diff --git "a/wandb/run-20220301_041848-29zl3b4i/files/wandb-summary.json" "b/wandb/run-20220301_041848-29zl3b4i/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220301_041848-29zl3b4i/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.3507, "train/learning_rate": 2.982e-05, "train/epoch": 0.56, "train/global_step": 500, "_runtime": 3841, "_timestamp": 1646112170, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 309.0, 696.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-90.60092163085938, -73.09754180908203, -55.59416198730469, -38.090782165527344, -20.58740234375, -3.0840225219726562, 14.419357299804688, 31.92273712158203, 49.426116943359375, 66.92949676513672, 84.43287658691406, 101.9362564086914, 119.43963623046875, 136.94302368164062, 154.44639587402344, 171.94976806640625, 189.45315551757812, 206.95654296875, 224.4599151611328, 241.96328735351562, 259.4666748046875, 276.9700622558594, 294.47344970703125, 311.976806640625, 329.4801940917969, 346.98358154296875, 364.4869384765625, 381.9903259277344, 399.49371337890625, 416.9971008300781, 434.50048828125, 452.00384521484375, 469.5072021484375, 487.0105895996094, 504.51397705078125, 522.017333984375, 539.520751953125, 557.0241088867188, 574.5274658203125, 592.0308837890625, 609.5342407226562, 627.03759765625, 644.541015625, 662.0443725585938, 679.5477294921875, 697.0511474609375, 714.5545043945312, 732.0579223632812, 749.561279296875, 767.0646362304688, 784.5680541992188, 802.0714111328125, 819.5748291015625, 837.0781860351562, 854.58154296875, 872.0849609375, 889.5883178710938, 907.0916748046875, 924.5950927734375, 942.0984497070312, 959.601806640625, 977.105224609375, 994.6085815429688, 1012.1119995117188, 1029.6153564453125]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 6.0, 4.0, 9.0, 9.0, 13.0, 19.0, 9.0, 17.0, 22.0, 25.0, 27.0, 24.0, 37.0, 33.0, 35.0, 32.0, 48.0, 71.0, 47.0, 51.0, 45.0, 39.0, 40.0, 38.0, 35.0, 37.0, 31.0, 41.0, 27.0, 25.0, 16.0, 24.0, 12.0, 12.0, 9.0, 7.0, 5.0, 7.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.16863250732422, -67.6971435546875, -65.22566223144531, -62.75417709350586, -60.282691955566406, -57.81120681762695, -55.3397216796875, -52.86823654174805, -50.396751403808594, -47.92526626586914, -45.45378112792969, -42.982295989990234, -40.51081085205078, -38.03932571411133, -35.567840576171875, -33.09635543823242, -30.62487030029297, -28.153385162353516, -25.681900024414062, -23.21041488647461, -20.738929748535156, -18.267444610595703, -15.79595947265625, -13.324474334716797, -10.852989196777344, -8.38150405883789, -5.9100189208984375, -3.4385337829589844, -0.9670486450195312, 1.5044364929199219, 3.975921630859375, 6.447406768798828, 8.918891906738281, 11.390377044677734, 13.861862182617188, 16.33334732055664, 18.804832458496094, 21.276317596435547, 23.747802734375, 26.219287872314453, 28.690773010253906, 31.16225814819336, 33.63374328613281, 36.105228424072266, 38.57671356201172, 41.04819869995117, 43.519683837890625, 45.99116897583008, 48.46265411376953, 50.934139251708984, 53.40562438964844, 55.87710952758789, 58.348594665527344, 60.8200798034668, 63.29156494140625, 65.76304626464844, 68.23453521728516, 70.70602416992188, 73.17750549316406, 75.64898681640625, 78.12047576904297, 80.59196472167969, 83.06344604492188, 85.53492736816406, 88.00641632080078]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 7.0, 10.0, 15.0, 27.0, 28.0, 28.0, 33.0, 44.0, 48.0, 53.0, 78.0, 81.0, 78.0, 68.0, 74.0, 54.0, 52.0, 46.0, 52.0, 32.0, 21.0, 24.0, 22.0, 10.0, 10.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -3.9495849609375, -3.727294921875, -3.5050048828125, -3.28271484375, -3.0604248046875, -2.838134765625, -2.6158447265625, -2.3935546875, -2.1712646484375, -1.948974609375, -1.7266845703125, -1.50439453125, -1.2821044921875, -1.059814453125, -0.8375244140625, -0.615234375, -0.3929443359375, -0.170654296875, 0.0516357421875, 0.27392578125, 0.4962158203125, 0.718505859375, 0.9407958984375, 1.1630859375, 1.3853759765625, 1.607666015625, 1.8299560546875, 2.05224609375, 2.2745361328125, 2.496826171875, 2.7191162109375, 2.94140625, 3.1636962890625, 3.385986328125, 3.6082763671875, 3.83056640625, 4.0528564453125, 4.275146484375, 4.4974365234375, 4.7197265625, 4.9420166015625, 5.164306640625, 5.3865966796875, 5.60888671875, 5.8311767578125, 6.053466796875, 6.2757568359375, 6.498046875, 6.7203369140625, 6.942626953125, 7.1649169921875, 7.38720703125, 7.6094970703125, 7.831787109375, 8.0540771484375, 8.2763671875, 8.4986572265625, 8.720947265625, 8.9432373046875, 9.16552734375, 9.3878173828125, 9.610107421875, 9.8323974609375, 10.0546875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 7.0, 13.0, 19.0, 7.0, 28.0, 67.0, 77.0, 138.0, 195.0, 319.0, 539.0, 1136.0, 2314.0, 5781.0, 20138.0, 127831.0, 2548164.0, 1393212.0, 71898.0, 13751.0, 4522.0, 1905.0, 898.0, 511.0, 296.0, 161.0, 123.0, 79.0, 43.0, 42.0, 22.0, 9.0, 13.0, 9.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.4779052734375, -10.869873046875, -10.2618408203125, -9.65380859375, -9.0457763671875, -8.437744140625, -7.8297119140625, -7.2216796875, -6.6136474609375, -6.005615234375, -5.3975830078125, -4.78955078125, -4.1815185546875, -3.573486328125, -2.9654541015625, -2.357421875, -1.7493896484375, -1.141357421875, -0.5333251953125, 0.07470703125, 0.6827392578125, 1.290771484375, 1.8988037109375, 2.5068359375, 3.1148681640625, 3.722900390625, 4.3309326171875, 4.93896484375, 5.5469970703125, 6.155029296875, 6.7630615234375, 7.37109375, 7.9791259765625, 8.587158203125, 9.1951904296875, 9.80322265625, 10.4112548828125, 11.019287109375, 11.6273193359375, 12.2353515625, 12.8433837890625, 13.451416015625, 14.0594482421875, 14.66748046875, 15.2755126953125, 15.883544921875, 16.4915771484375, 17.099609375, 17.7076416015625, 18.315673828125, 18.9237060546875, 19.53173828125, 20.1397705078125, 20.747802734375, 21.3558349609375, 21.9638671875, 22.5718994140625, 23.179931640625, 23.7879638671875, 24.39599609375, 25.0040283203125, 25.612060546875, 26.2200927734375, 26.828125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 9.0, 12.0, 10.0, 30.0, 35.0, 57.0, 85.0, 128.0, 216.0, 352.0, 568.0, 684.0, 591.0, 434.0, 280.0, 183.0, 121.0, 104.0, 58.0, 38.0, 21.0, 21.0, 10.0, 5.0, 10.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-20.984375, -20.322509765625, -19.66064453125, -18.998779296875, -18.3369140625, -17.675048828125, -17.01318359375, -16.351318359375, -15.689453125, -15.027587890625, -14.36572265625, -13.703857421875, -13.0419921875, -12.380126953125, -11.71826171875, -11.056396484375, -10.39453125, -9.732666015625, -9.07080078125, -8.408935546875, -7.7470703125, -7.085205078125, -6.42333984375, -5.761474609375, -5.099609375, -4.437744140625, -3.77587890625, -3.114013671875, -2.4521484375, -1.790283203125, -1.12841796875, -0.466552734375, 0.1953125, 0.857177734375, 1.51904296875, 2.180908203125, 2.8427734375, 3.504638671875, 4.16650390625, 4.828369140625, 5.490234375, 6.152099609375, 6.81396484375, 7.475830078125, 8.1376953125, 8.799560546875, 9.46142578125, 10.123291015625, 10.78515625, 11.447021484375, 12.10888671875, 12.770751953125, 13.4326171875, 14.094482421875, 14.75634765625, 15.418212890625, 16.080078125, 16.741943359375, 17.40380859375, 18.065673828125, 18.7275390625, 19.389404296875, 20.05126953125, 20.713134765625, 21.375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 9.0, 12.0, 25.0, 33.0, 43.0, 68.0, 113.0, 193.0, 314.0, 590.0, 1323.0, 4263.0, 139117.0, 3996136.0, 46428.0, 3029.0, 1128.0, 539.0, 361.0, 215.0, 108.0, 80.0, 48.0, 27.0, 23.0, 14.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-69.375, -67.2333984375, -65.091796875, -62.9501953125, -60.80859375, -58.6669921875, -56.525390625, -54.3837890625, -52.2421875, -50.1005859375, -47.958984375, -45.8173828125, -43.67578125, -41.5341796875, -39.392578125, -37.2509765625, -35.109375, -32.9677734375, -30.826171875, -28.6845703125, -26.54296875, -24.4013671875, -22.259765625, -20.1181640625, -17.9765625, -15.8349609375, -13.693359375, -11.5517578125, -9.41015625, -7.2685546875, -5.126953125, -2.9853515625, -0.84375, 1.2978515625, 3.439453125, 5.5810546875, 7.72265625, 9.8642578125, 12.005859375, 14.1474609375, 16.2890625, 18.4306640625, 20.572265625, 22.7138671875, 24.85546875, 26.9970703125, 29.138671875, 31.2802734375, 33.421875, 35.5634765625, 37.705078125, 39.8466796875, 41.98828125, 44.1298828125, 46.271484375, 48.4130859375, 50.5546875, 52.6962890625, 54.837890625, 56.9794921875, 59.12109375, 61.2626953125, 63.404296875, 65.5458984375, 67.6875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 18.0, 546.0, 430.0, 21.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-640.975830078125, -629.2928466796875, -617.60986328125, -605.9268798828125, -594.2439575195312, -582.5609741210938, -570.8779907226562, -559.1950073242188, -547.5120239257812, -535.8290405273438, -524.1460571289062, -512.463134765625, -500.7801208496094, -489.09716796875, -477.4141845703125, -465.731201171875, -454.0482482910156, -442.3652648925781, -430.68231201171875, -418.99932861328125, -407.31634521484375, -395.63336181640625, -383.9504089355469, -372.2674255371094, -360.58447265625, -348.9014892578125, -337.2185363769531, -325.5355529785156, -313.8525695800781, -302.16961669921875, -290.48663330078125, -278.80364990234375, -267.12066650390625, -255.4376983642578, -243.7547149658203, -232.07174682617188, -220.38876342773438, -208.70579528808594, -197.0228271484375, -185.33984375, -173.65687561035156, -161.97390747070312, -150.29092407226562, -138.6079559326172, -126.92498016357422, -115.24200439453125, -103.55903625488281, -91.87606048583984, -80.19308471679688, -68.5101089477539, -56.8271369934082, -45.1441650390625, -33.46118927001953, -21.778213500976562, -10.095245361328125, 1.5877304077148438, 13.270706176757812, 24.95368003845215, 36.636653900146484, 48.31962585449219, 60.002601623535156, 71.68557739257812, 83.36854553222656, 95.05152130126953, 106.7344970703125]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 6.0, 15.0, 16.0, 21.0, 14.0, 34.0, 31.0, 28.0, 42.0, 45.0, 52.0, 51.0, 47.0, 49.0, 51.0, 68.0, 60.0, 63.0, 51.0, 51.0, 41.0, 32.0, 30.0, 21.0, 16.0, 21.0, 14.0, 14.0, 12.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-102.01329040527344, -99.42792510986328, -96.84256744384766, -94.2572021484375, -91.67184448242188, -89.08647918701172, -86.50111389160156, -83.91575622558594, -81.33039093017578, -78.74502563476562, -76.15966796875, -73.57430267333984, -70.98893737792969, -68.40357971191406, -65.8182144165039, -63.232852935791016, -60.647491455078125, -58.062129974365234, -55.476768493652344, -52.89140319824219, -50.3060417175293, -47.720680236816406, -45.13531494140625, -42.54995346069336, -39.96459197998047, -37.37923049926758, -34.79386901855469, -32.20850372314453, -29.62314224243164, -27.03778076171875, -24.452417373657227, -21.867053985595703, -19.281688690185547, -16.696327209472656, -14.110963821411133, -11.525601387023926, -8.940238952636719, -6.354876518249512, -3.7695140838623047, -1.1841506958007812, 1.4012107849121094, 3.9865732192993164, 6.571935653686523, 9.15729808807373, 11.742660522460938, 14.328022956848145, 16.91338539123535, 19.498748779296875, 22.084110260009766, 24.669471740722656, 27.25483512878418, 29.840198516845703, 32.425559997558594, 35.010921478271484, 37.596282958984375, 40.18164825439453, 42.76700973510742, 45.35237121582031, 47.93773651123047, 50.52309799194336, 53.10845947265625, 55.69382095336914, 58.27918243408203, 60.86454772949219, 63.44990921020508]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 6.0, 9.0, 9.0, 16.0, 15.0, 16.0, 11.0, 19.0, 26.0, 22.0, 24.0, 29.0, 28.0, 40.0, 52.0, 46.0, 42.0, 52.0, 56.0, 41.0, 45.0, 47.0, 41.0, 47.0, 40.0, 44.0, 20.0, 20.0, 26.0, 23.0, 23.0, 18.0, 10.0, 9.0, 11.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.490478515625, -4.32861328125, -4.166748046875, -4.0048828125, -3.843017578125, -3.68115234375, -3.519287109375, -3.357421875, -3.195556640625, -3.03369140625, -2.871826171875, -2.7099609375, -2.548095703125, -2.38623046875, -2.224365234375, -2.0625, -1.900634765625, -1.73876953125, -1.576904296875, -1.4150390625, -1.253173828125, -1.09130859375, -0.929443359375, -0.767578125, -0.605712890625, -0.44384765625, -0.281982421875, -0.1201171875, 0.041748046875, 0.20361328125, 0.365478515625, 0.52734375, 0.689208984375, 0.85107421875, 1.012939453125, 1.1748046875, 1.336669921875, 1.49853515625, 1.660400390625, 1.822265625, 1.984130859375, 2.14599609375, 2.307861328125, 2.4697265625, 2.631591796875, 2.79345703125, 2.955322265625, 3.1171875, 3.279052734375, 3.44091796875, 3.602783203125, 3.7646484375, 3.926513671875, 4.08837890625, 4.250244140625, 4.412109375, 4.573974609375, 4.73583984375, 4.897705078125, 5.0595703125, 5.221435546875, 5.38330078125, 5.545166015625, 5.70703125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 8.0, 11.0, 11.0, 16.0, 23.0, 34.0, 43.0, 82.0, 122.0, 170.0, 282.0, 384.0, 560.0, 772.0, 1151.0, 1684.0, 2488.0, 3676.0, 5459.0, 8034.0, 12286.0, 18092.0, 26964.0, 40300.0, 59297.0, 89203.0, 129571.0, 168125.0, 149818.0, 108232.0, 72654.0, 48865.0, 32823.0, 22140.0, 14726.0, 9902.0, 6573.0, 4500.0, 2986.0, 2069.0, 1390.0, 938.0, 687.0, 450.0, 312.0, 224.0, 150.0, 84.0, 62.0, 38.0, 34.0, 18.0, 19.0, 7.0, 4.0, 4.0, 0.0, 3.0], "bins": [-0.4482421875, -0.43495941162109375, -0.4216766357421875, -0.40839385986328125, -0.395111083984375, -0.38182830810546875, -0.3685455322265625, -0.35526275634765625, -0.34197998046875, -0.32869720458984375, -0.3154144287109375, -0.30213165283203125, -0.288848876953125, -0.27556610107421875, -0.2622833251953125, -0.24900054931640625, -0.2357177734375, -0.22243499755859375, -0.2091522216796875, -0.19586944580078125, -0.182586669921875, -0.16930389404296875, -0.1560211181640625, -0.14273834228515625, -0.12945556640625, -0.11617279052734375, -0.1028900146484375, -0.08960723876953125, -0.076324462890625, -0.06304168701171875, -0.0497589111328125, -0.03647613525390625, -0.023193359375, -0.00991058349609375, 0.0033721923828125, 0.01665496826171875, 0.029937744140625, 0.04322052001953125, 0.0565032958984375, 0.06978607177734375, 0.08306884765625, 0.09635162353515625, 0.1096343994140625, 0.12291717529296875, 0.136199951171875, 0.14948272705078125, 0.1627655029296875, 0.17604827880859375, 0.1893310546875, 0.20261383056640625, 0.2158966064453125, 0.22917938232421875, 0.242462158203125, 0.25574493408203125, 0.2690277099609375, 0.28231048583984375, 0.29559326171875, 0.30887603759765625, 0.3221588134765625, 0.33544158935546875, 0.348724365234375, 0.36200714111328125, 0.3752899169921875, 0.38857269287109375, 0.40185546875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 7.0, 10.0, 9.0, 11.0, 11.0, 12.0, 21.0, 23.0, 19.0, 26.0, 23.0, 28.0, 31.0, 36.0, 34.0, 31.0, 41.0, 35.0, 34.0, 37.0, 1069.0, 36.0, 35.0, 38.0, 31.0, 29.0, 32.0, 27.0, 29.0, 35.0, 19.0, 26.0, 24.0, 16.0, 17.0, 9.0, 8.0, 5.0, 14.0, 9.0, 7.0, 5.0, 8.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.638671875, -2.55474853515625, -2.4708251953125, -2.38690185546875, -2.302978515625, -2.21905517578125, -2.1351318359375, -2.05120849609375, -1.96728515625, -1.88336181640625, -1.7994384765625, -1.71551513671875, -1.631591796875, -1.54766845703125, -1.4637451171875, -1.37982177734375, -1.2958984375, -1.21197509765625, -1.1280517578125, -1.04412841796875, -0.960205078125, -0.87628173828125, -0.7923583984375, -0.70843505859375, -0.62451171875, -0.54058837890625, -0.4566650390625, -0.37274169921875, -0.288818359375, -0.20489501953125, -0.1209716796875, -0.03704833984375, 0.046875, 0.13079833984375, 0.2147216796875, 0.29864501953125, 0.382568359375, 0.46649169921875, 0.5504150390625, 0.63433837890625, 0.71826171875, 0.80218505859375, 0.8861083984375, 0.97003173828125, 1.053955078125, 1.13787841796875, 1.2218017578125, 1.30572509765625, 1.3896484375, 1.47357177734375, 1.5574951171875, 1.64141845703125, 1.725341796875, 1.80926513671875, 1.8931884765625, 1.97711181640625, 2.06103515625, 2.14495849609375, 2.2288818359375, 2.31280517578125, 2.396728515625, 2.48065185546875, 2.5645751953125, 2.64849853515625, 2.732421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 9.0, 7.0, 12.0, 22.0, 23.0, 36.0, 69.0, 102.0, 131.0, 231.0, 352.0, 625.0, 847.0, 1438.0, 2241.0, 3572.0, 5565.0, 9402.0, 15089.0, 24150.0, 39196.0, 64687.0, 105151.0, 161947.0, 1246835.0, 155878.0, 100273.0, 61322.0, 36712.0, 22727.0, 14449.0, 8874.0, 5591.0, 3474.0, 2260.0, 1344.0, 896.0, 599.0, 358.0, 201.0, 143.0, 104.0, 56.0, 46.0, 38.0, 18.0, 6.0, 8.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0], "bins": [-0.50634765625, -0.4912109375, -0.47607421875, -0.4609375, -0.44580078125, -0.4306640625, -0.41552734375, -0.400390625, -0.38525390625, -0.3701171875, -0.35498046875, -0.33984375, -0.32470703125, -0.3095703125, -0.29443359375, -0.279296875, -0.26416015625, -0.2490234375, -0.23388671875, -0.21875, -0.20361328125, -0.1884765625, -0.17333984375, -0.158203125, -0.14306640625, -0.1279296875, -0.11279296875, -0.09765625, -0.08251953125, -0.0673828125, -0.05224609375, -0.037109375, -0.02197265625, -0.0068359375, 0.00830078125, 0.0234375, 0.03857421875, 0.0537109375, 0.06884765625, 0.083984375, 0.09912109375, 0.1142578125, 0.12939453125, 0.14453125, 0.15966796875, 0.1748046875, 0.18994140625, 0.205078125, 0.22021484375, 0.2353515625, 0.25048828125, 0.265625, 0.28076171875, 0.2958984375, 0.31103515625, 0.326171875, 0.34130859375, 0.3564453125, 0.37158203125, 0.38671875, 0.40185546875, 0.4169921875, 0.43212890625, 0.447265625, 0.46240234375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 9.0, 6.0, 7.0, 6.0, 11.0, 16.0, 15.0, 18.0, 23.0, 29.0, 19.0, 44.0, 37.0, 42.0, 54.0, 50.0, 48.0, 46.0, 56.0, 66.0, 45.0, 43.0, 57.0, 43.0, 31.0, 18.0, 30.0, 18.0, 16.0, 19.0, 12.0, 8.0, 6.0, 4.0, 9.0, 8.0, 0.0, 5.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0010738372802734375, -0.0010401159524917603, -0.001006394624710083, -0.0009726732969284058, -0.0009389519691467285, -0.0009052306413650513, -0.000871509313583374, -0.0008377879858016968, -0.0008040666580200195, -0.0007703453302383423, -0.000736624002456665, -0.0007029026746749878, -0.0006691813468933105, -0.0006354600191116333, -0.0006017386913299561, -0.0005680173635482788, -0.0005342960357666016, -0.0005005747079849243, -0.00046685338020324707, -0.0004331320524215698, -0.0003994107246398926, -0.00036568939685821533, -0.0003319680690765381, -0.00029824674129486084, -0.0002645254135131836, -0.00023080408573150635, -0.0001970827579498291, -0.00016336143016815186, -0.0001296401023864746, -9.591877460479736e-05, -6.219744682312012e-05, -2.847611904144287e-05, 5.245208740234375e-06, 3.896653652191162e-05, 7.268786430358887e-05, 0.00010640919208526611, 0.00014013051986694336, 0.0001738518476486206, 0.00020757317543029785, 0.0002412945032119751, 0.00027501583099365234, 0.0003087371587753296, 0.00034245848655700684, 0.0003761798143386841, 0.00040990114212036133, 0.0004436224699020386, 0.0004773437976837158, 0.0005110651254653931, 0.0005447864532470703, 0.0005785077810287476, 0.0006122291088104248, 0.000645950436592102, 0.0006796717643737793, 0.0007133930921554565, 0.0007471144199371338, 0.000780835747718811, 0.0008145570755004883, 0.0008482784032821655, 0.0008819997310638428, 0.00091572105884552, 0.0009494423866271973, 0.0009831637144088745, 0.0010168850421905518, 0.001050606369972229, 0.0010843276977539062]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 5.0, 9.0, 15.0, 18.0, 19.0, 19.0, 25.0, 21.0, 30.0, 47.0, 76.0, 74.0, 93.0, 105.0, 138.0, 185.0, 238.0, 330.0, 520.0, 1799.0, 948362.0, 93666.0, 912.0, 480.0, 317.0, 250.0, 162.0, 121.0, 114.0, 62.0, 55.0, 48.0, 43.0, 28.0, 28.0, 19.0, 17.0, 18.0, 14.0, 11.0, 8.0, 1.0, 6.0, 5.0, 7.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.020751953125, -0.02013850212097168, -0.01952505111694336, -0.01891160011291504, -0.01829814910888672, -0.0176846981048584, -0.017071247100830078, -0.016457796096801758, -0.015844345092773438, -0.015230894088745117, -0.014617443084716797, -0.014003992080688477, -0.013390541076660156, -0.012777090072631836, -0.012163639068603516, -0.011550188064575195, -0.010936737060546875, -0.010323286056518555, -0.009709835052490234, -0.009096384048461914, -0.008482933044433594, -0.007869482040405273, -0.007256031036376953, -0.006642580032348633, -0.0060291290283203125, -0.005415678024291992, -0.004802227020263672, -0.0041887760162353516, -0.0035753250122070312, -0.002961874008178711, -0.0023484230041503906, -0.0017349720001220703, -0.00112152099609375, -0.0005080699920654297, 0.00010538101196289062, 0.0007188320159912109, 0.0013322830200195312, 0.0019457340240478516, 0.002559185028076172, 0.003172636032104492, 0.0037860870361328125, 0.004399538040161133, 0.005012989044189453, 0.0056264400482177734, 0.006239891052246094, 0.006853342056274414, 0.007466793060302734, 0.008080244064331055, 0.008693695068359375, 0.009307146072387695, 0.009920597076416016, 0.010534048080444336, 0.011147499084472656, 0.011760950088500977, 0.012374401092529297, 0.012987852096557617, 0.013601303100585938, 0.014214754104614258, 0.014828205108642578, 0.015441656112670898, 0.01605510711669922, 0.01666855812072754, 0.01728200912475586, 0.01789546012878418, 0.0185089111328125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 16.0, 171.0, 579.0, 226.0, 20.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030368645675480366, -0.0029513761401176453, -0.0028658879455178976, -0.0027803995180875063, -0.002694911090657115, -0.0026094228960573673, -0.002523934468626976, -0.0024384460411965847, -0.0023529576137661934, -0.002267469186335802, -0.0021819809917360544, -0.002096492564305663, -0.002011004136875272, -0.0019255158258602023, -0.0018400275148451328, -0.0017545390874147415, -0.0016690508928149939, -0.0015835625817999244, -0.001498074154369533, -0.0014125858433544636, -0.0013270974159240723, -0.0012416091049090028, -0.0011561207938939333, -0.001070632366463542, -0.0009851440554484725, -0.0008996556862257421, -0.0008141673170030117, -0.0007286790059879422, -0.0006431906367652118, -0.0005577022675424814, -0.00047221395652741194, -0.00038672558730468154, -0.0003012369852513075, -0.00021574863058049232, -0.00013026027590967715, -4.4771935790777206e-05, 4.071643343195319e-05, 0.0001262048026546836, 0.00021169311366975307, 0.00029718148289248347, 0.00038266985211521387, 0.00046815822133794427, 0.0005536465905606747, 0.0006391349015757442, 0.0007246232707984746, 0.000810111640021205, 0.0008955999510362744, 0.000981088262051344, 0.0010665766894817352, 0.0011520650004968047, 0.001237553427927196, 0.0013230417389422655, 0.0014085301663726568, 0.0014940184773877263, 0.0015795067884027958, 0.001664995215833187, 0.0017504835268482566, 0.001835971837863326, 0.0019214602652937174, 0.002006948459893465, 0.0020924368873238564, 0.0021779253147542477, 0.002263413742184639, 0.0023489019367843866, 0.002434390364214778]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 3.0, 9.0, 9.0, 11.0, 9.0, 17.0, 26.0, 23.0, 22.0, 30.0, 34.0, 37.0, 22.0, 36.0, 38.0, 33.0, 46.0, 54.0, 41.0, 36.0, 40.0, 32.0, 40.0, 33.0, 40.0, 34.0, 37.0, 25.0, 18.0, 23.0, 18.0, 23.0, 18.0, 15.0, 11.0, 15.0, 8.0, 4.0, 6.0, 4.0, 6.0, 2.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006201863288879395, -0.0006003305315971375, -0.0005804747343063354, -0.0005606189370155334, -0.0005407631397247314, -0.0005209073424339294, -0.0005010515451431274, -0.00048119574785232544, -0.00046133995056152344, -0.00044148415327072144, -0.00042162835597991943, -0.00040177255868911743, -0.00038191676139831543, -0.00036206096410751343, -0.0003422051668167114, -0.0003223493695259094, -0.0003024935722351074, -0.0002826377749443054, -0.0002627819776535034, -0.00024292618036270142, -0.00022307038307189941, -0.0002032145857810974, -0.0001833587884902954, -0.0001635029911994934, -0.0001436471939086914, -0.0001237913966178894, -0.0001039355993270874, -8.40798020362854e-05, -6.42240047454834e-05, -4.4368207454681396e-05, -2.4512410163879395e-05, -4.656612873077393e-06, 1.519918441772461e-05, 3.505498170852661e-05, 5.491077899932861e-05, 7.476657629013062e-05, 9.462237358093262e-05, 0.00011447817087173462, 0.00013433396816253662, 0.00015418976545333862, 0.00017404556274414062, 0.00019390136003494263, 0.00021375715732574463, 0.00023361295461654663, 0.00025346875190734863, 0.00027332454919815063, 0.00029318034648895264, 0.00031303614377975464, 0.00033289194107055664, 0.00035274773836135864, 0.00037260353565216064, 0.00039245933294296265, 0.00041231513023376465, 0.00043217092752456665, 0.00045202672481536865, 0.00047188252210617065, 0.0004917383193969727, 0.0005115941166877747, 0.0005314499139785767, 0.0005513057112693787, 0.0005711615085601807, 0.0005910173058509827, 0.0006108731031417847, 0.0006307289004325867, 0.0006505846977233887]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 6.0, 9.0, 9.0, 16.0, 15.0, 16.0, 11.0, 19.0, 26.0, 22.0, 24.0, 29.0, 28.0, 40.0, 52.0, 46.0, 42.0, 52.0, 56.0, 41.0, 45.0, 47.0, 41.0, 47.0, 40.0, 44.0, 20.0, 20.0, 26.0, 23.0, 23.0, 18.0, 10.0, 9.0, 11.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.490478515625, -4.32861328125, -4.166748046875, -4.0048828125, -3.843017578125, -3.68115234375, -3.519287109375, -3.357421875, -3.195556640625, -3.03369140625, -2.871826171875, -2.7099609375, -2.548095703125, -2.38623046875, -2.224365234375, -2.0625, -1.900634765625, -1.73876953125, -1.576904296875, -1.4150390625, -1.253173828125, -1.09130859375, -0.929443359375, -0.767578125, -0.605712890625, -0.44384765625, -0.281982421875, -0.1201171875, 0.041748046875, 0.20361328125, 0.365478515625, 0.52734375, 0.689208984375, 0.85107421875, 1.012939453125, 1.1748046875, 1.336669921875, 1.49853515625, 1.660400390625, 1.822265625, 1.984130859375, 2.14599609375, 2.307861328125, 2.4697265625, 2.631591796875, 2.79345703125, 2.955322265625, 3.1171875, 3.279052734375, 3.44091796875, 3.602783203125, 3.7646484375, 3.926513671875, 4.08837890625, 4.250244140625, 4.412109375, 4.573974609375, 4.73583984375, 4.897705078125, 5.0595703125, 5.221435546875, 5.38330078125, 5.545166015625, 5.70703125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 12.0, 9.0, 13.0, 15.0, 24.0, 35.0, 44.0, 36.0, 65.0, 102.0, 140.0, 182.0, 220.0, 359.0, 505.0, 737.0, 1012.0, 1362.0, 2196.0, 3282.0, 5657.0, 10595.0, 25028.0, 187245.0, 725598.0, 48722.0, 15220.0, 7522.0, 4234.0, 2675.0, 1638.0, 1158.0, 845.0, 559.0, 417.0, 307.0, 208.0, 168.0, 101.0, 81.0, 64.0, 47.0, 35.0, 23.0, 24.0, 12.0, 7.0, 9.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0], "bins": [-24.296875, -23.587158203125, -22.87744140625, -22.167724609375, -21.4580078125, -20.748291015625, -20.03857421875, -19.328857421875, -18.619140625, -17.909423828125, -17.19970703125, -16.489990234375, -15.7802734375, -15.070556640625, -14.36083984375, -13.651123046875, -12.94140625, -12.231689453125, -11.52197265625, -10.812255859375, -10.1025390625, -9.392822265625, -8.68310546875, -7.973388671875, -7.263671875, -6.553955078125, -5.84423828125, -5.134521484375, -4.4248046875, -3.715087890625, -3.00537109375, -2.295654296875, -1.5859375, -0.876220703125, -0.16650390625, 0.543212890625, 1.2529296875, 1.962646484375, 2.67236328125, 3.382080078125, 4.091796875, 4.801513671875, 5.51123046875, 6.220947265625, 6.9306640625, 7.640380859375, 8.35009765625, 9.059814453125, 9.76953125, 10.479248046875, 11.18896484375, 11.898681640625, 12.6083984375, 13.318115234375, 14.02783203125, 14.737548828125, 15.447265625, 16.156982421875, 16.86669921875, 17.576416015625, 18.2861328125, 18.995849609375, 19.70556640625, 20.415283203125, 21.125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 7.0, 1.0, 2.0, 8.0, 4.0, 12.0, 6.0, 14.0, 13.0, 14.0, 14.0, 12.0, 17.0, 25.0, 22.0, 22.0, 30.0, 31.0, 20.0, 28.0, 33.0, 43.0, 44.0, 114.0, 257.0, 1567.0, 189.0, 72.0, 44.0, 27.0, 30.0, 42.0, 36.0, 28.0, 19.0, 24.0, 26.0, 15.0, 14.0, 19.0, 19.0, 17.0, 13.0, 10.0, 6.0, 9.0, 4.0, 5.0, 8.0, 7.0, 3.0, 4.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-11.296875, -10.9244384765625, -10.552001953125, -10.1795654296875, -9.80712890625, -9.4346923828125, -9.062255859375, -8.6898193359375, -8.3173828125, -7.9449462890625, -7.572509765625, -7.2000732421875, -6.82763671875, -6.4552001953125, -6.082763671875, -5.7103271484375, -5.337890625, -4.9654541015625, -4.593017578125, -4.2205810546875, -3.84814453125, -3.4757080078125, -3.103271484375, -2.7308349609375, -2.3583984375, -1.9859619140625, -1.613525390625, -1.2410888671875, -0.86865234375, -0.4962158203125, -0.123779296875, 0.2486572265625, 0.62109375, 0.9935302734375, 1.365966796875, 1.7384033203125, 2.11083984375, 2.4832763671875, 2.855712890625, 3.2281494140625, 3.6005859375, 3.9730224609375, 4.345458984375, 4.7178955078125, 5.09033203125, 5.4627685546875, 5.835205078125, 6.2076416015625, 6.580078125, 6.9525146484375, 7.324951171875, 7.6973876953125, 8.06982421875, 8.4422607421875, 8.814697265625, 9.1871337890625, 9.5595703125, 9.9320068359375, 10.304443359375, 10.6768798828125, 11.04931640625, 11.4217529296875, 11.794189453125, 12.1666259765625, 12.5390625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 2.0, 6.0, 6.0, 6.0, 6.0, 5.0, 11.0, 15.0, 16.0, 11.0, 17.0, 22.0, 14.0, 14.0, 29.0, 32.0, 25.0, 40.0, 62.0, 72.0, 125.0, 245.0, 730.0, 9071.0, 3107470.0, 25980.0, 898.0, 257.0, 128.0, 78.0, 40.0, 29.0, 38.0, 31.0, 21.0, 24.0, 18.0, 17.0, 11.0, 14.0, 11.0, 19.0, 5.0, 7.0, 9.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-57.0625, -55.36328125, -53.6640625, -51.96484375, -50.265625, -48.56640625, -46.8671875, -45.16796875, -43.46875, -41.76953125, -40.0703125, -38.37109375, -36.671875, -34.97265625, -33.2734375, -31.57421875, -29.875, -28.17578125, -26.4765625, -24.77734375, -23.078125, -21.37890625, -19.6796875, -17.98046875, -16.28125, -14.58203125, -12.8828125, -11.18359375, -9.484375, -7.78515625, -6.0859375, -4.38671875, -2.6875, -0.98828125, 0.7109375, 2.41015625, 4.109375, 5.80859375, 7.5078125, 9.20703125, 10.90625, 12.60546875, 14.3046875, 16.00390625, 17.703125, 19.40234375, 21.1015625, 22.80078125, 24.5, 26.19921875, 27.8984375, 29.59765625, 31.296875, 32.99609375, 34.6953125, 36.39453125, 38.09375, 39.79296875, 41.4921875, 43.19140625, 44.890625, 46.58984375, 48.2890625, 49.98828125, 51.6875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 14.0, 979.0, 22.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.37266540527344, -65.7014389038086, -58.03021240234375, -50.358985900878906, -42.68775939941406, -35.01653289794922, -27.345306396484375, -19.67407989501953, -12.002853393554688, -4.331626892089844, 3.339599609375, 11.010826110839844, 18.682052612304688, 26.35327911376953, 34.024505615234375, 41.69573211669922, 49.36695861816406, 57.038185119628906, 64.70941162109375, 72.3806381225586, 80.05186462402344, 87.72309112548828, 95.39431762695312, 103.06554412841797, 110.73677062988281, 118.40799713134766, 126.0792236328125, 133.75045776367188, 141.4216766357422, 149.0928955078125, 156.76412963867188, 164.43536376953125, 172.1065673828125, 179.77780151367188, 187.4490203857422, 195.1202392578125, 202.79147338867188, 210.46270751953125, 218.13392639160156, 225.80514526367188, 233.47637939453125, 241.14761352539062, 248.81883239746094, 256.49005126953125, 264.1612854003906, 271.83251953125, 279.50372314453125, 287.1749572753906, 294.84619140625, 302.5174255371094, 310.18865966796875, 317.85986328125, 325.5310974121094, 333.20233154296875, 340.87353515625, 348.5447692871094, 356.21600341796875, 363.8872375488281, 371.5584716796875, 379.22967529296875, 386.9009094238281, 394.5721435546875, 402.24334716796875, 409.9145812988281, 417.5858154296875]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 9.0, 2.0, 9.0, 5.0, 10.0, 11.0, 11.0, 20.0, 22.0, 23.0, 34.0, 28.0, 39.0, 28.0, 33.0, 37.0, 27.0, 45.0, 51.0, 48.0, 48.0, 53.0, 35.0, 43.0, 37.0, 41.0, 22.0, 21.0, 17.0, 32.0, 29.0, 26.0, 22.0, 15.0, 13.0, 9.0, 12.0, 9.0, 5.0, 2.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.27901840209961, -40.84931945800781, -39.41961669921875, -37.98991394042969, -36.56021499633789, -35.130516052246094, -33.70081329345703, -32.27111053466797, -30.841411590576172, -29.411710739135742, -27.982009887695312, -26.552309036254883, -25.122608184814453, -23.692907333374023, -22.263206481933594, -20.833505630493164, -19.403804779052734, -17.974103927612305, -16.544403076171875, -15.114702224731445, -13.685001373291016, -12.255300521850586, -10.825599670410156, -9.395898818969727, -7.966197967529297, -6.536497116088867, -5.1067962646484375, -3.677095413208008, -2.247394561767578, -0.8176937103271484, 0.6120071411132812, 2.041707992553711, 3.4714126586914062, 4.901113510131836, 6.330814361572266, 7.760515213012695, 9.190216064453125, 10.619916915893555, 12.049617767333984, 13.479318618774414, 14.909019470214844, 16.338720321655273, 17.768421173095703, 19.198122024536133, 20.627822875976562, 22.057523727416992, 23.487224578857422, 24.91692543029785, 26.34662628173828, 27.77632713317871, 29.20602798461914, 30.63572883605957, 32.0654296875, 33.49513244628906, 34.92483139038086, 36.354530334472656, 37.78423309326172, 39.21393585205078, 40.64363479614258, 42.073333740234375, 43.50303649902344, 44.9327392578125, 46.3624382019043, 47.792137145996094, 49.221839904785156]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 3.0, 9.0, 20.0, 12.0, 13.0, 19.0, 21.0, 16.0, 21.0, 13.0, 43.0, 29.0, 30.0, 49.0, 38.0, 47.0, 60.0, 44.0, 53.0, 44.0, 31.0, 33.0, 64.0, 43.0, 34.0, 15.0, 24.0, 30.0, 31.0, 17.0, 19.0, 14.0, 8.0, 10.0, 8.0, 6.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.875, -4.71240234375, -4.5498046875, -4.38720703125, -4.224609375, -4.06201171875, -3.8994140625, -3.73681640625, -3.57421875, -3.41162109375, -3.2490234375, -3.08642578125, -2.923828125, -2.76123046875, -2.5986328125, -2.43603515625, -2.2734375, -2.11083984375, -1.9482421875, -1.78564453125, -1.623046875, -1.46044921875, -1.2978515625, -1.13525390625, -0.97265625, -0.81005859375, -0.6474609375, -0.48486328125, -0.322265625, -0.15966796875, 0.0029296875, 0.16552734375, 0.328125, 0.49072265625, 0.6533203125, 0.81591796875, 0.978515625, 1.14111328125, 1.3037109375, 1.46630859375, 1.62890625, 1.79150390625, 1.9541015625, 2.11669921875, 2.279296875, 2.44189453125, 2.6044921875, 2.76708984375, 2.9296875, 3.09228515625, 3.2548828125, 3.41748046875, 3.580078125, 3.74267578125, 3.9052734375, 4.06787109375, 4.23046875, 4.39306640625, 4.5556640625, 4.71826171875, 4.880859375, 5.04345703125, 5.2060546875, 5.36865234375, 5.53125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 5.0, 8.0, 9.0, 13.0, 6.0, 18.0, 24.0, 36.0, 38.0, 60.0, 108.0, 135.0, 189.0, 279.0, 439.0, 808.0, 1468.0, 3021.0, 6550.0, 18478.0, 84091.0, 1620106.0, 2311719.0, 110512.0, 22151.0, 7362.0, 3010.0, 1511.0, 765.0, 458.0, 270.0, 190.0, 118.0, 103.0, 70.0, 44.0, 23.0, 20.0, 19.0, 14.0, 13.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.34375, -18.572021484375, -17.80029296875, -17.028564453125, -16.2568359375, -15.485107421875, -14.71337890625, -13.941650390625, -13.169921875, -12.398193359375, -11.62646484375, -10.854736328125, -10.0830078125, -9.311279296875, -8.53955078125, -7.767822265625, -6.99609375, -6.224365234375, -5.45263671875, -4.680908203125, -3.9091796875, -3.137451171875, -2.36572265625, -1.593994140625, -0.822265625, -0.050537109375, 0.72119140625, 1.492919921875, 2.2646484375, 3.036376953125, 3.80810546875, 4.579833984375, 5.3515625, 6.123291015625, 6.89501953125, 7.666748046875, 8.4384765625, 9.210205078125, 9.98193359375, 10.753662109375, 11.525390625, 12.297119140625, 13.06884765625, 13.840576171875, 14.6123046875, 15.384033203125, 16.15576171875, 16.927490234375, 17.69921875, 18.470947265625, 19.24267578125, 20.014404296875, 20.7861328125, 21.557861328125, 22.32958984375, 23.101318359375, 23.873046875, 24.644775390625, 25.41650390625, 26.188232421875, 26.9599609375, 27.731689453125, 28.50341796875, 29.275146484375, 30.046875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 13.0, 28.0, 42.0, 50.0, 85.0, 121.0, 170.0, 264.0, 372.0, 528.0, 633.0, 568.0, 370.0, 231.0, 191.0, 116.0, 80.0, 61.0, 40.0, 23.0, 22.0, 14.0, 12.0, 9.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.8125, -20.081787109375, -19.35107421875, -18.620361328125, -17.8896484375, -17.158935546875, -16.42822265625, -15.697509765625, -14.966796875, -14.236083984375, -13.50537109375, -12.774658203125, -12.0439453125, -11.313232421875, -10.58251953125, -9.851806640625, -9.12109375, -8.390380859375, -7.65966796875, -6.928955078125, -6.1982421875, -5.467529296875, -4.73681640625, -4.006103515625, -3.275390625, -2.544677734375, -1.81396484375, -1.083251953125, -0.3525390625, 0.378173828125, 1.10888671875, 1.839599609375, 2.5703125, 3.301025390625, 4.03173828125, 4.762451171875, 5.4931640625, 6.223876953125, 6.95458984375, 7.685302734375, 8.416015625, 9.146728515625, 9.87744140625, 10.608154296875, 11.3388671875, 12.069580078125, 12.80029296875, 13.531005859375, 14.26171875, 14.992431640625, 15.72314453125, 16.453857421875, 17.1845703125, 17.915283203125, 18.64599609375, 19.376708984375, 20.107421875, 20.838134765625, 21.56884765625, 22.299560546875, 23.0302734375, 23.760986328125, 24.49169921875, 25.222412109375, 25.953125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 3.0, 7.0, 7.0, 13.0, 20.0, 30.0, 24.0, 35.0, 38.0, 95.0, 96.0, 166.0, 268.0, 471.0, 1492.0, 34498.0, 4049747.0, 103504.0, 2303.0, 650.0, 325.0, 144.0, 88.0, 73.0, 52.0, 30.0, 22.0, 16.0, 12.0, 11.0, 8.0, 5.0, 5.0, 5.0, 1.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-84.1875, -81.681640625, -79.17578125, -76.669921875, -74.1640625, -71.658203125, -69.15234375, -66.646484375, -64.140625, -61.634765625, -59.12890625, -56.623046875, -54.1171875, -51.611328125, -49.10546875, -46.599609375, -44.09375, -41.587890625, -39.08203125, -36.576171875, -34.0703125, -31.564453125, -29.05859375, -26.552734375, -24.046875, -21.541015625, -19.03515625, -16.529296875, -14.0234375, -11.517578125, -9.01171875, -6.505859375, -4.0, -1.494140625, 1.01171875, 3.517578125, 6.0234375, 8.529296875, 11.03515625, 13.541015625, 16.046875, 18.552734375, 21.05859375, 23.564453125, 26.0703125, 28.576171875, 31.08203125, 33.587890625, 36.09375, 38.599609375, 41.10546875, 43.611328125, 46.1171875, 48.623046875, 51.12890625, 53.634765625, 56.140625, 58.646484375, 61.15234375, 63.658203125, 66.1640625, 68.669921875, 71.17578125, 73.681640625, 76.1875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [2.0, 58.0, 782.0, 174.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.337581634521484, -22.602922439575195, -8.868263244628906, 4.866397857666016, 18.601055145263672, 32.33571243286133, 46.070377349853516, 59.80503463745117, 73.53968811035156, 87.27434539794922, 101.00900268554688, 114.74366760253906, 128.47833251953125, 142.21298217773438, 155.94764709472656, 169.68231201171875, 183.41696166992188, 197.15162658691406, 210.8862762451172, 224.62094116210938, 238.3555908203125, 252.0902557373047, 265.8249206542969, 279.5595703125, 293.29425048828125, 307.0289001464844, 320.7635803222656, 334.49822998046875, 348.2328796386719, 361.967529296875, 375.70220947265625, 389.4368591308594, 403.1715087890625, 416.9061584472656, 430.6408386230469, 444.37548828125, 458.1101379394531, 471.84478759765625, 485.5794677734375, 499.3141174316406, 513.0487670898438, 526.783447265625, 540.51806640625, 554.2527465820312, 567.9874267578125, 581.7220458984375, 595.4567260742188, 609.19140625, 622.926025390625, 636.6607055664062, 650.3953247070312, 664.1300048828125, 677.8646850585938, 691.5993041992188, 705.333984375, 719.0686645507812, 732.8033447265625, 746.5380249023438, 760.2726440429688, 774.00732421875, 787.7420043945312, 801.4766235351562, 815.2113037109375, 828.9459838867188, 842.6806030273438]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 6.0, 5.0, 7.0, 5.0, 6.0, 6.0, 20.0, 15.0, 19.0, 23.0, 20.0, 23.0, 25.0, 21.0, 45.0, 31.0, 45.0, 42.0, 45.0, 44.0, 33.0, 47.0, 41.0, 38.0, 32.0, 31.0, 30.0, 29.0, 28.0, 34.0, 28.0, 22.0, 25.0, 18.0, 16.0, 18.0, 16.0, 9.0, 9.0, 8.0, 7.0, 5.0, 7.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-59.351253509521484, -57.520713806152344, -55.6901741027832, -53.85963439941406, -52.02909469604492, -50.19855499267578, -48.368011474609375, -46.537471771240234, -44.706932067871094, -42.87639236450195, -41.04585266113281, -39.21531295776367, -37.38477325439453, -35.554229736328125, -33.72369384765625, -31.893150329589844, -30.062612533569336, -28.232072830200195, -26.401533126831055, -24.57099151611328, -22.74045181274414, -20.909912109375, -19.07937240600586, -17.24883270263672, -15.418292045593262, -13.587752342224121, -11.757211685180664, -9.926671981811523, -8.096132278442383, -6.265591621398926, -4.435051918029785, -2.604511260986328, -0.7739715576171875, 1.0565685033798218, 2.887108564376831, 4.717648506164551, 6.54818868637085, 8.378728866577148, 10.209268569946289, 12.039809226989746, 13.870348930358887, 15.700888633728027, 17.531429290771484, 19.361968994140625, 21.192508697509766, 23.023048400878906, 24.853588104248047, 26.68412971496582, 28.51466941833496, 30.3452091217041, 32.175750732421875, 34.006290435791016, 35.836830139160156, 37.6673698425293, 39.49790954589844, 41.32844924926758, 43.15898895263672, 44.98952865600586, 46.820068359375, 48.65060806274414, 50.48114776611328, 52.31169128417969, 54.14222717285156, 55.97277069091797, 57.80331039428711]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 4.0, 11.0, 11.0, 19.0, 15.0, 23.0, 13.0, 25.0, 15.0, 40.0, 35.0, 44.0, 51.0, 40.0, 44.0, 55.0, 55.0, 56.0, 46.0, 56.0, 32.0, 39.0, 37.0, 37.0, 25.0, 29.0, 37.0, 23.0, 13.0, 9.0, 8.0, 18.0, 7.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.3441162109375, -5.164794921875, -4.9854736328125, -4.80615234375, -4.6268310546875, -4.447509765625, -4.2681884765625, -4.0888671875, -3.9095458984375, -3.730224609375, -3.5509033203125, -3.37158203125, -3.1922607421875, -3.012939453125, -2.8336181640625, -2.654296875, -2.4749755859375, -2.295654296875, -2.1163330078125, -1.93701171875, -1.7576904296875, -1.578369140625, -1.3990478515625, -1.2197265625, -1.0404052734375, -0.861083984375, -0.6817626953125, -0.50244140625, -0.3231201171875, -0.143798828125, 0.0355224609375, 0.21484375, 0.3941650390625, 0.573486328125, 0.7528076171875, 0.93212890625, 1.1114501953125, 1.290771484375, 1.4700927734375, 1.6494140625, 1.8287353515625, 2.008056640625, 2.1873779296875, 2.36669921875, 2.5460205078125, 2.725341796875, 2.9046630859375, 3.083984375, 3.2633056640625, 3.442626953125, 3.6219482421875, 3.80126953125, 3.9805908203125, 4.159912109375, 4.3392333984375, 4.5185546875, 4.6978759765625, 4.877197265625, 5.0565185546875, 5.23583984375, 5.4151611328125, 5.594482421875, 5.7738037109375, 5.953125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 11.0, 13.0, 16.0, 26.0, 24.0, 64.0, 83.0, 114.0, 150.0, 280.0, 378.0, 579.0, 856.0, 1209.0, 1935.0, 2724.0, 4118.0, 6026.0, 8971.0, 13248.0, 19873.0, 29575.0, 44382.0, 66647.0, 99552.0, 142482.0, 171275.0, 139399.0, 97303.0, 65618.0, 43298.0, 29046.0, 19398.0, 12893.0, 8643.0, 5970.0, 3968.0, 2756.0, 1852.0, 1246.0, 834.0, 577.0, 368.0, 252.0, 173.0, 113.0, 71.0, 45.0, 33.0, 32.0, 20.0, 14.0, 10.0, 8.0, 2.0, 0.0, 1.0], "bins": [-0.494384765625, -0.4796142578125, -0.46484375, -0.4500732421875, -0.435302734375, -0.4205322265625, -0.40576171875, -0.3909912109375, -0.376220703125, -0.3614501953125, -0.3466796875, -0.3319091796875, -0.317138671875, -0.3023681640625, -0.28759765625, -0.2728271484375, -0.258056640625, -0.2432861328125, -0.228515625, -0.2137451171875, -0.198974609375, -0.1842041015625, -0.16943359375, -0.1546630859375, -0.139892578125, -0.1251220703125, -0.1103515625, -0.0955810546875, -0.080810546875, -0.0660400390625, -0.05126953125, -0.0364990234375, -0.021728515625, -0.0069580078125, 0.0078125, 0.0225830078125, 0.037353515625, 0.0521240234375, 0.06689453125, 0.0816650390625, 0.096435546875, 0.1112060546875, 0.1259765625, 0.1407470703125, 0.155517578125, 0.1702880859375, 0.18505859375, 0.1998291015625, 0.214599609375, 0.2293701171875, 0.244140625, 0.2589111328125, 0.273681640625, 0.2884521484375, 0.30322265625, 0.3179931640625, 0.332763671875, 0.3475341796875, 0.3623046875, 0.3770751953125, 0.391845703125, 0.4066162109375, 0.42138671875, 0.4361572265625, 0.450927734375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 3.0, 5.0, 7.0, 13.0, 10.0, 8.0, 14.0, 15.0, 16.0, 18.0, 18.0, 21.0, 26.0, 34.0, 38.0, 28.0, 29.0, 39.0, 46.0, 35.0, 43.0, 1072.0, 46.0, 36.0, 48.0, 36.0, 37.0, 39.0, 30.0, 31.0, 26.0, 22.0, 30.0, 16.0, 14.0, 13.0, 8.0, 9.0, 11.0, 11.0, 5.0, 4.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.96484375, -2.870697021484375, -2.77655029296875, -2.682403564453125, -2.5882568359375, -2.494110107421875, -2.39996337890625, -2.305816650390625, -2.211669921875, -2.117523193359375, -2.02337646484375, -1.929229736328125, -1.8350830078125, -1.740936279296875, -1.64678955078125, -1.552642822265625, -1.45849609375, -1.364349365234375, -1.27020263671875, -1.176055908203125, -1.0819091796875, -0.987762451171875, -0.89361572265625, -0.799468994140625, -0.705322265625, -0.611175537109375, -0.51702880859375, -0.422882080078125, -0.3287353515625, -0.234588623046875, -0.14044189453125, -0.046295166015625, 0.0478515625, 0.141998291015625, 0.23614501953125, 0.330291748046875, 0.4244384765625, 0.518585205078125, 0.61273193359375, 0.706878662109375, 0.801025390625, 0.895172119140625, 0.98931884765625, 1.083465576171875, 1.1776123046875, 1.271759033203125, 1.36590576171875, 1.460052490234375, 1.55419921875, 1.648345947265625, 1.74249267578125, 1.836639404296875, 1.9307861328125, 2.024932861328125, 2.11907958984375, 2.213226318359375, 2.307373046875, 2.401519775390625, 2.49566650390625, 2.589813232421875, 2.6839599609375, 2.778106689453125, 2.87225341796875, 2.966400146484375, 3.060546875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 7.0, 7.0, 10.0, 19.0, 22.0, 31.0, 68.0, 69.0, 106.0, 179.0, 240.0, 385.0, 596.0, 894.0, 1427.0, 2242.0, 3674.0, 5591.0, 9028.0, 14424.0, 22950.0, 37477.0, 60982.0, 100475.0, 162473.0, 1253100.0, 161236.0, 100144.0, 60671.0, 36999.0, 22851.0, 14088.0, 8819.0, 5640.0, 3567.0, 2352.0, 1483.0, 963.0, 615.0, 451.0, 254.0, 178.0, 131.0, 85.0, 50.0, 32.0, 26.0, 10.0, 8.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.475341796875, -0.4592247009277344, -0.44310760498046875, -0.4269905090332031, -0.4108734130859375, -0.3947563171386719, -0.37863922119140625, -0.3625221252441406, -0.346405029296875, -0.3302879333496094, -0.31417083740234375, -0.2980537414550781, -0.2819366455078125, -0.2658195495605469, -0.24970245361328125, -0.23358535766601562, -0.21746826171875, -0.20135116577148438, -0.18523406982421875, -0.16911697387695312, -0.1529998779296875, -0.13688278198242188, -0.12076568603515625, -0.10464859008789062, -0.088531494140625, -0.07241439819335938, -0.05629730224609375, -0.040180206298828125, -0.0240631103515625, -0.007946014404296875, 0.00817108154296875, 0.024288177490234375, 0.0404052734375, 0.056522369384765625, 0.07263946533203125, 0.08875656127929688, 0.1048736572265625, 0.12099075317382812, 0.13710784912109375, 0.15322494506835938, 0.169342041015625, 0.18545913696289062, 0.20157623291015625, 0.21769332885742188, 0.2338104248046875, 0.24992752075195312, 0.26604461669921875, 0.2821617126464844, 0.29827880859375, 0.3143959045410156, 0.33051300048828125, 0.3466300964355469, 0.3627471923828125, 0.3788642883300781, 0.39498138427734375, 0.4110984802246094, 0.427215576171875, 0.4433326721191406, 0.45944976806640625, 0.4755668640136719, 0.4916839599609375, 0.5078010559082031, 0.5239181518554688, 0.5400352478027344, 0.55615234375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 6.0, 2.0, 7.0, 6.0, 5.0, 13.0, 17.0, 18.0, 14.0, 20.0, 17.0, 29.0, 19.0, 41.0, 43.0, 31.0, 50.0, 48.0, 33.0, 52.0, 47.0, 54.0, 46.0, 46.0, 36.0, 32.0, 31.0, 34.0, 31.0, 22.0, 38.0, 22.0, 21.0, 11.0, 11.0, 8.0, 12.0, 6.0, 7.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010585784912109375, -0.0010240674018859863, -0.0009895563125610352, -0.000955045223236084, -0.0009205341339111328, -0.0008860230445861816, -0.0008515119552612305, -0.0008170008659362793, -0.0007824897766113281, -0.000747978687286377, -0.0007134675979614258, -0.0006789565086364746, -0.0006444454193115234, -0.0006099343299865723, -0.0005754232406616211, -0.0005409121513366699, -0.0005064010620117188, -0.0004718899726867676, -0.0004373788833618164, -0.00040286779403686523, -0.00036835670471191406, -0.0003338456153869629, -0.0002993345260620117, -0.00026482343673706055, -0.00023031234741210938, -0.0001958012580871582, -0.00016129016876220703, -0.00012677907943725586, -9.226799011230469e-05, -5.7756900787353516e-05, -2.3245811462402344e-05, 1.1265277862548828e-05, 4.57763671875e-05, 8.028745651245117e-05, 0.00011479854583740234, 0.00014930963516235352, 0.0001838207244873047, 0.00021833181381225586, 0.00025284290313720703, 0.0002873539924621582, 0.0003218650817871094, 0.00035637617111206055, 0.0003908872604370117, 0.0004253983497619629, 0.00045990943908691406, 0.0004944205284118652, 0.0005289316177368164, 0.0005634427070617676, 0.0005979537963867188, 0.0006324648857116699, 0.0006669759750366211, 0.0007014870643615723, 0.0007359981536865234, 0.0007705092430114746, 0.0008050203323364258, 0.000839531421661377, 0.0008740425109863281, 0.0009085536003112793, 0.0009430646896362305, 0.0009775757789611816, 0.0010120868682861328, 0.001046597957611084, 0.0010811090469360352, 0.0011156201362609863, 0.0011501312255859375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 3.0, 7.0, 12.0, 17.0, 19.0, 25.0, 26.0, 40.0, 41.0, 59.0, 72.0, 102.0, 128.0, 176.0, 272.0, 522.0, 1632.0, 1001742.0, 41568.0, 795.0, 385.0, 218.0, 167.0, 110.0, 85.0, 65.0, 48.0, 29.0, 36.0, 39.0, 17.0, 21.0, 15.0, 10.0, 12.0, 4.0, 8.0, 9.0, 1.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.027618408203125, -0.02680039405822754, -0.025982379913330078, -0.025164365768432617, -0.024346351623535156, -0.023528337478637695, -0.022710323333740234, -0.021892309188842773, -0.021074295043945312, -0.02025628089904785, -0.01943826675415039, -0.01862025260925293, -0.01780223846435547, -0.016984224319458008, -0.016166210174560547, -0.015348196029663086, -0.014530181884765625, -0.013712167739868164, -0.012894153594970703, -0.012076139450073242, -0.011258125305175781, -0.01044011116027832, -0.00962209701538086, -0.008804082870483398, -0.007986068725585938, -0.0071680545806884766, -0.006350040435791016, -0.005532026290893555, -0.004714012145996094, -0.003895998001098633, -0.003077983856201172, -0.002259969711303711, -0.00144195556640625, -0.0006239414215087891, 0.00019407272338867188, 0.0010120868682861328, 0.0018301010131835938, 0.0026481151580810547, 0.0034661293029785156, 0.0042841434478759766, 0.0051021575927734375, 0.0059201717376708984, 0.006738185882568359, 0.00755620002746582, 0.008374214172363281, 0.009192228317260742, 0.010010242462158203, 0.010828256607055664, 0.011646270751953125, 0.012464284896850586, 0.013282299041748047, 0.014100313186645508, 0.014918327331542969, 0.01573634147644043, 0.01655435562133789, 0.01737236976623535, 0.018190383911132812, 0.019008398056030273, 0.019826412200927734, 0.020644426345825195, 0.021462440490722656, 0.022280454635620117, 0.023098468780517578, 0.02391648292541504, 0.0247344970703125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 65.0, 435.0, 440.0, 70.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029033408500254154, -0.002803163370117545, -0.002702985890209675, -0.002602808177471161, -0.0025026306975632906, -0.0024024532176554203, -0.00230227573774755, -0.0022020982578396797, -0.0021019207779318094, -0.002001743298023939, -0.001901565701700747, -0.0018013882217928767, -0.0017012107418850064, -0.0016010331455618143, -0.001500855665653944, -0.0014006781857460737, -0.0013005005894228816, -0.0012003231095150113, -0.0011001455131918192, -0.000999968033283949, -0.0008997905533760786, -0.0007996130152605474, -0.0006994354771450162, -0.0005992579972371459, -0.0004990804591216147, -0.00039890295010991395, -0.0002987254410982132, -0.000198547902982682, -9.837039397098124e-05, 1.8071150407195091e-06, 0.00010198465315625072, 0.000202162133064121, 0.0003023396711796522, 0.00040251718019135296, 0.0005026946892030537, 0.0006028722273185849, 0.0007030497072264552, 0.0008032272453419864, 0.0009034047834575176, 0.001003582263365388, 0.0011037597432732582, 0.0012039372231811285, 0.0013041148195043206, 0.001404292299412191, 0.0015044697793200612, 0.0016046473756432533, 0.0017048248555511236, 0.001805002335458994, 0.001905179931782186, 0.002005357528105378, 0.0021055350080132484, 0.0022057124879211187, 0.002305889967828989, 0.0024060674477368593, 0.0025062449276447296, 0.0026064226403832436, 0.002706600120291114, 0.002806777600198984, 0.0029069550801068544, 0.0030071325600147247, 0.0031073102727532387, 0.003207487752661109, 0.0033076652325689793, 0.0034078427124768496, 0.00350802019238472]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 3.0, 8.0, 10.0, 12.0, 17.0, 10.0, 20.0, 26.0, 24.0, 27.0, 36.0, 23.0, 27.0, 33.0, 41.0, 41.0, 38.0, 42.0, 42.0, 47.0, 36.0, 48.0, 42.0, 45.0, 32.0, 27.0, 23.0, 29.0, 21.0, 22.0, 14.0, 14.0, 18.0, 12.0, 19.0, 9.0, 14.0, 7.0, 8.0, 7.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0006064772605895996, -0.0005863811820745468, -0.000566285103559494, -0.0005461890250444412, -0.0005260929465293884, -0.0005059968680143356, -0.00048590078949928284, -0.00046580471098423004, -0.00044570863246917725, -0.00042561255395412445, -0.00040551647543907166, -0.00038542039692401886, -0.00036532431840896606, -0.00034522823989391327, -0.0003251321613788605, -0.0003050360828638077, -0.0002849400043487549, -0.0002648439258337021, -0.0002447478473186493, -0.0002246517688035965, -0.0002045556902885437, -0.0001844596117734909, -0.0001643635332584381, -0.00014426745474338531, -0.00012417137622833252, -0.00010407529771327972, -8.397921919822693e-05, -6.388314068317413e-05, -4.378706216812134e-05, -2.3690983653068542e-05, -3.594905138015747e-06, 1.650117337703705e-05, 3.6597251892089844e-05, 5.669333040714264e-05, 7.678940892219543e-05, 9.688548743724823e-05, 0.00011698156595230103, 0.00013707764446735382, 0.00015717372298240662, 0.0001772698014974594, 0.0001973658800125122, 0.000217461958527565, 0.0002375580370426178, 0.0002576541155576706, 0.0002777501940727234, 0.0002978462725877762, 0.000317942351102829, 0.0003380384296178818, 0.00035813450813293457, 0.00037823058664798737, 0.00039832666516304016, 0.00041842274367809296, 0.00043851882219314575, 0.00045861490070819855, 0.00047871097922325134, 0.0004988070577383041, 0.0005189031362533569, 0.0005389992147684097, 0.0005590952932834625, 0.0005791913717985153, 0.0005992874503135681, 0.0006193835288286209, 0.0006394796073436737, 0.0006595756858587265, 0.0006796717643737793]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 4.0, 11.0, 11.0, 19.0, 15.0, 23.0, 13.0, 25.0, 15.0, 40.0, 35.0, 44.0, 51.0, 40.0, 44.0, 55.0, 55.0, 56.0, 46.0, 56.0, 32.0, 39.0, 37.0, 37.0, 25.0, 29.0, 37.0, 23.0, 13.0, 9.0, 8.0, 18.0, 7.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.3441162109375, -5.164794921875, -4.9854736328125, -4.80615234375, -4.6268310546875, -4.447509765625, -4.2681884765625, -4.0888671875, -3.9095458984375, -3.730224609375, -3.5509033203125, -3.37158203125, -3.1922607421875, -3.012939453125, -2.8336181640625, -2.654296875, -2.4749755859375, -2.295654296875, -2.1163330078125, -1.93701171875, -1.7576904296875, -1.578369140625, -1.3990478515625, -1.2197265625, -1.0404052734375, -0.861083984375, -0.6817626953125, -0.50244140625, -0.3231201171875, -0.143798828125, 0.0355224609375, 0.21484375, 0.3941650390625, 0.573486328125, 0.7528076171875, 0.93212890625, 1.1114501953125, 1.290771484375, 1.4700927734375, 1.6494140625, 1.8287353515625, 2.008056640625, 2.1873779296875, 2.36669921875, 2.5460205078125, 2.725341796875, 2.9046630859375, 3.083984375, 3.2633056640625, 3.442626953125, 3.6219482421875, 3.80126953125, 3.9805908203125, 4.159912109375, 4.3392333984375, 4.5185546875, 4.6978759765625, 4.877197265625, 5.0565185546875, 5.23583984375, 5.4151611328125, 5.594482421875, 5.7738037109375, 5.953125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 8.0, 7.0, 19.0, 28.0, 24.0, 38.0, 71.0, 82.0, 123.0, 158.0, 247.0, 375.0, 541.0, 896.0, 1620.0, 3124.0, 7424.0, 19418.0, 61889.0, 244655.0, 509287.0, 136263.0, 38007.0, 13100.0, 5259.0, 2434.0, 1283.0, 735.0, 436.0, 286.0, 235.0, 132.0, 112.0, 60.0, 56.0, 37.0, 27.0, 20.0, 12.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.15234375, -4.9822998046875, -4.812255859375, -4.6422119140625, -4.47216796875, -4.3021240234375, -4.132080078125, -3.9620361328125, -3.7919921875, -3.6219482421875, -3.451904296875, -3.2818603515625, -3.11181640625, -2.9417724609375, -2.771728515625, -2.6016845703125, -2.431640625, -2.2615966796875, -2.091552734375, -1.9215087890625, -1.75146484375, -1.5814208984375, -1.411376953125, -1.2413330078125, -1.0712890625, -0.9012451171875, -0.731201171875, -0.5611572265625, -0.39111328125, -0.2210693359375, -0.051025390625, 0.1190185546875, 0.2890625, 0.4591064453125, 0.629150390625, 0.7991943359375, 0.96923828125, 1.1392822265625, 1.309326171875, 1.4793701171875, 1.6494140625, 1.8194580078125, 1.989501953125, 2.1595458984375, 2.32958984375, 2.4996337890625, 2.669677734375, 2.8397216796875, 3.009765625, 3.1798095703125, 3.349853515625, 3.5198974609375, 3.68994140625, 3.8599853515625, 4.030029296875, 4.2000732421875, 4.3701171875, 4.5401611328125, 4.710205078125, 4.8802490234375, 5.05029296875, 5.2203369140625, 5.390380859375, 5.5604248046875, 5.73046875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 6.0, 7.0, 11.0, 18.0, 10.0, 22.0, 25.0, 28.0, 30.0, 29.0, 35.0, 37.0, 35.0, 56.0, 59.0, 57.0, 84.0, 358.0, 1628.0, 73.0, 46.0, 47.0, 42.0, 42.0, 35.0, 34.0, 34.0, 29.0, 22.0, 21.0, 13.0, 8.0, 11.0, 10.0, 6.0, 7.0, 10.0, 2.0, 6.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-18.453125, -17.91162109375, -17.3701171875, -16.82861328125, -16.287109375, -15.74560546875, -15.2041015625, -14.66259765625, -14.12109375, -13.57958984375, -13.0380859375, -12.49658203125, -11.955078125, -11.41357421875, -10.8720703125, -10.33056640625, -9.7890625, -9.24755859375, -8.7060546875, -8.16455078125, -7.623046875, -7.08154296875, -6.5400390625, -5.99853515625, -5.45703125, -4.91552734375, -4.3740234375, -3.83251953125, -3.291015625, -2.74951171875, -2.2080078125, -1.66650390625, -1.125, -0.58349609375, -0.0419921875, 0.49951171875, 1.041015625, 1.58251953125, 2.1240234375, 2.66552734375, 3.20703125, 3.74853515625, 4.2900390625, 4.83154296875, 5.373046875, 5.91455078125, 6.4560546875, 6.99755859375, 7.5390625, 8.08056640625, 8.6220703125, 9.16357421875, 9.705078125, 10.24658203125, 10.7880859375, 11.32958984375, 11.87109375, 12.41259765625, 12.9541015625, 13.49560546875, 14.037109375, 14.57861328125, 15.1201171875, 15.66162109375, 16.203125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 7.0, 3.0, 5.0, 7.0, 6.0, 8.0, 10.0, 4.0, 14.0, 15.0, 17.0, 31.0, 35.0, 36.0, 57.0, 76.0, 108.0, 150.0, 314.0, 820.0, 5246.0, 2898841.0, 235655.0, 2797.0, 599.0, 279.0, 154.0, 86.0, 52.0, 51.0, 48.0, 37.0, 37.0, 14.0, 28.0, 9.0, 19.0, 12.0, 4.0, 5.0, 3.0, 1.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.09375, -36.818359375, -35.54296875, -34.267578125, -32.9921875, -31.716796875, -30.44140625, -29.166015625, -27.890625, -26.615234375, -25.33984375, -24.064453125, -22.7890625, -21.513671875, -20.23828125, -18.962890625, -17.6875, -16.412109375, -15.13671875, -13.861328125, -12.5859375, -11.310546875, -10.03515625, -8.759765625, -7.484375, -6.208984375, -4.93359375, -3.658203125, -2.3828125, -1.107421875, 0.16796875, 1.443359375, 2.71875, 3.994140625, 5.26953125, 6.544921875, 7.8203125, 9.095703125, 10.37109375, 11.646484375, 12.921875, 14.197265625, 15.47265625, 16.748046875, 18.0234375, 19.298828125, 20.57421875, 21.849609375, 23.125, 24.400390625, 25.67578125, 26.951171875, 28.2265625, 29.501953125, 30.77734375, 32.052734375, 33.328125, 34.603515625, 35.87890625, 37.154296875, 38.4296875, 39.705078125, 40.98046875, 42.255859375, 43.53125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 3.0, 966.0, 47.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.71988868713379, -14.966870307922363, -6.2138519287109375, 2.5391674041748047, 11.292184829711914, 20.045202255249023, 28.7982234954834, 37.551239013671875, 46.30426025390625, 55.05727767944336, 63.81029510498047, 72.56331634521484, 81.31632995605469, 90.06935119628906, 98.82237243652344, 107.57539367675781, 116.32840728759766, 125.08142852783203, 133.83444213867188, 142.58746337890625, 151.34048461914062, 160.093505859375, 168.84652709960938, 177.5995330810547, 186.35255432128906, 195.10557556152344, 203.8585968017578, 212.61160278320312, 221.3646240234375, 230.11764526367188, 238.87066650390625, 247.62368774414062, 256.3766784667969, 265.12969970703125, 273.8827209472656, 282.6357421875, 291.3887634277344, 300.14178466796875, 308.894775390625, 317.6477966308594, 326.40081787109375, 335.1538391113281, 343.9068603515625, 352.6598815917969, 361.41290283203125, 370.1658935546875, 378.9189453125, 387.67193603515625, 396.42498779296875, 405.1780090332031, 413.9310302734375, 422.6840515136719, 431.43707275390625, 440.1900634765625, 448.943115234375, 457.69610595703125, 466.4491271972656, 475.2021484375, 483.9551696777344, 492.70819091796875, 501.4612121582031, 510.2142333984375, 518.9672241210938, 527.7202758789062, 536.4732666015625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 2.0, 4.0, 7.0, 11.0, 15.0, 20.0, 18.0, 19.0, 16.0, 23.0, 22.0, 23.0, 35.0, 28.0, 30.0, 30.0, 43.0, 40.0, 43.0, 26.0, 36.0, 35.0, 35.0, 26.0, 47.0, 34.0, 39.0, 35.0, 42.0, 24.0, 27.0, 26.0, 23.0, 11.0, 18.0, 21.0, 23.0, 9.0, 10.0, 3.0, 9.0, 2.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-54.0447998046875, -52.430301666259766, -50.8158073425293, -49.20130920410156, -47.586814880371094, -45.97231674194336, -44.35782241821289, -42.743324279785156, -41.12882995605469, -39.51433181762695, -37.899837493896484, -36.28533935546875, -34.67084503173828, -33.05634689331055, -31.441852569580078, -29.827354431152344, -28.212858200073242, -26.59836196899414, -24.98386573791504, -23.369369506835938, -21.754873275756836, -20.140377044677734, -18.52587890625, -16.91138458251953, -15.296887397766113, -13.682391166687012, -12.06789493560791, -10.453397750854492, -8.83890151977539, -7.224405288696289, -5.6099090576171875, -3.995412826538086, -2.3809165954589844, -0.7664202451705933, 0.8480761051177979, 2.4625725746154785, 4.07706880569458, 5.69156551361084, 7.306061744689941, 8.920557975769043, 10.535054206848145, 12.149550437927246, 13.764046669006348, 15.378543853759766, 16.993040084838867, 18.60753631591797, 20.22203254699707, 21.836528778076172, 23.451025009155273, 25.065521240234375, 26.680017471313477, 28.294513702392578, 29.90900993347168, 31.52350616455078, 33.138004302978516, 34.752498626708984, 36.36699676513672, 37.98149490356445, 39.59598922729492, 41.210487365722656, 42.824981689453125, 44.43947982788086, 46.05397415161133, 47.66847229003906, 49.28296661376953]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 7.0, 7.0, 11.0, 16.0, 16.0, 11.0, 20.0, 23.0, 15.0, 21.0, 47.0, 26.0, 43.0, 48.0, 44.0, 47.0, 47.0, 59.0, 57.0, 53.0, 36.0, 50.0, 38.0, 38.0, 29.0, 39.0, 29.0, 17.0, 25.0, 17.0, 11.0, 15.0, 8.0, 10.0, 8.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.80078125, -5.61798095703125, -5.4351806640625, -5.25238037109375, -5.069580078125, -4.88677978515625, -4.7039794921875, -4.52117919921875, -4.33837890625, -4.15557861328125, -3.9727783203125, -3.78997802734375, -3.607177734375, -3.42437744140625, -3.2415771484375, -3.05877685546875, -2.8759765625, -2.69317626953125, -2.5103759765625, -2.32757568359375, -2.144775390625, -1.96197509765625, -1.7791748046875, -1.59637451171875, -1.41357421875, -1.23077392578125, -1.0479736328125, -0.86517333984375, -0.682373046875, -0.49957275390625, -0.3167724609375, -0.13397216796875, 0.048828125, 0.23162841796875, 0.4144287109375, 0.59722900390625, 0.780029296875, 0.96282958984375, 1.1456298828125, 1.32843017578125, 1.51123046875, 1.69403076171875, 1.8768310546875, 2.05963134765625, 2.242431640625, 2.42523193359375, 2.6080322265625, 2.79083251953125, 2.9736328125, 3.15643310546875, 3.3392333984375, 3.52203369140625, 3.704833984375, 3.88763427734375, 4.0704345703125, 4.25323486328125, 4.43603515625, 4.61883544921875, 4.8016357421875, 4.98443603515625, 5.167236328125, 5.35003662109375, 5.5328369140625, 5.71563720703125, 5.8984375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 5.0, 9.0, 12.0, 15.0, 19.0, 24.0, 26.0, 36.0, 44.0, 54.0, 96.0, 124.0, 273.0, 638.0, 2571.0, 25027.0, 814083.0, 3221715.0, 119043.0, 8099.0, 1337.0, 408.0, 193.0, 116.0, 57.0, 61.0, 45.0, 26.0, 27.0, 25.0, 22.0, 11.0, 6.0, 7.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.38671875, -18.6484375, -17.91015625, -17.171875, -16.43359375, -15.6953125, -14.95703125, -14.21875, -13.48046875, -12.7421875, -12.00390625, -11.265625, -10.52734375, -9.7890625, -9.05078125, -8.3125, -7.57421875, -6.8359375, -6.09765625, -5.359375, -4.62109375, -3.8828125, -3.14453125, -2.40625, -1.66796875, -0.9296875, -0.19140625, 0.546875, 1.28515625, 2.0234375, 2.76171875, 3.5, 4.23828125, 4.9765625, 5.71484375, 6.453125, 7.19140625, 7.9296875, 8.66796875, 9.40625, 10.14453125, 10.8828125, 11.62109375, 12.359375, 13.09765625, 13.8359375, 14.57421875, 15.3125, 16.05078125, 16.7890625, 17.52734375, 18.265625, 19.00390625, 19.7421875, 20.48046875, 21.21875, 21.95703125, 22.6953125, 23.43359375, 24.171875, 24.91015625, 25.6484375, 26.38671875, 27.125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 14.0, 11.0, 20.0, 33.0, 39.0, 65.0, 67.0, 109.0, 172.0, 234.0, 385.0, 500.0, 575.0, 503.0, 420.0, 271.0, 222.0, 131.0, 89.0, 72.0, 41.0, 22.0, 27.0, 18.0, 15.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.125, -21.48583984375, -20.8466796875, -20.20751953125, -19.568359375, -18.92919921875, -18.2900390625, -17.65087890625, -17.01171875, -16.37255859375, -15.7333984375, -15.09423828125, -14.455078125, -13.81591796875, -13.1767578125, -12.53759765625, -11.8984375, -11.25927734375, -10.6201171875, -9.98095703125, -9.341796875, -8.70263671875, -8.0634765625, -7.42431640625, -6.78515625, -6.14599609375, -5.5068359375, -4.86767578125, -4.228515625, -3.58935546875, -2.9501953125, -2.31103515625, -1.671875, -1.03271484375, -0.3935546875, 0.24560546875, 0.884765625, 1.52392578125, 2.1630859375, 2.80224609375, 3.44140625, 4.08056640625, 4.7197265625, 5.35888671875, 5.998046875, 6.63720703125, 7.2763671875, 7.91552734375, 8.5546875, 9.19384765625, 9.8330078125, 10.47216796875, 11.111328125, 11.75048828125, 12.3896484375, 13.02880859375, 13.66796875, 14.30712890625, 14.9462890625, 15.58544921875, 16.224609375, 16.86376953125, 17.5029296875, 18.14208984375, 18.78125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 4.0, 7.0, 29.0, 26.0, 54.0, 97.0, 195.0, 463.0, 1359.0, 27814.0, 4030823.0, 130181.0, 2129.0, 557.0, 251.0, 114.0, 65.0, 40.0, 27.0, 12.0, 8.0, 8.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.0625, -71.5634765625, -69.064453125, -66.5654296875, -64.06640625, -61.5673828125, -59.068359375, -56.5693359375, -54.0703125, -51.5712890625, -49.072265625, -46.5732421875, -44.07421875, -41.5751953125, -39.076171875, -36.5771484375, -34.078125, -31.5791015625, -29.080078125, -26.5810546875, -24.08203125, -21.5830078125, -19.083984375, -16.5849609375, -14.0859375, -11.5869140625, -9.087890625, -6.5888671875, -4.08984375, -1.5908203125, 0.908203125, 3.4072265625, 5.90625, 8.4052734375, 10.904296875, 13.4033203125, 15.90234375, 18.4013671875, 20.900390625, 23.3994140625, 25.8984375, 28.3974609375, 30.896484375, 33.3955078125, 35.89453125, 38.3935546875, 40.892578125, 43.3916015625, 45.890625, 48.3896484375, 50.888671875, 53.3876953125, 55.88671875, 58.3857421875, 60.884765625, 63.3837890625, 65.8828125, 68.3818359375, 70.880859375, 73.3798828125, 75.87890625, 78.3779296875, 80.876953125, 83.3759765625, 85.875]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 26.0, 168.0, 453.0, 313.0, 46.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.1459655761719, -255.32554626464844, -247.505126953125, -239.68470764160156, -231.86428833007812, -224.0438690185547, -216.22344970703125, -208.4030303955078, -200.58261108398438, -192.76219177246094, -184.9417724609375, -177.12135314941406, -169.30093383789062, -161.4805145263672, -153.66009521484375, -145.8396759033203, -138.01925659179688, -130.19883728027344, -122.37841796875, -114.55799865722656, -106.73757934570312, -98.91716003417969, -91.09674072265625, -83.27632141113281, -75.45590209960938, -67.63548278808594, -59.8150634765625, -51.99464416503906, -44.174224853515625, -36.35380554199219, -28.53338623046875, -20.712966918945312, -12.892532348632812, -5.072113037109375, 2.7483062744140625, 10.5687255859375, 18.389144897460938, 26.209564208984375, 34.02998352050781, 41.85040283203125, 49.67082214355469, 57.491241455078125, 65.31166076660156, 73.132080078125, 80.95249938964844, 88.77291870117188, 96.59333801269531, 104.41375732421875, 112.23417663574219, 120.05459594726562, 127.87501525878906, 135.6954345703125, 143.51585388183594, 151.33627319335938, 159.1566925048828, 166.97711181640625, 174.7975311279297, 182.61795043945312, 190.43836975097656, 198.2587890625, 206.07920837402344, 213.89962768554688, 221.7200469970703, 229.54046630859375, 237.3608856201172]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 9.0, 11.0, 15.0, 15.0, 16.0, 16.0, 21.0, 24.0, 21.0, 31.0, 20.0, 27.0, 40.0, 35.0, 32.0, 28.0, 36.0, 37.0, 33.0, 46.0, 46.0, 36.0, 31.0, 36.0, 33.0, 32.0, 39.0, 22.0, 31.0, 28.0, 16.0, 13.0, 20.0, 18.0, 15.0, 13.0, 10.0, 8.0, 10.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-56.86656188964844, -55.17795181274414, -53.489341735839844, -51.80073165893555, -50.11212158203125, -48.42351150512695, -46.734901428222656, -45.04629135131836, -43.35768127441406, -41.669071197509766, -39.98046112060547, -38.29185104370117, -36.603240966796875, -34.91463088989258, -33.22602081298828, -31.537410736083984, -29.84880256652832, -28.160192489624023, -26.471582412719727, -24.78297233581543, -23.094362258911133, -21.40575408935547, -19.717144012451172, -18.028533935546875, -16.339923858642578, -14.651313781738281, -12.962703704833984, -11.274093627929688, -9.58548355102539, -7.89687442779541, -6.208264350891113, -4.519654273986816, -2.831043243408203, -1.1424332857131958, 0.5461766719818115, 2.2347865104675293, 3.923396587371826, 5.612006187438965, 7.300616264343262, 8.989226341247559, 10.677836418151855, 12.366446495056152, 14.05505657196045, 15.74366569519043, 17.432275772094727, 19.120885848999023, 20.80949592590332, 22.498106002807617, 24.186716079711914, 25.87532615661621, 27.563936233520508, 29.252546310424805, 30.9411563873291, 32.629764556884766, 34.31837463378906, 36.00698471069336, 37.695594787597656, 39.38420486450195, 41.07281494140625, 42.76142501831055, 44.450035095214844, 46.13864517211914, 47.82725524902344, 49.515865325927734, 51.20447540283203]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 4.0, 8.0, 7.0, 10.0, 16.0, 17.0, 11.0, 19.0, 26.0, 23.0, 31.0, 27.0, 36.0, 37.0, 32.0, 42.0, 54.0, 50.0, 44.0, 57.0, 48.0, 50.0, 40.0, 39.0, 33.0, 32.0, 31.0, 25.0, 24.0, 27.0, 18.0, 17.0, 14.0, 10.0, 11.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.37109375, -5.19659423828125, -5.0220947265625, -4.84759521484375, -4.673095703125, -4.49859619140625, -4.3240966796875, -4.14959716796875, -3.97509765625, -3.80059814453125, -3.6260986328125, -3.45159912109375, -3.277099609375, -3.10260009765625, -2.9281005859375, -2.75360107421875, -2.5791015625, -2.40460205078125, -2.2301025390625, -2.05560302734375, -1.881103515625, -1.70660400390625, -1.5321044921875, -1.35760498046875, -1.18310546875, -1.00860595703125, -0.8341064453125, -0.65960693359375, -0.485107421875, -0.31060791015625, -0.1361083984375, 0.03839111328125, 0.212890625, 0.38739013671875, 0.5618896484375, 0.73638916015625, 0.910888671875, 1.08538818359375, 1.2598876953125, 1.43438720703125, 1.60888671875, 1.78338623046875, 1.9578857421875, 2.13238525390625, 2.306884765625, 2.48138427734375, 2.6558837890625, 2.83038330078125, 3.0048828125, 3.17938232421875, 3.3538818359375, 3.52838134765625, 3.702880859375, 3.87738037109375, 4.0518798828125, 4.22637939453125, 4.40087890625, 4.57537841796875, 4.7498779296875, 4.92437744140625, 5.098876953125, 5.27337646484375, 5.4478759765625, 5.62237548828125, 5.796875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 9.0, 6.0, 20.0, 19.0, 38.0, 58.0, 65.0, 116.0, 142.0, 217.0, 332.0, 452.0, 673.0, 1031.0, 1421.0, 2052.0, 2966.0, 4328.0, 6263.0, 9193.0, 13445.0, 19364.0, 28683.0, 42150.0, 62821.0, 94404.0, 134966.0, 168157.0, 142955.0, 101012.0, 68158.0, 45652.0, 30592.0, 20884.0, 14230.0, 9984.0, 6709.0, 4672.0, 3299.0, 2203.0, 1556.0, 1018.0, 704.0, 463.0, 331.0, 246.0, 180.0, 117.0, 73.0, 37.0, 26.0, 23.0, 20.0, 13.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.443359375, -0.4288673400878906, -0.41437530517578125, -0.3998832702636719, -0.3853912353515625, -0.3708992004394531, -0.35640716552734375, -0.3419151306152344, -0.327423095703125, -0.3129310607910156, -0.29843902587890625, -0.2839469909667969, -0.2694549560546875, -0.2549629211425781, -0.24047088623046875, -0.22597885131835938, -0.21148681640625, -0.19699478149414062, -0.18250274658203125, -0.16801071166992188, -0.1535186767578125, -0.13902664184570312, -0.12453460693359375, -0.11004257202148438, -0.095550537109375, -0.08105850219726562, -0.06656646728515625, -0.052074432373046875, -0.0375823974609375, -0.023090362548828125, -0.00859832763671875, 0.005893707275390625, 0.0203857421875, 0.034877777099609375, 0.04936981201171875, 0.06386184692382812, 0.0783538818359375, 0.09284591674804688, 0.10733795166015625, 0.12182998657226562, 0.136322021484375, 0.15081405639648438, 0.16530609130859375, 0.17979812622070312, 0.1942901611328125, 0.20878219604492188, 0.22327423095703125, 0.23776626586914062, 0.25225830078125, 0.2667503356933594, 0.28124237060546875, 0.2957344055175781, 0.3102264404296875, 0.3247184753417969, 0.33921051025390625, 0.3537025451660156, 0.368194580078125, 0.3826866149902344, 0.39717864990234375, 0.4116706848144531, 0.4261627197265625, 0.4406547546386719, 0.45514678955078125, 0.4696388244628906, 0.484130859375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 10.0, 15.0, 9.0, 8.0, 19.0, 12.0, 19.0, 17.0, 16.0, 18.0, 18.0, 19.0, 28.0, 30.0, 29.0, 36.0, 36.0, 32.0, 40.0, 39.0, 1064.0, 42.0, 34.0, 44.0, 28.0, 31.0, 41.0, 40.0, 23.0, 32.0, 29.0, 22.0, 23.0, 16.0, 20.0, 10.0, 9.0, 8.0, 9.0, 9.0, 3.0, 7.0, 6.0, 6.0, 1.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.91015625, -2.81805419921875, -2.7259521484375, -2.63385009765625, -2.541748046875, -2.44964599609375, -2.3575439453125, -2.26544189453125, -2.17333984375, -2.08123779296875, -1.9891357421875, -1.89703369140625, -1.804931640625, -1.71282958984375, -1.6207275390625, -1.52862548828125, -1.4365234375, -1.34442138671875, -1.2523193359375, -1.16021728515625, -1.068115234375, -0.97601318359375, -0.8839111328125, -0.79180908203125, -0.69970703125, -0.60760498046875, -0.5155029296875, -0.42340087890625, -0.331298828125, -0.23919677734375, -0.1470947265625, -0.05499267578125, 0.037109375, 0.12921142578125, 0.2213134765625, 0.31341552734375, 0.405517578125, 0.49761962890625, 0.5897216796875, 0.68182373046875, 0.77392578125, 0.86602783203125, 0.9581298828125, 1.05023193359375, 1.142333984375, 1.23443603515625, 1.3265380859375, 1.41864013671875, 1.5107421875, 1.60284423828125, 1.6949462890625, 1.78704833984375, 1.879150390625, 1.97125244140625, 2.0633544921875, 2.15545654296875, 2.24755859375, 2.33966064453125, 2.4317626953125, 2.52386474609375, 2.615966796875, 2.70806884765625, 2.8001708984375, 2.89227294921875, 2.984375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 10.0, 15.0, 25.0, 27.0, 40.0, 72.0, 110.0, 154.0, 209.0, 269.0, 389.0, 615.0, 923.0, 1296.0, 1874.0, 2806.0, 4136.0, 6210.0, 9185.0, 13853.0, 20931.0, 31817.0, 49114.0, 75745.0, 115804.0, 163152.0, 1220243.0, 130369.0, 86417.0, 55656.0, 35836.0, 23568.0, 15372.0, 10027.0, 6856.0, 4540.0, 3098.0, 2095.0, 1400.0, 925.0, 643.0, 399.0, 287.0, 188.0, 120.0, 99.0, 82.0, 45.0, 27.0, 23.0, 9.0, 8.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0], "bins": [-0.4814453125, -0.46646881103515625, -0.4514923095703125, -0.43651580810546875, -0.421539306640625, -0.40656280517578125, -0.3915863037109375, -0.37660980224609375, -0.36163330078125, -0.34665679931640625, -0.3316802978515625, -0.31670379638671875, -0.301727294921875, -0.28675079345703125, -0.2717742919921875, -0.25679779052734375, -0.2418212890625, -0.22684478759765625, -0.2118682861328125, -0.19689178466796875, -0.181915283203125, -0.16693878173828125, -0.1519622802734375, -0.13698577880859375, -0.12200927734375, -0.10703277587890625, -0.0920562744140625, -0.07707977294921875, -0.062103271484375, -0.04712677001953125, -0.0321502685546875, -0.01717376708984375, -0.002197265625, 0.01277923583984375, 0.0277557373046875, 0.04273223876953125, 0.057708740234375, 0.07268524169921875, 0.0876617431640625, 0.10263824462890625, 0.11761474609375, 0.13259124755859375, 0.1475677490234375, 0.16254425048828125, 0.177520751953125, 0.19249725341796875, 0.2074737548828125, 0.22245025634765625, 0.2374267578125, 0.25240325927734375, 0.2673797607421875, 0.28235626220703125, 0.297332763671875, 0.31230926513671875, 0.3272857666015625, 0.34226226806640625, 0.35723876953125, 0.37221527099609375, 0.3871917724609375, 0.40216827392578125, 0.417144775390625, 0.43212127685546875, 0.4470977783203125, 0.46207427978515625, 0.47705078125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 8.0, 1.0, 2.0, 6.0, 1.0, 10.0, 6.0, 11.0, 11.0, 13.0, 20.0, 15.0, 21.0, 30.0, 37.0, 40.0, 47.0, 51.0, 49.0, 60.0, 58.0, 53.0, 50.0, 49.0, 57.0, 36.0, 45.0, 29.0, 33.0, 22.0, 28.0, 21.0, 18.0, 15.0, 16.0, 11.0, 7.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0012235641479492188, -0.0011858046054840088, -0.0011480450630187988, -0.0011102855205535889, -0.001072525978088379, -0.001034766435623169, -0.000997006893157959, -0.000959247350692749, -0.0009214878082275391, -0.0008837282657623291, -0.0008459687232971191, -0.0008082091808319092, -0.0007704496383666992, -0.0007326900959014893, -0.0006949305534362793, -0.0006571710109710693, -0.0006194114685058594, -0.0005816519260406494, -0.0005438923835754395, -0.0005061328411102295, -0.00046837329864501953, -0.00043061375617980957, -0.0003928542137145996, -0.00035509467124938965, -0.0003173351287841797, -0.0002795755863189697, -0.00024181604385375977, -0.0002040565013885498, -0.00016629695892333984, -0.00012853741645812988, -9.077787399291992e-05, -5.301833152770996e-05, -1.52587890625e-05, 2.250075340270996e-05, 6.026029586791992e-05, 9.801983833312988e-05, 0.00013577938079833984, 0.0001735389232635498, 0.00021129846572875977, 0.0002490580081939697, 0.0002868175506591797, 0.00032457709312438965, 0.0003623366355895996, 0.00040009617805480957, 0.00043785572052001953, 0.0004756152629852295, 0.0005133748054504395, 0.0005511343479156494, 0.0005888938903808594, 0.0006266534328460693, 0.0006644129753112793, 0.0007021725177764893, 0.0007399320602416992, 0.0007776916027069092, 0.0008154511451721191, 0.0008532106876373291, 0.0008909702301025391, 0.000928729772567749, 0.000966489315032959, 0.001004248857498169, 0.001042008399963379, 0.0010797679424285889, 0.0011175274848937988, 0.0011552870273590088, 0.0011930465698242188]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 9.0, 8.0, 11.0, 17.0, 19.0, 23.0, 42.0, 68.0, 70.0, 112.0, 220.0, 334.0, 688.0, 61553.0, 983115.0, 1141.0, 401.0, 202.0, 154.0, 103.0, 77.0, 42.0, 48.0, 20.0, 13.0, 12.0, 8.0, 9.0, 3.0, 5.0, 6.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03338623046875, -0.0323486328125, -0.03131103515625, -0.0302734375, -0.02923583984375, -0.0281982421875, -0.02716064453125, -0.026123046875, -0.02508544921875, -0.0240478515625, -0.02301025390625, -0.02197265625, -0.02093505859375, -0.0198974609375, -0.01885986328125, -0.017822265625, -0.01678466796875, -0.0157470703125, -0.01470947265625, -0.013671875, -0.01263427734375, -0.0115966796875, -0.01055908203125, -0.009521484375, -0.00848388671875, -0.0074462890625, -0.00640869140625, -0.00537109375, -0.00433349609375, -0.0032958984375, -0.00225830078125, -0.001220703125, -0.00018310546875, 0.0008544921875, 0.00189208984375, 0.0029296875, 0.00396728515625, 0.0050048828125, 0.00604248046875, 0.007080078125, 0.00811767578125, 0.0091552734375, 0.01019287109375, 0.01123046875, 0.01226806640625, 0.0133056640625, 0.01434326171875, 0.015380859375, 0.01641845703125, 0.0174560546875, 0.01849365234375, 0.01953125, 0.02056884765625, 0.0216064453125, 0.02264404296875, 0.023681640625, 0.02471923828125, 0.0257568359375, 0.02679443359375, 0.02783203125, 0.02886962890625, 0.0299072265625, 0.03094482421875, 0.031982421875, 0.03302001953125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 6.0, 27.0, 175.0, 446.0, 284.0, 72.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038046028930693865, -0.00029969491879455745, -0.00021892956283409148, -0.00013816420687362552, -5.739883636124432e-05, 2.3366534151136875e-05, 0.00010413187555968761, 0.00018489727517589927, 0.00026566261658445, 0.0003464279870968312, 0.0004271933576092124, 0.0005079586990177631, 0.0005887240404263139, 0.0006694894400425255, 0.0007502547814510763, 0.0008310201810672879, 0.0009117855224758387, 0.0009925508638843894, 0.0010733162052929401, 0.0011540816631168127, 0.0012348470045253634, 0.0013156123459339142, 0.001396377687342465, 0.0014771430287510157, 0.0015579084865748882, 0.001638673827983439, 0.0017194391693919897, 0.0018002046272158623, 0.001880969968624413, 0.0019617353100329638, 0.0020425007678568363, 0.0021232659928500652, 0.002204031450673938, 0.0022847969084978104, 0.0023655621334910393, 0.002446327591314912, 0.0025270928163081408, 0.0026078582741320133, 0.0026886234991252422, 0.002769388956949115, 0.0028501544147729874, 0.00293091987259686, 0.003011685097590089, 0.0030924505554139614, 0.0031732157804071903, 0.003253981238231063, 0.0033347466960549355, 0.0034155119210481644, 0.0034962771460413933, 0.003577042603865266, 0.0036578078288584948, 0.0037385732866823673, 0.0038193385116755962, 0.003900103969499469, 0.003980869427323341, 0.00406163465231657, 0.0041424003429710865, 0.004223165567964315, 0.004303931258618832, 0.0043846964836120605, 0.0044654617086052895, 0.004546226933598518, 0.004626992624253035, 0.0047077578492462635, 0.004788523074239492]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 16.0, 11.0, 14.0, 12.0, 24.0, 10.0, 18.0, 28.0, 27.0, 36.0, 39.0, 37.0, 36.0, 34.0, 38.0, 42.0, 50.0, 31.0, 34.0, 61.0, 41.0, 28.0, 35.0, 44.0, 37.0, 33.0, 25.0, 20.0, 28.0, 19.0, 15.0, 10.0, 13.0, 8.0, 10.0, 12.0, 8.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007579326629638672, -0.0007364675402641296, -0.0007150024175643921, -0.0006935372948646545, -0.000672072172164917, -0.0006506070494651794, -0.0006291419267654419, -0.0006076768040657043, -0.0005862116813659668, -0.0005647465586662292, -0.0005432814359664917, -0.0005218163132667542, -0.0005003511905670166, -0.00047888606786727905, -0.0004574209451675415, -0.00043595582246780396, -0.0004144906997680664, -0.00039302557706832886, -0.0003715604543685913, -0.00035009533166885376, -0.0003286302089691162, -0.00030716508626937866, -0.0002856999635696411, -0.00026423484086990356, -0.00024276971817016602, -0.00022130459547042847, -0.00019983947277069092, -0.00017837435007095337, -0.00015690922737121582, -0.00013544410467147827, -0.00011397898197174072, -9.251385927200317e-05, -7.104873657226562e-05, -4.9583613872528076e-05, -2.8118491172790527e-05, -6.6533684730529785e-06, 1.481175422668457e-05, 3.627687692642212e-05, 5.774199962615967e-05, 7.920712232589722e-05, 0.00010067224502563477, 0.00012213736772537231, 0.00014360249042510986, 0.0001650676131248474, 0.00018653273582458496, 0.0002079978585243225, 0.00022946298122406006, 0.0002509281039237976, 0.00027239322662353516, 0.0002938583493232727, 0.00031532347202301025, 0.0003367885947227478, 0.00035825371742248535, 0.0003797188401222229, 0.00040118396282196045, 0.000422649085521698, 0.00044411420822143555, 0.0004655793309211731, 0.00048704445362091064, 0.0005085095763206482, 0.0005299746990203857, 0.0005514398217201233, 0.0005729049444198608, 0.0005943700671195984, 0.0006158351898193359]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 4.0, 8.0, 7.0, 10.0, 16.0, 17.0, 11.0, 19.0, 26.0, 23.0, 31.0, 27.0, 36.0, 37.0, 32.0, 42.0, 54.0, 50.0, 44.0, 57.0, 48.0, 50.0, 40.0, 39.0, 33.0, 32.0, 31.0, 25.0, 24.0, 27.0, 18.0, 17.0, 14.0, 10.0, 11.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.37109375, -5.19659423828125, -5.0220947265625, -4.84759521484375, -4.673095703125, -4.49859619140625, -4.3240966796875, -4.14959716796875, -3.97509765625, -3.80059814453125, -3.6260986328125, -3.45159912109375, -3.277099609375, -3.10260009765625, -2.9281005859375, -2.75360107421875, -2.5791015625, -2.40460205078125, -2.2301025390625, -2.05560302734375, -1.881103515625, -1.70660400390625, -1.5321044921875, -1.35760498046875, -1.18310546875, -1.00860595703125, -0.8341064453125, -0.65960693359375, -0.485107421875, -0.31060791015625, -0.1361083984375, 0.03839111328125, 0.212890625, 0.38739013671875, 0.5618896484375, 0.73638916015625, 0.910888671875, 1.08538818359375, 1.2598876953125, 1.43438720703125, 1.60888671875, 1.78338623046875, 1.9578857421875, 2.13238525390625, 2.306884765625, 2.48138427734375, 2.6558837890625, 2.83038330078125, 3.0048828125, 3.17938232421875, 3.3538818359375, 3.52838134765625, 3.702880859375, 3.87738037109375, 4.0518798828125, 4.22637939453125, 4.40087890625, 4.57537841796875, 4.7498779296875, 4.92437744140625, 5.098876953125, 5.27337646484375, 5.4478759765625, 5.62237548828125, 5.796875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 8.0, 15.0, 18.0, 31.0, 36.0, 50.0, 58.0, 90.0, 117.0, 202.0, 276.0, 407.0, 648.0, 973.0, 1555.0, 2507.0, 4091.0, 7049.0, 12948.0, 26140.0, 58992.0, 150188.0, 419462.0, 213651.0, 77708.0, 33700.0, 16250.0, 8495.0, 4868.0, 2851.0, 1748.0, 1095.0, 777.0, 482.0, 327.0, 192.0, 158.0, 107.0, 82.0, 50.0, 41.0, 31.0, 20.0, 18.0, 14.0, 5.0, 8.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.419921875, -3.308380126953125, -3.19683837890625, -3.085296630859375, -2.9737548828125, -2.862213134765625, -2.75067138671875, -2.639129638671875, -2.527587890625, -2.416046142578125, -2.30450439453125, -2.192962646484375, -2.0814208984375, -1.969879150390625, -1.85833740234375, -1.746795654296875, -1.63525390625, -1.523712158203125, -1.41217041015625, -1.300628662109375, -1.1890869140625, -1.077545166015625, -0.96600341796875, -0.854461669921875, -0.742919921875, -0.631378173828125, -0.51983642578125, -0.408294677734375, -0.2967529296875, -0.185211181640625, -0.07366943359375, 0.037872314453125, 0.1494140625, 0.260955810546875, 0.37249755859375, 0.484039306640625, 0.5955810546875, 0.707122802734375, 0.81866455078125, 0.930206298828125, 1.041748046875, 1.153289794921875, 1.26483154296875, 1.376373291015625, 1.4879150390625, 1.599456787109375, 1.71099853515625, 1.822540283203125, 1.93408203125, 2.045623779296875, 2.15716552734375, 2.268707275390625, 2.3802490234375, 2.491790771484375, 2.60333251953125, 2.714874267578125, 2.826416015625, 2.937957763671875, 3.04949951171875, 3.161041259765625, 3.2725830078125, 3.384124755859375, 3.49566650390625, 3.607208251953125, 3.71875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 12.0, 4.0, 5.0, 8.0, 14.0, 17.0, 19.0, 17.0, 23.0, 24.0, 26.0, 24.0, 35.0, 33.0, 46.0, 52.0, 64.0, 131.0, 1644.0, 307.0, 98.0, 60.0, 49.0, 46.0, 43.0, 30.0, 37.0, 30.0, 16.0, 21.0, 18.0, 18.0, 19.0, 11.0, 10.0, 6.0, 6.0, 5.0, 2.0, 4.0, 0.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.15625, -19.541748046875, -18.92724609375, -18.312744140625, -17.6982421875, -17.083740234375, -16.46923828125, -15.854736328125, -15.240234375, -14.625732421875, -14.01123046875, -13.396728515625, -12.7822265625, -12.167724609375, -11.55322265625, -10.938720703125, -10.32421875, -9.709716796875, -9.09521484375, -8.480712890625, -7.8662109375, -7.251708984375, -6.63720703125, -6.022705078125, -5.408203125, -4.793701171875, -4.17919921875, -3.564697265625, -2.9501953125, -2.335693359375, -1.72119140625, -1.106689453125, -0.4921875, 0.122314453125, 0.73681640625, 1.351318359375, 1.9658203125, 2.580322265625, 3.19482421875, 3.809326171875, 4.423828125, 5.038330078125, 5.65283203125, 6.267333984375, 6.8818359375, 7.496337890625, 8.11083984375, 8.725341796875, 9.33984375, 9.954345703125, 10.56884765625, 11.183349609375, 11.7978515625, 12.412353515625, 13.02685546875, 13.641357421875, 14.255859375, 14.870361328125, 15.48486328125, 16.099365234375, 16.7138671875, 17.328369140625, 17.94287109375, 18.557373046875, 19.171875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 5.0, 10.0, 6.0, 17.0, 11.0, 15.0, 20.0, 33.0, 24.0, 48.0, 57.0, 60.0, 96.0, 184.0, 355.0, 835.0, 4797.0, 249757.0, 2871453.0, 15289.0, 1444.0, 469.0, 215.0, 121.0, 95.0, 49.0, 49.0, 30.0, 26.0, 20.0, 24.0, 15.0, 15.0, 11.0, 8.0, 9.0, 4.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.125, -32.09619140625, -31.0673828125, -30.03857421875, -29.009765625, -27.98095703125, -26.9521484375, -25.92333984375, -24.89453125, -23.86572265625, -22.8369140625, -21.80810546875, -20.779296875, -19.75048828125, -18.7216796875, -17.69287109375, -16.6640625, -15.63525390625, -14.6064453125, -13.57763671875, -12.548828125, -11.52001953125, -10.4912109375, -9.46240234375, -8.43359375, -7.40478515625, -6.3759765625, -5.34716796875, -4.318359375, -3.28955078125, -2.2607421875, -1.23193359375, -0.203125, 0.82568359375, 1.8544921875, 2.88330078125, 3.912109375, 4.94091796875, 5.9697265625, 6.99853515625, 8.02734375, 9.05615234375, 10.0849609375, 11.11376953125, 12.142578125, 13.17138671875, 14.2001953125, 15.22900390625, 16.2578125, 17.28662109375, 18.3154296875, 19.34423828125, 20.373046875, 21.40185546875, 22.4306640625, 23.45947265625, 24.48828125, 25.51708984375, 26.5458984375, 27.57470703125, 28.603515625, 29.63232421875, 30.6611328125, 31.68994140625, 32.71875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 12.0, 15.0, 18.0, 45.0, 74.0, 120.0, 146.0, 170.0, 139.0, 123.0, 66.0, 44.0, 18.0, 12.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-39.19820785522461, -38.42173767089844, -37.645267486572266, -36.868797302246094, -36.09232711791992, -35.31585693359375, -34.53938674926758, -33.762916564941406, -32.986446380615234, -32.20997619628906, -31.43350601196289, -30.65703582763672, -29.880565643310547, -29.104095458984375, -28.327625274658203, -27.55115509033203, -26.77468490600586, -25.998214721679688, -25.221744537353516, -24.445274353027344, -23.668804168701172, -22.892333984375, -22.115863800048828, -21.339393615722656, -20.56292152404785, -19.78645133972168, -19.009981155395508, -18.233510971069336, -17.457040786743164, -16.680570602416992, -15.90410041809082, -15.127630233764648, -14.351160049438477, -13.574689865112305, -12.798219680786133, -12.021749496459961, -11.245279312133789, -10.468809127807617, -9.692338943481445, -8.915868759155273, -8.139398574829102, -7.36292839050293, -6.586458206176758, -5.809988021850586, -5.033517837524414, -4.257047653198242, -3.480576992034912, -2.7041068077087402, -1.9276361465454102, -1.1511659622192383, -0.37469565868377686, 0.40177464485168457, 1.1782448291778564, 1.9547150135040283, 2.7311854362487793, 3.507655620574951, 4.284125804901123, 5.060595989227295, 5.837066173553467, 6.613536834716797, 7.390007019042969, 8.16647720336914, 8.942947387695312, 9.719417572021484, 10.495887756347656]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 10.0, 9.0, 13.0, 9.0, 21.0, 18.0, 19.0, 14.0, 15.0, 25.0, 27.0, 26.0, 29.0, 28.0, 21.0, 39.0, 37.0, 28.0, 45.0, 46.0, 31.0, 38.0, 51.0, 42.0, 37.0, 38.0, 26.0, 32.0, 31.0, 29.0, 20.0, 19.0, 16.0, 16.0, 17.0, 9.0, 15.0, 12.0, 8.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.617916107177734, -50.75606155395508, -48.89420700073242, -47.032352447509766, -45.170494079589844, -43.30863952636719, -41.44678497314453, -39.584930419921875, -37.72307586669922, -35.86122131347656, -33.999366760253906, -32.13751220703125, -30.27565574645996, -28.413801193237305, -26.551944732666016, -24.69009017944336, -22.828235626220703, -20.966381072998047, -19.10452651977539, -17.2426700592041, -15.380815505981445, -13.518960952758789, -11.657105445861816, -9.795249938964844, -7.9333953857421875, -6.071540355682373, -4.209685325622559, -2.347830295562744, -0.4859752655029297, 1.3758792877197266, 3.237734794616699, 5.099590301513672, 6.961448669433594, 8.82330322265625, 10.685158729553223, 12.547014236450195, 14.408868789672852, 16.270723342895508, 18.132579803466797, 19.994434356689453, 21.85628890991211, 23.718143463134766, 25.579998016357422, 27.44185447692871, 29.303709030151367, 31.165563583374023, 33.02742004394531, 34.88927459716797, 36.751129150390625, 38.61298370361328, 40.47483825683594, 42.336692810058594, 44.19854736328125, 46.060401916503906, 47.92226028442383, 49.784114837646484, 51.64596939086914, 53.5078239440918, 55.36967849731445, 57.23153305053711, 59.09339141845703, 60.95524597167969, 62.817100524902344, 64.678955078125, 66.54080963134766]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 9.0, 2.0, 10.0, 12.0, 14.0, 13.0, 12.0, 12.0, 25.0, 22.0, 30.0, 25.0, 36.0, 39.0, 32.0, 44.0, 49.0, 52.0, 56.0, 38.0, 48.0, 52.0, 36.0, 43.0, 47.0, 31.0, 31.0, 25.0, 21.0, 20.0, 23.0, 21.0, 13.0, 12.0, 10.0, 7.0, 9.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.4453125, -5.264892578125, -5.08447265625, -4.904052734375, -4.7236328125, -4.543212890625, -4.36279296875, -4.182373046875, -4.001953125, -3.821533203125, -3.64111328125, -3.460693359375, -3.2802734375, -3.099853515625, -2.91943359375, -2.739013671875, -2.55859375, -2.378173828125, -2.19775390625, -2.017333984375, -1.8369140625, -1.656494140625, -1.47607421875, -1.295654296875, -1.115234375, -0.934814453125, -0.75439453125, -0.573974609375, -0.3935546875, -0.213134765625, -0.03271484375, 0.147705078125, 0.328125, 0.508544921875, 0.68896484375, 0.869384765625, 1.0498046875, 1.230224609375, 1.41064453125, 1.591064453125, 1.771484375, 1.951904296875, 2.13232421875, 2.312744140625, 2.4931640625, 2.673583984375, 2.85400390625, 3.034423828125, 3.21484375, 3.395263671875, 3.57568359375, 3.756103515625, 3.9365234375, 4.116943359375, 4.29736328125, 4.477783203125, 4.658203125, 4.838623046875, 5.01904296875, 5.199462890625, 5.3798828125, 5.560302734375, 5.74072265625, 5.921142578125, 6.1015625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 8.0, 4.0, 8.0, 16.0, 21.0, 18.0, 19.0, 20.0, 31.0, 38.0, 23.0, 67.0, 84.0, 228.0, 1179.0, 22194.0, 2692127.0, 1463850.0, 12855.0, 881.0, 211.0, 103.0, 47.0, 42.0, 35.0, 26.0, 29.0, 15.0, 17.0, 11.0, 16.0, 16.0, 6.0, 8.0, 11.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.03125, -30.923828125, -29.81640625, -28.708984375, -27.6015625, -26.494140625, -25.38671875, -24.279296875, -23.171875, -22.064453125, -20.95703125, -19.849609375, -18.7421875, -17.634765625, -16.52734375, -15.419921875, -14.3125, -13.205078125, -12.09765625, -10.990234375, -9.8828125, -8.775390625, -7.66796875, -6.560546875, -5.453125, -4.345703125, -3.23828125, -2.130859375, -1.0234375, 0.083984375, 1.19140625, 2.298828125, 3.40625, 4.513671875, 5.62109375, 6.728515625, 7.8359375, 8.943359375, 10.05078125, 11.158203125, 12.265625, 13.373046875, 14.48046875, 15.587890625, 16.6953125, 17.802734375, 18.91015625, 20.017578125, 21.125, 22.232421875, 23.33984375, 24.447265625, 25.5546875, 26.662109375, 27.76953125, 28.876953125, 29.984375, 31.091796875, 32.19921875, 33.306640625, 34.4140625, 35.521484375, 36.62890625, 37.736328125, 38.84375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 8.0, 8.0, 10.0, 12.0, 22.0, 39.0, 56.0, 79.0, 126.0, 145.0, 200.0, 254.0, 357.0, 475.0, 553.0, 472.0, 382.0, 265.0, 184.0, 127.0, 116.0, 65.0, 40.0, 32.0, 15.0, 12.0, 8.0, 10.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.765625, -22.2021484375, -21.638671875, -21.0751953125, -20.51171875, -19.9482421875, -19.384765625, -18.8212890625, -18.2578125, -17.6943359375, -17.130859375, -16.5673828125, -16.00390625, -15.4404296875, -14.876953125, -14.3134765625, -13.75, -13.1865234375, -12.623046875, -12.0595703125, -11.49609375, -10.9326171875, -10.369140625, -9.8056640625, -9.2421875, -8.6787109375, -8.115234375, -7.5517578125, -6.98828125, -6.4248046875, -5.861328125, -5.2978515625, -4.734375, -4.1708984375, -3.607421875, -3.0439453125, -2.48046875, -1.9169921875, -1.353515625, -0.7900390625, -0.2265625, 0.3369140625, 0.900390625, 1.4638671875, 2.02734375, 2.5908203125, 3.154296875, 3.7177734375, 4.28125, 4.8447265625, 5.408203125, 5.9716796875, 6.53515625, 7.0986328125, 7.662109375, 8.2255859375, 8.7890625, 9.3525390625, 9.916015625, 10.4794921875, 11.04296875, 11.6064453125, 12.169921875, 12.7333984375, 13.296875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 11.0, 12.0, 15.0, 13.0, 41.0, 71.0, 84.0, 137.0, 197.0, 316.0, 827.0, 5986.0, 421980.0, 3726651.0, 34887.0, 1753.0, 481.0, 285.0, 172.0, 113.0, 87.0, 51.0, 39.0, 25.0, 17.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.1875, -60.197265625, -58.20703125, -56.216796875, -54.2265625, -52.236328125, -50.24609375, -48.255859375, -46.265625, -44.275390625, -42.28515625, -40.294921875, -38.3046875, -36.314453125, -34.32421875, -32.333984375, -30.34375, -28.353515625, -26.36328125, -24.373046875, -22.3828125, -20.392578125, -18.40234375, -16.412109375, -14.421875, -12.431640625, -10.44140625, -8.451171875, -6.4609375, -4.470703125, -2.48046875, -0.490234375, 1.5, 3.490234375, 5.48046875, 7.470703125, 9.4609375, 11.451171875, 13.44140625, 15.431640625, 17.421875, 19.412109375, 21.40234375, 23.392578125, 25.3828125, 27.373046875, 29.36328125, 31.353515625, 33.34375, 35.333984375, 37.32421875, 39.314453125, 41.3046875, 43.294921875, 45.28515625, 47.275390625, 49.265625, 51.255859375, 53.24609375, 55.236328125, 57.2265625, 59.216796875, 61.20703125, 63.197265625, 65.1875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 10.0, 15.0, 18.0, 33.0, 60.0, 87.0, 96.0, 109.0, 106.0, 131.0, 95.0, 80.0, 64.0, 34.0, 33.0, 19.0, 5.0, 7.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.925573348999023, -26.835285186767578, -24.744997024536133, -22.654708862304688, -20.564422607421875, -18.474132537841797, -16.383846282958984, -14.293558120727539, -12.203269958496094, -10.112981796264648, -8.022693634033203, -5.932406425476074, -3.842118263244629, -1.7518301010131836, 0.3384571075439453, 2.4287452697753906, 4.519033432006836, 6.609321594238281, 8.699609756469727, 10.789896965026855, 12.8801851272583, 14.970473289489746, 17.060760498046875, 19.15104866027832, 21.241336822509766, 23.33162498474121, 25.421913146972656, 27.51219940185547, 29.602489471435547, 31.69277572631836, 33.78306579589844, 35.87335205078125, 37.963645935058594, 40.053932189941406, 42.144222259521484, 44.2345085144043, 46.324798583984375, 48.41508483886719, 50.50537109375, 52.59566116333008, 54.685951232910156, 56.77623748779297, 58.86652755737305, 60.95681381225586, 63.04710388183594, 65.13739013671875, 67.22767639160156, 69.31796264648438, 71.40824890136719, 73.49853515625, 75.58882141113281, 77.67911529541016, 79.76940155029297, 81.85968780517578, 83.9499740600586, 86.04026794433594, 88.13055419921875, 90.22084045410156, 92.31112670898438, 94.40142059326172, 96.49170684814453, 98.58199310302734, 100.67227935791016, 102.7625732421875, 104.85285949707031]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 4.0, 4.0, 8.0, 12.0, 11.0, 16.0, 15.0, 17.0, 13.0, 24.0, 28.0, 29.0, 32.0, 24.0, 45.0, 35.0, 36.0, 33.0, 35.0, 44.0, 35.0, 48.0, 49.0, 38.0, 33.0, 34.0, 30.0, 37.0, 26.0, 27.0, 37.0, 16.0, 24.0, 19.0, 15.0, 11.0, 16.0, 8.0, 6.0, 3.0, 8.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.36811828613281, -48.77981185913086, -47.191505432128906, -45.60319900512695, -44.014892578125, -42.42658233642578, -40.83827590942383, -39.249969482421875, -37.66166305541992, -36.07335662841797, -34.485050201416016, -32.89674377441406, -31.308435440063477, -29.720129013061523, -28.131820678710938, -26.543514251708984, -24.95520782470703, -23.366901397705078, -21.778594970703125, -20.19028663635254, -18.601980209350586, -17.013673782348633, -15.425366401672363, -13.837059020996094, -12.24875259399414, -10.660446166992188, -9.072138786315918, -7.483831882476807, -5.895524978637695, -4.307218074798584, -2.7189111709594727, -1.1306037902832031, 0.4577064514160156, 2.046013355255127, 3.6343202590942383, 5.22262716293335, 6.810934066772461, 8.399240493774414, 9.987547874450684, 11.575855255126953, 13.164161682128906, 14.75246810913086, 16.340774536132812, 17.9290828704834, 19.51738929748535, 21.105695724487305, 22.69400405883789, 24.282310485839844, 25.870616912841797, 27.45892333984375, 29.047229766845703, 30.63553810119629, 32.223846435546875, 33.81215286254883, 35.40045928955078, 36.988765716552734, 38.57707214355469, 40.16537857055664, 41.753684997558594, 43.34199142456055, 44.9302978515625, 46.51860809326172, 48.10691452026367, 49.695220947265625, 51.28352737426758]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 10.0, 7.0, 16.0, 27.0, 14.0, 19.0, 22.0, 15.0, 21.0, 28.0, 35.0, 41.0, 42.0, 37.0, 41.0, 51.0, 40.0, 55.0, 45.0, 44.0, 45.0, 45.0, 35.0, 29.0, 38.0, 22.0, 31.0, 23.0, 18.0, 21.0, 11.0, 12.0, 14.0, 10.0, 8.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.171875, -4.9876708984375, -4.803466796875, -4.6192626953125, -4.43505859375, -4.2508544921875, -4.066650390625, -3.8824462890625, -3.6982421875, -3.5140380859375, -3.329833984375, -3.1456298828125, -2.96142578125, -2.7772216796875, -2.593017578125, -2.4088134765625, -2.224609375, -2.0404052734375, -1.856201171875, -1.6719970703125, -1.48779296875, -1.3035888671875, -1.119384765625, -0.9351806640625, -0.7509765625, -0.5667724609375, -0.382568359375, -0.1983642578125, -0.01416015625, 0.1700439453125, 0.354248046875, 0.5384521484375, 0.72265625, 0.9068603515625, 1.091064453125, 1.2752685546875, 1.45947265625, 1.6436767578125, 1.827880859375, 2.0120849609375, 2.1962890625, 2.3804931640625, 2.564697265625, 2.7489013671875, 2.93310546875, 3.1173095703125, 3.301513671875, 3.4857177734375, 3.669921875, 3.8541259765625, 4.038330078125, 4.2225341796875, 4.40673828125, 4.5909423828125, 4.775146484375, 4.9593505859375, 5.1435546875, 5.3277587890625, 5.511962890625, 5.6961669921875, 5.88037109375, 6.0645751953125, 6.248779296875, 6.4329833984375, 6.6171875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 9.0, 5.0, 17.0, 18.0, 29.0, 34.0, 72.0, 109.0, 159.0, 244.0, 312.0, 432.0, 680.0, 1054.0, 1509.0, 2269.0, 3424.0, 5201.0, 7763.0, 12182.0, 18905.0, 29713.0, 47151.0, 74350.0, 116617.0, 169135.0, 184449.0, 133856.0, 86320.0, 54511.0, 34987.0, 21996.0, 14159.0, 9127.0, 5947.0, 3851.0, 2574.0, 1805.0, 1173.0, 769.0, 526.0, 386.0, 250.0, 148.0, 124.0, 90.0, 52.0, 31.0, 17.0, 11.0, 4.0, 5.0, 1.0, 5.0, 1.0, 2.0], "bins": [-0.61962890625, -0.6014938354492188, -0.5833587646484375, -0.5652236938476562, -0.547088623046875, -0.5289535522460938, -0.5108184814453125, -0.49268341064453125, -0.47454833984375, -0.45641326904296875, -0.4382781982421875, -0.42014312744140625, -0.402008056640625, -0.38387298583984375, -0.3657379150390625, -0.34760284423828125, -0.3294677734375, -0.31133270263671875, -0.2931976318359375, -0.27506256103515625, -0.256927490234375, -0.23879241943359375, -0.2206573486328125, -0.20252227783203125, -0.18438720703125, -0.16625213623046875, -0.1481170654296875, -0.12998199462890625, -0.111846923828125, -0.09371185302734375, -0.0755767822265625, -0.05744171142578125, -0.039306640625, -0.02117156982421875, -0.0030364990234375, 0.01509857177734375, 0.033233642578125, 0.05136871337890625, 0.0695037841796875, 0.08763885498046875, 0.10577392578125, 0.12390899658203125, 0.1420440673828125, 0.16017913818359375, 0.178314208984375, 0.19644927978515625, 0.2145843505859375, 0.23271942138671875, 0.2508544921875, 0.26898956298828125, 0.2871246337890625, 0.30525970458984375, 0.323394775390625, 0.34152984619140625, 0.3596649169921875, 0.37779998779296875, 0.39593505859375, 0.41407012939453125, 0.4322052001953125, 0.45034027099609375, 0.468475341796875, 0.48661041259765625, 0.5047454833984375, 0.5228805541992188, 0.541015625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 7.0, 5.0, 6.0, 14.0, 12.0, 15.0, 16.0, 18.0, 26.0, 20.0, 20.0, 35.0, 28.0, 29.0, 45.0, 35.0, 48.0, 46.0, 45.0, 1063.0, 37.0, 50.0, 33.0, 40.0, 38.0, 37.0, 32.0, 30.0, 29.0, 27.0, 18.0, 23.0, 20.0, 12.0, 15.0, 12.0, 9.0, 7.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.28125, -4.1644287109375, -4.047607421875, -3.9307861328125, -3.81396484375, -3.6971435546875, -3.580322265625, -3.4635009765625, -3.3466796875, -3.2298583984375, -3.113037109375, -2.9962158203125, -2.87939453125, -2.7625732421875, -2.645751953125, -2.5289306640625, -2.412109375, -2.2952880859375, -2.178466796875, -2.0616455078125, -1.94482421875, -1.8280029296875, -1.711181640625, -1.5943603515625, -1.4775390625, -1.3607177734375, -1.243896484375, -1.1270751953125, -1.01025390625, -0.8934326171875, -0.776611328125, -0.6597900390625, -0.54296875, -0.4261474609375, -0.309326171875, -0.1925048828125, -0.07568359375, 0.0411376953125, 0.157958984375, 0.2747802734375, 0.3916015625, 0.5084228515625, 0.625244140625, 0.7420654296875, 0.85888671875, 0.9757080078125, 1.092529296875, 1.2093505859375, 1.326171875, 1.4429931640625, 1.559814453125, 1.6766357421875, 1.79345703125, 1.9102783203125, 2.027099609375, 2.1439208984375, 2.2607421875, 2.3775634765625, 2.494384765625, 2.6112060546875, 2.72802734375, 2.8448486328125, 2.961669921875, 3.0784912109375, 3.1953125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 16.0, 9.0, 11.0, 12.0, 25.0, 51.0, 71.0, 103.0, 138.0, 212.0, 338.0, 447.0, 766.0, 1148.0, 1648.0, 2558.0, 3878.0, 6169.0, 9211.0, 14367.0, 21638.0, 33773.0, 52000.0, 81846.0, 127891.0, 1197211.0, 198494.0, 122455.0, 78545.0, 50216.0, 32139.0, 20634.0, 13481.0, 8813.0, 5665.0, 3761.0, 2489.0, 1497.0, 1136.0, 748.0, 451.0, 344.0, 219.0, 169.0, 107.0, 73.0, 61.0, 28.0, 29.0, 18.0, 12.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0], "bins": [-0.556640625, -0.5397491455078125, -0.522857666015625, -0.5059661865234375, -0.48907470703125, -0.4721832275390625, -0.455291748046875, -0.4384002685546875, -0.4215087890625, -0.4046173095703125, -0.387725830078125, -0.3708343505859375, -0.35394287109375, -0.3370513916015625, -0.320159912109375, -0.3032684326171875, -0.286376953125, -0.2694854736328125, -0.252593994140625, -0.2357025146484375, -0.21881103515625, -0.2019195556640625, -0.185028076171875, -0.1681365966796875, -0.1512451171875, -0.1343536376953125, -0.117462158203125, -0.1005706787109375, -0.08367919921875, -0.0667877197265625, -0.049896240234375, -0.0330047607421875, -0.01611328125, 0.0007781982421875, 0.017669677734375, 0.0345611572265625, 0.05145263671875, 0.0683441162109375, 0.085235595703125, 0.1021270751953125, 0.1190185546875, 0.1359100341796875, 0.152801513671875, 0.1696929931640625, 0.18658447265625, 0.2034759521484375, 0.220367431640625, 0.2372589111328125, 0.254150390625, 0.2710418701171875, 0.287933349609375, 0.3048248291015625, 0.32171630859375, 0.3386077880859375, 0.355499267578125, 0.3723907470703125, 0.3892822265625, 0.4061737060546875, 0.423065185546875, 0.4399566650390625, 0.45684814453125, 0.4737396240234375, 0.490631103515625, 0.5075225830078125, 0.5244140625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 10.0, 4.0, 6.0, 8.0, 11.0, 19.0, 16.0, 20.0, 30.0, 32.0, 38.0, 41.0, 45.0, 54.0, 50.0, 46.0, 66.0, 72.0, 53.0, 59.0, 50.0, 44.0, 38.0, 34.0, 29.0, 20.0, 22.0, 20.0, 10.0, 10.0, 9.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00145721435546875, -0.001406162977218628, -0.0013551115989685059, -0.0013040602207183838, -0.0012530088424682617, -0.0012019574642181396, -0.0011509060859680176, -0.0010998547077178955, -0.0010488033294677734, -0.0009977519512176514, -0.0009467005729675293, -0.0008956491947174072, -0.0008445978164672852, -0.0007935464382171631, -0.000742495059967041, -0.0006914436817169189, -0.0006403923034667969, -0.0005893409252166748, -0.0005382895469665527, -0.00048723816871643066, -0.0004361867904663086, -0.0003851354122161865, -0.00033408403396606445, -0.0002830326557159424, -0.0002319812774658203, -0.00018092989921569824, -0.00012987852096557617, -7.88271427154541e-05, -2.777576446533203e-05, 2.327561378479004e-05, 7.432699203491211e-05, 0.00012537837028503418, 0.00017642974853515625, 0.00022748112678527832, 0.0002785325050354004, 0.00032958388328552246, 0.00038063526153564453, 0.0004316866397857666, 0.00048273801803588867, 0.0005337893962860107, 0.0005848407745361328, 0.0006358921527862549, 0.000686943531036377, 0.000737994909286499, 0.0007890462875366211, 0.0008400976657867432, 0.0008911490440368652, 0.0009422004222869873, 0.0009932518005371094, 0.0010443031787872314, 0.0010953545570373535, 0.0011464059352874756, 0.0011974573135375977, 0.0012485086917877197, 0.0012995600700378418, 0.0013506114482879639, 0.001401662826538086, 0.001452714204788208, 0.00150376558303833, 0.0015548169612884521, 0.0016058683395385742, 0.0016569197177886963, 0.0017079710960388184, 0.0017590224742889404, 0.0018100738525390625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 5.0, 6.0, 6.0, 8.0, 8.0, 13.0, 18.0, 36.0, 44.0, 55.0, 57.0, 104.0, 119.0, 196.0, 302.0, 579.0, 3853.0, 1032725.0, 8751.0, 627.0, 324.0, 198.0, 119.0, 108.0, 78.0, 41.0, 34.0, 34.0, 17.0, 21.0, 9.0, 9.0, 11.0, 9.0, 8.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.035064697265625, -0.033987998962402344, -0.03291130065917969, -0.03183460235595703, -0.030757904052734375, -0.02968120574951172, -0.028604507446289062, -0.027527809143066406, -0.02645111083984375, -0.025374412536621094, -0.024297714233398438, -0.02322101593017578, -0.022144317626953125, -0.02106761932373047, -0.019990921020507812, -0.018914222717285156, -0.0178375244140625, -0.016760826110839844, -0.015684127807617188, -0.014607429504394531, -0.013530731201171875, -0.012454032897949219, -0.011377334594726562, -0.010300636291503906, -0.00922393798828125, -0.008147239685058594, -0.0070705413818359375, -0.005993843078613281, -0.004917144775390625, -0.0038404464721679688, -0.0027637481689453125, -0.0016870498657226562, -0.0006103515625, 0.00046634674072265625, 0.0015430450439453125, 0.0026197433471679688, 0.003696441650390625, 0.004773139953613281, 0.0058498382568359375, 0.006926536560058594, 0.00800323486328125, 0.009079933166503906, 0.010156631469726562, 0.011233329772949219, 0.012310028076171875, 0.013386726379394531, 0.014463424682617188, 0.015540122985839844, 0.0166168212890625, 0.017693519592285156, 0.018770217895507812, 0.01984691619873047, 0.020923614501953125, 0.02200031280517578, 0.023077011108398438, 0.024153709411621094, 0.02523040771484375, 0.026307106018066406, 0.027383804321289062, 0.02846050262451172, 0.029537200927734375, 0.03061389923095703, 0.03169059753417969, 0.032767295837402344, 0.033843994140625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 33.0, 116.0, 327.0, 351.0, 148.0, 33.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00282714469358325, -0.002736028516665101, -0.002644912339746952, -0.002553796162828803, -0.002462679985910654, -0.002371563808992505, -0.002280447632074356, -0.002189331455156207, -0.002098215278238058, -0.002007099101319909, -0.00191598292440176, -0.001824866747483611, -0.0017337505705654621, -0.0016426343936473131, -0.0015515182167291641, -0.0014604020398110151, -0.0013692858628928661, -0.0012781696859747171, -0.0011870535090565681, -0.0010959373321384192, -0.0010048211552202702, -0.0009137049783021212, -0.0008225888013839722, -0.0007314726244658232, -0.0006403564475476742, -0.0005492402706295252, -0.0004581240937113762, -0.0003670079167932272, -0.0002758917398750782, -0.0001847755629569292, -9.365938603878021e-05, -2.543209120631218e-06, 8.857273496687412e-05, 0.00017968891188502312, 0.0002708050888031721, 0.0003619212657213211, 0.0004530374426394701, 0.0005441536195576191, 0.0006352697964757681, 0.0007263859733939171, 0.0008175021503120661, 0.0009086183272302151, 0.000999734504148364, 0.001090850681066513, 0.001181966857984662, 0.001273083034902811, 0.00136419921182096, 0.001455315388739109, 0.001546431565657258, 0.001637547742575407, 0.001728663919493556, 0.001819780096411705, 0.001910896273329854, 0.002002012450248003, 0.002093128627166152, 0.002184244804084301, 0.00227536098100245, 0.002366477157920599, 0.002457593334838748, 0.002548709511756897, 0.002639825688675046, 0.002730941865593195, 0.002822058042511344, 0.002913174219429493, 0.003004290396347642]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 2.0, 4.0, 6.0, 7.0, 13.0, 9.0, 14.0, 12.0, 16.0, 23.0, 25.0, 18.0, 24.0, 42.0, 21.0, 21.0, 43.0, 46.0, 31.0, 36.0, 33.0, 37.0, 36.0, 41.0, 33.0, 39.0, 42.0, 29.0, 21.0, 39.0, 27.0, 38.0, 23.0, 18.0, 26.0, 18.0, 25.0, 7.0, 15.0, 4.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.0008667707443237305, -0.0008421819657087326, -0.0008175931870937347, -0.0007930044084787369, -0.000768415629863739, -0.0007438268512487411, -0.0007192380726337433, -0.0006946492940187454, -0.0006700605154037476, -0.0006454717367887497, -0.0006208829581737518, -0.000596294179558754, -0.0005717054009437561, -0.0005471166223287582, -0.0005225278437137604, -0.0004979390650987625, -0.00047335028648376465, -0.0004487615078687668, -0.0004241727292537689, -0.00039958395063877106, -0.0003749951720237732, -0.00035040639340877533, -0.00032581761479377747, -0.0003012288361787796, -0.00027664005756378174, -0.0002520512789487839, -0.000227462500333786, -0.00020287372171878815, -0.00017828494310379028, -0.00015369616448879242, -0.00012910738587379456, -0.00010451860725879669, -7.992982864379883e-05, -5.5341050028800964e-05, -3.07522714138031e-05, -6.163492798805237e-06, 1.8425285816192627e-05, 4.301406443119049e-05, 6.760284304618835e-05, 9.219162166118622e-05, 0.00011678040027618408, 0.00014136917889118195, 0.0001659579575061798, 0.00019054673612117767, 0.00021513551473617554, 0.0002397242933511734, 0.00026431307196617126, 0.00028890185058116913, 0.000313490629196167, 0.00033807940781116486, 0.0003626681864261627, 0.0003872569650411606, 0.00041184574365615845, 0.0004364345222711563, 0.0004610233008861542, 0.00048561207950115204, 0.0005102008581161499, 0.0005347896367311478, 0.0005593784153461456, 0.0005839671939611435, 0.0006085559725761414, 0.0006331447511911392, 0.0006577335298061371, 0.000682322308421135, 0.0007069110870361328]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 10.0, 7.0, 16.0, 27.0, 14.0, 19.0, 22.0, 15.0, 21.0, 28.0, 35.0, 41.0, 42.0, 37.0, 41.0, 51.0, 40.0, 55.0, 45.0, 44.0, 45.0, 45.0, 35.0, 29.0, 38.0, 22.0, 31.0, 23.0, 18.0, 21.0, 11.0, 12.0, 14.0, 10.0, 8.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.171875, -4.9876708984375, -4.803466796875, -4.6192626953125, -4.43505859375, -4.2508544921875, -4.066650390625, -3.8824462890625, -3.6982421875, -3.5140380859375, -3.329833984375, -3.1456298828125, -2.96142578125, -2.7772216796875, -2.593017578125, -2.4088134765625, -2.224609375, -2.0404052734375, -1.856201171875, -1.6719970703125, -1.48779296875, -1.3035888671875, -1.119384765625, -0.9351806640625, -0.7509765625, -0.5667724609375, -0.382568359375, -0.1983642578125, -0.01416015625, 0.1700439453125, 0.354248046875, 0.5384521484375, 0.72265625, 0.9068603515625, 1.091064453125, 1.2752685546875, 1.45947265625, 1.6436767578125, 1.827880859375, 2.0120849609375, 2.1962890625, 2.3804931640625, 2.564697265625, 2.7489013671875, 2.93310546875, 3.1173095703125, 3.301513671875, 3.4857177734375, 3.669921875, 3.8541259765625, 4.038330078125, 4.2225341796875, 4.40673828125, 4.5909423828125, 4.775146484375, 4.9593505859375, 5.1435546875, 5.3277587890625, 5.511962890625, 5.6961669921875, 5.88037109375, 6.0645751953125, 6.248779296875, 6.4329833984375, 6.6171875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 12.0, 16.0, 20.0, 24.0, 45.0, 47.0, 83.0, 129.0, 185.0, 335.0, 465.0, 774.0, 1322.0, 2357.0, 4412.0, 9562.0, 25999.0, 103948.0, 561044.0, 259372.0, 48936.0, 15294.0, 6531.0, 3262.0, 1771.0, 933.0, 563.0, 351.0, 256.0, 151.0, 105.0, 81.0, 38.0, 37.0, 22.0, 21.0, 10.0, 14.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.01171875, -4.84326171875, -4.6748046875, -4.50634765625, -4.337890625, -4.16943359375, -4.0009765625, -3.83251953125, -3.6640625, -3.49560546875, -3.3271484375, -3.15869140625, -2.990234375, -2.82177734375, -2.6533203125, -2.48486328125, -2.31640625, -2.14794921875, -1.9794921875, -1.81103515625, -1.642578125, -1.47412109375, -1.3056640625, -1.13720703125, -0.96875, -0.80029296875, -0.6318359375, -0.46337890625, -0.294921875, -0.12646484375, 0.0419921875, 0.21044921875, 0.37890625, 0.54736328125, 0.7158203125, 0.88427734375, 1.052734375, 1.22119140625, 1.3896484375, 1.55810546875, 1.7265625, 1.89501953125, 2.0634765625, 2.23193359375, 2.400390625, 2.56884765625, 2.7373046875, 2.90576171875, 3.07421875, 3.24267578125, 3.4111328125, 3.57958984375, 3.748046875, 3.91650390625, 4.0849609375, 4.25341796875, 4.421875, 4.59033203125, 4.7587890625, 4.92724609375, 5.095703125, 5.26416015625, 5.4326171875, 5.60107421875, 5.76953125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 11.0, 7.0, 5.0, 15.0, 14.0, 12.0, 18.0, 10.0, 22.0, 18.0, 29.0, 30.0, 32.0, 29.0, 29.0, 53.0, 45.0, 46.0, 84.0, 1572.0, 426.0, 75.0, 53.0, 53.0, 51.0, 28.0, 38.0, 37.0, 35.0, 30.0, 24.0, 17.0, 12.0, 13.0, 16.0, 12.0, 9.0, 4.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-18.6875, -18.1201171875, -17.552734375, -16.9853515625, -16.41796875, -15.8505859375, -15.283203125, -14.7158203125, -14.1484375, -13.5810546875, -13.013671875, -12.4462890625, -11.87890625, -11.3115234375, -10.744140625, -10.1767578125, -9.609375, -9.0419921875, -8.474609375, -7.9072265625, -7.33984375, -6.7724609375, -6.205078125, -5.6376953125, -5.0703125, -4.5029296875, -3.935546875, -3.3681640625, -2.80078125, -2.2333984375, -1.666015625, -1.0986328125, -0.53125, 0.0361328125, 0.603515625, 1.1708984375, 1.73828125, 2.3056640625, 2.873046875, 3.4404296875, 4.0078125, 4.5751953125, 5.142578125, 5.7099609375, 6.27734375, 6.8447265625, 7.412109375, 7.9794921875, 8.546875, 9.1142578125, 9.681640625, 10.2490234375, 10.81640625, 11.3837890625, 11.951171875, 12.5185546875, 13.0859375, 13.6533203125, 14.220703125, 14.7880859375, 15.35546875, 15.9228515625, 16.490234375, 17.0576171875, 17.625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 7.0, 6.0, 6.0, 10.0, 14.0, 19.0, 14.0, 15.0, 31.0, 28.0, 41.0, 56.0, 66.0, 122.0, 151.0, 322.0, 652.0, 3184.0, 104387.0, 3021943.0, 12161.0, 1294.0, 411.0, 227.0, 136.0, 91.0, 63.0, 47.0, 42.0, 25.0, 21.0, 18.0, 20.0, 11.0, 15.0, 5.0, 5.0, 14.0, 6.0, 1.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-32.875, -31.886474609375, -30.89794921875, -29.909423828125, -28.9208984375, -27.932373046875, -26.94384765625, -25.955322265625, -24.966796875, -23.978271484375, -22.98974609375, -22.001220703125, -21.0126953125, -20.024169921875, -19.03564453125, -18.047119140625, -17.05859375, -16.070068359375, -15.08154296875, -14.093017578125, -13.1044921875, -12.115966796875, -11.12744140625, -10.138916015625, -9.150390625, -8.161865234375, -7.17333984375, -6.184814453125, -5.1962890625, -4.207763671875, -3.21923828125, -2.230712890625, -1.2421875, -0.253662109375, 0.73486328125, 1.723388671875, 2.7119140625, 3.700439453125, 4.68896484375, 5.677490234375, 6.666015625, 7.654541015625, 8.64306640625, 9.631591796875, 10.6201171875, 11.608642578125, 12.59716796875, 13.585693359375, 14.57421875, 15.562744140625, 16.55126953125, 17.539794921875, 18.5283203125, 19.516845703125, 20.50537109375, 21.493896484375, 22.482421875, 23.470947265625, 24.45947265625, 25.447998046875, 26.4365234375, 27.425048828125, 28.41357421875, 29.402099609375, 30.390625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 36.0, 450.0, 490.0, 36.0, 2.0, 0.0, 0.0, 1.0], "bins": [-173.21722412109375, -170.23013305664062, -167.24305725097656, -164.25596618652344, -161.26889038085938, -158.28179931640625, -155.29470825195312, -152.30763244628906, -149.32054138183594, -146.3334503173828, -143.34637451171875, -140.35928344726562, -137.37220764160156, -134.38511657714844, -131.39804077148438, -128.41094970703125, -125.42386627197266, -122.43678283691406, -119.44969940185547, -116.46261596679688, -113.47552490234375, -110.48844146728516, -107.50135803222656, -104.51427459716797, -101.52719116210938, -98.54010772705078, -95.55302429199219, -92.56593322753906, -89.57884979248047, -86.59176635742188, -83.60468292236328, -80.61759948730469, -77.63050842285156, -74.64342498779297, -71.65634155273438, -68.66925048828125, -65.68216705322266, -62.69508361816406, -59.70800018310547, -56.720916748046875, -53.73383331298828, -50.74674987792969, -47.75966262817383, -44.772579193115234, -41.785491943359375, -38.79840850830078, -35.81132507324219, -32.824241638183594, -29.8371524810791, -26.850067138671875, -23.86298370361328, -20.875898361206055, -17.888813018798828, -14.901727676391602, -11.914644241333008, -8.927558898925781, -5.940473556518555, -2.9533886909484863, 0.03369617462158203, 3.020780563354492, 6.007865905761719, 8.994951248168945, 11.982034683227539, 14.969120025634766, 17.956205368041992]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 1.0, 7.0, 10.0, 5.0, 11.0, 11.0, 17.0, 22.0, 19.0, 25.0, 20.0, 27.0, 26.0, 36.0, 39.0, 36.0, 42.0, 35.0, 29.0, 33.0, 34.0, 38.0, 56.0, 39.0, 41.0, 42.0, 45.0, 27.0, 31.0, 14.0, 25.0, 26.0, 24.0, 29.0, 13.0, 6.0, 17.0, 7.0, 9.0, 8.0, 6.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-61.63927459716797, -59.73326873779297, -57.827266693115234, -55.921260833740234, -54.0152587890625, -52.1092529296875, -50.2032470703125, -48.2972412109375, -46.391239166259766, -44.485233306884766, -42.57923126220703, -40.67322540283203, -38.76721954345703, -36.8612174987793, -34.9552116394043, -33.04920959472656, -31.143203735351562, -29.237199783325195, -27.331195831298828, -25.425189971923828, -23.51918601989746, -21.613182067871094, -19.707176208496094, -17.801172256469727, -15.89516830444336, -13.989164352416992, -12.083159446716309, -10.177154541015625, -8.271150588989258, -6.365146636962891, -4.459141731262207, -2.5531368255615234, -0.6471328735351562, 1.2588715553283691, 3.1648759841918945, 5.07088041305542, 6.976884841918945, 8.882888793945312, 10.788893699645996, 12.69489860534668, 14.600902557373047, 16.506906509399414, 18.41291046142578, 20.31891632080078, 22.22492027282715, 24.130924224853516, 26.036930084228516, 27.942934036254883, 29.84893798828125, 31.754941940307617, 33.660945892333984, 35.566951751708984, 37.47295379638672, 39.37895965576172, 41.28496551513672, 43.19097137451172, 45.09697341918945, 47.00297927856445, 48.90898132324219, 50.81498718261719, 52.72099304199219, 54.62699508666992, 56.53300094604492, 58.439002990722656, 60.345008850097656]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 11.0, 13.0, 15.0, 20.0, 21.0, 16.0, 19.0, 28.0, 21.0, 30.0, 37.0, 32.0, 45.0, 32.0, 46.0, 49.0, 46.0, 54.0, 39.0, 47.0, 42.0, 36.0, 36.0, 36.0, 35.0, 22.0, 26.0, 25.0, 21.0, 18.0, 14.0, 12.0, 10.0, 11.0, 8.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.17578125, -4.98974609375, -4.8037109375, -4.61767578125, -4.431640625, -4.24560546875, -4.0595703125, -3.87353515625, -3.6875, -3.50146484375, -3.3154296875, -3.12939453125, -2.943359375, -2.75732421875, -2.5712890625, -2.38525390625, -2.19921875, -2.01318359375, -1.8271484375, -1.64111328125, -1.455078125, -1.26904296875, -1.0830078125, -0.89697265625, -0.7109375, -0.52490234375, -0.3388671875, -0.15283203125, 0.033203125, 0.21923828125, 0.4052734375, 0.59130859375, 0.77734375, 0.96337890625, 1.1494140625, 1.33544921875, 1.521484375, 1.70751953125, 1.8935546875, 2.07958984375, 2.265625, 2.45166015625, 2.6376953125, 2.82373046875, 3.009765625, 3.19580078125, 3.3818359375, 3.56787109375, 3.75390625, 3.93994140625, 4.1259765625, 4.31201171875, 4.498046875, 4.68408203125, 4.8701171875, 5.05615234375, 5.2421875, 5.42822265625, 5.6142578125, 5.80029296875, 5.986328125, 6.17236328125, 6.3583984375, 6.54443359375, 6.73046875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 4.0, 5.0, 6.0, 9.0, 12.0, 17.0, 22.0, 27.0, 31.0, 56.0, 69.0, 163.0, 250.0, 602.0, 1643.0, 6287.0, 31403.0, 245441.0, 2270847.0, 1476658.0, 134269.0, 19703.0, 4373.0, 1260.0, 479.0, 240.0, 152.0, 70.0, 39.0, 38.0, 20.0, 19.0, 24.0, 11.0, 15.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.390625, -12.9267578125, -12.462890625, -11.9990234375, -11.53515625, -11.0712890625, -10.607421875, -10.1435546875, -9.6796875, -9.2158203125, -8.751953125, -8.2880859375, -7.82421875, -7.3603515625, -6.896484375, -6.4326171875, -5.96875, -5.5048828125, -5.041015625, -4.5771484375, -4.11328125, -3.6494140625, -3.185546875, -2.7216796875, -2.2578125, -1.7939453125, -1.330078125, -0.8662109375, -0.40234375, 0.0615234375, 0.525390625, 0.9892578125, 1.453125, 1.9169921875, 2.380859375, 2.8447265625, 3.30859375, 3.7724609375, 4.236328125, 4.7001953125, 5.1640625, 5.6279296875, 6.091796875, 6.5556640625, 7.01953125, 7.4833984375, 7.947265625, 8.4111328125, 8.875, 9.3388671875, 9.802734375, 10.2666015625, 10.73046875, 11.1943359375, 11.658203125, 12.1220703125, 12.5859375, 13.0498046875, 13.513671875, 13.9775390625, 14.44140625, 14.9052734375, 15.369140625, 15.8330078125, 16.296875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 8.0, 10.0, 14.0, 22.0, 31.0, 49.0, 67.0, 111.0, 151.0, 264.0, 443.0, 601.0, 677.0, 550.0, 398.0, 263.0, 162.0, 116.0, 49.0, 26.0, 25.0, 10.0, 9.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.483154296875, -16.76318359375, -16.043212890625, -15.3232421875, -14.603271484375, -13.88330078125, -13.163330078125, -12.443359375, -11.723388671875, -11.00341796875, -10.283447265625, -9.5634765625, -8.843505859375, -8.12353515625, -7.403564453125, -6.68359375, -5.963623046875, -5.24365234375, -4.523681640625, -3.8037109375, -3.083740234375, -2.36376953125, -1.643798828125, -0.923828125, -0.203857421875, 0.51611328125, 1.236083984375, 1.9560546875, 2.676025390625, 3.39599609375, 4.115966796875, 4.8359375, 5.555908203125, 6.27587890625, 6.995849609375, 7.7158203125, 8.435791015625, 9.15576171875, 9.875732421875, 10.595703125, 11.315673828125, 12.03564453125, 12.755615234375, 13.4755859375, 14.195556640625, 14.91552734375, 15.635498046875, 16.35546875, 17.075439453125, 17.79541015625, 18.515380859375, 19.2353515625, 19.955322265625, 20.67529296875, 21.395263671875, 22.115234375, 22.835205078125, 23.55517578125, 24.275146484375, 24.9951171875, 25.715087890625, 26.43505859375, 27.155029296875, 27.875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 9.0, 5.0, 17.0, 30.0, 38.0, 73.0, 109.0, 222.0, 505.0, 2504.0, 92671.0, 4040416.0, 54739.0, 1931.0, 480.0, 209.0, 109.0, 69.0, 55.0, 37.0, 10.0, 14.0, 12.0, 7.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.03125, -59.68603515625, -57.3408203125, -54.99560546875, -52.650390625, -50.30517578125, -47.9599609375, -45.61474609375, -43.26953125, -40.92431640625, -38.5791015625, -36.23388671875, -33.888671875, -31.54345703125, -29.1982421875, -26.85302734375, -24.5078125, -22.16259765625, -19.8173828125, -17.47216796875, -15.126953125, -12.78173828125, -10.4365234375, -8.09130859375, -5.74609375, -3.40087890625, -1.0556640625, 1.28955078125, 3.634765625, 5.97998046875, 8.3251953125, 10.67041015625, 13.015625, 15.36083984375, 17.7060546875, 20.05126953125, 22.396484375, 24.74169921875, 27.0869140625, 29.43212890625, 31.77734375, 34.12255859375, 36.4677734375, 38.81298828125, 41.158203125, 43.50341796875, 45.8486328125, 48.19384765625, 50.5390625, 52.88427734375, 55.2294921875, 57.57470703125, 59.919921875, 62.26513671875, 64.6103515625, 66.95556640625, 69.30078125, 71.64599609375, 73.9912109375, 76.33642578125, 78.681640625, 81.02685546875, 83.3720703125, 85.71728515625, 88.0625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 11.0, 50.0, 218.0, 321.0, 265.0, 119.0, 21.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-254.05181884765625, -247.65887451171875, -241.2659149169922, -234.87295532226562, -228.48001098632812, -222.08706665039062, -215.69410705566406, -209.3011474609375, -202.908203125, -196.5152587890625, -190.12229919433594, -183.72933959960938, -177.33639526367188, -170.94345092773438, -164.5504913330078, -158.15753173828125, -151.76458740234375, -145.37164306640625, -138.9786834716797, -132.58572387695312, -126.19277954101562, -119.7998275756836, -113.40687561035156, -107.01392364501953, -100.6209716796875, -94.22801971435547, -87.83506774902344, -81.4421157836914, -75.04916381835938, -68.65621185302734, -62.26325988769531, -55.87030792236328, -49.47734069824219, -43.084388732910156, -36.691436767578125, -30.298484802246094, -23.905532836914062, -17.51258087158203, -11.11962890625, -4.726676940917969, 1.6662750244140625, 8.059226989746094, 14.452178955078125, 20.845130920410156, 27.238082885742188, 33.63103485107422, 40.02398681640625, 46.41693878173828, 52.80989074707031, 59.202842712402344, 65.59579467773438, 71.9887466430664, 78.38169860839844, 84.77465057373047, 91.1676025390625, 97.56055450439453, 103.95350646972656, 110.3464584350586, 116.73941040039062, 123.13236236572266, 129.5253143310547, 135.91827392578125, 142.31121826171875, 148.70416259765625, 155.0971221923828]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 7.0, 8.0, 5.0, 13.0, 17.0, 17.0, 18.0, 15.0, 16.0, 22.0, 31.0, 35.0, 32.0, 35.0, 45.0, 43.0, 42.0, 35.0, 35.0, 44.0, 45.0, 44.0, 41.0, 42.0, 48.0, 35.0, 37.0, 29.0, 34.0, 29.0, 19.0, 18.0, 21.0, 10.0, 10.0, 13.0, 12.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-68.07278442382812, -66.25129699707031, -64.42980194091797, -62.608314514160156, -60.78682327270508, -58.96533203125, -57.14384078979492, -55.322349548339844, -53.50086212158203, -51.67937088012695, -49.857879638671875, -48.03639221191406, -46.214900970458984, -44.393409729003906, -42.57191848754883, -40.75042724609375, -38.92893600463867, -37.107444763183594, -35.285953521728516, -33.46446228027344, -31.642974853515625, -29.821483612060547, -27.99999237060547, -26.17850112915039, -24.357011795043945, -22.535520553588867, -20.714031219482422, -18.892539978027344, -17.071048736572266, -15.24955940246582, -13.428068161010742, -11.60657787322998, -9.785087585449219, -7.963597297668457, -6.142106533050537, -4.320615768432617, -2.4991254806518555, -0.6776351928710938, 1.1438560485839844, 2.965346336364746, 4.786836624145508, 6.6083269119262695, 8.429817199707031, 10.25130844116211, 12.072798728942871, 13.894289016723633, 15.715780258178711, 17.537269592285156, 19.358760833740234, 21.180252075195312, 23.001741409301758, 24.823232650756836, 26.64472198486328, 28.46621322631836, 30.287704467773438, 32.109195709228516, 33.930686950683594, 35.75217819213867, 37.57366943359375, 39.39515686035156, 41.21664810180664, 43.03813934326172, 44.8596305847168, 46.681121826171875, 48.50260925292969]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 8.0, 2.0, 10.0, 9.0, 20.0, 21.0, 23.0, 17.0, 24.0, 24.0, 26.0, 36.0, 42.0, 50.0, 44.0, 42.0, 42.0, 49.0, 46.0, 35.0, 51.0, 42.0, 40.0, 42.0, 49.0, 42.0, 25.0, 24.0, 15.0, 19.0, 18.0, 7.0, 13.0, 9.0, 5.0, 13.0, 4.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8515625, -5.649658203125, -5.44775390625, -5.245849609375, -5.0439453125, -4.842041015625, -4.64013671875, -4.438232421875, -4.236328125, -4.034423828125, -3.83251953125, -3.630615234375, -3.4287109375, -3.226806640625, -3.02490234375, -2.822998046875, -2.62109375, -2.419189453125, -2.21728515625, -2.015380859375, -1.8134765625, -1.611572265625, -1.40966796875, -1.207763671875, -1.005859375, -0.803955078125, -0.60205078125, -0.400146484375, -0.1982421875, 0.003662109375, 0.20556640625, 0.407470703125, 0.609375, 0.811279296875, 1.01318359375, 1.215087890625, 1.4169921875, 1.618896484375, 1.82080078125, 2.022705078125, 2.224609375, 2.426513671875, 2.62841796875, 2.830322265625, 3.0322265625, 3.234130859375, 3.43603515625, 3.637939453125, 3.83984375, 4.041748046875, 4.24365234375, 4.445556640625, 4.6474609375, 4.849365234375, 5.05126953125, 5.253173828125, 5.455078125, 5.656982421875, 5.85888671875, 6.060791015625, 6.2626953125, 6.464599609375, 6.66650390625, 6.868408203125, 7.0703125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 12.0, 8.0, 11.0, 22.0, 30.0, 48.0, 69.0, 96.0, 170.0, 263.0, 374.0, 552.0, 795.0, 1160.0, 1784.0, 2503.0, 3891.0, 5455.0, 8192.0, 11757.0, 17080.0, 25003.0, 36857.0, 54476.0, 82208.0, 123076.0, 165879.0, 159621.0, 114036.0, 75139.0, 50299.0, 34148.0, 23337.0, 15929.0, 11011.0, 7509.0, 4923.0, 3429.0, 2382.0, 1638.0, 1109.0, 780.0, 512.0, 333.0, 217.0, 142.0, 99.0, 70.0, 55.0, 29.0, 17.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.53759765625, -0.5207443237304688, -0.5038909912109375, -0.48703765869140625, -0.470184326171875, -0.45333099365234375, -0.4364776611328125, -0.41962432861328125, -0.40277099609375, -0.38591766357421875, -0.3690643310546875, -0.35221099853515625, -0.335357666015625, -0.31850433349609375, -0.3016510009765625, -0.28479766845703125, -0.2679443359375, -0.25109100341796875, -0.2342376708984375, -0.21738433837890625, -0.200531005859375, -0.18367767333984375, -0.1668243408203125, -0.14997100830078125, -0.13311767578125, -0.11626434326171875, -0.0994110107421875, -0.08255767822265625, -0.065704345703125, -0.04885101318359375, -0.0319976806640625, -0.01514434814453125, 0.001708984375, 0.01856231689453125, 0.0354156494140625, 0.05226898193359375, 0.069122314453125, 0.08597564697265625, 0.1028289794921875, 0.11968231201171875, 0.13653564453125, 0.15338897705078125, 0.1702423095703125, 0.18709564208984375, 0.203948974609375, 0.22080230712890625, 0.2376556396484375, 0.25450897216796875, 0.2713623046875, 0.28821563720703125, 0.3050689697265625, 0.32192230224609375, 0.338775634765625, 0.35562896728515625, 0.3724822998046875, 0.38933563232421875, 0.40618896484375, 0.42304229736328125, 0.4398956298828125, 0.45674896240234375, 0.473602294921875, 0.49045562744140625, 0.5073089599609375, 0.5241622924804688, 0.541015625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 11.0, 4.0, 9.0, 15.0, 13.0, 13.0, 13.0, 12.0, 28.0, 23.0, 38.0, 20.0, 29.0, 24.0, 27.0, 32.0, 35.0, 45.0, 29.0, 45.0, 1057.0, 33.0, 43.0, 33.0, 41.0, 41.0, 51.0, 34.0, 33.0, 28.0, 28.0, 23.0, 18.0, 14.0, 15.0, 14.0, 12.0, 10.0, 12.0, 5.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4921875, -3.3818359375, -3.271484375, -3.1611328125, -3.05078125, -2.9404296875, -2.830078125, -2.7197265625, -2.609375, -2.4990234375, -2.388671875, -2.2783203125, -2.16796875, -2.0576171875, -1.947265625, -1.8369140625, -1.7265625, -1.6162109375, -1.505859375, -1.3955078125, -1.28515625, -1.1748046875, -1.064453125, -0.9541015625, -0.84375, -0.7333984375, -0.623046875, -0.5126953125, -0.40234375, -0.2919921875, -0.181640625, -0.0712890625, 0.0390625, 0.1494140625, 0.259765625, 0.3701171875, 0.48046875, 0.5908203125, 0.701171875, 0.8115234375, 0.921875, 1.0322265625, 1.142578125, 1.2529296875, 1.36328125, 1.4736328125, 1.583984375, 1.6943359375, 1.8046875, 1.9150390625, 2.025390625, 2.1357421875, 2.24609375, 2.3564453125, 2.466796875, 2.5771484375, 2.6875, 2.7978515625, 2.908203125, 3.0185546875, 3.12890625, 3.2392578125, 3.349609375, 3.4599609375, 3.5703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 7.0, 2.0, 9.0, 7.0, 14.0, 21.0, 36.0, 48.0, 65.0, 89.0, 123.0, 197.0, 253.0, 360.0, 531.0, 774.0, 1076.0, 1554.0, 2329.0, 3404.0, 4871.0, 7487.0, 10917.0, 16218.0, 24542.0, 37916.0, 58098.0, 90720.0, 134502.0, 1220252.0, 156876.0, 112175.0, 72875.0, 47308.0, 30232.0, 19767.0, 13256.0, 8853.0, 6086.0, 4134.0, 2819.0, 1966.0, 1344.0, 897.0, 636.0, 441.0, 323.0, 217.0, 169.0, 112.0, 72.0, 45.0, 36.0, 27.0, 17.0, 12.0, 11.0, 7.0, 9.0, 2.0, 1.0, 1.0], "bins": [-0.52685546875, -0.5102615356445312, -0.4936676025390625, -0.47707366943359375, -0.460479736328125, -0.44388580322265625, -0.4272918701171875, -0.41069793701171875, -0.39410400390625, -0.37751007080078125, -0.3609161376953125, -0.34432220458984375, -0.327728271484375, -0.31113433837890625, -0.2945404052734375, -0.27794647216796875, -0.2613525390625, -0.24475860595703125, -0.2281646728515625, -0.21157073974609375, -0.194976806640625, -0.17838287353515625, -0.1617889404296875, -0.14519500732421875, -0.12860107421875, -0.11200714111328125, -0.0954132080078125, -0.07881927490234375, -0.062225341796875, -0.04563140869140625, -0.0290374755859375, -0.01244354248046875, 0.004150390625, 0.02074432373046875, 0.0373382568359375, 0.05393218994140625, 0.070526123046875, 0.08712005615234375, 0.1037139892578125, 0.12030792236328125, 0.13690185546875, 0.15349578857421875, 0.1700897216796875, 0.18668365478515625, 0.203277587890625, 0.21987152099609375, 0.2364654541015625, 0.25305938720703125, 0.2696533203125, 0.28624725341796875, 0.3028411865234375, 0.31943511962890625, 0.336029052734375, 0.35262298583984375, 0.3692169189453125, 0.38581085205078125, 0.40240478515625, 0.41899871826171875, 0.4355926513671875, 0.45218658447265625, 0.468780517578125, 0.48537445068359375, 0.5019683837890625, 0.5185623168945312, 0.53515625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 2.0, 3.0, 4.0, 11.0, 11.0, 18.0, 19.0, 28.0, 36.0, 55.0, 71.0, 59.0, 81.0, 76.0, 72.0, 103.0, 78.0, 59.0, 41.0, 51.0, 28.0, 22.0, 16.0, 14.0, 15.0, 2.0, 6.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015592575073242188, -0.0014942437410354614, -0.001429229974746704, -0.0013642162084579468, -0.0012992024421691895, -0.0012341886758804321, -0.0011691749095916748, -0.0011041611433029175, -0.0010391473770141602, -0.0009741336107254028, -0.0009091198444366455, -0.0008441060781478882, -0.0007790923118591309, -0.0007140785455703735, -0.0006490647792816162, -0.0005840510129928589, -0.0005190372467041016, -0.00045402348041534424, -0.0003890097141265869, -0.0003239959478378296, -0.00025898218154907227, -0.00019396841526031494, -0.00012895464897155762, -6.394088268280029e-05, 1.0728836059570312e-06, 6.608664989471436e-05, 0.00013110041618347168, 0.000196114182472229, 0.00026112794876098633, 0.00032614171504974365, 0.000391155481338501, 0.0004561692476272583, 0.0005211830139160156, 0.000586196780204773, 0.0006512105464935303, 0.0007162243127822876, 0.0007812380790710449, 0.0008462518453598022, 0.0009112656116485596, 0.0009762793779373169, 0.0010412931442260742, 0.0011063069105148315, 0.0011713206768035889, 0.0012363344430923462, 0.0013013482093811035, 0.0013663619756698608, 0.0014313757419586182, 0.0014963895082473755, 0.0015614032745361328, 0.0016264170408248901, 0.0016914308071136475, 0.0017564445734024048, 0.0018214583396911621, 0.0018864721059799194, 0.0019514858722686768, 0.002016499638557434, 0.0020815134048461914, 0.0021465271711349487, 0.002211540937423706, 0.0022765547037124634, 0.0023415684700012207, 0.002406582236289978, 0.0024715960025787354, 0.0025366097688674927, 0.00260162353515625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 6.0, 4.0, 6.0, 7.0, 9.0, 15.0, 26.0, 38.0, 52.0, 86.0, 139.0, 291.0, 608.0, 11940.0, 1032997.0, 1356.0, 432.0, 217.0, 120.0, 65.0, 56.0, 25.0, 20.0, 8.0, 8.0, 8.0, 6.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.06756591796875, -0.06592988967895508, -0.06429386138916016, -0.06265783309936523, -0.06102180480957031, -0.05938577651977539, -0.05774974822998047, -0.05611371994018555, -0.054477691650390625, -0.0528416633605957, -0.05120563507080078, -0.04956960678100586, -0.04793357849121094, -0.046297550201416016, -0.044661521911621094, -0.04302549362182617, -0.04138946533203125, -0.03975343704223633, -0.038117408752441406, -0.036481380462646484, -0.03484535217285156, -0.03320932388305664, -0.03157329559326172, -0.029937267303466797, -0.028301239013671875, -0.026665210723876953, -0.02502918243408203, -0.02339315414428711, -0.021757125854492188, -0.020121097564697266, -0.018485069274902344, -0.016849040985107422, -0.0152130126953125, -0.013576984405517578, -0.011940956115722656, -0.010304927825927734, -0.008668899536132812, -0.007032871246337891, -0.005396842956542969, -0.003760814666748047, -0.002124786376953125, -0.0004887580871582031, 0.0011472702026367188, 0.0027832984924316406, 0.0044193267822265625, 0.006055355072021484, 0.007691383361816406, 0.009327411651611328, 0.01096343994140625, 0.012599468231201172, 0.014235496520996094, 0.015871524810791016, 0.017507553100585938, 0.01914358139038086, 0.02077960968017578, 0.022415637969970703, 0.024051666259765625, 0.025687694549560547, 0.02732372283935547, 0.02895975112915039, 0.030595779418945312, 0.032231807708740234, 0.033867835998535156, 0.03550386428833008, 0.037139892578125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 13.0, 47.0, 94.0, 162.0, 252.0, 203.0, 129.0, 69.0, 21.0, 13.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020341684576123953, -0.0019720362033694983, -0.001909904065541923, -0.0018477719277143478, -0.0017856396734714508, -0.0017235074192285538, -0.0016613752814009786, -0.0015992431435734034, -0.0015371108893305063, -0.0014749786350876093, -0.001412846497260034, -0.0013507143594324589, -0.0012885821051895618, -0.0012264498509466648, -0.0011643177131190896, -0.0011021855752915144, -0.0010400533210486174, -0.0009779210668057203, -0.0009157889289781451, -0.000853656732942909, -0.0007915245369076729, -0.0007293923408724368, -0.0006672601448372006, -0.0006051279488019645, -0.0005429957527667284, -0.0004808635567314923, -0.00041873136069625616, -0.00035659916466102004, -0.0002944669686257839, -0.0002323347725905478, -0.00017020257655531168, -0.00010807038052007556, -4.5937951654195786e-05, 1.6194244381040335e-05, 7.832644041627645e-05, 0.00014045863645151258, 0.0002025908324867487, 0.0002647230285219848, 0.00032685522455722094, 0.00038898742059245706, 0.0004511196166276932, 0.0005132518126629293, 0.0005753840086981654, 0.0006375162047334015, 0.0006996484007686377, 0.0007617805968038738, 0.0008239127928391099, 0.000886044988874346, 0.0009481771849095821, 0.0010103094391524792, 0.0010724415769800544, 0.0011345737148076296, 0.0011967059690505266, 0.0012588382232934237, 0.0013209703611209989, 0.001383102498948574, 0.001445234753191471, 0.0015073670074343681, 0.0015694991452619433, 0.0016316312830895185, 0.0016937635373324156, 0.0017558957915753126, 0.0018180279294028878, 0.001880160067230463, 0.00194229232147336]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 6.0, 14.0, 6.0, 14.0, 17.0, 12.0, 14.0, 20.0, 19.0, 17.0, 16.0, 27.0, 31.0, 43.0, 37.0, 30.0, 36.0, 28.0, 41.0, 46.0, 34.0, 46.0, 29.0, 47.0, 31.0, 39.0, 33.0, 33.0, 23.0, 19.0, 28.0, 27.0, 21.0, 24.0, 11.0, 14.0, 16.0, 8.0, 7.0, 10.0, 9.0, 7.0, 4.0, 1.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.000769197940826416, -0.0007457379251718521, -0.0007222779095172882, -0.0006988178938627243, -0.0006753578782081604, -0.0006518978625535965, -0.0006284378468990326, -0.0006049778312444687, -0.0005815178155899048, -0.0005580577999353409, -0.000534597784280777, -0.0005111377686262131, -0.00048767775297164917, -0.00046421773731708527, -0.00044075772166252136, -0.00041729770600795746, -0.00039383769035339355, -0.00037037767469882965, -0.00034691765904426575, -0.00032345764338970184, -0.00029999762773513794, -0.00027653761208057404, -0.00025307759642601013, -0.00022961758077144623, -0.00020615756511688232, -0.00018269754946231842, -0.00015923753380775452, -0.0001357775181531906, -0.00011231750249862671, -8.88574868440628e-05, -6.53974711894989e-05, -4.1937455534935e-05, -1.8477439880371094e-05, 4.98257577419281e-06, 2.8442591428756714e-05, 5.190260708332062e-05, 7.536262273788452e-05, 9.882263839244843e-05, 0.00012228265404701233, 0.00014574266970157623, 0.00016920268535614014, 0.00019266270101070404, 0.00021612271666526794, 0.00023958273231983185, 0.00026304274797439575, 0.00028650276362895966, 0.00030996277928352356, 0.00033342279493808746, 0.00035688281059265137, 0.00038034282624721527, 0.0004038028419017792, 0.0004272628575563431, 0.000450722873210907, 0.0004741828888654709, 0.0004976429045200348, 0.0005211029201745987, 0.0005445629358291626, 0.0005680229514837265, 0.0005914829671382904, 0.0006149429827928543, 0.0006384029984474182, 0.0006618630141019821, 0.000685323029756546, 0.0007087830454111099, 0.0007322430610656738]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 8.0, 2.0, 10.0, 9.0, 20.0, 21.0, 23.0, 17.0, 24.0, 24.0, 26.0, 36.0, 42.0, 50.0, 44.0, 42.0, 42.0, 49.0, 46.0, 35.0, 51.0, 42.0, 40.0, 42.0, 49.0, 42.0, 25.0, 24.0, 15.0, 19.0, 18.0, 7.0, 13.0, 9.0, 5.0, 13.0, 4.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8515625, -5.649658203125, -5.44775390625, -5.245849609375, -5.0439453125, -4.842041015625, -4.64013671875, -4.438232421875, -4.236328125, -4.034423828125, -3.83251953125, -3.630615234375, -3.4287109375, -3.226806640625, -3.02490234375, -2.822998046875, -2.62109375, -2.419189453125, -2.21728515625, -2.015380859375, -1.8134765625, -1.611572265625, -1.40966796875, -1.207763671875, -1.005859375, -0.803955078125, -0.60205078125, -0.400146484375, -0.1982421875, 0.003662109375, 0.20556640625, 0.407470703125, 0.609375, 0.811279296875, 1.01318359375, 1.215087890625, 1.4169921875, 1.618896484375, 1.82080078125, 2.022705078125, 2.224609375, 2.426513671875, 2.62841796875, 2.830322265625, 3.0322265625, 3.234130859375, 3.43603515625, 3.637939453125, 3.83984375, 4.041748046875, 4.24365234375, 4.445556640625, 4.6474609375, 4.849365234375, 5.05126953125, 5.253173828125, 5.455078125, 5.656982421875, 5.85888671875, 6.060791015625, 6.2626953125, 6.464599609375, 6.66650390625, 6.868408203125, 7.0703125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 2.0, 10.0, 8.0, 16.0, 26.0, 37.0, 63.0, 74.0, 100.0, 248.0, 359.0, 660.0, 1175.0, 2340.0, 4717.0, 10745.0, 27929.0, 89491.0, 362594.0, 397365.0, 98278.0, 30395.0, 11610.0, 5024.0, 2390.0, 1211.0, 651.0, 394.0, 229.0, 130.0, 97.0, 65.0, 22.0, 29.0, 21.0, 9.0, 16.0, 8.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.63671875, -3.511474609375, -3.38623046875, -3.260986328125, -3.1357421875, -3.010498046875, -2.88525390625, -2.760009765625, -2.634765625, -2.509521484375, -2.38427734375, -2.259033203125, -2.1337890625, -2.008544921875, -1.88330078125, -1.758056640625, -1.6328125, -1.507568359375, -1.38232421875, -1.257080078125, -1.1318359375, -1.006591796875, -0.88134765625, -0.756103515625, -0.630859375, -0.505615234375, -0.38037109375, -0.255126953125, -0.1298828125, -0.004638671875, 0.12060546875, 0.245849609375, 0.37109375, 0.496337890625, 0.62158203125, 0.746826171875, 0.8720703125, 0.997314453125, 1.12255859375, 1.247802734375, 1.373046875, 1.498291015625, 1.62353515625, 1.748779296875, 1.8740234375, 1.999267578125, 2.12451171875, 2.249755859375, 2.375, 2.500244140625, 2.62548828125, 2.750732421875, 2.8759765625, 3.001220703125, 3.12646484375, 3.251708984375, 3.376953125, 3.502197265625, 3.62744140625, 3.752685546875, 3.8779296875, 4.003173828125, 4.12841796875, 4.253662109375, 4.37890625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 3.0, 2.0, 13.0, 16.0, 18.0, 16.0, 23.0, 23.0, 30.0, 34.0, 27.0, 27.0, 46.0, 40.0, 46.0, 61.0, 104.0, 1616.0, 401.0, 103.0, 51.0, 53.0, 47.0, 44.0, 20.0, 39.0, 30.0, 14.0, 27.0, 15.0, 12.0, 13.0, 11.0, 9.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.375, -20.609375, -19.84375, -19.078125, -18.3125, -17.546875, -16.78125, -16.015625, -15.25, -14.484375, -13.71875, -12.953125, -12.1875, -11.421875, -10.65625, -9.890625, -9.125, -8.359375, -7.59375, -6.828125, -6.0625, -5.296875, -4.53125, -3.765625, -3.0, -2.234375, -1.46875, -0.703125, 0.0625, 0.828125, 1.59375, 2.359375, 3.125, 3.890625, 4.65625, 5.421875, 6.1875, 6.953125, 7.71875, 8.484375, 9.25, 10.015625, 10.78125, 11.546875, 12.3125, 13.078125, 13.84375, 14.609375, 15.375, 16.140625, 16.90625, 17.671875, 18.4375, 19.203125, 19.96875, 20.734375, 21.5, 22.265625, 23.03125, 23.796875, 24.5625, 25.328125, 26.09375, 26.859375, 27.625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 8.0, 18.0, 14.0, 15.0, 24.0, 24.0, 34.0, 39.0, 46.0, 38.0, 90.0, 174.0, 271.0, 590.0, 2180.0, 48831.0, 3071852.0, 18756.0, 1462.0, 440.0, 221.0, 145.0, 103.0, 71.0, 43.0, 45.0, 31.0, 17.0, 28.0, 20.0, 17.0, 16.0, 8.0, 6.0, 3.0, 4.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.0, -41.818359375, -40.63671875, -39.455078125, -38.2734375, -37.091796875, -35.91015625, -34.728515625, -33.546875, -32.365234375, -31.18359375, -30.001953125, -28.8203125, -27.638671875, -26.45703125, -25.275390625, -24.09375, -22.912109375, -21.73046875, -20.548828125, -19.3671875, -18.185546875, -17.00390625, -15.822265625, -14.640625, -13.458984375, -12.27734375, -11.095703125, -9.9140625, -8.732421875, -7.55078125, -6.369140625, -5.1875, -4.005859375, -2.82421875, -1.642578125, -0.4609375, 0.720703125, 1.90234375, 3.083984375, 4.265625, 5.447265625, 6.62890625, 7.810546875, 8.9921875, 10.173828125, 11.35546875, 12.537109375, 13.71875, 14.900390625, 16.08203125, 17.263671875, 18.4453125, 19.626953125, 20.80859375, 21.990234375, 23.171875, 24.353515625, 25.53515625, 26.716796875, 27.8984375, 29.080078125, 30.26171875, 31.443359375, 32.625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 15.0, 726.0, 274.0, 3.0, 0.0, 0.0, 1.0], "bins": [-383.7342834472656, -377.2065124511719, -370.6787414550781, -364.1509704589844, -357.6231994628906, -351.0954284667969, -344.5676574707031, -338.0398864746094, -331.5121154785156, -324.9843444824219, -318.4565734863281, -311.9288024902344, -305.4010314941406, -298.8732604980469, -292.3454895019531, -285.8177185058594, -279.2899475097656, -272.7621765136719, -266.2344055175781, -259.7066345214844, -253.17886352539062, -246.65109252929688, -240.12332153320312, -233.59555053710938, -227.06776428222656, -220.5399932861328, -214.01222229003906, -207.4844512939453, -200.95668029785156, -194.4289093017578, -187.90113830566406, -181.3733673095703, -174.84559631347656, -168.3178253173828, -161.79005432128906, -155.2622833251953, -148.73451232910156, -142.2067413330078, -135.67897033691406, -129.1511993408203, -122.62342834472656, -116.09565734863281, -109.56788635253906, -103.04011535644531, -96.51234436035156, -89.98457336425781, -83.45680236816406, -76.92903137207031, -70.40125274658203, -63.87348175048828, -57.34571075439453, -50.81793975830078, -44.29016876220703, -37.762393951416016, -31.234622955322266, -24.706851959228516, -18.179080963134766, -11.651309967041016, -5.123538017272949, 1.4042339324951172, 7.932004928588867, 14.45977783203125, 20.987548828125, 27.51531982421875, 34.0430908203125]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 12.0, 5.0, 13.0, 11.0, 9.0, 14.0, 19.0, 16.0, 20.0, 12.0, 31.0, 32.0, 33.0, 32.0, 29.0, 24.0, 38.0, 44.0, 34.0, 35.0, 45.0, 34.0, 40.0, 36.0, 36.0, 26.0, 42.0, 30.0, 29.0, 31.0, 25.0, 27.0, 19.0, 11.0, 10.0, 17.0, 16.0, 18.0, 9.0, 5.0, 10.0, 5.0, 6.0, 0.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.21676254272461, -57.24195098876953, -55.26714324951172, -53.29233169555664, -51.31752014160156, -49.34271240234375, -47.36790084838867, -45.393089294433594, -43.41828155517578, -41.4434700012207, -39.46866226196289, -37.49385070800781, -35.519039154052734, -33.544227600097656, -31.569419860839844, -29.594608306884766, -27.619796752929688, -25.644987106323242, -23.670175552368164, -21.69536590576172, -19.72055435180664, -17.745744705200195, -15.77093505859375, -13.796124458312988, -11.821313858032227, -9.846503257751465, -7.871693134307861, -5.896883010864258, -3.922072410583496, -1.9472618103027344, 0.027547836303710938, 2.0023584365844727, 3.9771728515625, 5.951983451843262, 7.926793575286865, 9.901603698730469, 11.87641429901123, 13.851224899291992, 15.826034545898438, 17.800846099853516, 19.77565574645996, 21.750465393066406, 23.725276947021484, 25.70008659362793, 27.674896240234375, 29.649707794189453, 31.6245174407959, 33.599327087402344, 35.57413864135742, 37.5489501953125, 39.52375793457031, 41.49856948852539, 43.47338104248047, 45.44818878173828, 47.42300033569336, 49.39781188964844, 51.37261962890625, 53.34743118286133, 55.32223892211914, 57.29705047607422, 59.2718620300293, 61.246673583984375, 63.22148132324219, 65.1962890625, 67.17110443115234]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 9.0, 14.0, 14.0, 22.0, 29.0, 18.0, 16.0, 26.0, 33.0, 38.0, 45.0, 38.0, 52.0, 44.0, 43.0, 41.0, 41.0, 38.0, 48.0, 40.0, 41.0, 55.0, 35.0, 30.0, 29.0, 25.0, 24.0, 13.0, 10.0, 18.0, 12.0, 9.0, 5.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.84375, -5.64105224609375, -5.4383544921875, -5.23565673828125, -5.032958984375, -4.83026123046875, -4.6275634765625, -4.42486572265625, -4.22216796875, -4.01947021484375, -3.8167724609375, -3.61407470703125, -3.411376953125, -3.20867919921875, -3.0059814453125, -2.80328369140625, -2.6005859375, -2.39788818359375, -2.1951904296875, -1.99249267578125, -1.789794921875, -1.58709716796875, -1.3843994140625, -1.18170166015625, -0.97900390625, -0.77630615234375, -0.5736083984375, -0.37091064453125, -0.168212890625, 0.03448486328125, 0.2371826171875, 0.43988037109375, 0.642578125, 0.84527587890625, 1.0479736328125, 1.25067138671875, 1.453369140625, 1.65606689453125, 1.8587646484375, 2.06146240234375, 2.26416015625, 2.46685791015625, 2.6695556640625, 2.87225341796875, 3.074951171875, 3.27764892578125, 3.4803466796875, 3.68304443359375, 3.8857421875, 4.08843994140625, 4.2911376953125, 4.49383544921875, 4.696533203125, 4.89923095703125, 5.1019287109375, 5.30462646484375, 5.50732421875, 5.71002197265625, 5.9127197265625, 6.11541748046875, 6.318115234375, 6.52081298828125, 6.7235107421875, 6.92620849609375, 7.12890625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 7.0, 5.0, 2.0, 14.0, 8.0, 13.0, 19.0, 20.0, 26.0, 34.0, 32.0, 43.0, 83.0, 135.0, 300.0, 1054.0, 5565.0, 47265.0, 1019626.0, 2932124.0, 170575.0, 14088.0, 2168.0, 483.0, 205.0, 116.0, 72.0, 45.0, 26.0, 18.0, 20.0, 17.0, 19.0, 10.0, 6.0, 9.0, 9.0, 8.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.671875, -18.9990234375, -18.326171875, -17.6533203125, -16.98046875, -16.3076171875, -15.634765625, -14.9619140625, -14.2890625, -13.6162109375, -12.943359375, -12.2705078125, -11.59765625, -10.9248046875, -10.251953125, -9.5791015625, -8.90625, -8.2333984375, -7.560546875, -6.8876953125, -6.21484375, -5.5419921875, -4.869140625, -4.1962890625, -3.5234375, -2.8505859375, -2.177734375, -1.5048828125, -0.83203125, -0.1591796875, 0.513671875, 1.1865234375, 1.859375, 2.5322265625, 3.205078125, 3.8779296875, 4.55078125, 5.2236328125, 5.896484375, 6.5693359375, 7.2421875, 7.9150390625, 8.587890625, 9.2607421875, 9.93359375, 10.6064453125, 11.279296875, 11.9521484375, 12.625, 13.2978515625, 13.970703125, 14.6435546875, 15.31640625, 15.9892578125, 16.662109375, 17.3349609375, 18.0078125, 18.6806640625, 19.353515625, 20.0263671875, 20.69921875, 21.3720703125, 22.044921875, 22.7177734375, 23.390625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 3.0, 5.0, 12.0, 19.0, 18.0, 33.0, 49.0, 64.0, 118.0, 188.0, 254.0, 386.0, 519.0, 601.0, 588.0, 426.0, 266.0, 179.0, 113.0, 93.0, 45.0, 39.0, 22.0, 8.0, 10.0, 7.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.734375, -29.0523681640625, -28.370361328125, -27.6883544921875, -27.00634765625, -26.3243408203125, -25.642333984375, -24.9603271484375, -24.2783203125, -23.5963134765625, -22.914306640625, -22.2322998046875, -21.55029296875, -20.8682861328125, -20.186279296875, -19.5042724609375, -18.822265625, -18.1402587890625, -17.458251953125, -16.7762451171875, -16.09423828125, -15.4122314453125, -14.730224609375, -14.0482177734375, -13.3662109375, -12.6842041015625, -12.002197265625, -11.3201904296875, -10.63818359375, -9.9561767578125, -9.274169921875, -8.5921630859375, -7.91015625, -7.2281494140625, -6.546142578125, -5.8641357421875, -5.18212890625, -4.5001220703125, -3.818115234375, -3.1361083984375, -2.4541015625, -1.7720947265625, -1.090087890625, -0.4080810546875, 0.27392578125, 0.9559326171875, 1.637939453125, 2.3199462890625, 3.001953125, 3.6839599609375, 4.365966796875, 5.0479736328125, 5.72998046875, 6.4119873046875, 7.093994140625, 7.7760009765625, 8.4580078125, 9.1400146484375, 9.822021484375, 10.5040283203125, 11.18603515625, 11.8680419921875, 12.550048828125, 13.2320556640625, 13.9140625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 15.0, 17.0, 34.0, 38.0, 84.0, 110.0, 195.0, 268.0, 646.0, 2663.0, 82421.0, 3983236.0, 119854.0, 3124.0, 698.0, 308.0, 183.0, 113.0, 80.0, 64.0, 37.0, 25.0, 15.0, 14.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.0, -49.9638671875, -47.927734375, -45.8916015625, -43.85546875, -41.8193359375, -39.783203125, -37.7470703125, -35.7109375, -33.6748046875, -31.638671875, -29.6025390625, -27.56640625, -25.5302734375, -23.494140625, -21.4580078125, -19.421875, -17.3857421875, -15.349609375, -13.3134765625, -11.27734375, -9.2412109375, -7.205078125, -5.1689453125, -3.1328125, -1.0966796875, 0.939453125, 2.9755859375, 5.01171875, 7.0478515625, 9.083984375, 11.1201171875, 13.15625, 15.1923828125, 17.228515625, 19.2646484375, 21.30078125, 23.3369140625, 25.373046875, 27.4091796875, 29.4453125, 31.4814453125, 33.517578125, 35.5537109375, 37.58984375, 39.6259765625, 41.662109375, 43.6982421875, 45.734375, 47.7705078125, 49.806640625, 51.8427734375, 53.87890625, 55.9150390625, 57.951171875, 59.9873046875, 62.0234375, 64.0595703125, 66.095703125, 68.1318359375, 70.16796875, 72.2041015625, 74.240234375, 76.2763671875, 78.3125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 24.0, 82.0, 182.0, 308.0, 238.0, 106.0, 47.0, 15.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-232.390625, -226.9712677001953, -221.55191040039062, -216.13253784179688, -210.7131805419922, -205.2938232421875, -199.8744659423828, -194.45510864257812, -189.03575134277344, -183.61639404296875, -178.19703674316406, -172.77767944335938, -167.35830688476562, -161.93894958496094, -156.51959228515625, -151.10023498535156, -145.68087768554688, -140.2615203857422, -134.8421630859375, -129.42279052734375, -124.0034408569336, -118.58407592773438, -113.16471862792969, -107.745361328125, -102.32598876953125, -96.90663146972656, -91.48726654052734, -86.06790924072266, -80.64855194091797, -75.22918701171875, -69.80982971191406, -64.39047241210938, -58.971107482910156, -53.5517463684082, -48.132389068603516, -42.71302795410156, -37.293670654296875, -31.874309539794922, -26.45494842529297, -21.03559112548828, -15.616230010986328, -10.196870803833008, -4.777510643005371, 0.6418495178222656, 6.061208724975586, 11.480567932128906, 16.89992904663086, 22.319286346435547, 27.7386474609375, 33.15800857543945, 38.57736587524414, 43.996726989746094, 49.41608428955078, 54.835445404052734, 60.25480651855469, 65.67416381835938, 71.09352111816406, 76.51287841796875, 81.93224334716797, 87.35160064697266, 92.77095794677734, 98.19032287597656, 103.60968017578125, 109.02903747558594, 114.44840240478516]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 11.0, 11.0, 8.0, 8.0, 17.0, 11.0, 17.0, 16.0, 25.0, 31.0, 20.0, 28.0, 48.0, 39.0, 39.0, 38.0, 50.0, 39.0, 52.0, 47.0, 39.0, 32.0, 40.0, 37.0, 32.0, 27.0, 28.0, 34.0, 28.0, 17.0, 26.0, 14.0, 14.0, 16.0, 14.0, 8.0, 6.0, 6.0, 4.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-62.817142486572266, -60.92501449584961, -59.03288269042969, -57.14075469970703, -55.248626708984375, -53.35649871826172, -51.46437072753906, -49.57223892211914, -47.680110931396484, -45.78798294067383, -43.895851135253906, -42.00372314453125, -40.111595153808594, -38.21946716308594, -36.32733917236328, -34.43520736694336, -32.5430793762207, -30.650951385498047, -28.758821487426758, -26.86669158935547, -24.974563598632812, -23.082435607910156, -21.190305709838867, -19.298175811767578, -17.406047821044922, -15.51391887664795, -13.621789932250977, -11.729660987854004, -9.837532043457031, -7.945403099060059, -6.053274154663086, -4.161145210266113, -2.269012451171875, -0.37688350677490234, 1.5152454376220703, 3.407374382019043, 5.299503326416016, 7.191632270812988, 9.083761215209961, 10.975890159606934, 12.868019104003906, 14.760148048400879, 16.65227699279785, 18.54440689086914, 20.436534881591797, 22.328662872314453, 24.220792770385742, 26.11292266845703, 28.005050659179688, 29.897178649902344, 31.789308547973633, 33.68143844604492, 35.57356643676758, 37.465694427490234, 39.357826232910156, 41.24995422363281, 43.14208221435547, 45.034210205078125, 46.92633819580078, 48.8184700012207, 50.71059799194336, 52.602725982666016, 54.49485778808594, 56.386985778808594, 58.27911376953125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 3.0, 5.0, 4.0, 4.0, 12.0, 12.0, 21.0, 14.0, 18.0, 32.0, 31.0, 30.0, 37.0, 46.0, 43.0, 32.0, 45.0, 36.0, 38.0, 55.0, 52.0, 50.0, 39.0, 27.0, 46.0, 48.0, 31.0, 35.0, 22.0, 17.0, 25.0, 10.0, 15.0, 11.0, 11.0, 7.0, 7.0, 9.0, 9.0, 5.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.33984375, -6.13116455078125, -5.9224853515625, -5.71380615234375, -5.505126953125, -5.29644775390625, -5.0877685546875, -4.87908935546875, -4.67041015625, -4.46173095703125, -4.2530517578125, -4.04437255859375, -3.835693359375, -3.62701416015625, -3.4183349609375, -3.20965576171875, -3.0009765625, -2.79229736328125, -2.5836181640625, -2.37493896484375, -2.166259765625, -1.95758056640625, -1.7489013671875, -1.54022216796875, -1.33154296875, -1.12286376953125, -0.9141845703125, -0.70550537109375, -0.496826171875, -0.28814697265625, -0.0794677734375, 0.12921142578125, 0.337890625, 0.54656982421875, 0.7552490234375, 0.96392822265625, 1.172607421875, 1.38128662109375, 1.5899658203125, 1.79864501953125, 2.00732421875, 2.21600341796875, 2.4246826171875, 2.63336181640625, 2.842041015625, 3.05072021484375, 3.2593994140625, 3.46807861328125, 3.6767578125, 3.88543701171875, 4.0941162109375, 4.30279541015625, 4.511474609375, 4.72015380859375, 4.9288330078125, 5.13751220703125, 5.34619140625, 5.55487060546875, 5.7635498046875, 5.97222900390625, 6.180908203125, 6.38958740234375, 6.5982666015625, 6.80694580078125, 7.015625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 12.0, 16.0, 21.0, 37.0, 58.0, 91.0, 121.0, 205.0, 289.0, 479.0, 714.0, 989.0, 1419.0, 2243.0, 3358.0, 5001.0, 7554.0, 11377.0, 17211.0, 26223.0, 39790.0, 61213.0, 94121.0, 142761.0, 188485.0, 152836.0, 100725.0, 65166.0, 42881.0, 28269.0, 18484.0, 12239.0, 8104.0, 5254.0, 3593.0, 2389.0, 1592.0, 1086.0, 695.0, 485.0, 332.0, 224.0, 129.0, 104.0, 60.0, 44.0, 26.0, 23.0, 15.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.64208984375, -0.6229705810546875, -0.603851318359375, -0.5847320556640625, -0.56561279296875, -0.5464935302734375, -0.527374267578125, -0.5082550048828125, -0.4891357421875, -0.4700164794921875, -0.450897216796875, -0.4317779541015625, -0.41265869140625, -0.3935394287109375, -0.374420166015625, -0.3553009033203125, -0.336181640625, -0.3170623779296875, -0.297943115234375, -0.2788238525390625, -0.25970458984375, -0.2405853271484375, -0.221466064453125, -0.2023468017578125, -0.1832275390625, -0.1641082763671875, -0.144989013671875, -0.1258697509765625, -0.10675048828125, -0.0876312255859375, -0.068511962890625, -0.0493927001953125, -0.0302734375, -0.0111541748046875, 0.007965087890625, 0.0270843505859375, 0.04620361328125, 0.0653228759765625, 0.084442138671875, 0.1035614013671875, 0.1226806640625, 0.1417999267578125, 0.160919189453125, 0.1800384521484375, 0.19915771484375, 0.2182769775390625, 0.237396240234375, 0.2565155029296875, 0.275634765625, 0.2947540283203125, 0.313873291015625, 0.3329925537109375, 0.35211181640625, 0.3712310791015625, 0.390350341796875, 0.4094696044921875, 0.4285888671875, 0.4477081298828125, 0.466827392578125, 0.4859466552734375, 0.50506591796875, 0.5241851806640625, 0.543304443359375, 0.5624237060546875, 0.58154296875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 5.0, 5.0, 8.0, 8.0, 13.0, 14.0, 11.0, 20.0, 23.0, 23.0, 33.0, 30.0, 24.0, 29.0, 37.0, 39.0, 50.0, 41.0, 39.0, 1074.0, 35.0, 41.0, 34.0, 38.0, 32.0, 39.0, 42.0, 26.0, 28.0, 15.0, 25.0, 26.0, 25.0, 15.0, 12.0, 10.0, 14.0, 8.0, 7.0, 4.0, 6.0, 4.0, 3.0, 0.0, 3.0, 2.0, 3.0], "bins": [-4.4375, -4.316070556640625, -4.19464111328125, -4.073211669921875, -3.9517822265625, -3.830352783203125, -3.70892333984375, -3.587493896484375, -3.466064453125, -3.344635009765625, -3.22320556640625, -3.101776123046875, -2.9803466796875, -2.858917236328125, -2.73748779296875, -2.616058349609375, -2.49462890625, -2.373199462890625, -2.25177001953125, -2.130340576171875, -2.0089111328125, -1.887481689453125, -1.76605224609375, -1.644622802734375, -1.523193359375, -1.401763916015625, -1.28033447265625, -1.158905029296875, -1.0374755859375, -0.916046142578125, -0.79461669921875, -0.673187255859375, -0.5517578125, -0.430328369140625, -0.30889892578125, -0.187469482421875, -0.0660400390625, 0.055389404296875, 0.17681884765625, 0.298248291015625, 0.419677734375, 0.541107177734375, 0.66253662109375, 0.783966064453125, 0.9053955078125, 1.026824951171875, 1.14825439453125, 1.269683837890625, 1.39111328125, 1.512542724609375, 1.63397216796875, 1.755401611328125, 1.8768310546875, 1.998260498046875, 2.11968994140625, 2.241119384765625, 2.362548828125, 2.483978271484375, 2.60540771484375, 2.726837158203125, 2.8482666015625, 2.969696044921875, 3.09112548828125, 3.212554931640625, 3.333984375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 10.0, 20.0, 32.0, 34.0, 47.0, 78.0, 124.0, 176.0, 248.0, 391.0, 611.0, 842.0, 1294.0, 2005.0, 2843.0, 4448.0, 6802.0, 10373.0, 15806.0, 24885.0, 39062.0, 62602.0, 100148.0, 154392.0, 1238029.0, 155974.0, 101117.0, 63522.0, 39511.0, 25363.0, 16184.0, 10434.0, 6679.0, 4413.0, 2908.0, 1877.0, 1261.0, 829.0, 554.0, 376.0, 258.0, 188.0, 125.0, 75.0, 52.0, 53.0, 23.0, 17.0, 14.0, 10.0, 8.0, 6.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.6186676025390625, -0.599639892578125, -0.5806121826171875, -0.56158447265625, -0.5425567626953125, -0.523529052734375, -0.5045013427734375, -0.4854736328125, -0.4664459228515625, -0.447418212890625, -0.4283905029296875, -0.40936279296875, -0.3903350830078125, -0.371307373046875, -0.3522796630859375, -0.333251953125, -0.3142242431640625, -0.295196533203125, -0.2761688232421875, -0.25714111328125, -0.2381134033203125, -0.219085693359375, -0.2000579833984375, -0.1810302734375, -0.1620025634765625, -0.142974853515625, -0.1239471435546875, -0.10491943359375, -0.0858917236328125, -0.066864013671875, -0.0478363037109375, -0.02880859375, -0.0097808837890625, 0.009246826171875, 0.0282745361328125, 0.04730224609375, 0.0663299560546875, 0.085357666015625, 0.1043853759765625, 0.1234130859375, 0.1424407958984375, 0.161468505859375, 0.1804962158203125, 0.19952392578125, 0.2185516357421875, 0.237579345703125, 0.2566070556640625, 0.275634765625, 0.2946624755859375, 0.313690185546875, 0.3327178955078125, 0.35174560546875, 0.3707733154296875, 0.389801025390625, 0.4088287353515625, 0.4278564453125, 0.4468841552734375, 0.465911865234375, 0.4849395751953125, 0.50396728515625, 0.5229949951171875, 0.542022705078125, 0.5610504150390625, 0.580078125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 9.0, 6.0, 9.0, 7.0, 11.0, 11.0, 19.0, 20.0, 35.0, 36.0, 45.0, 37.0, 49.0, 71.0, 57.0, 51.0, 74.0, 46.0, 39.0, 47.0, 55.0, 45.0, 41.0, 26.0, 32.0, 23.0, 15.0, 18.0, 14.0, 13.0, 8.0, 2.0, 4.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010890960693359375, -0.0010444670915603638, -0.00099983811378479, -0.0009552091360092163, -0.0009105801582336426, -0.0008659511804580688, -0.0008213222026824951, -0.0007766932249069214, -0.0007320642471313477, -0.0006874352693557739, -0.0006428062915802002, -0.0005981773138046265, -0.0005535483360290527, -0.000508919358253479, -0.0004642903804779053, -0.00041966140270233154, -0.0003750324249267578, -0.0003304034471511841, -0.00028577446937561035, -0.00024114549160003662, -0.0001965165138244629, -0.00015188753604888916, -0.00010725855827331543, -6.26295804977417e-05, -1.800060272216797e-05, 2.6628375053405762e-05, 7.125735282897949e-05, 0.00011588633060455322, 0.00016051530838012695, 0.00020514428615570068, 0.0002497732639312744, 0.00029440224170684814, 0.0003390312194824219, 0.0003836601972579956, 0.00042828917503356934, 0.00047291815280914307, 0.0005175471305847168, 0.0005621761083602905, 0.0006068050861358643, 0.000651434063911438, 0.0006960630416870117, 0.0007406920194625854, 0.0007853209972381592, 0.0008299499750137329, 0.0008745789527893066, 0.0009192079305648804, 0.0009638369083404541, 0.0010084658861160278, 0.0010530948638916016, 0.0010977238416671753, 0.001142352819442749, 0.0011869817972183228, 0.0012316107749938965, 0.0012762397527694702, 0.001320868730545044, 0.0013654977083206177, 0.0014101266860961914, 0.0014547556638717651, 0.0014993846416473389, 0.0015440136194229126, 0.0015886425971984863, 0.00163327157497406, 0.0016779005527496338, 0.0017225295305252075, 0.0017671585083007812]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 7.0, 6.0, 7.0, 7.0, 7.0, 16.0, 25.0, 32.0, 32.0, 48.0, 63.0, 121.0, 195.0, 314.0, 573.0, 2985.0, 983400.0, 58739.0, 866.0, 411.0, 232.0, 127.0, 98.0, 56.0, 50.0, 21.0, 29.0, 14.0, 16.0, 7.0, 7.0, 12.0, 4.0, 6.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.04132080078125, -0.040280818939208984, -0.03924083709716797, -0.03820085525512695, -0.03716087341308594, -0.03612089157104492, -0.035080909729003906, -0.03404092788696289, -0.033000946044921875, -0.03196096420288086, -0.030920982360839844, -0.029881000518798828, -0.028841018676757812, -0.027801036834716797, -0.02676105499267578, -0.025721073150634766, -0.02468109130859375, -0.023641109466552734, -0.02260112762451172, -0.021561145782470703, -0.020521163940429688, -0.019481182098388672, -0.018441200256347656, -0.01740121841430664, -0.016361236572265625, -0.01532125473022461, -0.014281272888183594, -0.013241291046142578, -0.012201309204101562, -0.011161327362060547, -0.010121345520019531, -0.009081363677978516, -0.0080413818359375, -0.007001399993896484, -0.005961418151855469, -0.004921436309814453, -0.0038814544677734375, -0.002841472625732422, -0.0018014907836914062, -0.0007615089416503906, 0.000278472900390625, 0.0013184547424316406, 0.0023584365844726562, 0.003398418426513672, 0.0044384002685546875, 0.005478382110595703, 0.006518363952636719, 0.007558345794677734, 0.00859832763671875, 0.009638309478759766, 0.010678291320800781, 0.011718273162841797, 0.012758255004882812, 0.013798236846923828, 0.014838218688964844, 0.01587820053100586, 0.016918182373046875, 0.01795816421508789, 0.018998146057128906, 0.020038127899169922, 0.021078109741210938, 0.022118091583251953, 0.02315807342529297, 0.024198055267333984, 0.025238037109375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 169.0, 761.0, 81.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030418625101447105, -0.0027967325877398252, -0.00255160266533494, -0.002306472510099411, -0.0020613425876945257, -0.0018162126652896404, -0.0015710826264694333, -0.0013259525876492262, -0.001080822665244341, -0.0008356926846317947, -0.0005905627040192485, -0.0003454327234067023, -0.00010030274279415607, 0.00014482717961072922, 0.00038995721843093634, 0.0006350872572511435, 0.0008802171796560287, 0.001125347102060914, 0.0013704771408811212, 0.0016156071797013283, 0.0018607371021062136, 0.002105867024511099, 0.002350997179746628, 0.002596127102151513, 0.0028412570245563984, 0.0030863869469612837, 0.003331516869366169, 0.003576647024601698, 0.003821776947006583, 0.0040669068694114685, 0.0043120370246469975, 0.004557167179882526, 0.004802297800779343, 0.005047427956014872, 0.005292557645589113, 0.005537687800824642, 0.005782817490398884, 0.006027947645634413, 0.006273077800869942, 0.006518207490444183, 0.006763337645679712, 0.007008467800915241, 0.007253597490489483, 0.007498727645725012, 0.007743857800960541, 0.007988987490534782, 0.008234117180109024, 0.00847924780100584, 0.008724377490580082, 0.008969507180154324, 0.00921463780105114, 0.009459767490625381, 0.009704897180199623, 0.009950026869773865, 0.010195157490670681, 0.010440287180244923, 0.010685417801141739, 0.01093054749071598, 0.011175678111612797, 0.011420807801187038, 0.01166593749076128, 0.011911068111658096, 0.012156197801232338, 0.01240132749080658, 0.012646457180380821]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 2.0, 6.0, 3.0, 9.0, 7.0, 10.0, 8.0, 13.0, 14.0, 22.0, 19.0, 20.0, 26.0, 32.0, 30.0, 31.0, 26.0, 33.0, 30.0, 33.0, 49.0, 34.0, 45.0, 34.0, 37.0, 43.0, 36.0, 28.0, 28.0, 31.0, 31.0, 30.0, 28.0, 36.0, 19.0, 16.0, 17.0, 16.0, 17.0, 16.0, 7.0, 9.0, 7.0, 3.0, 6.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006739497184753418, -0.0006525153294205666, -0.0006310809403657913, -0.0006096465513110161, -0.0005882121622562408, -0.0005667777732014656, -0.0005453433841466904, -0.0005239089950919151, -0.0005024746060371399, -0.00048104021698236465, -0.0004596058279275894, -0.0004381714388728142, -0.00041673704981803894, -0.0003953026607632637, -0.00037386827170848846, -0.0003524338826537132, -0.000330999493598938, -0.00030956510454416275, -0.0002881307154893875, -0.0002666963264346123, -0.00024526193737983704, -0.0002238275483250618, -0.00020239315927028656, -0.00018095877021551132, -0.00015952438116073608, -0.00013808999210596085, -0.00011665560305118561, -9.522121399641037e-05, -7.378682494163513e-05, -5.2352435886859894e-05, -3.0918046832084656e-05, -9.483657777309418e-06, 1.195073127746582e-05, 3.338512033224106e-05, 5.4819509387016296e-05, 7.625389844179153e-05, 9.768828749656677e-05, 0.00011912267655134201, 0.00014055706560611725, 0.0001619914546608925, 0.00018342584371566772, 0.00020486023277044296, 0.0002262946218252182, 0.00024772901087999344, 0.0002691633999347687, 0.0002905977889895439, 0.00031203217804431915, 0.0003334665670990944, 0.00035490095615386963, 0.00037633534520864487, 0.0003977697342634201, 0.00041920412331819534, 0.0004406385123729706, 0.0004620729014277458, 0.00048350729048252106, 0.0005049416795372963, 0.0005263760685920715, 0.0005478104576468468, 0.000569244846701622, 0.0005906792357563972, 0.0006121136248111725, 0.0006335480138659477, 0.000654982402920723, 0.0006764167919754982, 0.0006978511810302734]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 3.0, 5.0, 4.0, 4.0, 12.0, 12.0, 21.0, 14.0, 18.0, 32.0, 31.0, 30.0, 37.0, 46.0, 43.0, 32.0, 45.0, 36.0, 38.0, 56.0, 51.0, 50.0, 39.0, 27.0, 46.0, 48.0, 31.0, 35.0, 22.0, 17.0, 25.0, 10.0, 15.0, 11.0, 11.0, 7.0, 7.0, 9.0, 9.0, 5.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.33984375, -6.13116455078125, -5.9224853515625, -5.71380615234375, -5.505126953125, -5.29644775390625, -5.0877685546875, -4.87908935546875, -4.67041015625, -4.46173095703125, -4.2530517578125, -4.04437255859375, -3.835693359375, -3.62701416015625, -3.4183349609375, -3.20965576171875, -3.0009765625, -2.79229736328125, -2.5836181640625, -2.37493896484375, -2.166259765625, -1.95758056640625, -1.7489013671875, -1.54022216796875, -1.33154296875, -1.12286376953125, -0.9141845703125, -0.70550537109375, -0.496826171875, -0.28814697265625, -0.0794677734375, 0.12921142578125, 0.337890625, 0.54656982421875, 0.7552490234375, 0.96392822265625, 1.172607421875, 1.38128662109375, 1.5899658203125, 1.79864501953125, 2.00732421875, 2.21600341796875, 2.4246826171875, 2.63336181640625, 2.842041015625, 3.05072021484375, 3.2593994140625, 3.46807861328125, 3.6767578125, 3.88543701171875, 4.0941162109375, 4.30279541015625, 4.511474609375, 4.72015380859375, 4.9288330078125, 5.13751220703125, 5.34619140625, 5.55487060546875, 5.7635498046875, 5.97222900390625, 6.180908203125, 6.38958740234375, 6.5982666015625, 6.80694580078125, 7.015625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 11.0, 24.0, 20.0, 34.0, 41.0, 52.0, 68.0, 109.0, 167.0, 234.0, 366.0, 650.0, 943.0, 1372.0, 2329.0, 3744.0, 6349.0, 11564.0, 24852.0, 70875.0, 339293.0, 439994.0, 86144.0, 28427.0, 12893.0, 7114.0, 4035.0, 2472.0, 1520.0, 988.0, 613.0, 423.0, 282.0, 178.0, 112.0, 72.0, 58.0, 32.0, 32.0, 18.0, 9.0, 6.0, 3.0, 5.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.796875, -4.63189697265625, -4.4669189453125, -4.30194091796875, -4.136962890625, -3.97198486328125, -3.8070068359375, -3.64202880859375, -3.47705078125, -3.31207275390625, -3.1470947265625, -2.98211669921875, -2.817138671875, -2.65216064453125, -2.4871826171875, -2.32220458984375, -2.1572265625, -1.99224853515625, -1.8272705078125, -1.66229248046875, -1.497314453125, -1.33233642578125, -1.1673583984375, -1.00238037109375, -0.83740234375, -0.67242431640625, -0.5074462890625, -0.34246826171875, -0.177490234375, -0.01251220703125, 0.1524658203125, 0.31744384765625, 0.482421875, 0.64739990234375, 0.8123779296875, 0.97735595703125, 1.142333984375, 1.30731201171875, 1.4722900390625, 1.63726806640625, 1.80224609375, 1.96722412109375, 2.1322021484375, 2.29718017578125, 2.462158203125, 2.62713623046875, 2.7921142578125, 2.95709228515625, 3.1220703125, 3.28704833984375, 3.4520263671875, 3.61700439453125, 3.781982421875, 3.94696044921875, 4.1119384765625, 4.27691650390625, 4.44189453125, 4.60687255859375, 4.7718505859375, 4.93682861328125, 5.101806640625, 5.26678466796875, 5.4317626953125, 5.59674072265625, 5.76171875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 2.0, 1.0, 3.0, 8.0, 10.0, 6.0, 7.0, 16.0, 12.0, 12.0, 21.0, 22.0, 21.0, 19.0, 29.0, 31.0, 29.0, 40.0, 44.0, 47.0, 68.0, 97.0, 435.0, 1494.0, 101.0, 60.0, 53.0, 51.0, 41.0, 39.0, 30.0, 25.0, 29.0, 20.0, 25.0, 20.0, 14.0, 10.0, 19.0, 7.0, 6.0, 7.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-21.96875, -21.282470703125, -20.59619140625, -19.909912109375, -19.2236328125, -18.537353515625, -17.85107421875, -17.164794921875, -16.478515625, -15.792236328125, -15.10595703125, -14.419677734375, -13.7333984375, -13.047119140625, -12.36083984375, -11.674560546875, -10.98828125, -10.302001953125, -9.61572265625, -8.929443359375, -8.2431640625, -7.556884765625, -6.87060546875, -6.184326171875, -5.498046875, -4.811767578125, -4.12548828125, -3.439208984375, -2.7529296875, -2.066650390625, -1.38037109375, -0.694091796875, -0.0078125, 0.678466796875, 1.36474609375, 2.051025390625, 2.7373046875, 3.423583984375, 4.10986328125, 4.796142578125, 5.482421875, 6.168701171875, 6.85498046875, 7.541259765625, 8.2275390625, 8.913818359375, 9.60009765625, 10.286376953125, 10.97265625, 11.658935546875, 12.34521484375, 13.031494140625, 13.7177734375, 14.404052734375, 15.09033203125, 15.776611328125, 16.462890625, 17.149169921875, 17.83544921875, 18.521728515625, 19.2080078125, 19.894287109375, 20.58056640625, 21.266845703125, 21.953125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 9.0, 14.0, 11.0, 12.0, 12.0, 17.0, 19.0, 35.0, 44.0, 35.0, 58.0, 77.0, 133.0, 177.0, 322.0, 566.0, 2433.0, 56864.0, 3063160.0, 18967.0, 1495.0, 431.0, 226.0, 137.0, 111.0, 71.0, 65.0, 45.0, 25.0, 23.0, 20.0, 23.0, 15.0, 7.0, 11.0, 10.0, 4.0, 4.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-48.25, -46.84619140625, -45.4423828125, -44.03857421875, -42.634765625, -41.23095703125, -39.8271484375, -38.42333984375, -37.01953125, -35.61572265625, -34.2119140625, -32.80810546875, -31.404296875, -30.00048828125, -28.5966796875, -27.19287109375, -25.7890625, -24.38525390625, -22.9814453125, -21.57763671875, -20.173828125, -18.77001953125, -17.3662109375, -15.96240234375, -14.55859375, -13.15478515625, -11.7509765625, -10.34716796875, -8.943359375, -7.53955078125, -6.1357421875, -4.73193359375, -3.328125, -1.92431640625, -0.5205078125, 0.88330078125, 2.287109375, 3.69091796875, 5.0947265625, 6.49853515625, 7.90234375, 9.30615234375, 10.7099609375, 12.11376953125, 13.517578125, 14.92138671875, 16.3251953125, 17.72900390625, 19.1328125, 20.53662109375, 21.9404296875, 23.34423828125, 24.748046875, 26.15185546875, 27.5556640625, 28.95947265625, 30.36328125, 31.76708984375, 33.1708984375, 34.57470703125, 35.978515625, 37.38232421875, 38.7861328125, 40.18994140625, 41.59375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 36.0, 369.0, 500.0, 98.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-197.15797424316406, -193.44810485839844, -189.7382354736328, -186.02835083007812, -182.3184814453125, -178.60861206054688, -174.89874267578125, -171.18885803222656, -167.47898864746094, -163.7691192626953, -160.0592498779297, -156.349365234375, -152.63949584960938, -148.92962646484375, -145.21975708007812, -141.50987243652344, -137.8000030517578, -134.0901336669922, -130.38026428222656, -126.6703872680664, -122.96051025390625, -119.25064086914062, -115.54076385498047, -111.83089447021484, -108.12102508544922, -104.4111557006836, -100.70127868652344, -96.99140930175781, -93.28153228759766, -89.57166290283203, -85.86178588867188, -82.15191650390625, -78.44204711914062, -74.732177734375, -71.02230072021484, -67.31243133544922, -63.60255432128906, -59.89268493652344, -56.18280792236328, -52.472938537597656, -48.7630615234375, -45.05318832397461, -41.34331512451172, -37.63344192504883, -33.92356872558594, -30.21369743347168, -26.50382423400879, -22.7939510345459, -19.084075927734375, -15.374202728271484, -11.664329528808594, -7.9544572830200195, -4.244584083557129, -0.5347118377685547, 3.175161361694336, 6.885034561157227, 10.594907760620117, 14.304780960083008, 18.0146541595459, 21.724525451660156, 25.434398651123047, 29.144271850585938, 32.85414505004883, 36.56401824951172, 40.27389144897461]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 5.0, 3.0, 11.0, 10.0, 16.0, 16.0, 17.0, 19.0, 24.0, 31.0, 22.0, 33.0, 39.0, 36.0, 29.0, 34.0, 37.0, 43.0, 44.0, 41.0, 40.0, 36.0, 39.0, 42.0, 51.0, 24.0, 30.0, 34.0, 27.0, 19.0, 25.0, 16.0, 22.0, 17.0, 11.0, 12.0, 12.0, 9.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.47752380371094, -67.2846908569336, -65.09185028076172, -62.899017333984375, -60.706180572509766, -58.513343811035156, -56.32051086425781, -54.1276741027832, -51.934837341308594, -49.742000579833984, -47.549163818359375, -45.35633087158203, -43.16349411010742, -40.97065734863281, -38.77782440185547, -36.58498764038086, -34.39215087890625, -32.19931411743164, -30.006479263305664, -27.813644409179688, -25.620807647705078, -23.42797088623047, -21.235136032104492, -19.042301177978516, -16.849464416503906, -14.656628608703613, -12.46379280090332, -10.270956993103027, -8.078121185302734, -5.885285377502441, -3.6924495697021484, -1.4996137619018555, 0.6932220458984375, 2.8860578536987305, 5.078893661499023, 7.271729469299316, 9.46456527709961, 11.657401084899902, 13.850236892700195, 16.043071746826172, 18.23590850830078, 20.42874526977539, 22.621580123901367, 24.814414978027344, 27.007251739501953, 29.200088500976562, 31.39292335510254, 33.585758209228516, 35.778594970703125, 37.971431732177734, 40.164268493652344, 42.35710144042969, 44.5499382019043, 46.742774963378906, 48.93560791015625, 51.12844467163086, 53.32128143310547, 55.51411819458008, 57.70695495605469, 59.89978790283203, 62.09262466430664, 64.28546142578125, 66.4782943725586, 68.67113494873047, 70.86396789550781]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 3.0, 1.0, 9.0, 8.0, 16.0, 12.0, 15.0, 16.0, 23.0, 16.0, 34.0, 40.0, 33.0, 41.0, 52.0, 33.0, 36.0, 42.0, 42.0, 53.0, 46.0, 53.0, 23.0, 43.0, 47.0, 33.0, 31.0, 39.0, 28.0, 21.0, 18.0, 12.0, 14.0, 7.0, 13.0, 12.0, 4.0, 9.0, 6.0, 9.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.37109375, -6.1612548828125, -5.951416015625, -5.7415771484375, -5.53173828125, -5.3218994140625, -5.112060546875, -4.9022216796875, -4.6923828125, -4.4825439453125, -4.272705078125, -4.0628662109375, -3.85302734375, -3.6431884765625, -3.433349609375, -3.2235107421875, -3.013671875, -2.8038330078125, -2.593994140625, -2.3841552734375, -2.17431640625, -1.9644775390625, -1.754638671875, -1.5447998046875, -1.3349609375, -1.1251220703125, -0.915283203125, -0.7054443359375, -0.49560546875, -0.2857666015625, -0.075927734375, 0.1339111328125, 0.34375, 0.5535888671875, 0.763427734375, 0.9732666015625, 1.18310546875, 1.3929443359375, 1.602783203125, 1.8126220703125, 2.0224609375, 2.2322998046875, 2.442138671875, 2.6519775390625, 2.86181640625, 3.0716552734375, 3.281494140625, 3.4913330078125, 3.701171875, 3.9110107421875, 4.120849609375, 4.3306884765625, 4.54052734375, 4.7503662109375, 4.960205078125, 5.1700439453125, 5.3798828125, 5.5897216796875, 5.799560546875, 6.0093994140625, 6.21923828125, 6.4290771484375, 6.638916015625, 6.8487548828125, 7.05859375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 6.0, 8.0, 8.0, 8.0, 9.0, 11.0, 26.0, 33.0, 34.0, 57.0, 79.0, 148.0, 218.0, 339.0, 585.0, 1068.0, 1928.0, 3717.0, 7375.0, 15639.0, 37233.0, 105761.0, 365095.0, 1093905.0, 1515747.0, 722036.0, 207422.0, 67642.0, 25548.0, 10908.0, 5357.0, 2808.0, 1490.0, 762.0, 482.0, 280.0, 156.0, 105.0, 72.0, 48.0, 41.0, 32.0, 20.0, 13.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.97265625, -6.73455810546875, -6.4964599609375, -6.25836181640625, -6.020263671875, -5.78216552734375, -5.5440673828125, -5.30596923828125, -5.06787109375, -4.82977294921875, -4.5916748046875, -4.35357666015625, -4.115478515625, -3.87738037109375, -3.6392822265625, -3.40118408203125, -3.1630859375, -2.92498779296875, -2.6868896484375, -2.44879150390625, -2.210693359375, -1.97259521484375, -1.7344970703125, -1.49639892578125, -1.25830078125, -1.02020263671875, -0.7821044921875, -0.54400634765625, -0.305908203125, -0.06781005859375, 0.1702880859375, 0.40838623046875, 0.646484375, 0.88458251953125, 1.1226806640625, 1.36077880859375, 1.598876953125, 1.83697509765625, 2.0750732421875, 2.31317138671875, 2.55126953125, 2.78936767578125, 3.0274658203125, 3.26556396484375, 3.503662109375, 3.74176025390625, 3.9798583984375, 4.21795654296875, 4.4560546875, 4.69415283203125, 4.9322509765625, 5.17034912109375, 5.408447265625, 5.64654541015625, 5.8846435546875, 6.12274169921875, 6.36083984375, 6.59893798828125, 6.8370361328125, 7.07513427734375, 7.313232421875, 7.55133056640625, 7.7894287109375, 8.02752685546875, 8.265625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 12.0, 15.0, 15.0, 25.0, 32.0, 36.0, 41.0, 51.0, 93.0, 94.0, 141.0, 181.0, 230.0, 338.0, 397.0, 439.0, 391.0, 357.0, 261.0, 209.0, 184.0, 127.0, 98.0, 75.0, 60.0, 46.0, 31.0, 19.0, 21.0, 14.0, 12.0, 8.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.34375, -14.8897705078125, -14.435791015625, -13.9818115234375, -13.52783203125, -13.0738525390625, -12.619873046875, -12.1658935546875, -11.7119140625, -11.2579345703125, -10.803955078125, -10.3499755859375, -9.89599609375, -9.4420166015625, -8.988037109375, -8.5340576171875, -8.080078125, -7.6260986328125, -7.172119140625, -6.7181396484375, -6.26416015625, -5.8101806640625, -5.356201171875, -4.9022216796875, -4.4482421875, -3.9942626953125, -3.540283203125, -3.0863037109375, -2.63232421875, -2.1783447265625, -1.724365234375, -1.2703857421875, -0.81640625, -0.3624267578125, 0.091552734375, 0.5455322265625, 0.99951171875, 1.4534912109375, 1.907470703125, 2.3614501953125, 2.8154296875, 3.2694091796875, 3.723388671875, 4.1773681640625, 4.63134765625, 5.0853271484375, 5.539306640625, 5.9932861328125, 6.447265625, 6.9012451171875, 7.355224609375, 7.8092041015625, 8.26318359375, 8.7171630859375, 9.171142578125, 9.6251220703125, 10.0791015625, 10.5330810546875, 10.987060546875, 11.4410400390625, 11.89501953125, 12.3489990234375, 12.802978515625, 13.2569580078125, 13.7109375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 9.0, 6.0, 16.0, 15.0, 34.0, 35.0, 56.0, 78.0, 107.0, 192.0, 385.0, 1270.0, 19193.0, 2883042.0, 1276794.0, 11291.0, 912.0, 336.0, 174.0, 115.0, 64.0, 35.0, 36.0, 32.0, 19.0, 7.0, 13.0, 7.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.75, -47.8310546875, -45.912109375, -43.9931640625, -42.07421875, -40.1552734375, -38.236328125, -36.3173828125, -34.3984375, -32.4794921875, -30.560546875, -28.6416015625, -26.72265625, -24.8037109375, -22.884765625, -20.9658203125, -19.046875, -17.1279296875, -15.208984375, -13.2900390625, -11.37109375, -9.4521484375, -7.533203125, -5.6142578125, -3.6953125, -1.7763671875, 0.142578125, 2.0615234375, 3.98046875, 5.8994140625, 7.818359375, 9.7373046875, 11.65625, 13.5751953125, 15.494140625, 17.4130859375, 19.33203125, 21.2509765625, 23.169921875, 25.0888671875, 27.0078125, 28.9267578125, 30.845703125, 32.7646484375, 34.68359375, 36.6025390625, 38.521484375, 40.4404296875, 42.359375, 44.2783203125, 46.197265625, 48.1162109375, 50.03515625, 51.9541015625, 53.873046875, 55.7919921875, 57.7109375, 59.6298828125, 61.548828125, 63.4677734375, 65.38671875, 67.3056640625, 69.224609375, 71.1435546875, 73.0625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 17.0, 42.0, 104.0, 214.0, 291.0, 178.0, 109.0, 39.0, 10.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-264.9073486328125, -259.5574951171875, -254.2076416015625, -248.8577880859375, -243.5079345703125, -238.1580810546875, -232.8082275390625, -227.4583740234375, -222.1085205078125, -216.7586669921875, -211.4088134765625, -206.0589599609375, -200.7091064453125, -195.3592529296875, -190.0093994140625, -184.6595458984375, -179.3096923828125, -173.9598388671875, -168.6099853515625, -163.2601318359375, -157.9102783203125, -152.5604248046875, -147.2105712890625, -141.8607177734375, -136.51084899902344, -131.16099548339844, -125.81114196777344, -120.46128845214844, -115.11143493652344, -109.76158142089844, -104.41172790527344, -99.06187438964844, -93.71202850341797, -88.36217498779297, -83.01232147216797, -77.66246795654297, -72.31261444091797, -66.96276092529297, -61.6129035949707, -56.2630500793457, -50.9131965637207, -45.5633430480957, -40.2134895324707, -34.86363220214844, -29.51378059387207, -24.16392707824707, -18.814071655273438, -13.464218139648438, -8.114364624023438, -2.7645106315612793, 2.585343360900879, 7.935197830200195, 13.285051345825195, 18.634904861450195, 23.984760284423828, 29.334613800048828, 34.68446731567383, 40.03432083129883, 45.38417434692383, 50.734031677246094, 56.083885192871094, 61.433738708496094, 66.7835922241211, 72.1334457397461, 77.4832992553711]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 11.0, 14.0, 14.0, 11.0, 16.0, 11.0, 15.0, 19.0, 21.0, 27.0, 24.0, 33.0, 32.0, 34.0, 34.0, 36.0, 39.0, 35.0, 35.0, 44.0, 38.0, 46.0, 47.0, 44.0, 32.0, 36.0, 29.0, 29.0, 23.0, 21.0, 18.0, 18.0, 14.0, 19.0, 16.0, 11.0, 13.0, 7.0, 6.0, 5.0, 5.0, 4.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.63923645019531, -45.09027862548828, -43.54132080078125, -41.99236297607422, -40.44340515136719, -38.89445114135742, -37.34549331665039, -35.79653549194336, -34.24757766723633, -32.6986198425293, -31.149662017822266, -29.600706100463867, -28.051748275756836, -26.502790451049805, -24.953834533691406, -23.404876708984375, -21.855918884277344, -20.306961059570312, -18.75800323486328, -17.209047317504883, -15.660089492797852, -14.11113166809082, -12.562174797058105, -11.01321792602539, -9.46426010131836, -7.915302753448486, -6.366345405578613, -4.81738805770874, -3.268430709838867, -1.7194733619689941, -0.1705160140991211, 1.3784408569335938, 2.9273948669433594, 4.476352214813232, 6.0253095626831055, 7.5742669105529785, 9.123224258422852, 10.672182083129883, 12.221138954162598, 13.770095825195312, 15.319053649902344, 16.868011474609375, 18.416969299316406, 19.965925216674805, 21.514883041381836, 23.063840866088867, 24.612796783447266, 26.161754608154297, 27.710712432861328, 29.25967025756836, 30.80862808227539, 32.35758590698242, 33.90653991699219, 35.45549774169922, 37.00445556640625, 38.55341339111328, 40.10237121582031, 41.651329040527344, 43.200286865234375, 44.749244689941406, 46.29820251464844, 47.8471565246582, 49.396114349365234, 50.945072174072266, 52.4940299987793]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 5.0, 7.0, 13.0, 11.0, 14.0, 14.0, 22.0, 21.0, 26.0, 28.0, 35.0, 36.0, 50.0, 31.0, 39.0, 36.0, 51.0, 40.0, 49.0, 53.0, 56.0, 33.0, 34.0, 50.0, 37.0, 24.0, 25.0, 25.0, 27.0, 13.0, 20.0, 8.0, 15.0, 12.0, 8.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.421875, -7.20269775390625, -6.9835205078125, -6.76434326171875, -6.545166015625, -6.32598876953125, -6.1068115234375, -5.88763427734375, -5.66845703125, -5.44927978515625, -5.2301025390625, -5.01092529296875, -4.791748046875, -4.57257080078125, -4.3533935546875, -4.13421630859375, -3.9150390625, -3.69586181640625, -3.4766845703125, -3.25750732421875, -3.038330078125, -2.81915283203125, -2.5999755859375, -2.38079833984375, -2.16162109375, -1.94244384765625, -1.7232666015625, -1.50408935546875, -1.284912109375, -1.06573486328125, -0.8465576171875, -0.62738037109375, -0.408203125, -0.18902587890625, 0.0301513671875, 0.24932861328125, 0.468505859375, 0.68768310546875, 0.9068603515625, 1.12603759765625, 1.34521484375, 1.56439208984375, 1.7835693359375, 2.00274658203125, 2.221923828125, 2.44110107421875, 2.6602783203125, 2.87945556640625, 3.0986328125, 3.31781005859375, 3.5369873046875, 3.75616455078125, 3.975341796875, 4.19451904296875, 4.4136962890625, 4.63287353515625, 4.85205078125, 5.07122802734375, 5.2904052734375, 5.50958251953125, 5.728759765625, 5.94793701171875, 6.1671142578125, 6.38629150390625, 6.60546875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 13.0, 14.0, 18.0, 47.0, 53.0, 86.0, 101.0, 141.0, 238.0, 357.0, 517.0, 744.0, 1037.0, 1559.0, 2328.0, 3363.0, 4913.0, 7489.0, 11303.0, 17080.0, 26640.0, 40820.0, 63668.0, 99486.0, 150787.0, 185090.0, 150112.0, 99005.0, 63050.0, 40508.0, 26026.0, 17060.0, 11387.0, 7618.0, 5078.0, 3445.0, 2341.0, 1597.0, 1085.0, 730.0, 534.0, 339.0, 260.0, 167.0, 93.0, 86.0, 51.0, 38.0, 15.0, 21.0, 7.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.6708984375, -0.6502532958984375, -0.629608154296875, -0.6089630126953125, -0.58831787109375, -0.5676727294921875, -0.547027587890625, -0.5263824462890625, -0.5057373046875, -0.4850921630859375, -0.464447021484375, -0.4438018798828125, -0.42315673828125, -0.4025115966796875, -0.381866455078125, -0.3612213134765625, -0.340576171875, -0.3199310302734375, -0.299285888671875, -0.2786407470703125, -0.25799560546875, -0.2373504638671875, -0.216705322265625, -0.1960601806640625, -0.1754150390625, -0.1547698974609375, -0.134124755859375, -0.1134796142578125, -0.09283447265625, -0.0721893310546875, -0.051544189453125, -0.0308990478515625, -0.01025390625, 0.0103912353515625, 0.031036376953125, 0.0516815185546875, 0.07232666015625, 0.0929718017578125, 0.113616943359375, 0.1342620849609375, 0.1549072265625, 0.1755523681640625, 0.196197509765625, 0.2168426513671875, 0.23748779296875, 0.2581329345703125, 0.278778076171875, 0.2994232177734375, 0.320068359375, 0.3407135009765625, 0.361358642578125, 0.3820037841796875, 0.40264892578125, 0.4232940673828125, 0.443939208984375, 0.4645843505859375, 0.4852294921875, 0.5058746337890625, 0.526519775390625, 0.5471649169921875, 0.56781005859375, 0.5884552001953125, 0.609100341796875, 0.6297454833984375, 0.650390625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 10.0, 17.0, 14.0, 22.0, 17.0, 22.0, 19.0, 31.0, 27.0, 30.0, 33.0, 40.0, 38.0, 47.0, 37.0, 45.0, 1064.0, 48.0, 40.0, 40.0, 28.0, 38.0, 30.0, 31.0, 23.0, 24.0, 22.0, 19.0, 22.0, 21.0, 16.0, 15.0, 10.0, 9.0, 12.0, 6.0, 3.0, 6.0, 8.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.923828125, -3.800079345703125, -3.67633056640625, -3.552581787109375, -3.4288330078125, -3.305084228515625, -3.18133544921875, -3.057586669921875, -2.933837890625, -2.810089111328125, -2.68634033203125, -2.562591552734375, -2.4388427734375, -2.315093994140625, -2.19134521484375, -2.067596435546875, -1.94384765625, -1.820098876953125, -1.69635009765625, -1.572601318359375, -1.4488525390625, -1.325103759765625, -1.20135498046875, -1.077606201171875, -0.953857421875, -0.830108642578125, -0.70635986328125, -0.582611083984375, -0.4588623046875, -0.335113525390625, -0.21136474609375, -0.087615966796875, 0.0361328125, 0.159881591796875, 0.28363037109375, 0.407379150390625, 0.5311279296875, 0.654876708984375, 0.77862548828125, 0.902374267578125, 1.026123046875, 1.149871826171875, 1.27362060546875, 1.397369384765625, 1.5211181640625, 1.644866943359375, 1.76861572265625, 1.892364501953125, 2.01611328125, 2.139862060546875, 2.26361083984375, 2.387359619140625, 2.5111083984375, 2.634857177734375, 2.75860595703125, 2.882354736328125, 3.006103515625, 3.129852294921875, 3.25360107421875, 3.377349853515625, 3.5010986328125, 3.624847412109375, 3.74859619140625, 3.872344970703125, 3.99609375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 9.0, 13.0, 20.0, 27.0, 43.0, 72.0, 93.0, 144.0, 233.0, 296.0, 418.0, 616.0, 917.0, 1275.0, 1866.0, 2684.0, 3809.0, 5537.0, 7768.0, 11189.0, 16103.0, 23093.0, 33515.0, 48631.0, 70803.0, 101758.0, 137040.0, 1199263.0, 128170.0, 92665.0, 64258.0, 44338.0, 30433.0, 21282.0, 14930.0, 10381.0, 6994.0, 4994.0, 3569.0, 2415.0, 1602.0, 1238.0, 792.0, 557.0, 409.0, 291.0, 200.0, 119.0, 98.0, 61.0, 38.0, 30.0, 17.0, 11.0, 9.0, 3.0, 3.0, 2.0], "bins": [-0.5439453125, -0.5276451110839844, -0.5113449096679688, -0.4950447082519531, -0.4787445068359375, -0.4624443054199219, -0.44614410400390625, -0.4298439025878906, -0.413543701171875, -0.3972434997558594, -0.38094329833984375, -0.3646430969238281, -0.3483428955078125, -0.3320426940917969, -0.31574249267578125, -0.2994422912597656, -0.28314208984375, -0.2668418884277344, -0.25054168701171875, -0.23424148559570312, -0.2179412841796875, -0.20164108276367188, -0.18534088134765625, -0.16904067993164062, -0.152740478515625, -0.13644027709960938, -0.12014007568359375, -0.10383987426757812, -0.0875396728515625, -0.07123947143554688, -0.05493927001953125, -0.038639068603515625, -0.0223388671875, -0.006038665771484375, 0.01026153564453125, 0.026561737060546875, 0.0428619384765625, 0.059162139892578125, 0.07546234130859375, 0.09176254272460938, 0.108062744140625, 0.12436294555664062, 0.14066314697265625, 0.15696334838867188, 0.1732635498046875, 0.18956375122070312, 0.20586395263671875, 0.22216415405273438, 0.23846435546875, 0.2547645568847656, 0.27106475830078125, 0.2873649597167969, 0.3036651611328125, 0.3199653625488281, 0.33626556396484375, 0.3525657653808594, 0.368865966796875, 0.3851661682128906, 0.40146636962890625, 0.4177665710449219, 0.4340667724609375, 0.4503669738769531, 0.46666717529296875, 0.4829673767089844, 0.499267578125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 11.0, 18.0, 6.0, 20.0, 30.0, 27.0, 38.0, 56.0, 54.0, 73.0, 58.0, 80.0, 90.0, 68.0, 71.0, 63.0, 41.0, 48.0, 26.0, 22.0, 17.0, 17.0, 7.0, 15.0, 4.0, 7.0, 5.0, 3.0, 1.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020885467529296875, -0.002019524574279785, -0.0019505023956298828, -0.0018814802169799805, -0.0018124580383300781, -0.0017434358596801758, -0.0016744136810302734, -0.001605391502380371, -0.0015363693237304688, -0.0014673471450805664, -0.001398324966430664, -0.0013293027877807617, -0.0012602806091308594, -0.001191258430480957, -0.0011222362518310547, -0.0010532140731811523, -0.00098419189453125, -0.0009151697158813477, -0.0008461475372314453, -0.000777125358581543, -0.0007081031799316406, -0.0006390810012817383, -0.0005700588226318359, -0.0005010366439819336, -0.00043201446533203125, -0.0003629922866821289, -0.00029397010803222656, -0.00022494792938232422, -0.00015592575073242188, -8.690357208251953e-05, -1.7881393432617188e-05, 5.1140785217285156e-05, 0.0001201629638671875, 0.00018918514251708984, 0.0002582073211669922, 0.00032722949981689453, 0.0003962516784667969, 0.0004652738571166992, 0.0005342960357666016, 0.0006033182144165039, 0.0006723403930664062, 0.0007413625717163086, 0.0008103847503662109, 0.0008794069290161133, 0.0009484291076660156, 0.001017451286315918, 0.0010864734649658203, 0.0011554956436157227, 0.001224517822265625, 0.0012935400009155273, 0.0013625621795654297, 0.001431584358215332, 0.0015006065368652344, 0.0015696287155151367, 0.001638650894165039, 0.0017076730728149414, 0.0017766952514648438, 0.001845717430114746, 0.0019147396087646484, 0.0019837617874145508, 0.002052783966064453, 0.0021218061447143555, 0.002190828323364258, 0.00225985050201416, 0.0023288726806640625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 4.0, 2.0, 10.0, 13.0, 14.0, 10.0, 24.0, 48.0, 62.0, 73.0, 157.0, 251.0, 550.0, 2639.0, 1023477.0, 19618.0, 752.0, 335.0, 152.0, 103.0, 59.0, 51.0, 36.0, 19.0, 14.0, 22.0, 10.0, 9.0, 9.0, 5.0, 2.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05377197265625, -0.05230522155761719, -0.050838470458984375, -0.04937171936035156, -0.04790496826171875, -0.04643821716308594, -0.044971466064453125, -0.04350471496582031, -0.0420379638671875, -0.04057121276855469, -0.039104461669921875, -0.03763771057128906, -0.03617095947265625, -0.03470420837402344, -0.033237457275390625, -0.03177070617675781, -0.030303955078125, -0.028837203979492188, -0.027370452880859375, -0.025903701782226562, -0.02443695068359375, -0.022970199584960938, -0.021503448486328125, -0.020036697387695312, -0.0185699462890625, -0.017103195190429688, -0.015636444091796875, -0.014169692993164062, -0.01270294189453125, -0.011236190795898438, -0.009769439697265625, -0.008302688598632812, -0.0068359375, -0.0053691864013671875, -0.003902435302734375, -0.0024356842041015625, -0.00096893310546875, 0.0004978179931640625, 0.001964569091796875, 0.0034313201904296875, 0.0048980712890625, 0.0063648223876953125, 0.007831573486328125, 0.009298324584960938, 0.01076507568359375, 0.012231826782226562, 0.013698577880859375, 0.015165328979492188, 0.016632080078125, 0.018098831176757812, 0.019565582275390625, 0.021032333374023438, 0.02249908447265625, 0.023965835571289062, 0.025432586669921875, 0.026899337768554688, 0.0283660888671875, 0.029832839965820312, 0.031299591064453125, 0.03276634216308594, 0.03423309326171875, 0.03569984436035156, 0.037166595458984375, 0.03863334655761719, 0.04010009765625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 44.0, 417.0, 490.0, 64.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029400296043604612, -0.0027150525711476803, -0.002490075770765543, -0.002265098737552762, -0.002040121704339981, -0.001815144787542522, -0.0015901678707450628, -0.0013651908375322819, -0.0011402139207348228, -0.0009152369457297027, -0.0006902599707245827, -0.00046528305392712355, -0.0002403060789220035, -1.532910391688347e-05, 0.00020964781288057566, 0.0004346248460933566, 0.0006596017628908157, 0.0008845787378959358, 0.0011095557129010558, 0.001334532629698515, 0.0015595096629112959, 0.001784486579708755, 0.002009463496506214, 0.002234440529718995, 0.002459417562931776, 0.002684394596144557, 0.0029093713965266943, 0.0031343484297394753, 0.003359325462952256, 0.003584302496165037, 0.0038092792965471745, 0.004034256562590599, 0.004259232897311449, 0.004484209697693586, 0.004709186963737011, 0.004934163764119148, 0.0051591405645012856, 0.00538411783054471, 0.0056090946309268475, 0.005834071896970272, 0.006059048697352409, 0.006284025497734547, 0.006509002763777971, 0.0067339795641601086, 0.006958956364542246, 0.0071839336305856705, 0.007408910430967808, 0.007633887231349945, 0.007858864031732082, 0.00808384083211422, 0.008308817632496357, 0.008533794432878494, 0.008758772164583206, 0.008983748964965343, 0.00920872576534748, 0.009433702565729618, 0.00965868029743433, 0.009883657097816467, 0.010108633898198605, 0.010333610698580742, 0.010558588430285454, 0.010783565230667591, 0.011008542031049728, 0.011233518831431866, 0.011458495631814003]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 11.0, 3.0, 10.0, 8.0, 12.0, 10.0, 15.0, 18.0, 26.0, 25.0, 20.0, 44.0, 38.0, 37.0, 47.0, 31.0, 55.0, 36.0, 45.0, 49.0, 48.0, 39.0, 47.0, 48.0, 37.0, 32.0, 31.0, 25.0, 24.0, 25.0, 24.0, 15.0, 16.0, 10.0, 11.0, 9.0, 8.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008756518363952637, -0.0008439505472779274, -0.0008122492581605911, -0.0007805479690432549, -0.0007488466799259186, -0.0007171453908085823, -0.000685444101691246, -0.0006537428125739098, -0.0006220415234565735, -0.0005903402343392372, -0.0005586389452219009, -0.0005269376561045647, -0.0004952363669872284, -0.0004635350778698921, -0.00043183378875255585, -0.0004001324996352196, -0.0003684312105178833, -0.00033672992140054703, -0.00030502863228321075, -0.0002733273431658745, -0.0002416260540485382, -0.00020992476493120193, -0.00017822347581386566, -0.0001465221866965294, -0.00011482089757919312, -8.311960846185684e-05, -5.141831934452057e-05, -1.9717030227184296e-05, 1.1984258890151978e-05, 4.368554800748825e-05, 7.538683712482452e-05, 0.0001070881262421608, 0.00013878941535949707, 0.00017049070447683334, 0.00020219199359416962, 0.0002338932827115059, 0.00026559457182884216, 0.00029729586094617844, 0.0003289971500635147, 0.000360698439180851, 0.00039239972829818726, 0.00042410101741552353, 0.0004558023065328598, 0.0004875035956501961, 0.0005192048847675323, 0.0005509061738848686, 0.0005826074630022049, 0.0006143087521195412, 0.0006460100412368774, 0.0006777113303542137, 0.00070941261947155, 0.0007411139085888863, 0.0007728151977062225, 0.0008045164868235588, 0.0008362177759408951, 0.0008679190650582314, 0.0008996203541755676, 0.0009313216432929039, 0.0009630229324102402, 0.0009947242215275764, 0.0010264255106449127, 0.001058126799762249, 0.0010898280888795853, 0.0011215293779969215, 0.0011532306671142578]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 5.0, 7.0, 13.0, 11.0, 14.0, 14.0, 22.0, 21.0, 26.0, 28.0, 36.0, 35.0, 50.0, 31.0, 39.0, 36.0, 51.0, 40.0, 49.0, 53.0, 56.0, 33.0, 34.0, 50.0, 37.0, 24.0, 25.0, 25.0, 27.0, 13.0, 20.0, 8.0, 15.0, 12.0, 8.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.421875, -7.20269775390625, -6.9835205078125, -6.76434326171875, -6.545166015625, -6.32598876953125, -6.1068115234375, -5.88763427734375, -5.66845703125, -5.44927978515625, -5.2301025390625, -5.01092529296875, -4.791748046875, -4.57257080078125, -4.3533935546875, -4.13421630859375, -3.9150390625, -3.69586181640625, -3.4766845703125, -3.25750732421875, -3.038330078125, -2.81915283203125, -2.5999755859375, -2.38079833984375, -2.16162109375, -1.94244384765625, -1.7232666015625, -1.50408935546875, -1.284912109375, -1.06573486328125, -0.8465576171875, -0.62738037109375, -0.408203125, -0.18902587890625, 0.0301513671875, 0.24932861328125, 0.468505859375, 0.68768310546875, 0.9068603515625, 1.12603759765625, 1.34521484375, 1.56439208984375, 1.7835693359375, 2.00274658203125, 2.221923828125, 2.44110107421875, 2.6602783203125, 2.87945556640625, 3.0986328125, 3.31781005859375, 3.5369873046875, 3.75616455078125, 3.975341796875, 4.19451904296875, 4.4136962890625, 4.63287353515625, 4.85205078125, 5.07122802734375, 5.2904052734375, 5.50958251953125, 5.728759765625, 5.94793701171875, 6.1671142578125, 6.38629150390625, 6.60546875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 10.0, 14.0, 19.0, 21.0, 27.0, 39.0, 45.0, 57.0, 91.0, 153.0, 222.0, 321.0, 493.0, 760.0, 1272.0, 2102.0, 3968.0, 7564.0, 15943.0, 37630.0, 109448.0, 424906.0, 304831.0, 81402.0, 29548.0, 13013.0, 6310.0, 3330.0, 1835.0, 1088.0, 690.0, 463.0, 287.0, 199.0, 151.0, 79.0, 54.0, 50.0, 38.0, 18.0, 14.0, 13.0, 14.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.09375, -4.943359375, -4.79296875, -4.642578125, -4.4921875, -4.341796875, -4.19140625, -4.041015625, -3.890625, -3.740234375, -3.58984375, -3.439453125, -3.2890625, -3.138671875, -2.98828125, -2.837890625, -2.6875, -2.537109375, -2.38671875, -2.236328125, -2.0859375, -1.935546875, -1.78515625, -1.634765625, -1.484375, -1.333984375, -1.18359375, -1.033203125, -0.8828125, -0.732421875, -0.58203125, -0.431640625, -0.28125, -0.130859375, 0.01953125, 0.169921875, 0.3203125, 0.470703125, 0.62109375, 0.771484375, 0.921875, 1.072265625, 1.22265625, 1.373046875, 1.5234375, 1.673828125, 1.82421875, 1.974609375, 2.125, 2.275390625, 2.42578125, 2.576171875, 2.7265625, 2.876953125, 3.02734375, 3.177734375, 3.328125, 3.478515625, 3.62890625, 3.779296875, 3.9296875, 4.080078125, 4.23046875, 4.380859375, 4.53125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 2.0, 10.0, 7.0, 8.0, 9.0, 17.0, 15.0, 20.0, 24.0, 26.0, 21.0, 35.0, 30.0, 39.0, 37.0, 45.0, 59.0, 67.0, 116.0, 1639.0, 279.0, 89.0, 55.0, 56.0, 46.0, 38.0, 40.0, 30.0, 36.0, 26.0, 18.0, 19.0, 18.0, 14.0, 9.0, 9.0, 11.0, 6.0, 4.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.609375, -19.866455078125, -19.12353515625, -18.380615234375, -17.6376953125, -16.894775390625, -16.15185546875, -15.408935546875, -14.666015625, -13.923095703125, -13.18017578125, -12.437255859375, -11.6943359375, -10.951416015625, -10.20849609375, -9.465576171875, -8.72265625, -7.979736328125, -7.23681640625, -6.493896484375, -5.7509765625, -5.008056640625, -4.26513671875, -3.522216796875, -2.779296875, -2.036376953125, -1.29345703125, -0.550537109375, 0.1923828125, 0.935302734375, 1.67822265625, 2.421142578125, 3.1640625, 3.906982421875, 4.64990234375, 5.392822265625, 6.1357421875, 6.878662109375, 7.62158203125, 8.364501953125, 9.107421875, 9.850341796875, 10.59326171875, 11.336181640625, 12.0791015625, 12.822021484375, 13.56494140625, 14.307861328125, 15.05078125, 15.793701171875, 16.53662109375, 17.279541015625, 18.0224609375, 18.765380859375, 19.50830078125, 20.251220703125, 20.994140625, 21.737060546875, 22.47998046875, 23.222900390625, 23.9658203125, 24.708740234375, 25.45166015625, 26.194580078125, 26.9375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 13.0, 21.0, 23.0, 46.0, 79.0, 136.0, 309.0, 994.0, 51605.0, 3089864.0, 1786.0, 445.0, 153.0, 89.0, 52.0, 41.0, 24.0, 12.0, 14.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.375, -148.58203125, -144.7890625, -140.99609375, -137.203125, -133.41015625, -129.6171875, -125.82421875, -122.03125, -118.23828125, -114.4453125, -110.65234375, -106.859375, -103.06640625, -99.2734375, -95.48046875, -91.6875, -87.89453125, -84.1015625, -80.30859375, -76.515625, -72.72265625, -68.9296875, -65.13671875, -61.34375, -57.55078125, -53.7578125, -49.96484375, -46.171875, -42.37890625, -38.5859375, -34.79296875, -31.0, -27.20703125, -23.4140625, -19.62109375, -15.828125, -12.03515625, -8.2421875, -4.44921875, -0.65625, 3.13671875, 6.9296875, 10.72265625, 14.515625, 18.30859375, 22.1015625, 25.89453125, 29.6875, 33.48046875, 37.2734375, 41.06640625, 44.859375, 48.65234375, 52.4453125, 56.23828125, 60.03125, 63.82421875, 67.6171875, 71.41015625, 75.203125, 78.99609375, 82.7890625, 86.58203125, 90.375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [6.0, 983.0, 30.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.737899780273438, -9.958105087280273, 4.821689605712891, 19.601486206054688, 34.38127899169922, 49.16107177734375, 63.94087219238281, 78.72066497802734, 93.50045776367188, 108.2802505493164, 123.06004333496094, 137.83984375, 152.61962890625, 167.39942932128906, 182.17922973632812, 196.95901489257812, 211.7388153076172, 226.51861572265625, 241.29840087890625, 256.07818603515625, 270.8580017089844, 285.6377868652344, 300.4176025390625, 315.1973876953125, 329.9771728515625, 344.7569580078125, 359.5367736816406, 374.3165588378906, 389.0963439941406, 403.87615966796875, 418.65594482421875, 433.43572998046875, 448.21551513671875, 462.99530029296875, 477.7751159667969, 492.5549011230469, 507.3346862792969, 522.114501953125, 536.894287109375, 551.674072265625, 566.453857421875, 581.233642578125, 596.013427734375, 610.793212890625, 625.5730590820312, 640.3528442382812, 655.1326293945312, 669.9124145507812, 684.6922607421875, 699.4720458984375, 714.2518310546875, 729.0316162109375, 743.8114624023438, 758.5912475585938, 773.3710327148438, 788.1508178710938, 802.9306030273438, 817.7103881835938, 832.4901733398438, 847.27001953125, 862.0498046875, 876.82958984375, 891.609375, 906.38916015625, 921.1689453125]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 9.0, 10.0, 8.0, 4.0, 15.0, 18.0, 15.0, 10.0, 22.0, 18.0, 24.0, 21.0, 33.0, 21.0, 21.0, 34.0, 30.0, 32.0, 41.0, 31.0, 39.0, 46.0, 36.0, 37.0, 41.0, 36.0, 21.0, 42.0, 39.0, 17.0, 30.0, 23.0, 23.0, 23.0, 23.0, 24.0, 11.0, 12.0, 13.0, 6.0, 8.0, 5.0, 5.0, 5.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0], "bins": [-57.706512451171875, -55.98161697387695, -54.25672149658203, -52.531822204589844, -50.80692672729492, -49.08203125, -47.35713195800781, -45.63223648071289, -43.90734100341797, -42.18244552612305, -40.457550048828125, -38.73265075683594, -37.007755279541016, -35.282859802246094, -33.557960510253906, -31.833065032958984, -30.108169555664062, -28.38327407836914, -26.658376693725586, -24.93347930908203, -23.20858383178711, -21.483688354492188, -19.758790969848633, -18.033893585205078, -16.308998107910156, -14.584101676940918, -12.85920524597168, -11.134308815002441, -9.409412384033203, -7.684515953063965, -5.959619522094727, -4.234723091125488, -2.50982666015625, -0.7849302291870117, 0.9399662017822266, 2.664862632751465, 4.389759063720703, 6.114655494689941, 7.83955192565918, 9.564448356628418, 11.289344787597656, 13.014241218566895, 14.739137649536133, 16.464035034179688, 18.18893051147461, 19.91382598876953, 21.638723373413086, 23.36362075805664, 25.088516235351562, 26.813411712646484, 28.53830909729004, 30.263206481933594, 31.988101959228516, 33.71299743652344, 35.437896728515625, 37.16279220581055, 38.88768768310547, 40.61258316040039, 42.33747863769531, 44.0623779296875, 45.78727340698242, 47.512168884277344, 49.23706817626953, 50.96196365356445, 52.686859130859375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 10.0, 7.0, 7.0, 9.0, 12.0, 11.0, 19.0, 31.0, 21.0, 25.0, 31.0, 33.0, 34.0, 33.0, 47.0, 38.0, 45.0, 40.0, 43.0, 41.0, 57.0, 49.0, 35.0, 44.0, 37.0, 27.0, 30.0, 18.0, 29.0, 30.0, 11.0, 21.0, 11.0, 13.0, 8.0, 11.0, 10.0, 6.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.6875, -7.46563720703125, -7.2437744140625, -7.02191162109375, -6.800048828125, -6.57818603515625, -6.3563232421875, -6.13446044921875, -5.91259765625, -5.69073486328125, -5.4688720703125, -5.24700927734375, -5.025146484375, -4.80328369140625, -4.5814208984375, -4.35955810546875, -4.1376953125, -3.91583251953125, -3.6939697265625, -3.47210693359375, -3.250244140625, -3.02838134765625, -2.8065185546875, -2.58465576171875, -2.36279296875, -2.14093017578125, -1.9190673828125, -1.69720458984375, -1.475341796875, -1.25347900390625, -1.0316162109375, -0.80975341796875, -0.587890625, -0.36602783203125, -0.1441650390625, 0.07769775390625, 0.299560546875, 0.52142333984375, 0.7432861328125, 0.96514892578125, 1.18701171875, 1.40887451171875, 1.6307373046875, 1.85260009765625, 2.074462890625, 2.29632568359375, 2.5181884765625, 2.74005126953125, 2.9619140625, 3.18377685546875, 3.4056396484375, 3.62750244140625, 3.849365234375, 4.07122802734375, 4.2930908203125, 4.51495361328125, 4.73681640625, 4.95867919921875, 5.1805419921875, 5.40240478515625, 5.624267578125, 5.84613037109375, 6.0679931640625, 6.28985595703125, 6.51171875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 7.0, 4.0, 3.0, 9.0, 15.0, 9.0, 18.0, 18.0, 15.0, 28.0, 34.0, 35.0, 58.0, 74.0, 101.0, 149.0, 342.0, 1824.0, 30750.0, 2932027.0, 1214169.0, 12724.0, 1038.0, 258.0, 151.0, 96.0, 71.0, 44.0, 39.0, 25.0, 27.0, 18.0, 18.0, 13.0, 14.0, 9.0, 6.0, 7.0, 10.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-37.3125, -36.2109375, -35.109375, -34.0078125, -32.90625, -31.8046875, -30.703125, -29.6015625, -28.5, -27.3984375, -26.296875, -25.1953125, -24.09375, -22.9921875, -21.890625, -20.7890625, -19.6875, -18.5859375, -17.484375, -16.3828125, -15.28125, -14.1796875, -13.078125, -11.9765625, -10.875, -9.7734375, -8.671875, -7.5703125, -6.46875, -5.3671875, -4.265625, -3.1640625, -2.0625, -0.9609375, 0.140625, 1.2421875, 2.34375, 3.4453125, 4.546875, 5.6484375, 6.75, 7.8515625, 8.953125, 10.0546875, 11.15625, 12.2578125, 13.359375, 14.4609375, 15.5625, 16.6640625, 17.765625, 18.8671875, 19.96875, 21.0703125, 22.171875, 23.2734375, 24.375, 25.4765625, 26.578125, 27.6796875, 28.78125, 29.8828125, 30.984375, 32.0859375, 33.1875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 6.0, 11.0, 15.0, 26.0, 36.0, 37.0, 60.0, 93.0, 132.0, 193.0, 278.0, 421.0, 534.0, 560.0, 460.0, 351.0, 297.0, 166.0, 124.0, 87.0, 50.0, 48.0, 25.0, 19.0, 11.0, 5.0, 7.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.296875, -18.717529296875, -18.13818359375, -17.558837890625, -16.9794921875, -16.400146484375, -15.82080078125, -15.241455078125, -14.662109375, -14.082763671875, -13.50341796875, -12.924072265625, -12.3447265625, -11.765380859375, -11.18603515625, -10.606689453125, -10.02734375, -9.447998046875, -8.86865234375, -8.289306640625, -7.7099609375, -7.130615234375, -6.55126953125, -5.971923828125, -5.392578125, -4.813232421875, -4.23388671875, -3.654541015625, -3.0751953125, -2.495849609375, -1.91650390625, -1.337158203125, -0.7578125, -0.178466796875, 0.40087890625, 0.980224609375, 1.5595703125, 2.138916015625, 2.71826171875, 3.297607421875, 3.876953125, 4.456298828125, 5.03564453125, 5.614990234375, 6.1943359375, 6.773681640625, 7.35302734375, 7.932373046875, 8.51171875, 9.091064453125, 9.67041015625, 10.249755859375, 10.8291015625, 11.408447265625, 11.98779296875, 12.567138671875, 13.146484375, 13.725830078125, 14.30517578125, 14.884521484375, 15.4638671875, 16.043212890625, 16.62255859375, 17.201904296875, 17.78125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 15.0, 20.0, 21.0, 39.0, 33.0, 60.0, 59.0, 113.0, 150.0, 215.0, 342.0, 721.0, 1998.0, 21394.0, 2316762.0, 1830759.0, 17978.0, 1920.0, 647.0, 278.0, 196.0, 130.0, 100.0, 81.0, 56.0, 41.0, 30.0, 32.0, 21.0, 15.0, 10.0, 7.0, 5.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.53125, -47.87890625, -46.2265625, -44.57421875, -42.921875, -41.26953125, -39.6171875, -37.96484375, -36.3125, -34.66015625, -33.0078125, -31.35546875, -29.703125, -28.05078125, -26.3984375, -24.74609375, -23.09375, -21.44140625, -19.7890625, -18.13671875, -16.484375, -14.83203125, -13.1796875, -11.52734375, -9.875, -8.22265625, -6.5703125, -4.91796875, -3.265625, -1.61328125, 0.0390625, 1.69140625, 3.34375, 4.99609375, 6.6484375, 8.30078125, 9.953125, 11.60546875, 13.2578125, 14.91015625, 16.5625, 18.21484375, 19.8671875, 21.51953125, 23.171875, 24.82421875, 26.4765625, 28.12890625, 29.78125, 31.43359375, 33.0859375, 34.73828125, 36.390625, 38.04296875, 39.6953125, 41.34765625, 43.0, 44.65234375, 46.3046875, 47.95703125, 49.609375, 51.26171875, 52.9140625, 54.56640625, 56.21875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 19.0, 58.0, 136.0, 206.0, 240.0, 181.0, 100.0, 47.0, 12.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.32273864746094, -199.71424865722656, -195.10574340820312, -190.49725341796875, -185.88876342773438, -181.2802734375, -176.67176818847656, -172.0632781982422, -167.45477294921875, -162.84628295898438, -158.23777770996094, -153.62928771972656, -149.0207977294922, -144.41229248046875, -139.80380249023438, -135.1953125, -130.58682250976562, -125.97832489013672, -121.36983489990234, -116.76133728027344, -112.15284729003906, -107.54434967041016, -102.93585205078125, -98.32736206054688, -93.71886444091797, -89.11036682128906, -84.50187683105469, -79.89337921142578, -75.28488159179688, -70.6763916015625, -66.0678939819336, -61.45940017700195, -56.850914001464844, -52.2424201965332, -47.63392639160156, -43.025428771972656, -38.416934967041016, -33.808441162109375, -29.1999454498291, -24.591449737548828, -19.982955932617188, -15.37446117401123, -10.765966415405273, -6.157471656799316, -1.5489768981933594, 3.0595169067382812, 7.668012619018555, 12.276508331298828, 16.88500213623047, 21.49349594116211, 26.101991653442383, 30.710487365722656, 35.3189811706543, 39.92747497558594, 44.535972595214844, 49.144466400146484, 53.752960205078125, 58.361454010009766, 62.969947814941406, 67.57844543457031, 72.18693542480469, 76.7954330444336, 81.4039306640625, 86.01242065429688, 90.62091827392578]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 4.0, 8.0, 5.0, 7.0, 13.0, 15.0, 13.0, 14.0, 25.0, 18.0, 33.0, 32.0, 35.0, 37.0, 43.0, 43.0, 45.0, 45.0, 55.0, 39.0, 55.0, 46.0, 40.0, 42.0, 34.0, 36.0, 29.0, 39.0, 23.0, 24.0, 21.0, 14.0, 15.0, 9.0, 8.0, 4.0, 11.0, 6.0, 9.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.94585418701172, -51.18500900268555, -49.42416763305664, -47.66332244873047, -45.90248107910156, -44.14163589477539, -42.38079071044922, -40.61994934082031, -38.85910415649414, -37.09825897216797, -35.33741760253906, -33.57657241821289, -31.81572914123535, -30.054885864257812, -28.294042587280273, -26.533199310302734, -24.772356033325195, -23.011512756347656, -21.250669479370117, -19.489826202392578, -17.728981018066406, -15.968137741088867, -14.207294464111328, -12.446450233459473, -10.685606956481934, -8.924763679504395, -7.163919448852539, -5.403076171875, -3.6422324180603027, -1.8813886642456055, -0.1205453872680664, 1.640298843383789, 3.401142120361328, 5.161985874176025, 6.922829627990723, 8.683672904968262, 10.444517135620117, 12.205360412597656, 13.966203689575195, 15.72704792022705, 17.487892150878906, 19.248735427856445, 21.009578704833984, 22.770423889160156, 24.531267166137695, 26.292110443115234, 28.052953720092773, 29.813796997070312, 31.57464027404785, 33.33548355102539, 35.09632873535156, 36.85717010498047, 38.61801528930664, 40.37886047363281, 42.13970184326172, 43.90054702758789, 45.6613883972168, 47.42223358154297, 49.183074951171875, 50.94392013549805, 52.70476150512695, 54.465606689453125, 56.22644805908203, 57.9872932434082, 59.748138427734375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 11.0, 10.0, 11.0, 12.0, 12.0, 16.0, 24.0, 20.0, 32.0, 35.0, 32.0, 36.0, 38.0, 30.0, 36.0, 42.0, 43.0, 41.0, 50.0, 42.0, 53.0, 34.0, 42.0, 36.0, 41.0, 31.0, 26.0, 30.0, 18.0, 15.0, 18.0, 11.0, 12.0, 14.0, 8.0, 9.0, 7.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.6484375, -7.42230224609375, -7.1961669921875, -6.97003173828125, -6.743896484375, -6.51776123046875, -6.2916259765625, -6.06549072265625, -5.83935546875, -5.61322021484375, -5.3870849609375, -5.16094970703125, -4.934814453125, -4.70867919921875, -4.4825439453125, -4.25640869140625, -4.0302734375, -3.80413818359375, -3.5780029296875, -3.35186767578125, -3.125732421875, -2.89959716796875, -2.6734619140625, -2.44732666015625, -2.22119140625, -1.99505615234375, -1.7689208984375, -1.54278564453125, -1.316650390625, -1.09051513671875, -0.8643798828125, -0.63824462890625, -0.412109375, -0.18597412109375, 0.0401611328125, 0.26629638671875, 0.492431640625, 0.71856689453125, 0.9447021484375, 1.17083740234375, 1.39697265625, 1.62310791015625, 1.8492431640625, 2.07537841796875, 2.301513671875, 2.52764892578125, 2.7537841796875, 2.97991943359375, 3.2060546875, 3.43218994140625, 3.6583251953125, 3.88446044921875, 4.110595703125, 4.33673095703125, 4.5628662109375, 4.78900146484375, 5.01513671875, 5.24127197265625, 5.4674072265625, 5.69354248046875, 5.919677734375, 6.14581298828125, 6.3719482421875, 6.59808349609375, 6.82421875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 10.0, 16.0, 26.0, 37.0, 65.0, 77.0, 129.0, 162.0, 206.0, 335.0, 420.0, 625.0, 863.0, 1173.0, 1606.0, 2193.0, 3008.0, 4315.0, 5976.0, 8348.0, 11598.0, 16375.0, 23388.0, 33466.0, 47998.0, 68617.0, 96997.0, 131394.0, 148472.0, 126607.0, 92813.0, 65522.0, 45557.0, 32215.0, 22412.0, 15868.0, 11314.0, 7781.0, 5617.0, 4119.0, 3005.0, 2177.0, 1541.0, 1204.0, 816.0, 620.0, 435.0, 319.0, 224.0, 150.0, 127.0, 80.0, 57.0, 32.0, 23.0, 15.0, 9.0, 7.0, 6.0], "bins": [-0.58984375, -0.57220458984375, -0.5545654296875, -0.53692626953125, -0.519287109375, -0.50164794921875, -0.4840087890625, -0.46636962890625, -0.44873046875, -0.43109130859375, -0.4134521484375, -0.39581298828125, -0.378173828125, -0.36053466796875, -0.3428955078125, -0.32525634765625, -0.3076171875, -0.28997802734375, -0.2723388671875, -0.25469970703125, -0.237060546875, -0.21942138671875, -0.2017822265625, -0.18414306640625, -0.16650390625, -0.14886474609375, -0.1312255859375, -0.11358642578125, -0.095947265625, -0.07830810546875, -0.0606689453125, -0.04302978515625, -0.025390625, -0.00775146484375, 0.0098876953125, 0.02752685546875, 0.045166015625, 0.06280517578125, 0.0804443359375, 0.09808349609375, 0.11572265625, 0.13336181640625, 0.1510009765625, 0.16864013671875, 0.186279296875, 0.20391845703125, 0.2215576171875, 0.23919677734375, 0.2568359375, 0.27447509765625, 0.2921142578125, 0.30975341796875, 0.327392578125, 0.34503173828125, 0.3626708984375, 0.38031005859375, 0.39794921875, 0.41558837890625, 0.4332275390625, 0.45086669921875, 0.468505859375, 0.48614501953125, 0.5037841796875, 0.52142333984375, 0.5390625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 8.0, 5.0, 1.0, 9.0, 9.0, 13.0, 15.0, 18.0, 13.0, 22.0, 17.0, 23.0, 24.0, 28.0, 39.0, 25.0, 29.0, 40.0, 33.0, 49.0, 40.0, 1061.0, 46.0, 37.0, 37.0, 42.0, 45.0, 38.0, 24.0, 36.0, 33.0, 23.0, 19.0, 21.0, 16.0, 14.0, 13.0, 13.0, 13.0, 7.0, 5.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.0296630859375, -3.899169921875, -3.7686767578125, -3.63818359375, -3.5076904296875, -3.377197265625, -3.2467041015625, -3.1162109375, -2.9857177734375, -2.855224609375, -2.7247314453125, -2.59423828125, -2.4637451171875, -2.333251953125, -2.2027587890625, -2.072265625, -1.9417724609375, -1.811279296875, -1.6807861328125, -1.55029296875, -1.4197998046875, -1.289306640625, -1.1588134765625, -1.0283203125, -0.8978271484375, -0.767333984375, -0.6368408203125, -0.50634765625, -0.3758544921875, -0.245361328125, -0.1148681640625, 0.015625, 0.1461181640625, 0.276611328125, 0.4071044921875, 0.53759765625, 0.6680908203125, 0.798583984375, 0.9290771484375, 1.0595703125, 1.1900634765625, 1.320556640625, 1.4510498046875, 1.58154296875, 1.7120361328125, 1.842529296875, 1.9730224609375, 2.103515625, 2.2340087890625, 2.364501953125, 2.4949951171875, 2.62548828125, 2.7559814453125, 2.886474609375, 3.0169677734375, 3.1474609375, 3.2779541015625, 3.408447265625, 3.5389404296875, 3.66943359375, 3.7999267578125, 3.930419921875, 4.0609130859375, 4.19140625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 17.0, 26.0, 29.0, 60.0, 57.0, 103.0, 164.0, 217.0, 346.0, 483.0, 717.0, 1014.0, 1462.0, 2335.0, 3323.0, 4892.0, 7333.0, 11012.0, 15988.0, 23801.0, 35554.0, 53167.0, 81219.0, 122355.0, 1169542.0, 208846.0, 118475.0, 78326.0, 51361.0, 34189.0, 22733.0, 15550.0, 10463.0, 7105.0, 4721.0, 3257.0, 2184.0, 1494.0, 997.0, 716.0, 478.0, 355.0, 210.0, 137.0, 99.0, 80.0, 44.0, 30.0, 18.0, 13.0, 12.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.6005859375, -0.5817947387695312, -0.5630035400390625, -0.5442123413085938, -0.525421142578125, -0.5066299438476562, -0.4878387451171875, -0.46904754638671875, -0.45025634765625, -0.43146514892578125, -0.4126739501953125, -0.39388275146484375, -0.375091552734375, -0.35630035400390625, -0.3375091552734375, -0.31871795654296875, -0.2999267578125, -0.28113555908203125, -0.2623443603515625, -0.24355316162109375, -0.224761962890625, -0.20597076416015625, -0.1871795654296875, -0.16838836669921875, -0.14959716796875, -0.13080596923828125, -0.1120147705078125, -0.09322357177734375, -0.074432373046875, -0.05564117431640625, -0.0368499755859375, -0.01805877685546875, 0.000732421875, 0.01952362060546875, 0.0383148193359375, 0.05710601806640625, 0.075897216796875, 0.09468841552734375, 0.1134796142578125, 0.13227081298828125, 0.15106201171875, 0.16985321044921875, 0.1886444091796875, 0.20743560791015625, 0.226226806640625, 0.24501800537109375, 0.2638092041015625, 0.28260040283203125, 0.3013916015625, 0.32018280029296875, 0.3389739990234375, 0.35776519775390625, 0.376556396484375, 0.39534759521484375, 0.4141387939453125, 0.43292999267578125, 0.45172119140625, 0.47051239013671875, 0.4893035888671875, 0.5080947875976562, 0.526885986328125, 0.5456771850585938, 0.5644683837890625, 0.5832595825195312, 0.60205078125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 6.0, 7.0, 3.0, 9.0, 15.0, 22.0, 13.0, 21.0, 16.0, 27.0, 26.0, 44.0, 30.0, 33.0, 49.0, 45.0, 52.0, 46.0, 55.0, 59.0, 53.0, 45.0, 45.0, 50.0, 43.0, 32.0, 26.0, 22.0, 22.0, 14.0, 6.0, 16.0, 11.0, 8.0, 4.0, 4.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013914108276367188, -0.001341506838798523, -0.0012916028499603271, -0.0012416988611221313, -0.0011917948722839355, -0.0011418908834457397, -0.001091986894607544, -0.0010420829057693481, -0.0009921789169311523, -0.0009422749280929565, -0.0008923709392547607, -0.0008424669504165649, -0.0007925629615783691, -0.0007426589727401733, -0.0006927549839019775, -0.0006428509950637817, -0.0005929470062255859, -0.0005430430173873901, -0.0004931390285491943, -0.00044323503971099854, -0.00039333105087280273, -0.00034342706203460693, -0.00029352307319641113, -0.00024361908435821533, -0.00019371509552001953, -0.00014381110668182373, -9.390711784362793e-05, -4.400312900543213e-05, 5.900859832763672e-06, 5.580484867095947e-05, 0.00010570883750915527, 0.00015561282634735107, 0.00020551681518554688, 0.0002554208040237427, 0.0003053247928619385, 0.0003552287817001343, 0.0004051327705383301, 0.0004550367593765259, 0.0005049407482147217, 0.0005548447370529175, 0.0006047487258911133, 0.0006546527147293091, 0.0007045567035675049, 0.0007544606924057007, 0.0008043646812438965, 0.0008542686700820923, 0.0009041726589202881, 0.0009540766477584839, 0.0010039806365966797, 0.0010538846254348755, 0.0011037886142730713, 0.001153692603111267, 0.0012035965919494629, 0.0012535005807876587, 0.0013034045696258545, 0.0013533085584640503, 0.001403212547302246, 0.001453116536140442, 0.0015030205249786377, 0.0015529245138168335, 0.0016028285026550293, 0.001652732491493225, 0.001702636480331421, 0.0017525404691696167, 0.0018024444580078125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 10.0, 6.0, 9.0, 14.0, 16.0, 21.0, 18.0, 33.0, 52.0, 87.0, 113.0, 202.0, 270.0, 616.0, 2333.0, 789214.0, 252779.0, 1482.0, 528.0, 251.0, 141.0, 89.0, 59.0, 47.0, 36.0, 18.0, 29.0, 14.0, 15.0, 12.0, 7.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.046630859375, -0.04543185234069824, -0.044232845306396484, -0.04303383827209473, -0.04183483123779297, -0.04063582420349121, -0.03943681716918945, -0.038237810134887695, -0.03703880310058594, -0.03583979606628418, -0.03464078903198242, -0.033441781997680664, -0.032242774963378906, -0.03104376792907715, -0.02984476089477539, -0.028645753860473633, -0.027446746826171875, -0.026247739791870117, -0.02504873275756836, -0.0238497257232666, -0.022650718688964844, -0.021451711654663086, -0.020252704620361328, -0.01905369758605957, -0.017854690551757812, -0.016655683517456055, -0.015456676483154297, -0.014257669448852539, -0.013058662414550781, -0.011859655380249023, -0.010660648345947266, -0.009461641311645508, -0.00826263427734375, -0.007063627243041992, -0.005864620208740234, -0.0046656131744384766, -0.0034666061401367188, -0.002267599105834961, -0.0010685920715332031, 0.0001304149627685547, 0.0013294219970703125, 0.0025284290313720703, 0.003727436065673828, 0.004926443099975586, 0.006125450134277344, 0.0073244571685791016, 0.00852346420288086, 0.009722471237182617, 0.010921478271484375, 0.012120485305786133, 0.01331949234008789, 0.014518499374389648, 0.015717506408691406, 0.016916513442993164, 0.018115520477294922, 0.01931452751159668, 0.020513534545898438, 0.021712541580200195, 0.022911548614501953, 0.02411055564880371, 0.02530956268310547, 0.026508569717407227, 0.027707576751708984, 0.028906583786010742, 0.0301055908203125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 39.0, 395.0, 490.0, 88.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002618564059957862, -0.0023828439880162477, -0.00214712368324399, -0.0019114036113023758, -0.001675683306530118, -0.0014399632345885038, -0.0012042430462315679, -0.0009685228578746319, -0.0007328026695176959, -0.0004970824811607599, -0.0002613623219076544, -2.5642162654548883e-05, 0.0002100780257023871, 0.00044579815585166216, 0.0006815183442085981, 0.0009172385325655341, 0.00115295872092247, 0.001388678909279406, 0.001624399097636342, 0.0018601191695779562, 0.002095839474350214, 0.002331559546291828, 0.0025672796182334423, 0.0028029999230057, 0.003038720227777958, 0.003274440299719572, 0.00351016060449183, 0.003745880676433444, 0.003981600981205702, 0.004217321053147316, 0.00445304112508893, 0.004688761197030544, 0.004924481268972158, 0.005160201340913773, 0.005395921412855387, 0.005631641950458288, 0.005867362022399902, 0.0061030820943415165, 0.006338802166283131, 0.006574522703886032, 0.006810242775827646, 0.00704596284776926, 0.0072816829197108746, 0.007517403457313776, 0.00775312352925539, 0.007988844066858292, 0.008224563673138618, 0.00846028421074152, 0.008696003817021847, 0.008931724354624748, 0.009167443960905075, 0.009403164498507977, 0.009638884104788303, 0.009874604642391205, 0.010110325179994106, 0.010346044786274433, 0.010581765323877335, 0.010817485861480236, 0.011053205467760563, 0.011288926005363464, 0.011524645611643791, 0.011760366149246693, 0.011996086686849594, 0.012231806293129921, 0.012467526830732822]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 1.0, 7.0, 7.0, 4.0, 13.0, 14.0, 16.0, 16.0, 20.0, 26.0, 34.0, 30.0, 32.0, 37.0, 29.0, 39.0, 50.0, 44.0, 45.0, 55.0, 43.0, 45.0, 57.0, 34.0, 41.0, 33.0, 23.0, 35.0, 30.0, 22.0, 25.0, 16.0, 17.0, 12.0, 7.0, 11.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.00109100341796875, -0.0010602055117487907, -0.0010294076055288315, -0.0009986096993088722, -0.000967811793088913, -0.0009370138868689537, -0.0009062159806489944, -0.0008754180744290352, -0.0008446201682090759, -0.0008138222619891167, -0.0007830243557691574, -0.0007522264495491982, -0.0007214285433292389, -0.0006906306371092796, -0.0006598327308893204, -0.0006290348246693611, -0.0005982369184494019, -0.0005674390122294426, -0.0005366411060094833, -0.0005058431997895241, -0.0004750452935695648, -0.00044424738734960556, -0.0004134494811296463, -0.00038265157490968704, -0.0003518536686897278, -0.0003210557624697685, -0.00029025785624980927, -0.00025945995002985, -0.00022866204380989075, -0.0001978641375899315, -0.00016706623136997223, -0.00013626832515001297, -0.00010547041893005371, -7.467251271009445e-05, -4.387460649013519e-05, -1.3076700270175934e-05, 1.7721205949783325e-05, 4.8519112169742584e-05, 7.931701838970184e-05, 0.0001101149246096611, 0.00014091283082962036, 0.00017171073704957962, 0.00020250864326953888, 0.00023330654948949814, 0.0002641044557094574, 0.00029490236192941666, 0.0003257002681493759, 0.0003564981743693352, 0.00038729608058929443, 0.0004180939868092537, 0.00044889189302921295, 0.0004796897992491722, 0.0005104877054691315, 0.0005412856116890907, 0.00057208351790905, 0.0006028814241290092, 0.0006336793303489685, 0.0006644772365689278, 0.000695275142788887, 0.0007260730490088463, 0.0007568709552288055, 0.0007876688614487648, 0.0008184667676687241, 0.0008492646738886833, 0.0008800625801086426]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 11.0, 10.0, 11.0, 12.0, 12.0, 16.0, 24.0, 20.0, 32.0, 35.0, 32.0, 36.0, 38.0, 30.0, 36.0, 42.0, 43.0, 41.0, 50.0, 42.0, 53.0, 34.0, 42.0, 36.0, 41.0, 31.0, 26.0, 30.0, 18.0, 15.0, 18.0, 11.0, 12.0, 14.0, 8.0, 9.0, 7.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.6484375, -7.42230224609375, -7.1961669921875, -6.97003173828125, -6.743896484375, -6.51776123046875, -6.2916259765625, -6.06549072265625, -5.83935546875, -5.61322021484375, -5.3870849609375, -5.16094970703125, -4.934814453125, -4.70867919921875, -4.4825439453125, -4.25640869140625, -4.0302734375, -3.80413818359375, -3.5780029296875, -3.35186767578125, -3.125732421875, -2.89959716796875, -2.6734619140625, -2.44732666015625, -2.22119140625, -1.99505615234375, -1.7689208984375, -1.54278564453125, -1.316650390625, -1.09051513671875, -0.8643798828125, -0.63824462890625, -0.412109375, -0.18597412109375, 0.0401611328125, 0.26629638671875, 0.492431640625, 0.71856689453125, 0.9447021484375, 1.17083740234375, 1.39697265625, 1.62310791015625, 1.8492431640625, 2.07537841796875, 2.301513671875, 2.52764892578125, 2.7537841796875, 2.97991943359375, 3.2060546875, 3.43218994140625, 3.6583251953125, 3.88446044921875, 4.110595703125, 4.33673095703125, 4.5628662109375, 4.78900146484375, 5.01513671875, 5.24127197265625, 5.4674072265625, 5.69354248046875, 5.919677734375, 6.14581298828125, 6.3719482421875, 6.59808349609375, 6.82421875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 9.0, 15.0, 20.0, 26.0, 42.0, 53.0, 80.0, 124.0, 202.0, 319.0, 462.0, 715.0, 1189.0, 2075.0, 3401.0, 5929.0, 10161.0, 18419.0, 35236.0, 72997.0, 193475.0, 426037.0, 148908.0, 60598.0, 29903.0, 16093.0, 9152.0, 5209.0, 3020.0, 1754.0, 1094.0, 655.0, 388.0, 241.0, 171.0, 121.0, 89.0, 50.0, 39.0, 24.0, 13.0, 8.0, 8.0, 11.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -4.00518798828125, -3.8775634765625, -3.74993896484375, -3.622314453125, -3.49468994140625, -3.3670654296875, -3.23944091796875, -3.11181640625, -2.98419189453125, -2.8565673828125, -2.72894287109375, -2.601318359375, -2.47369384765625, -2.3460693359375, -2.21844482421875, -2.0908203125, -1.96319580078125, -1.8355712890625, -1.70794677734375, -1.580322265625, -1.45269775390625, -1.3250732421875, -1.19744873046875, -1.06982421875, -0.94219970703125, -0.8145751953125, -0.68695068359375, -0.559326171875, -0.43170166015625, -0.3040771484375, -0.17645263671875, -0.048828125, 0.07879638671875, 0.2064208984375, 0.33404541015625, 0.461669921875, 0.58929443359375, 0.7169189453125, 0.84454345703125, 0.97216796875, 1.09979248046875, 1.2274169921875, 1.35504150390625, 1.482666015625, 1.61029052734375, 1.7379150390625, 1.86553955078125, 1.9931640625, 2.12078857421875, 2.2484130859375, 2.37603759765625, 2.503662109375, 2.63128662109375, 2.7589111328125, 2.88653564453125, 3.01416015625, 3.14178466796875, 3.2694091796875, 3.39703369140625, 3.524658203125, 3.65228271484375, 3.7799072265625, 3.90753173828125, 4.03515625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 8.0, 6.0, 8.0, 7.0, 11.0, 15.0, 14.0, 16.0, 24.0, 29.0, 30.0, 44.0, 36.0, 59.0, 68.0, 68.0, 97.0, 314.0, 1640.0, 134.0, 64.0, 48.0, 35.0, 49.0, 50.0, 30.0, 27.0, 28.0, 21.0, 12.0, 8.0, 13.0, 6.0, 9.0, 6.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.34375, -31.33837890625, -30.3330078125, -29.32763671875, -28.322265625, -27.31689453125, -26.3115234375, -25.30615234375, -24.30078125, -23.29541015625, -22.2900390625, -21.28466796875, -20.279296875, -19.27392578125, -18.2685546875, -17.26318359375, -16.2578125, -15.25244140625, -14.2470703125, -13.24169921875, -12.236328125, -11.23095703125, -10.2255859375, -9.22021484375, -8.21484375, -7.20947265625, -6.2041015625, -5.19873046875, -4.193359375, -3.18798828125, -2.1826171875, -1.17724609375, -0.171875, 0.83349609375, 1.8388671875, 2.84423828125, 3.849609375, 4.85498046875, 5.8603515625, 6.86572265625, 7.87109375, 8.87646484375, 9.8818359375, 10.88720703125, 11.892578125, 12.89794921875, 13.9033203125, 14.90869140625, 15.9140625, 16.91943359375, 17.9248046875, 18.93017578125, 19.935546875, 20.94091796875, 21.9462890625, 22.95166015625, 23.95703125, 24.96240234375, 25.9677734375, 26.97314453125, 27.978515625, 28.98388671875, 29.9892578125, 30.99462890625, 32.0]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 11.0, 12.0, 12.0, 28.0, 28.0, 43.0, 66.0, 95.0, 175.0, 291.0, 631.0, 4149.0, 3088068.0, 49802.0, 1219.0, 430.0, 215.0, 141.0, 84.0, 55.0, 47.0, 21.0, 24.0, 16.0, 12.0, 7.0, 4.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-111.3125, -108.439453125, -105.56640625, -102.693359375, -99.8203125, -96.947265625, -94.07421875, -91.201171875, -88.328125, -85.455078125, -82.58203125, -79.708984375, -76.8359375, -73.962890625, -71.08984375, -68.216796875, -65.34375, -62.470703125, -59.59765625, -56.724609375, -53.8515625, -50.978515625, -48.10546875, -45.232421875, -42.359375, -39.486328125, -36.61328125, -33.740234375, -30.8671875, -27.994140625, -25.12109375, -22.248046875, -19.375, -16.501953125, -13.62890625, -10.755859375, -7.8828125, -5.009765625, -2.13671875, 0.736328125, 3.609375, 6.482421875, 9.35546875, 12.228515625, 15.1015625, 17.974609375, 20.84765625, 23.720703125, 26.59375, 29.466796875, 32.33984375, 35.212890625, 38.0859375, 40.958984375, 43.83203125, 46.705078125, 49.578125, 52.451171875, 55.32421875, 58.197265625, 61.0703125, 63.943359375, 66.81640625, 69.689453125, 72.5625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 11.0, 11.0, 40.0, 71.0, 124.0, 184.0, 192.0, 170.0, 112.0, 51.0, 24.0, 7.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.09598159790039, -42.64164352416992, -41.18730545043945, -39.732967376708984, -38.278629302978516, -36.82429122924805, -35.36995315551758, -33.91561508178711, -32.46127700805664, -31.006938934326172, -29.552600860595703, -28.098262786865234, -26.643924713134766, -25.189586639404297, -23.735248565673828, -22.28091049194336, -20.826570510864258, -19.37223243713379, -17.91789436340332, -16.46355628967285, -15.009218215942383, -13.554880142211914, -12.100541114807129, -10.64620304107666, -9.191864967346191, -7.737526893615723, -6.283188819885254, -4.828850269317627, -3.374512195587158, -1.9201741218566895, -0.4658355712890625, 0.9885025024414062, 2.442840576171875, 3.8971786499023438, 5.3515167236328125, 6.8058552742004395, 8.26019287109375, 9.714530944824219, 11.168869972229004, 12.623208045959473, 14.077546119689941, 15.53188419342041, 16.986223220825195, 18.440561294555664, 19.894899368286133, 21.3492374420166, 22.80357551574707, 24.25791358947754, 25.712251663208008, 27.166589736938477, 28.620927810668945, 30.075265884399414, 31.529603958129883, 32.983943939208984, 34.43828201293945, 35.89262008666992, 37.34695816040039, 38.80129623413086, 40.25563430786133, 41.7099723815918, 43.164310455322266, 44.618648529052734, 46.0729866027832, 47.52732467651367, 48.98166275024414]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 12.0, 9.0, 15.0, 14.0, 17.0, 12.0, 27.0, 16.0, 28.0, 31.0, 35.0, 27.0, 42.0, 56.0, 41.0, 43.0, 39.0, 55.0, 42.0, 41.0, 41.0, 23.0, 49.0, 35.0, 36.0, 23.0, 32.0, 25.0, 20.0, 20.0, 20.0, 15.0, 8.0, 9.0, 8.0, 6.0, 4.0, 8.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.60529327392578, -81.07646179199219, -78.54763793945312, -76.01880645751953, -73.48998260498047, -70.96115112304688, -68.43232727050781, -65.90349578857422, -63.37466812133789, -60.84584045410156, -58.317012786865234, -55.788185119628906, -53.25935363769531, -50.73052978515625, -48.201698303222656, -45.67287063598633, -43.14404296875, -40.61521530151367, -38.086387634277344, -35.557559967041016, -33.02873229980469, -30.499902725219727, -27.971073150634766, -25.442245483398438, -22.91341781616211, -20.38459014892578, -17.855762481689453, -15.326932907104492, -12.798105239868164, -10.269277572631836, -7.740448951721191, -5.211620330810547, -2.68280029296875, -0.15397214889526367, 2.3748559951782227, 4.903684139251709, 7.432512283325195, 9.961339950561523, 12.490168571472168, 15.018997192382812, 17.54782485961914, 20.07665252685547, 22.605480194091797, 25.134309768676758, 27.663137435913086, 30.191965103149414, 32.720794677734375, 35.2496223449707, 37.77845001220703, 40.30727767944336, 42.83610534667969, 45.364933013916016, 47.893760681152344, 50.42259216308594, 52.951419830322266, 55.480247497558594, 58.00907516479492, 60.53790283203125, 63.06673049926758, 65.5955581665039, 68.1243896484375, 70.65321350097656, 73.18204498291016, 75.71087646484375, 78.23970031738281]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 8.0, 9.0, 10.0, 16.0, 11.0, 20.0, 19.0, 29.0, 21.0, 32.0, 34.0, 30.0, 32.0, 37.0, 41.0, 52.0, 35.0, 54.0, 48.0, 45.0, 47.0, 41.0, 40.0, 36.0, 37.0, 26.0, 34.0, 28.0, 25.0, 20.0, 12.0, 12.0, 11.0, 12.0, 12.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.7496337890625, -7.499267578125, -7.2489013671875, -6.99853515625, -6.7481689453125, -6.497802734375, -6.2474365234375, -5.9970703125, -5.7467041015625, -5.496337890625, -5.2459716796875, -4.99560546875, -4.7452392578125, -4.494873046875, -4.2445068359375, -3.994140625, -3.7437744140625, -3.493408203125, -3.2430419921875, -2.99267578125, -2.7423095703125, -2.491943359375, -2.2415771484375, -1.9912109375, -1.7408447265625, -1.490478515625, -1.2401123046875, -0.98974609375, -0.7393798828125, -0.489013671875, -0.2386474609375, 0.01171875, 0.2620849609375, 0.512451171875, 0.7628173828125, 1.01318359375, 1.2635498046875, 1.513916015625, 1.7642822265625, 2.0146484375, 2.2650146484375, 2.515380859375, 2.7657470703125, 3.01611328125, 3.2664794921875, 3.516845703125, 3.7672119140625, 4.017578125, 4.2679443359375, 4.518310546875, 4.7686767578125, 5.01904296875, 5.2694091796875, 5.519775390625, 5.7701416015625, 6.0205078125, 6.2708740234375, 6.521240234375, 6.7716064453125, 7.02197265625, 7.2723388671875, 7.522705078125, 7.7730712890625, 8.0234375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 6.0, 15.0, 13.0, 30.0, 35.0, 46.0, 57.0, 84.0, 128.0, 202.0, 350.0, 514.0, 1043.0, 2091.0, 4845.0, 13016.0, 43629.0, 214307.0, 1037868.0, 1863385.0, 805085.0, 154706.0, 34369.0, 10530.0, 4002.0, 1726.0, 843.0, 451.0, 298.0, 185.0, 124.0, 81.0, 50.0, 44.0, 28.0, 26.0, 18.0, 14.0, 8.0, 8.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.4609375, -11.1278076171875, -10.794677734375, -10.4615478515625, -10.12841796875, -9.7952880859375, -9.462158203125, -9.1290283203125, -8.7958984375, -8.4627685546875, -8.129638671875, -7.7965087890625, -7.46337890625, -7.1302490234375, -6.797119140625, -6.4639892578125, -6.130859375, -5.7977294921875, -5.464599609375, -5.1314697265625, -4.79833984375, -4.4652099609375, -4.132080078125, -3.7989501953125, -3.4658203125, -3.1326904296875, -2.799560546875, -2.4664306640625, -2.13330078125, -1.8001708984375, -1.467041015625, -1.1339111328125, -0.80078125, -0.4676513671875, -0.134521484375, 0.1986083984375, 0.53173828125, 0.8648681640625, 1.197998046875, 1.5311279296875, 1.8642578125, 2.1973876953125, 2.530517578125, 2.8636474609375, 3.19677734375, 3.5299072265625, 3.863037109375, 4.1961669921875, 4.529296875, 4.8624267578125, 5.195556640625, 5.5286865234375, 5.86181640625, 6.1949462890625, 6.528076171875, 6.8612060546875, 7.1943359375, 7.5274658203125, 7.860595703125, 8.1937255859375, 8.52685546875, 8.8599853515625, 9.193115234375, 9.5262451171875, 9.859375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 4.0, 9.0, 9.0, 17.0, 19.0, 26.0, 36.0, 57.0, 78.0, 127.0, 177.0, 288.0, 391.0, 551.0, 606.0, 527.0, 403.0, 273.0, 161.0, 119.0, 61.0, 45.0, 31.0, 21.0, 15.0, 12.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.375, -18.71484375, -18.0546875, -17.39453125, -16.734375, -16.07421875, -15.4140625, -14.75390625, -14.09375, -13.43359375, -12.7734375, -12.11328125, -11.453125, -10.79296875, -10.1328125, -9.47265625, -8.8125, -8.15234375, -7.4921875, -6.83203125, -6.171875, -5.51171875, -4.8515625, -4.19140625, -3.53125, -2.87109375, -2.2109375, -1.55078125, -0.890625, -0.23046875, 0.4296875, 1.08984375, 1.75, 2.41015625, 3.0703125, 3.73046875, 4.390625, 5.05078125, 5.7109375, 6.37109375, 7.03125, 7.69140625, 8.3515625, 9.01171875, 9.671875, 10.33203125, 10.9921875, 11.65234375, 12.3125, 12.97265625, 13.6328125, 14.29296875, 14.953125, 15.61328125, 16.2734375, 16.93359375, 17.59375, 18.25390625, 18.9140625, 19.57421875, 20.234375, 20.89453125, 21.5546875, 22.21484375, 22.875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 2.0, 10.0, 8.0, 12.0, 17.0, 30.0, 41.0, 43.0, 73.0, 97.0, 124.0, 161.0, 280.0, 578.0, 1565.0, 14224.0, 1043569.0, 3097047.0, 32368.0, 2225.0, 703.0, 344.0, 221.0, 112.0, 100.0, 81.0, 39.0, 43.0, 35.0, 27.0, 22.0, 15.0, 7.0, 8.0, 10.0, 5.0, 8.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.75, -43.15869140625, -41.5673828125, -39.97607421875, -38.384765625, -36.79345703125, -35.2021484375, -33.61083984375, -32.01953125, -30.42822265625, -28.8369140625, -27.24560546875, -25.654296875, -24.06298828125, -22.4716796875, -20.88037109375, -19.2890625, -17.69775390625, -16.1064453125, -14.51513671875, -12.923828125, -11.33251953125, -9.7412109375, -8.14990234375, -6.55859375, -4.96728515625, -3.3759765625, -1.78466796875, -0.193359375, 1.39794921875, 2.9892578125, 4.58056640625, 6.171875, 7.76318359375, 9.3544921875, 10.94580078125, 12.537109375, 14.12841796875, 15.7197265625, 17.31103515625, 18.90234375, 20.49365234375, 22.0849609375, 23.67626953125, 25.267578125, 26.85888671875, 28.4501953125, 30.04150390625, 31.6328125, 33.22412109375, 34.8154296875, 36.40673828125, 37.998046875, 39.58935546875, 41.1806640625, 42.77197265625, 44.36328125, 45.95458984375, 47.5458984375, 49.13720703125, 50.728515625, 52.31982421875, 53.9111328125, 55.50244140625, 57.09375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 13.0, 12.0, 59.0, 73.0, 147.0, 185.0, 188.0, 159.0, 86.0, 53.0, 15.0, 12.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-184.10665893554688, -180.5732421875, -177.03982543945312, -173.50640869140625, -169.97299194335938, -166.4395751953125, -162.90615844726562, -159.37274169921875, -155.83932495117188, -152.305908203125, -148.77249145507812, -145.23907470703125, -141.70565795898438, -138.1722412109375, -134.63882446289062, -131.10540771484375, -127.57199096679688, -124.03857421875, -120.50515747070312, -116.97174072265625, -113.43832397460938, -109.9049072265625, -106.37149047851562, -102.83807373046875, -99.30465698242188, -95.771240234375, -92.23782348632812, -88.70440673828125, -85.17098999023438, -81.6375732421875, -78.10415649414062, -74.57073974609375, -71.03732299804688, -67.50390625, -63.970489501953125, -60.43707275390625, -56.903656005859375, -53.3702392578125, -49.836822509765625, -46.30340576171875, -42.76999282836914, -39.236576080322266, -35.70315933227539, -32.169742584228516, -28.63632583618164, -25.102909088134766, -21.56949234008789, -18.036075592041016, -14.50265884399414, -10.969242095947266, -7.435825347900391, -3.9024085998535156, -0.3689918518066406, 3.1644248962402344, 6.697841644287109, 10.231258392333984, 13.76467514038086, 17.298091888427734, 20.83150863647461, 24.364925384521484, 27.89834213256836, 31.431758880615234, 34.96517562866211, 38.498592376708984, 42.03200912475586]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 8.0, 8.0, 6.0, 5.0, 11.0, 5.0, 12.0, 13.0, 19.0, 17.0, 19.0, 27.0, 21.0, 26.0, 22.0, 42.0, 39.0, 40.0, 33.0, 34.0, 44.0, 45.0, 32.0, 41.0, 33.0, 49.0, 37.0, 32.0, 38.0, 36.0, 28.0, 18.0, 20.0, 13.0, 23.0, 11.0, 18.0, 9.0, 12.0, 16.0, 8.0, 7.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.17701721191406, -45.66553497314453, -44.154052734375, -42.64257049560547, -41.13108825683594, -39.619606018066406, -38.108123779296875, -36.596641540527344, -35.08515930175781, -33.57367706298828, -32.06219482421875, -30.55071258544922, -29.039230346679688, -27.527748107910156, -26.016263961791992, -24.50478172302246, -22.993297576904297, -21.481815338134766, -19.970333099365234, -18.458850860595703, -16.947368621826172, -15.435885429382324, -13.924402236938477, -12.412919998168945, -10.901437759399414, -9.389955520629883, -7.878472805023193, -6.366990089416504, -4.855507850646973, -3.3440256118774414, -1.8325424194335938, -0.3210601806640625, 1.1904182434082031, 2.7019007205963135, 4.213383197784424, 5.724865913391113, 7.2363481521606445, 8.747830390930176, 10.259313583374023, 11.770795822143555, 13.282278060913086, 14.793760299682617, 16.30524253845215, 17.816726684570312, 19.328208923339844, 20.839691162109375, 22.351173400878906, 23.862655639648438, 25.37413787841797, 26.8856201171875, 28.39710235595703, 29.908584594726562, 31.420066833496094, 32.931549072265625, 34.443031311035156, 35.95451354980469, 37.46599578857422, 38.97747802734375, 40.48896026611328, 42.00044250488281, 43.511924743652344, 45.023406982421875, 46.534889221191406, 48.04637145996094, 49.557857513427734]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 7.0, 8.0, 10.0, 11.0, 10.0, 13.0, 22.0, 19.0, 22.0, 29.0, 29.0, 42.0, 26.0, 24.0, 39.0, 41.0, 49.0, 47.0, 44.0, 42.0, 59.0, 41.0, 45.0, 39.0, 34.0, 29.0, 38.0, 31.0, 22.0, 28.0, 19.0, 9.0, 14.0, 10.0, 7.0, 12.0, 3.0, 5.0, 6.0, 7.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.240234375, -7.99609375, -7.751953125, -7.5078125, -7.263671875, -7.01953125, -6.775390625, -6.53125, -6.287109375, -6.04296875, -5.798828125, -5.5546875, -5.310546875, -5.06640625, -4.822265625, -4.578125, -4.333984375, -4.08984375, -3.845703125, -3.6015625, -3.357421875, -3.11328125, -2.869140625, -2.625, -2.380859375, -2.13671875, -1.892578125, -1.6484375, -1.404296875, -1.16015625, -0.916015625, -0.671875, -0.427734375, -0.18359375, 0.060546875, 0.3046875, 0.548828125, 0.79296875, 1.037109375, 1.28125, 1.525390625, 1.76953125, 2.013671875, 2.2578125, 2.501953125, 2.74609375, 2.990234375, 3.234375, 3.478515625, 3.72265625, 3.966796875, 4.2109375, 4.455078125, 4.69921875, 4.943359375, 5.1875, 5.431640625, 5.67578125, 5.919921875, 6.1640625, 6.408203125, 6.65234375, 6.896484375, 7.140625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 6.0, 11.0, 17.0, 20.0, 31.0, 46.0, 46.0, 80.0, 145.0, 192.0, 293.0, 422.0, 568.0, 910.0, 1284.0, 1859.0, 2584.0, 3808.0, 5453.0, 7714.0, 11778.0, 17339.0, 26093.0, 39349.0, 59801.0, 92994.0, 141301.0, 177259.0, 153554.0, 103839.0, 67036.0, 43192.0, 28700.0, 19212.0, 13080.0, 8850.0, 5991.0, 4185.0, 2933.0, 1932.0, 1392.0, 972.0, 721.0, 451.0, 350.0, 228.0, 176.0, 99.0, 86.0, 63.0, 45.0, 21.0, 22.0, 10.0, 9.0, 9.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.70849609375, -0.68609619140625, -0.6636962890625, -0.64129638671875, -0.618896484375, -0.59649658203125, -0.5740966796875, -0.55169677734375, -0.529296875, -0.50689697265625, -0.4844970703125, -0.46209716796875, -0.439697265625, -0.41729736328125, -0.3948974609375, -0.37249755859375, -0.35009765625, -0.32769775390625, -0.3052978515625, -0.28289794921875, -0.260498046875, -0.23809814453125, -0.2156982421875, -0.19329833984375, -0.1708984375, -0.14849853515625, -0.1260986328125, -0.10369873046875, -0.081298828125, -0.05889892578125, -0.0364990234375, -0.01409912109375, 0.00830078125, 0.03070068359375, 0.0531005859375, 0.07550048828125, 0.097900390625, 0.12030029296875, 0.1427001953125, 0.16510009765625, 0.1875, 0.20989990234375, 0.2322998046875, 0.25469970703125, 0.277099609375, 0.29949951171875, 0.3218994140625, 0.34429931640625, 0.36669921875, 0.38909912109375, 0.4114990234375, 0.43389892578125, 0.456298828125, 0.47869873046875, 0.5010986328125, 0.52349853515625, 0.5458984375, 0.56829833984375, 0.5906982421875, 0.61309814453125, 0.635498046875, 0.65789794921875, 0.6802978515625, 0.70269775390625, 0.72509765625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 7.0, 12.0, 7.0, 12.0, 19.0, 13.0, 17.0, 20.0, 25.0, 27.0, 40.0, 37.0, 35.0, 37.0, 28.0, 35.0, 31.0, 37.0, 49.0, 1056.0, 33.0, 34.0, 47.0, 33.0, 40.0, 38.0, 33.0, 28.0, 35.0, 25.0, 18.0, 23.0, 18.0, 16.0, 6.0, 8.0, 7.0, 7.0, 6.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.02734375, -4.87554931640625, -4.7237548828125, -4.57196044921875, -4.420166015625, -4.26837158203125, -4.1165771484375, -3.96478271484375, -3.81298828125, -3.66119384765625, -3.5093994140625, -3.35760498046875, -3.205810546875, -3.05401611328125, -2.9022216796875, -2.75042724609375, -2.5986328125, -2.44683837890625, -2.2950439453125, -2.14324951171875, -1.991455078125, -1.83966064453125, -1.6878662109375, -1.53607177734375, -1.38427734375, -1.23248291015625, -1.0806884765625, -0.92889404296875, -0.777099609375, -0.62530517578125, -0.4735107421875, -0.32171630859375, -0.169921875, -0.01812744140625, 0.1336669921875, 0.28546142578125, 0.437255859375, 0.58905029296875, 0.7408447265625, 0.89263916015625, 1.04443359375, 1.19622802734375, 1.3480224609375, 1.49981689453125, 1.651611328125, 1.80340576171875, 1.9552001953125, 2.10699462890625, 2.2587890625, 2.41058349609375, 2.5623779296875, 2.71417236328125, 2.865966796875, 3.01776123046875, 3.1695556640625, 3.32135009765625, 3.47314453125, 3.62493896484375, 3.7767333984375, 3.92852783203125, 4.080322265625, 4.23211669921875, 4.3839111328125, 4.53570556640625, 4.6875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 8.0, 4.0, 11.0, 20.0, 20.0, 37.0, 58.0, 86.0, 105.0, 187.0, 247.0, 342.0, 491.0, 766.0, 1106.0, 1641.0, 2396.0, 3420.0, 4895.0, 7309.0, 10374.0, 15040.0, 21613.0, 31114.0, 45422.0, 65573.0, 94704.0, 132677.0, 1206016.0, 135478.0, 97698.0, 67650.0, 45944.0, 32105.0, 21973.0, 15441.0, 10651.0, 7577.0, 5093.0, 3613.0, 2488.0, 1806.0, 1220.0, 808.0, 609.0, 407.0, 277.0, 190.0, 164.0, 101.0, 70.0, 39.0, 30.0, 12.0, 10.0, 4.0, 3.0, 1.0, 3.0], "bins": [-0.63916015625, -0.6201019287109375, -0.601043701171875, -0.5819854736328125, -0.56292724609375, -0.5438690185546875, -0.524810791015625, -0.5057525634765625, -0.4866943359375, -0.4676361083984375, -0.448577880859375, -0.4295196533203125, -0.41046142578125, -0.3914031982421875, -0.372344970703125, -0.3532867431640625, -0.334228515625, -0.3151702880859375, -0.296112060546875, -0.2770538330078125, -0.25799560546875, -0.2389373779296875, -0.219879150390625, -0.2008209228515625, -0.1817626953125, -0.1627044677734375, -0.143646240234375, -0.1245880126953125, -0.10552978515625, -0.0864715576171875, -0.067413330078125, -0.0483551025390625, -0.029296875, -0.0102386474609375, 0.008819580078125, 0.0278778076171875, 0.04693603515625, 0.0659942626953125, 0.085052490234375, 0.1041107177734375, 0.1231689453125, 0.1422271728515625, 0.161285400390625, 0.1803436279296875, 0.19940185546875, 0.2184600830078125, 0.237518310546875, 0.2565765380859375, 0.275634765625, 0.2946929931640625, 0.313751220703125, 0.3328094482421875, 0.35186767578125, 0.3709259033203125, 0.389984130859375, 0.4090423583984375, 0.4281005859375, 0.4471588134765625, 0.466217041015625, 0.4852752685546875, 0.50433349609375, 0.5233917236328125, 0.542449951171875, 0.5615081787109375, 0.58056640625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 6.0, 12.0, 13.0, 9.0, 16.0, 24.0, 24.0, 28.0, 40.0, 37.0, 44.0, 67.0, 53.0, 60.0, 61.0, 71.0, 41.0, 53.0, 45.0, 46.0, 47.0, 33.0, 29.0, 29.0, 18.0, 16.0, 15.0, 7.0, 6.0, 16.0, 3.0, 1.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0022411346435546875, -0.0021685659885406494, -0.0020959973335266113, -0.0020234286785125732, -0.0019508600234985352, -0.001878291368484497, -0.001805722713470459, -0.001733154058456421, -0.0016605854034423828, -0.0015880167484283447, -0.0015154480934143066, -0.0014428794384002686, -0.0013703107833862305, -0.0012977421283721924, -0.0012251734733581543, -0.0011526048183441162, -0.0010800361633300781, -0.00100746750831604, -0.000934898853302002, -0.0008623301982879639, -0.0007897615432739258, -0.0007171928882598877, -0.0006446242332458496, -0.0005720555782318115, -0.0004994869232177734, -0.00042691826820373535, -0.00035434961318969727, -0.0002817809581756592, -0.0002092123031616211, -0.000136643648147583, -6.407499313354492e-05, 8.493661880493164e-06, 8.106231689453125e-05, 0.00015363097190856934, 0.00022619962692260742, 0.0002987682819366455, 0.0003713369369506836, 0.0004439055919647217, 0.0005164742469787598, 0.0005890429019927979, 0.0006616115570068359, 0.000734180212020874, 0.0008067488670349121, 0.0008793175220489502, 0.0009518861770629883, 0.0010244548320770264, 0.0010970234870910645, 0.0011695921421051025, 0.0012421607971191406, 0.0013147294521331787, 0.0013872981071472168, 0.0014598667621612549, 0.001532435417175293, 0.001605004072189331, 0.0016775727272033691, 0.0017501413822174072, 0.0018227100372314453, 0.0018952786922454834, 0.0019678473472595215, 0.0020404160022735596, 0.0021129846572875977, 0.0021855533123016357, 0.002258121967315674, 0.002330690622329712, 0.00240325927734375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 6.0, 7.0, 13.0, 12.0, 18.0, 19.0, 22.0, 37.0, 51.0, 64.0, 120.0, 142.0, 340.0, 934.0, 38400.0, 1004724.0, 2416.0, 542.0, 246.0, 132.0, 85.0, 44.0, 31.0, 28.0, 22.0, 23.0, 18.0, 6.0, 10.0, 9.0, 6.0, 4.0, 5.0, 1.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.057037353515625, -0.05532264709472656, -0.053607940673828125, -0.05189323425292969, -0.05017852783203125, -0.04846382141113281, -0.046749114990234375, -0.04503440856933594, -0.0433197021484375, -0.04160499572753906, -0.039890289306640625, -0.03817558288574219, -0.03646087646484375, -0.03474617004394531, -0.033031463623046875, -0.03131675720214844, -0.02960205078125, -0.027887344360351562, -0.026172637939453125, -0.024457931518554688, -0.02274322509765625, -0.021028518676757812, -0.019313812255859375, -0.017599105834960938, -0.0158843994140625, -0.014169692993164062, -0.012454986572265625, -0.010740280151367188, -0.00902557373046875, -0.0073108673095703125, -0.005596160888671875, -0.0038814544677734375, -0.002166748046875, -0.0004520416259765625, 0.001262664794921875, 0.0029773712158203125, 0.00469207763671875, 0.0064067840576171875, 0.008121490478515625, 0.009836196899414062, 0.0115509033203125, 0.013265609741210938, 0.014980316162109375, 0.016695022583007812, 0.01840972900390625, 0.020124435424804688, 0.021839141845703125, 0.023553848266601562, 0.0252685546875, 0.026983261108398438, 0.028697967529296875, 0.030412673950195312, 0.03212738037109375, 0.03384208679199219, 0.035556793212890625, 0.03727149963378906, 0.0389862060546875, 0.04070091247558594, 0.042415618896484375, 0.04413032531738281, 0.04584503173828125, 0.04755973815917969, 0.049274444580078125, 0.05098915100097656, 0.052703857421875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 196.0, 733.0, 79.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014533390058204532, -0.0011199330911040306, -0.0007865271181799471, -0.00045312114525586367, -0.00011971523053944111, 0.00021369068417698145, 0.0005470967153087258, 0.0008805025136098266, 0.001213908544741571, 0.0015473144594579935, 0.001880720490589738, 0.0022141262888908386, 0.002547532320022583, 0.0028809383511543274, 0.0032143443822860718, 0.003547749947756529, 0.0038811559788882732, 0.004214562010020018, 0.004547968041151762, 0.004881373606622219, 0.0052147796377539635, 0.005548185668885708, 0.005881591700017452, 0.006214997731149197, 0.006548403762280941, 0.006881809793412685, 0.00721521582454443, 0.007548621855676174, 0.007882027886807919, 0.008215432986617088, 0.008548839017748833, 0.008882245048880577, 0.009215652011334896, 0.00954905804246664, 0.009882464073598385, 0.01021587010473013, 0.010549276135861874, 0.010882681235671043, 0.011216087266802788, 0.011549493297934532, 0.011882899329066277, 0.012216305360198021, 0.012549711391329765, 0.01288311742246151, 0.013216523453593254, 0.013549929484724998, 0.013883335515856743, 0.014216740615665913, 0.014550147578120232, 0.014883553609251976, 0.01521695964038372, 0.015550365671515465, 0.01588377170264721, 0.016217177733778954, 0.016550583764910698, 0.016883989796042442, 0.017217393964529037, 0.017550799995660782, 0.017884206026792526, 0.01821761205792427, 0.018551018089056015, 0.01888442412018776, 0.019217830151319504, 0.019551236182451248, 0.019884642213582993]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 8.0, 13.0, 8.0, 14.0, 9.0, 22.0, 19.0, 17.0, 16.0, 32.0, 31.0, 27.0, 29.0, 30.0, 36.0, 31.0, 33.0, 43.0, 51.0, 32.0, 37.0, 43.0, 32.0, 40.0, 39.0, 46.0, 42.0, 33.0, 22.0, 19.0, 21.0, 14.0, 16.0, 14.0, 17.0, 16.0, 8.0, 5.0, 9.0, 2.0, 5.0, 2.0, 7.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012045502662658691, -0.0011683376505970955, -0.0011321250349283218, -0.0010959124192595482, -0.0010596998035907745, -0.0010234871879220009, -0.0009872745722532272, -0.0009510619565844536, -0.0009148493409156799, -0.0008786367252469063, -0.0008424241095781326, -0.000806211493909359, -0.0007699988782405853, -0.0007337862625718117, -0.000697573646903038, -0.0006613610312342644, -0.0006251484155654907, -0.0005889357998967171, -0.0005527231842279434, -0.0005165105685591698, -0.0004802979528903961, -0.00044408533722162247, -0.0004078727215528488, -0.00037166010588407516, -0.0003354474902153015, -0.00029923487454652786, -0.0002630222588777542, -0.00022680964320898056, -0.0001905970275402069, -0.00015438441187143326, -0.00011817179620265961, -8.195918053388596e-05, -4.5746564865112305e-05, -9.533949196338654e-06, 2.6678666472434998e-05, 6.289128214120865e-05, 9.91038978099823e-05, 0.00013531651347875595, 0.0001715291291475296, 0.00020774174481630325, 0.0002439543604850769, 0.00028016697615385056, 0.0003163795918226242, 0.00035259220749139786, 0.0003888048231601715, 0.00042501743882894516, 0.0004612300544977188, 0.0004974426701664925, 0.0005336552858352661, 0.0005698679015040398, 0.0006060805171728134, 0.0006422931328415871, 0.0006785057485103607, 0.0007147183641791344, 0.000750930979847908, 0.0007871435955166817, 0.0008233562111854553, 0.000859568826854229, 0.0008957814425230026, 0.0009319940581917763, 0.0009682066738605499, 0.0010044192895293236, 0.0010406319051980972, 0.0010768445208668709, 0.0011130571365356445]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 7.0, 8.0, 10.0, 11.0, 10.0, 13.0, 22.0, 19.0, 22.0, 29.0, 29.0, 42.0, 26.0, 24.0, 39.0, 41.0, 49.0, 47.0, 44.0, 42.0, 59.0, 41.0, 45.0, 39.0, 34.0, 29.0, 38.0, 31.0, 22.0, 28.0, 19.0, 9.0, 14.0, 10.0, 7.0, 12.0, 3.0, 5.0, 6.0, 7.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.240234375, -7.99609375, -7.751953125, -7.5078125, -7.263671875, -7.01953125, -6.775390625, -6.53125, -6.287109375, -6.04296875, -5.798828125, -5.5546875, -5.310546875, -5.06640625, -4.822265625, -4.578125, -4.333984375, -4.08984375, -3.845703125, -3.6015625, -3.357421875, -3.11328125, -2.869140625, -2.625, -2.380859375, -2.13671875, -1.892578125, -1.6484375, -1.404296875, -1.16015625, -0.916015625, -0.671875, -0.427734375, -0.18359375, 0.060546875, 0.3046875, 0.548828125, 0.79296875, 1.037109375, 1.28125, 1.525390625, 1.76953125, 2.013671875, 2.2578125, 2.501953125, 2.74609375, 2.990234375, 3.234375, 3.478515625, 3.72265625, 3.966796875, 4.2109375, 4.455078125, 4.69921875, 4.943359375, 5.1875, 5.431640625, 5.67578125, 5.919921875, 6.1640625, 6.408203125, 6.65234375, 6.896484375, 7.140625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 15.0, 18.0, 23.0, 36.0, 59.0, 96.0, 129.0, 213.0, 341.0, 504.0, 937.0, 1674.0, 3493.0, 7606.0, 19435.0, 59588.0, 269532.0, 527949.0, 105225.0, 30607.0, 11034.0, 4742.0, 2271.0, 1236.0, 701.0, 379.0, 259.0, 160.0, 99.0, 70.0, 42.0, 27.0, 16.0, 12.0, 9.0, 3.0, 3.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.71875, -7.4791259765625, -7.239501953125, -6.9998779296875, -6.76025390625, -6.5206298828125, -6.281005859375, -6.0413818359375, -5.8017578125, -5.5621337890625, -5.322509765625, -5.0828857421875, -4.84326171875, -4.6036376953125, -4.364013671875, -4.1243896484375, -3.884765625, -3.6451416015625, -3.405517578125, -3.1658935546875, -2.92626953125, -2.6866455078125, -2.447021484375, -2.2073974609375, -1.9677734375, -1.7281494140625, -1.488525390625, -1.2489013671875, -1.00927734375, -0.7696533203125, -0.530029296875, -0.2904052734375, -0.05078125, 0.1888427734375, 0.428466796875, 0.6680908203125, 0.90771484375, 1.1473388671875, 1.386962890625, 1.6265869140625, 1.8662109375, 2.1058349609375, 2.345458984375, 2.5850830078125, 2.82470703125, 3.0643310546875, 3.303955078125, 3.5435791015625, 3.783203125, 4.0228271484375, 4.262451171875, 4.5020751953125, 4.74169921875, 4.9813232421875, 5.220947265625, 5.4605712890625, 5.7001953125, 5.9398193359375, 6.179443359375, 6.4190673828125, 6.65869140625, 6.8983154296875, 7.137939453125, 7.3775634765625, 7.6171875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 6.0, 4.0, 8.0, 11.0, 10.0, 16.0, 12.0, 23.0, 16.0, 20.0, 30.0, 32.0, 33.0, 35.0, 43.0, 55.0, 63.0, 94.0, 317.0, 1616.0, 122.0, 70.0, 53.0, 41.0, 44.0, 52.0, 22.0, 25.0, 26.0, 22.0, 21.0, 13.0, 16.0, 8.0, 14.0, 11.0, 9.0, 5.0, 5.0, 5.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-27.171875, -26.32666015625, -25.4814453125, -24.63623046875, -23.791015625, -22.94580078125, -22.1005859375, -21.25537109375, -20.41015625, -19.56494140625, -18.7197265625, -17.87451171875, -17.029296875, -16.18408203125, -15.3388671875, -14.49365234375, -13.6484375, -12.80322265625, -11.9580078125, -11.11279296875, -10.267578125, -9.42236328125, -8.5771484375, -7.73193359375, -6.88671875, -6.04150390625, -5.1962890625, -4.35107421875, -3.505859375, -2.66064453125, -1.8154296875, -0.97021484375, -0.125, 0.72021484375, 1.5654296875, 2.41064453125, 3.255859375, 4.10107421875, 4.9462890625, 5.79150390625, 6.63671875, 7.48193359375, 8.3271484375, 9.17236328125, 10.017578125, 10.86279296875, 11.7080078125, 12.55322265625, 13.3984375, 14.24365234375, 15.0888671875, 15.93408203125, 16.779296875, 17.62451171875, 18.4697265625, 19.31494140625, 20.16015625, 21.00537109375, 21.8505859375, 22.69580078125, 23.541015625, 24.38623046875, 25.2314453125, 26.07666015625, 26.921875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 6.0, 4.0, 3.0, 9.0, 9.0, 11.0, 17.0, 20.0, 25.0, 25.0, 41.0, 43.0, 74.0, 81.0, 131.0, 151.0, 225.0, 361.0, 995.0, 11526.0, 3085771.0, 43346.0, 1530.0, 388.0, 244.0, 169.0, 124.0, 106.0, 63.0, 40.0, 38.0, 25.0, 27.0, 26.0, 12.0, 10.0, 8.0, 3.0, 10.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-77.6875, -75.5078125, -73.328125, -71.1484375, -68.96875, -66.7890625, -64.609375, -62.4296875, -60.25, -58.0703125, -55.890625, -53.7109375, -51.53125, -49.3515625, -47.171875, -44.9921875, -42.8125, -40.6328125, -38.453125, -36.2734375, -34.09375, -31.9140625, -29.734375, -27.5546875, -25.375, -23.1953125, -21.015625, -18.8359375, -16.65625, -14.4765625, -12.296875, -10.1171875, -7.9375, -5.7578125, -3.578125, -1.3984375, 0.78125, 2.9609375, 5.140625, 7.3203125, 9.5, 11.6796875, 13.859375, 16.0390625, 18.21875, 20.3984375, 22.578125, 24.7578125, 26.9375, 29.1171875, 31.296875, 33.4765625, 35.65625, 37.8359375, 40.015625, 42.1953125, 44.375, 46.5546875, 48.734375, 50.9140625, 53.09375, 55.2734375, 57.453125, 59.6328125, 61.8125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 4.0, 102.0, 733.0, 172.0, 9.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.06592559814453, -16.613964080810547, -10.162003517150879, -3.710042953491211, 2.7419185638427734, 9.193878173828125, 15.64583969116211, 22.097801208496094, 28.549762725830078, 35.00172424316406, 41.45368576049805, 47.90564727783203, 54.35760498046875, 60.809566497802734, 67.26152801513672, 73.71348571777344, 80.16545104980469, 86.6174087524414, 93.06937408447266, 99.52133178710938, 105.97329711914062, 112.42525482177734, 118.87721252441406, 125.32917785644531, 131.78114318847656, 138.2331085205078, 144.68505859375, 151.13702392578125, 157.5889892578125, 164.04095458984375, 170.49290466308594, 176.9448699951172, 183.39683532714844, 189.8488006591797, 196.30075073242188, 202.75271606445312, 209.20468139648438, 215.65664672851562, 222.1085968017578, 228.56056213378906, 235.0125274658203, 241.46449279785156, 247.91644287109375, 254.368408203125, 260.82037353515625, 267.2723388671875, 273.72430419921875, 280.17626953125, 286.6282043457031, 293.0801696777344, 299.5321350097656, 305.9841003417969, 312.43603515625, 318.88800048828125, 325.3399658203125, 331.79193115234375, 338.243896484375, 344.69586181640625, 351.1478271484375, 357.59979248046875, 364.0517272949219, 370.5036926269531, 376.9556579589844, 383.4076232910156, 389.8595886230469]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 2.0, 5.0, 15.0, 12.0, 13.0, 18.0, 15.0, 18.0, 20.0, 21.0, 37.0, 32.0, 42.0, 41.0, 42.0, 45.0, 44.0, 34.0, 43.0, 39.0, 42.0, 39.0, 45.0, 39.0, 45.0, 31.0, 30.0, 20.0, 17.0, 32.0, 23.0, 16.0, 13.0, 10.0, 13.0, 10.0, 10.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.73987579345703, -69.42201232910156, -67.10415649414062, -64.78629302978516, -62.46843719482422, -60.15057373046875, -57.83271408081055, -55.514854431152344, -53.19699478149414, -50.87913513183594, -48.561275482177734, -46.24341583251953, -43.92555236816406, -41.607696533203125, -39.289833068847656, -36.97197341918945, -34.65411376953125, -32.33625411987305, -30.018394470214844, -27.700532913208008, -25.382673263549805, -23.0648136138916, -20.746952056884766, -18.429092407226562, -16.11123275756836, -13.793373107910156, -11.475512504577637, -9.157651901245117, -6.839792251586914, -4.521932601928711, -2.2040719985961914, 0.11378860473632812, 2.4316482543945312, 4.749508380889893, 7.067368507385254, 9.385229110717773, 11.703088760375977, 14.02094841003418, 16.338809967041016, 18.65666961669922, 20.974529266357422, 23.292388916015625, 25.610248565673828, 27.928110122680664, 30.245969772338867, 32.56382751464844, 34.881690979003906, 37.19955062866211, 39.51741027832031, 41.835269927978516, 44.15312957763672, 46.47098922729492, 48.788848876953125, 51.106712341308594, 53.4245719909668, 55.742431640625, 58.0602912902832, 60.378150939941406, 62.69601058959961, 65.01387023925781, 67.33173370361328, 69.64958953857422, 71.96745300292969, 74.28530883789062, 76.6031723022461]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 10.0, 9.0, 18.0, 18.0, 17.0, 19.0, 25.0, 20.0, 38.0, 24.0, 28.0, 24.0, 42.0, 37.0, 45.0, 44.0, 42.0, 52.0, 43.0, 54.0, 50.0, 31.0, 29.0, 29.0, 37.0, 26.0, 35.0, 29.0, 11.0, 17.0, 11.0, 11.0, 14.0, 8.0, 13.0, 4.0, 3.0, 6.0, 4.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7109375, -8.46295166015625, -8.2149658203125, -7.96697998046875, -7.718994140625, -7.47100830078125, -7.2230224609375, -6.97503662109375, -6.72705078125, -6.47906494140625, -6.2310791015625, -5.98309326171875, -5.735107421875, -5.48712158203125, -5.2391357421875, -4.99114990234375, -4.7431640625, -4.49517822265625, -4.2471923828125, -3.99920654296875, -3.751220703125, -3.50323486328125, -3.2552490234375, -3.00726318359375, -2.75927734375, -2.51129150390625, -2.2633056640625, -2.01531982421875, -1.767333984375, -1.51934814453125, -1.2713623046875, -1.02337646484375, -0.775390625, -0.52740478515625, -0.2794189453125, -0.03143310546875, 0.216552734375, 0.46453857421875, 0.7125244140625, 0.96051025390625, 1.20849609375, 1.45648193359375, 1.7044677734375, 1.95245361328125, 2.200439453125, 2.44842529296875, 2.6964111328125, 2.94439697265625, 3.1923828125, 3.44036865234375, 3.6883544921875, 3.93634033203125, 4.184326171875, 4.43231201171875, 4.6802978515625, 4.92828369140625, 5.17626953125, 5.42425537109375, 5.6722412109375, 5.92022705078125, 6.168212890625, 6.41619873046875, 6.6641845703125, 6.91217041015625, 7.16015625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 3.0, 5.0, 6.0, 6.0, 12.0, 7.0, 11.0, 12.0, 30.0, 22.0, 21.0, 27.0, 25.0, 29.0, 37.0, 78.0, 185.0, 482.0, 1842.0, 13763.0, 656972.0, 3403885.0, 109534.0, 5502.0, 1032.0, 299.0, 133.0, 63.0, 43.0, 32.0, 31.0, 23.0, 24.0, 24.0, 7.0, 12.0, 14.0, 7.0, 7.0, 13.0, 6.0, 3.0, 5.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.390625, -30.4189453125, -29.447265625, -28.4755859375, -27.50390625, -26.5322265625, -25.560546875, -24.5888671875, -23.6171875, -22.6455078125, -21.673828125, -20.7021484375, -19.73046875, -18.7587890625, -17.787109375, -16.8154296875, -15.84375, -14.8720703125, -13.900390625, -12.9287109375, -11.95703125, -10.9853515625, -10.013671875, -9.0419921875, -8.0703125, -7.0986328125, -6.126953125, -5.1552734375, -4.18359375, -3.2119140625, -2.240234375, -1.2685546875, -0.296875, 0.6748046875, 1.646484375, 2.6181640625, 3.58984375, 4.5615234375, 5.533203125, 6.5048828125, 7.4765625, 8.4482421875, 9.419921875, 10.3916015625, 11.36328125, 12.3349609375, 13.306640625, 14.2783203125, 15.25, 16.2216796875, 17.193359375, 18.1650390625, 19.13671875, 20.1083984375, 21.080078125, 22.0517578125, 23.0234375, 23.9951171875, 24.966796875, 25.9384765625, 26.91015625, 27.8818359375, 28.853515625, 29.8251953125, 30.796875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 4.0, 7.0, 21.0, 26.0, 36.0, 49.0, 64.0, 109.0, 138.0, 209.0, 333.0, 503.0, 648.0, 569.0, 440.0, 291.0, 220.0, 129.0, 81.0, 54.0, 45.0, 27.0, 10.0, 21.0, 12.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.96875, -24.32568359375, -23.6826171875, -23.03955078125, -22.396484375, -21.75341796875, -21.1103515625, -20.46728515625, -19.82421875, -19.18115234375, -18.5380859375, -17.89501953125, -17.251953125, -16.60888671875, -15.9658203125, -15.32275390625, -14.6796875, -14.03662109375, -13.3935546875, -12.75048828125, -12.107421875, -11.46435546875, -10.8212890625, -10.17822265625, -9.53515625, -8.89208984375, -8.2490234375, -7.60595703125, -6.962890625, -6.31982421875, -5.6767578125, -5.03369140625, -4.390625, -3.74755859375, -3.1044921875, -2.46142578125, -1.818359375, -1.17529296875, -0.5322265625, 0.11083984375, 0.75390625, 1.39697265625, 2.0400390625, 2.68310546875, 3.326171875, 3.96923828125, 4.6123046875, 5.25537109375, 5.8984375, 6.54150390625, 7.1845703125, 7.82763671875, 8.470703125, 9.11376953125, 9.7568359375, 10.39990234375, 11.04296875, 11.68603515625, 12.3291015625, 12.97216796875, 13.615234375, 14.25830078125, 14.9013671875, 15.54443359375, 16.1875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 10.0, 22.0, 28.0, 26.0, 44.0, 43.0, 75.0, 93.0, 123.0, 193.0, 338.0, 720.0, 3030.0, 79522.0, 3969478.0, 135024.0, 3642.0, 786.0, 331.0, 196.0, 149.0, 91.0, 73.0, 57.0, 42.0, 27.0, 21.0, 18.0, 11.0, 9.0, 13.0, 9.0, 6.0, 4.0, 4.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.75, -46.9140625, -45.078125, -43.2421875, -41.40625, -39.5703125, -37.734375, -35.8984375, -34.0625, -32.2265625, -30.390625, -28.5546875, -26.71875, -24.8828125, -23.046875, -21.2109375, -19.375, -17.5390625, -15.703125, -13.8671875, -12.03125, -10.1953125, -8.359375, -6.5234375, -4.6875, -2.8515625, -1.015625, 0.8203125, 2.65625, 4.4921875, 6.328125, 8.1640625, 10.0, 11.8359375, 13.671875, 15.5078125, 17.34375, 19.1796875, 21.015625, 22.8515625, 24.6875, 26.5234375, 28.359375, 30.1953125, 32.03125, 33.8671875, 35.703125, 37.5390625, 39.375, 41.2109375, 43.046875, 44.8828125, 46.71875, 48.5546875, 50.390625, 52.2265625, 54.0625, 55.8984375, 57.734375, 59.5703125, 61.40625, 63.2421875, 65.078125, 66.9140625, 68.75]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 30.0, 65.0, 129.0, 200.0, 233.0, 178.0, 97.0, 35.0, 24.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.06806182861328, -122.05321502685547, -118.03836822509766, -114.02352142333984, -110.00867462158203, -105.99382781982422, -101.97898864746094, -97.96414184570312, -93.94929504394531, -89.9344482421875, -85.91960144042969, -81.90475463867188, -77.88990783691406, -73.87506103515625, -69.86021423339844, -65.84536743164062, -61.83052062988281, -57.815673828125, -53.80082702636719, -49.785980224609375, -45.77113342285156, -41.75628662109375, -37.7414436340332, -33.72659683227539, -29.711750030517578, -25.696903228759766, -21.682056427001953, -17.667211532592773, -13.652364730834961, -9.637517929077148, -5.622673034667969, -1.6078262329101562, 2.4070281982421875, 6.421874523162842, 10.436720848083496, 14.451566696166992, 18.466413497924805, 22.481260299682617, 26.496105194091797, 30.51095199584961, 34.52579879760742, 38.540645599365234, 42.55549240112305, 46.570335388183594, 50.585182189941406, 54.60002899169922, 58.61487579345703, 62.629722595214844, 66.64456939697266, 70.65941619873047, 74.67426300048828, 78.6891098022461, 82.7039566040039, 86.71880340576172, 90.733642578125, 94.74848937988281, 98.76333618164062, 102.77818298339844, 106.79302978515625, 110.80787658691406, 114.82272338867188, 118.83757019042969, 122.8524169921875, 126.86726379394531, 130.88211059570312]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 9.0, 5.0, 7.0, 9.0, 14.0, 15.0, 12.0, 15.0, 24.0, 16.0, 18.0, 16.0, 17.0, 27.0, 39.0, 31.0, 37.0, 22.0, 37.0, 43.0, 43.0, 30.0, 27.0, 32.0, 33.0, 36.0, 33.0, 36.0, 48.0, 29.0, 35.0, 21.0, 23.0, 24.0, 21.0, 20.0, 15.0, 10.0, 11.0, 9.0, 11.0, 6.0, 11.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-53.89176559448242, -52.38570785522461, -50.8796501159668, -49.373592376708984, -47.867530822753906, -46.361473083496094, -44.85541534423828, -43.34935760498047, -41.843299865722656, -40.337242126464844, -38.83118438720703, -37.32512664794922, -35.819068908691406, -34.31300735473633, -32.806949615478516, -31.300891876220703, -29.79483413696289, -28.288776397705078, -26.782718658447266, -25.27665901184082, -23.770601272583008, -22.264543533325195, -20.75848388671875, -19.252426147460938, -17.746368408203125, -16.240310668945312, -14.734251976013184, -13.228193283081055, -11.722135543823242, -10.21607780456543, -8.7100191116333, -7.203960418701172, -5.697898864746094, -4.191840648651123, -2.6857824325561523, -1.1797242164611816, 0.32633399963378906, 1.8323922157287598, 3.3384504318237305, 4.844509124755859, 6.350566864013672, 7.856625080108643, 9.362683296203613, 10.868741989135742, 12.374799728393555, 13.880857467651367, 15.386916160583496, 16.892974853515625, 18.399032592773438, 19.90509033203125, 21.411148071289062, 22.917207717895508, 24.42326545715332, 25.929323196411133, 27.435382843017578, 28.94144058227539, 30.447498321533203, 31.953556060791016, 33.45961380004883, 34.96567153930664, 36.47173309326172, 37.97779083251953, 39.483848571777344, 40.989906311035156, 42.49596405029297]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 4.0, 5.0, 10.0, 15.0, 13.0, 19.0, 32.0, 16.0, 28.0, 42.0, 26.0, 48.0, 38.0, 42.0, 46.0, 53.0, 61.0, 44.0, 47.0, 56.0, 41.0, 57.0, 44.0, 37.0, 44.0, 29.0, 19.0, 16.0, 8.0, 12.0, 16.0, 4.0, 5.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0], "bins": [-12.4375, -12.1390380859375, -11.840576171875, -11.5421142578125, -11.24365234375, -10.9451904296875, -10.646728515625, -10.3482666015625, -10.0498046875, -9.7513427734375, -9.452880859375, -9.1544189453125, -8.85595703125, -8.5574951171875, -8.259033203125, -7.9605712890625, -7.662109375, -7.3636474609375, -7.065185546875, -6.7667236328125, -6.46826171875, -6.1697998046875, -5.871337890625, -5.5728759765625, -5.2744140625, -4.9759521484375, -4.677490234375, -4.3790283203125, -4.08056640625, -3.7821044921875, -3.483642578125, -3.1851806640625, -2.88671875, -2.5882568359375, -2.289794921875, -1.9913330078125, -1.69287109375, -1.3944091796875, -1.095947265625, -0.7974853515625, -0.4990234375, -0.2005615234375, 0.097900390625, 0.3963623046875, 0.69482421875, 0.9932861328125, 1.291748046875, 1.5902099609375, 1.888671875, 2.1871337890625, 2.485595703125, 2.7840576171875, 3.08251953125, 3.3809814453125, 3.679443359375, 3.9779052734375, 4.2763671875, 4.5748291015625, 4.873291015625, 5.1717529296875, 5.47021484375, 5.7686767578125, 6.067138671875, 6.3656005859375, 6.6640625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 8.0, 12.0, 15.0, 32.0, 39.0, 62.0, 68.0, 102.0, 166.0, 248.0, 383.0, 598.0, 838.0, 1241.0, 1805.0, 2707.0, 4120.0, 6179.0, 9380.0, 14347.0, 22094.0, 34250.0, 53545.0, 83825.0, 129496.0, 175473.0, 169578.0, 119992.0, 77645.0, 49346.0, 31368.0, 20497.0, 13125.0, 8511.0, 5817.0, 3850.0, 2496.0, 1671.0, 1153.0, 817.0, 531.0, 380.0, 236.0, 147.0, 112.0, 86.0, 53.0, 37.0, 27.0, 14.0, 14.0, 10.0, 6.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.77294921875, -0.7487258911132812, -0.7245025634765625, -0.7002792358398438, -0.676055908203125, -0.6518325805664062, -0.6276092529296875, -0.6033859252929688, -0.57916259765625, -0.5549392700195312, -0.5307159423828125, -0.5064926147460938, -0.482269287109375, -0.45804595947265625, -0.4338226318359375, -0.40959930419921875, -0.3853759765625, -0.36115264892578125, -0.3369293212890625, -0.31270599365234375, -0.288482666015625, -0.26425933837890625, -0.2400360107421875, -0.21581268310546875, -0.19158935546875, -0.16736602783203125, -0.1431427001953125, -0.11891937255859375, -0.094696044921875, -0.07047271728515625, -0.0462493896484375, -0.02202606201171875, 0.002197265625, 0.02642059326171875, 0.0506439208984375, 0.07486724853515625, 0.099090576171875, 0.12331390380859375, 0.1475372314453125, 0.17176055908203125, 0.19598388671875, 0.22020721435546875, 0.2444305419921875, 0.26865386962890625, 0.292877197265625, 0.31710052490234375, 0.3413238525390625, 0.36554718017578125, 0.3897705078125, 0.41399383544921875, 0.4382171630859375, 0.46244049072265625, 0.486663818359375, 0.5108871459960938, 0.5351104736328125, 0.5593338012695312, 0.58355712890625, 0.6077804565429688, 0.6320037841796875, 0.6562271118164062, 0.680450439453125, 0.7046737670898438, 0.7288970947265625, 0.7531204223632812, 0.77734375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 9.0, 6.0, 7.0, 12.0, 17.0, 19.0, 28.0, 21.0, 29.0, 35.0, 37.0, 26.0, 44.0, 47.0, 52.0, 42.0, 40.0, 1071.0, 45.0, 43.0, 45.0, 52.0, 52.0, 35.0, 28.0, 26.0, 27.0, 19.0, 20.0, 16.0, 14.0, 13.0, 15.0, 10.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.11328125, -5.9371337890625, -5.760986328125, -5.5848388671875, -5.40869140625, -5.2325439453125, -5.056396484375, -4.8802490234375, -4.7041015625, -4.5279541015625, -4.351806640625, -4.1756591796875, -3.99951171875, -3.8233642578125, -3.647216796875, -3.4710693359375, -3.294921875, -3.1187744140625, -2.942626953125, -2.7664794921875, -2.59033203125, -2.4141845703125, -2.238037109375, -2.0618896484375, -1.8857421875, -1.7095947265625, -1.533447265625, -1.3572998046875, -1.18115234375, -1.0050048828125, -0.828857421875, -0.6527099609375, -0.4765625, -0.3004150390625, -0.124267578125, 0.0518798828125, 0.22802734375, 0.4041748046875, 0.580322265625, 0.7564697265625, 0.9326171875, 1.1087646484375, 1.284912109375, 1.4610595703125, 1.63720703125, 1.8133544921875, 1.989501953125, 2.1656494140625, 2.341796875, 2.5179443359375, 2.694091796875, 2.8702392578125, 3.04638671875, 3.2225341796875, 3.398681640625, 3.5748291015625, 3.7509765625, 3.9271240234375, 4.103271484375, 4.2794189453125, 4.45556640625, 4.6317138671875, 4.807861328125, 4.9840087890625, 5.16015625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 3.0, 8.0, 5.0, 10.0, 12.0, 20.0, 35.0, 47.0, 63.0, 121.0, 157.0, 245.0, 359.0, 518.0, 737.0, 1119.0, 1680.0, 2569.0, 3993.0, 5874.0, 9044.0, 13536.0, 20908.0, 32458.0, 49521.0, 76373.0, 116018.0, 163149.0, 1220341.0, 129512.0, 86249.0, 55674.0, 36470.0, 23736.0, 15655.0, 10371.0, 6967.0, 4459.0, 3057.0, 2032.0, 1383.0, 900.0, 578.0, 364.0, 251.0, 178.0, 122.0, 96.0, 56.0, 46.0, 17.0, 18.0, 10.0, 8.0, 6.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.68212890625, -0.6602249145507812, -0.6383209228515625, -0.6164169311523438, -0.594512939453125, -0.5726089477539062, -0.5507049560546875, -0.5288009643554688, -0.50689697265625, -0.48499298095703125, -0.4630889892578125, -0.44118499755859375, -0.419281005859375, -0.39737701416015625, -0.3754730224609375, -0.35356903076171875, -0.3316650390625, -0.30976104736328125, -0.2878570556640625, -0.26595306396484375, -0.244049072265625, -0.22214508056640625, -0.2002410888671875, -0.17833709716796875, -0.15643310546875, -0.13452911376953125, -0.1126251220703125, -0.09072113037109375, -0.068817138671875, -0.04691314697265625, -0.0250091552734375, -0.00310516357421875, 0.018798828125, 0.04070281982421875, 0.0626068115234375, 0.08451080322265625, 0.106414794921875, 0.12831878662109375, 0.1502227783203125, 0.17212677001953125, 0.19403076171875, 0.21593475341796875, 0.2378387451171875, 0.25974273681640625, 0.281646728515625, 0.30355072021484375, 0.3254547119140625, 0.34735870361328125, 0.3692626953125, 0.39116668701171875, 0.4130706787109375, 0.43497467041015625, 0.456878662109375, 0.47878265380859375, 0.5006866455078125, 0.5225906372070312, 0.54449462890625, 0.5663986206054688, 0.5883026123046875, 0.6102066040039062, 0.632110595703125, 0.6540145874023438, 0.6759185791015625, 0.6978225708007812, 0.7197265625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 6.0, 6.0, 8.0, 12.0, 10.0, 15.0, 16.0, 28.0, 35.0, 26.0, 50.0, 51.0, 57.0, 67.0, 64.0, 87.0, 71.0, 58.0, 46.0, 72.0, 42.0, 30.0, 36.0, 25.0, 18.0, 18.0, 14.0, 5.0, 7.0, 4.0, 5.0, 7.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0030231475830078125, -0.002939939498901367, -0.002856731414794922, -0.0027735233306884766, -0.0026903152465820312, -0.002607107162475586, -0.0025238990783691406, -0.0024406909942626953, -0.00235748291015625, -0.0022742748260498047, -0.0021910667419433594, -0.002107858657836914, -0.0020246505737304688, -0.0019414424896240234, -0.0018582344055175781, -0.0017750263214111328, -0.0016918182373046875, -0.0016086101531982422, -0.0015254020690917969, -0.0014421939849853516, -0.0013589859008789062, -0.001275777816772461, -0.0011925697326660156, -0.0011093616485595703, -0.001026153564453125, -0.0009429454803466797, -0.0008597373962402344, -0.0007765293121337891, -0.0006933212280273438, -0.0006101131439208984, -0.0005269050598144531, -0.0004436969757080078, -0.0003604888916015625, -0.0002772808074951172, -0.00019407272338867188, -0.00011086463928222656, -2.765655517578125e-05, 5.555152893066406e-05, 0.00013875961303710938, 0.0002219676971435547, 0.00030517578125, 0.0003883838653564453, 0.0004715919494628906, 0.0005548000335693359, 0.0006380081176757812, 0.0007212162017822266, 0.0008044242858886719, 0.0008876323699951172, 0.0009708404541015625, 0.0010540485382080078, 0.0011372566223144531, 0.0012204647064208984, 0.0013036727905273438, 0.001386880874633789, 0.0014700889587402344, 0.0015532970428466797, 0.001636505126953125, 0.0017197132110595703, 0.0018029212951660156, 0.001886129379272461, 0.0019693374633789062, 0.0020525455474853516, 0.002135753631591797, 0.002218961715698242, 0.0023021697998046875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 8.0, 8.0, 4.0, 5.0, 9.0, 7.0, 9.0, 20.0, 21.0, 34.0, 45.0, 55.0, 73.0, 122.0, 203.0, 559.0, 3706.0, 1038087.0, 4411.0, 574.0, 225.0, 119.0, 72.0, 51.0, 24.0, 31.0, 21.0, 14.0, 10.0, 13.0, 7.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05108642578125, -0.049160003662109375, -0.04723358154296875, -0.045307159423828125, -0.0433807373046875, -0.041454315185546875, -0.03952789306640625, -0.037601470947265625, -0.035675048828125, -0.033748626708984375, -0.03182220458984375, -0.029895782470703125, -0.0279693603515625, -0.026042938232421875, -0.02411651611328125, -0.022190093994140625, -0.020263671875, -0.018337249755859375, -0.01641082763671875, -0.014484405517578125, -0.0125579833984375, -0.010631561279296875, -0.00870513916015625, -0.006778717041015625, -0.004852294921875, -0.002925872802734375, -0.00099945068359375, 0.000926971435546875, 0.0028533935546875, 0.004779815673828125, 0.00670623779296875, 0.008632659912109375, 0.01055908203125, 0.012485504150390625, 0.01441192626953125, 0.016338348388671875, 0.0182647705078125, 0.020191192626953125, 0.02211761474609375, 0.024044036865234375, 0.025970458984375, 0.027896881103515625, 0.02982330322265625, 0.031749725341796875, 0.0336761474609375, 0.035602569580078125, 0.03752899169921875, 0.039455413818359375, 0.0413818359375, 0.043308258056640625, 0.04523468017578125, 0.047161102294921875, 0.0490875244140625, 0.051013946533203125, 0.05294036865234375, 0.054866790771484375, 0.056793212890625, 0.058719635009765625, 0.06064605712890625, 0.06257247924804688, 0.0644989013671875, 0.06642532348632812, 0.06835174560546875, 0.07027816772460938, 0.07220458984375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 19.0, 47.0, 92.0, 202.0, 215.0, 210.0, 145.0, 53.0, 12.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020850494038313627, -0.0019967141561210155, -0.001908379141241312, -0.0018200440099462867, -0.0017317088786512613, -0.001643373747356236, -0.0015550386160612106, -0.0014667034847661853, -0.00137836835347116, -0.0012900332221761346, -0.0012016980908811092, -0.0011133629595860839, -0.0010250278282910585, -0.0009366926969960332, -0.0008483575657010078, -0.0007600224344059825, -0.0006716873031109571, -0.0005833521718159318, -0.0004950170405209064, -0.0004066819092258811, -0.00031834677793085575, -0.0002300116466358304, -0.00014167651534080505, -5.3341384045779705e-05, 3.4993747249245644e-05, 0.000123328878544271, 0.00021166400983929634, 0.0002999991411343217, 0.00038833427242934704, 0.0004766694037243724, 0.0005650045350193977, 0.0006533396663144231, 0.0007416745647788048, 0.0008300096960738301, 0.0009183448273688555, 0.0010066799586638808, 0.0010950150899589062, 0.0011833502212539315, 0.0012716853525489569, 0.0013600204838439822, 0.0014483556151390076, 0.001536690746434033, 0.0016250258777290583, 0.0017133610090240836, 0.001801696140319109, 0.0018900312716141343, 0.0019783664029091597, 0.002066701650619507, 0.0021550366654992104, 0.002243371680378914, 0.002331706928089261, 0.0024200421757996082, 0.0025083771906793118, 0.0025967122055590153, 0.0026850474532693624, 0.0027733827009797096, 0.002861717715859413, 0.0029500527307391167, 0.003038387978449464, 0.003126723226159811, 0.0032150582410395145, 0.003303393255919218, 0.0033917285036295652, 0.0034800637513399124, 0.003568398766219616]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 8.0, 6.0, 6.0, 17.0, 14.0, 8.0, 13.0, 22.0, 17.0, 25.0, 26.0, 26.0, 32.0, 36.0, 42.0, 35.0, 39.0, 44.0, 43.0, 42.0, 43.0, 43.0, 35.0, 39.0, 30.0, 41.0, 35.0, 44.0, 26.0, 29.0, 22.0, 23.0, 11.0, 14.0, 12.0, 14.0, 5.0, 12.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0012227296829223633, -0.001185067929327488, -0.0011474061757326126, -0.0011097444221377373, -0.001072082668542862, -0.0010344209149479866, -0.0009967591613531113, -0.0009590974077582359, -0.0009214356541633606, -0.0008837739005684853, -0.0008461121469736099, -0.0008084503933787346, -0.0007707886397838593, -0.0007331268861889839, -0.0006954651325941086, -0.0006578033789992332, -0.0006201416254043579, -0.0005824798718094826, -0.0005448181182146072, -0.0005071563646197319, -0.00046949461102485657, -0.00043183285742998123, -0.0003941711038351059, -0.00035650935024023056, -0.0003188475966453552, -0.0002811858430504799, -0.00024352408945560455, -0.00020586233586072922, -0.00016820058226585388, -0.00013053882867097855, -9.287707507610321e-05, -5.5215321481227875e-05, -1.755356788635254e-05, 2.0108185708522797e-05, 5.776993930339813e-05, 9.543169289827347e-05, 0.0001330934464931488, 0.00017075520008802414, 0.00020841695368289948, 0.0002460787072777748, 0.00028374046087265015, 0.0003214022144675255, 0.0003590639680624008, 0.00039672572165727615, 0.0004343874752521515, 0.0004720492288470268, 0.0005097109824419022, 0.0005473727360367775, 0.0005850344896316528, 0.0006226962432265282, 0.0006603579968214035, 0.0006980197504162788, 0.0007356815040111542, 0.0007733432576060295, 0.0008110050112009048, 0.0008486667647957802, 0.0008863285183906555, 0.0009239902719855309, 0.0009616520255804062, 0.0009993137791752815, 0.0010369755327701569, 0.0010746372863650322, 0.0011122990399599075, 0.0011499607935547829, 0.0011876225471496582]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 4.0, 5.0, 10.0, 15.0, 13.0, 17.0, 34.0, 16.0, 28.0, 42.0, 26.0, 46.0, 40.0, 41.0, 47.0, 53.0, 61.0, 44.0, 45.0, 58.0, 41.0, 57.0, 44.0, 36.0, 45.0, 29.0, 19.0, 16.0, 8.0, 12.0, 16.0, 4.0, 5.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0], "bins": [-12.4453125, -12.146728515625, -11.84814453125, -11.549560546875, -11.2509765625, -10.952392578125, -10.65380859375, -10.355224609375, -10.056640625, -9.758056640625, -9.45947265625, -9.160888671875, -8.8623046875, -8.563720703125, -8.26513671875, -7.966552734375, -7.66796875, -7.369384765625, -7.07080078125, -6.772216796875, -6.4736328125, -6.175048828125, -5.87646484375, -5.577880859375, -5.279296875, -4.980712890625, -4.68212890625, -4.383544921875, -4.0849609375, -3.786376953125, -3.48779296875, -3.189208984375, -2.890625, -2.592041015625, -2.29345703125, -1.994873046875, -1.6962890625, -1.397705078125, -1.09912109375, -0.800537109375, -0.501953125, -0.203369140625, 0.09521484375, 0.393798828125, 0.6923828125, 0.990966796875, 1.28955078125, 1.588134765625, 1.88671875, 2.185302734375, 2.48388671875, 2.782470703125, 3.0810546875, 3.379638671875, 3.67822265625, 3.976806640625, 4.275390625, 4.573974609375, 4.87255859375, 5.171142578125, 5.4697265625, 5.768310546875, 6.06689453125, 6.365478515625, 6.6640625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 11.0, 8.0, 8.0, 24.0, 24.0, 31.0, 48.0, 84.0, 80.0, 146.0, 213.0, 334.0, 444.0, 880.0, 1419.0, 2652.0, 5552.0, 12786.0, 34345.0, 125610.0, 593395.0, 193671.0, 46069.0, 16346.0, 6723.0, 3282.0, 1689.0, 969.0, 605.0, 367.0, 220.0, 147.0, 100.0, 77.0, 48.0, 46.0, 25.0, 17.0, 14.0, 12.0, 9.0, 3.0, 7.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.265625, -8.9901123046875, -8.714599609375, -8.4390869140625, -8.16357421875, -7.8880615234375, -7.612548828125, -7.3370361328125, -7.0615234375, -6.7860107421875, -6.510498046875, -6.2349853515625, -5.95947265625, -5.6839599609375, -5.408447265625, -5.1329345703125, -4.857421875, -4.5819091796875, -4.306396484375, -4.0308837890625, -3.75537109375, -3.4798583984375, -3.204345703125, -2.9288330078125, -2.6533203125, -2.3778076171875, -2.102294921875, -1.8267822265625, -1.55126953125, -1.2757568359375, -1.000244140625, -0.7247314453125, -0.44921875, -0.1737060546875, 0.101806640625, 0.3773193359375, 0.65283203125, 0.9283447265625, 1.203857421875, 1.4793701171875, 1.7548828125, 2.0303955078125, 2.305908203125, 2.5814208984375, 2.85693359375, 3.1324462890625, 3.407958984375, 3.6834716796875, 3.958984375, 4.2344970703125, 4.510009765625, 4.7855224609375, 5.06103515625, 5.3365478515625, 5.612060546875, 5.8875732421875, 6.1630859375, 6.4385986328125, 6.714111328125, 6.9896240234375, 7.26513671875, 7.5406494140625, 7.816162109375, 8.0916748046875, 8.3671875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 10.0, 16.0, 15.0, 14.0, 26.0, 30.0, 21.0, 24.0, 23.0, 40.0, 38.0, 39.0, 36.0, 49.0, 62.0, 93.0, 273.0, 1604.0, 139.0, 71.0, 50.0, 47.0, 32.0, 38.0, 44.0, 31.0, 35.0, 21.0, 11.0, 17.0, 17.0, 14.0, 11.0, 8.0, 9.0, 9.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.34375, -23.537109375, -22.73046875, -21.923828125, -21.1171875, -20.310546875, -19.50390625, -18.697265625, -17.890625, -17.083984375, -16.27734375, -15.470703125, -14.6640625, -13.857421875, -13.05078125, -12.244140625, -11.4375, -10.630859375, -9.82421875, -9.017578125, -8.2109375, -7.404296875, -6.59765625, -5.791015625, -4.984375, -4.177734375, -3.37109375, -2.564453125, -1.7578125, -0.951171875, -0.14453125, 0.662109375, 1.46875, 2.275390625, 3.08203125, 3.888671875, 4.6953125, 5.501953125, 6.30859375, 7.115234375, 7.921875, 8.728515625, 9.53515625, 10.341796875, 11.1484375, 11.955078125, 12.76171875, 13.568359375, 14.375, 15.181640625, 15.98828125, 16.794921875, 17.6015625, 18.408203125, 19.21484375, 20.021484375, 20.828125, 21.634765625, 22.44140625, 23.248046875, 24.0546875, 24.861328125, 25.66796875, 26.474609375, 27.28125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 6.0, 5.0, 11.0, 12.0, 14.0, 14.0, 29.0, 40.0, 48.0, 61.0, 101.0, 144.0, 183.0, 327.0, 668.0, 3667.0, 2815211.0, 321461.0, 2161.0, 569.0, 288.0, 173.0, 137.0, 87.0, 74.0, 59.0, 41.0, 35.0, 24.0, 12.0, 18.0, 10.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0], "bins": [-102.6875, -100.17724609375, -97.6669921875, -95.15673828125, -92.646484375, -90.13623046875, -87.6259765625, -85.11572265625, -82.60546875, -80.09521484375, -77.5849609375, -75.07470703125, -72.564453125, -70.05419921875, -67.5439453125, -65.03369140625, -62.5234375, -60.01318359375, -57.5029296875, -54.99267578125, -52.482421875, -49.97216796875, -47.4619140625, -44.95166015625, -42.44140625, -39.93115234375, -37.4208984375, -34.91064453125, -32.400390625, -29.89013671875, -27.3798828125, -24.86962890625, -22.359375, -19.84912109375, -17.3388671875, -14.82861328125, -12.318359375, -9.80810546875, -7.2978515625, -4.78759765625, -2.27734375, 0.23291015625, 2.7431640625, 5.25341796875, 7.763671875, 10.27392578125, 12.7841796875, 15.29443359375, 17.8046875, 20.31494140625, 22.8251953125, 25.33544921875, 27.845703125, 30.35595703125, 32.8662109375, 35.37646484375, 37.88671875, 40.39697265625, 42.9072265625, 45.41748046875, 47.927734375, 50.43798828125, 52.9482421875, 55.45849609375, 57.96875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [4.0, 18.0, 365.0, 617.0, 18.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.727123260498047, -17.595252990722656, -9.463380813598633, -1.3315086364746094, 6.800361633300781, 14.932231903076172, 23.064105987548828, 31.19597625732422, 39.32784652709961, 47.459716796875, 55.591590881347656, 63.72346115112305, 71.85533142089844, 79.98719787597656, 88.11907958984375, 96.25094604492188, 104.3828125, 112.51468658447266, 120.64655303955078, 128.77842712402344, 136.91029357910156, 145.04217529296875, 153.17404174804688, 161.305908203125, 169.4377899169922, 177.5696563720703, 185.7015380859375, 193.83340454101562, 201.96527099609375, 210.09713745117188, 218.22901916503906, 226.3608856201172, 234.49273681640625, 242.62460327148438, 250.75648498535156, 258.88836669921875, 267.0202331542969, 275.152099609375, 283.2839660644531, 291.41583251953125, 299.5476989746094, 307.6795654296875, 315.8114318847656, 323.94329833984375, 332.0751953125, 340.2070617675781, 348.33892822265625, 356.4707946777344, 364.6026611328125, 372.7345275878906, 380.86639404296875, 388.998291015625, 397.1301574707031, 405.26202392578125, 413.3938903808594, 421.5257568359375, 429.65765380859375, 437.7895202636719, 445.92138671875, 454.05328369140625, 462.1851501464844, 470.3170166015625, 478.4488830566406, 486.58074951171875, 494.7126159667969]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 6.0, 5.0, 14.0, 6.0, 6.0, 14.0, 13.0, 18.0, 21.0, 23.0, 27.0, 31.0, 34.0, 44.0, 21.0, 30.0, 29.0, 38.0, 32.0, 41.0, 43.0, 28.0, 45.0, 36.0, 39.0, 31.0, 34.0, 28.0, 28.0, 38.0, 27.0, 24.0, 20.0, 14.0, 21.0, 10.0, 15.0, 7.0, 8.0, 10.0, 2.0, 9.0, 3.0, 3.0, 3.0, 6.0, 4.0, 4.0, 0.0, 3.0], "bins": [-75.50237274169922, -73.35677337646484, -71.21117401123047, -69.0655746459961, -66.91996765136719, -64.77436828613281, -62.62876892089844, -60.48316955566406, -58.33757019042969, -56.19197082519531, -54.04637145996094, -51.9007682800293, -49.75516891479492, -47.60956954956055, -45.463966369628906, -43.31836700439453, -41.172767639160156, -39.02716827392578, -36.881568908691406, -34.735965728759766, -32.59036636352539, -30.444766998291016, -28.299165725708008, -26.153564453125, -24.007965087890625, -21.86236572265625, -19.716764450073242, -17.571163177490234, -15.42556381225586, -13.279963493347168, -11.134363174438477, -8.988762855529785, -6.843158721923828, -4.697558403015137, -2.5519580841064453, -0.4063577651977539, 1.7392425537109375, 3.884842872619629, 6.03044319152832, 8.176043510437012, 10.321643829345703, 12.467244148254395, 14.612844467163086, 16.758445739746094, 18.90404510498047, 21.049644470214844, 23.19524574279785, 25.34084701538086, 27.486446380615234, 29.63204574584961, 31.777647018432617, 33.923248291015625, 36.06884765625, 38.214447021484375, 40.36004638671875, 42.50564956665039, 44.651248931884766, 46.79684829711914, 48.94245147705078, 51.088050842285156, 53.23365020751953, 55.379249572753906, 57.52484893798828, 59.67045211791992, 61.8160514831543]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 5.0, 5.0, 7.0, 14.0, 14.0, 13.0, 23.0, 26.0, 21.0, 34.0, 41.0, 40.0, 37.0, 41.0, 45.0, 49.0, 56.0, 57.0, 43.0, 54.0, 56.0, 54.0, 42.0, 38.0, 38.0, 32.0, 30.0, 22.0, 8.0, 12.0, 9.0, 5.0, 8.0, 11.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-13.1953125, -12.86639404296875, -12.5374755859375, -12.20855712890625, -11.879638671875, -11.55072021484375, -11.2218017578125, -10.89288330078125, -10.56396484375, -10.23504638671875, -9.9061279296875, -9.57720947265625, -9.248291015625, -8.91937255859375, -8.5904541015625, -8.26153564453125, -7.9326171875, -7.60369873046875, -7.2747802734375, -6.94586181640625, -6.616943359375, -6.28802490234375, -5.9591064453125, -5.63018798828125, -5.30126953125, -4.97235107421875, -4.6434326171875, -4.31451416015625, -3.985595703125, -3.65667724609375, -3.3277587890625, -2.99884033203125, -2.669921875, -2.34100341796875, -2.0120849609375, -1.68316650390625, -1.354248046875, -1.02532958984375, -0.6964111328125, -0.36749267578125, -0.03857421875, 0.29034423828125, 0.6192626953125, 0.94818115234375, 1.277099609375, 1.60601806640625, 1.9349365234375, 2.26385498046875, 2.5927734375, 2.92169189453125, 3.2506103515625, 3.57952880859375, 3.908447265625, 4.23736572265625, 4.5662841796875, 4.89520263671875, 5.22412109375, 5.55303955078125, 5.8819580078125, 6.21087646484375, 6.539794921875, 6.86871337890625, 7.1976318359375, 7.52655029296875, 7.85546875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 4.0, 4.0, 7.0, 11.0, 11.0, 16.0, 23.0, 20.0, 29.0, 37.0, 39.0, 46.0, 50.0, 185.0, 668.0, 4039.0, 82936.0, 3574762.0, 520338.0, 9383.0, 1099.0, 215.0, 89.0, 56.0, 32.0, 38.0, 36.0, 23.0, 24.0, 9.0, 10.0, 11.0, 7.0, 7.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-44.0, -42.8623046875, -41.724609375, -40.5869140625, -39.44921875, -38.3115234375, -37.173828125, -36.0361328125, -34.8984375, -33.7607421875, -32.623046875, -31.4853515625, -30.34765625, -29.2099609375, -28.072265625, -26.9345703125, -25.796875, -24.6591796875, -23.521484375, -22.3837890625, -21.24609375, -20.1083984375, -18.970703125, -17.8330078125, -16.6953125, -15.5576171875, -14.419921875, -13.2822265625, -12.14453125, -11.0068359375, -9.869140625, -8.7314453125, -7.59375, -6.4560546875, -5.318359375, -4.1806640625, -3.04296875, -1.9052734375, -0.767578125, 0.3701171875, 1.5078125, 2.6455078125, 3.783203125, 4.9208984375, 6.05859375, 7.1962890625, 8.333984375, 9.4716796875, 10.609375, 11.7470703125, 12.884765625, 14.0224609375, 15.16015625, 16.2978515625, 17.435546875, 18.5732421875, 19.7109375, 20.8486328125, 21.986328125, 23.1240234375, 24.26171875, 25.3994140625, 26.537109375, 27.6748046875, 28.8125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 6.0, 11.0, 3.0, 15.0, 28.0, 36.0, 43.0, 60.0, 84.0, 130.0, 180.0, 280.0, 446.0, 568.0, 604.0, 520.0, 319.0, 231.0, 172.0, 106.0, 59.0, 48.0, 41.0, 21.0, 17.0, 11.0, 10.0, 8.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.25, -22.607177734375, -21.96435546875, -21.321533203125, -20.6787109375, -20.035888671875, -19.39306640625, -18.750244140625, -18.107421875, -17.464599609375, -16.82177734375, -16.178955078125, -15.5361328125, -14.893310546875, -14.25048828125, -13.607666015625, -12.96484375, -12.322021484375, -11.67919921875, -11.036376953125, -10.3935546875, -9.750732421875, -9.10791015625, -8.465087890625, -7.822265625, -7.179443359375, -6.53662109375, -5.893798828125, -5.2509765625, -4.608154296875, -3.96533203125, -3.322509765625, -2.6796875, -2.036865234375, -1.39404296875, -0.751220703125, -0.1083984375, 0.534423828125, 1.17724609375, 1.820068359375, 2.462890625, 3.105712890625, 3.74853515625, 4.391357421875, 5.0341796875, 5.677001953125, 6.31982421875, 6.962646484375, 7.60546875, 8.248291015625, 8.89111328125, 9.533935546875, 10.1767578125, 10.819580078125, 11.46240234375, 12.105224609375, 12.748046875, 13.390869140625, 14.03369140625, 14.676513671875, 15.3193359375, 15.962158203125, 16.60498046875, 17.247802734375, 17.890625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 7.0, 14.0, 19.0, 14.0, 20.0, 28.0, 43.0, 66.0, 67.0, 106.0, 127.0, 183.0, 274.0, 398.0, 825.0, 5208.0, 728649.0, 3441728.0, 13957.0, 1038.0, 429.0, 279.0, 213.0, 146.0, 99.0, 80.0, 64.0, 56.0, 37.0, 24.0, 21.0, 19.0, 5.0, 4.0, 5.0, 10.0, 3.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.4375, -58.36328125, -56.2890625, -54.21484375, -52.140625, -50.06640625, -47.9921875, -45.91796875, -43.84375, -41.76953125, -39.6953125, -37.62109375, -35.546875, -33.47265625, -31.3984375, -29.32421875, -27.25, -25.17578125, -23.1015625, -21.02734375, -18.953125, -16.87890625, -14.8046875, -12.73046875, -10.65625, -8.58203125, -6.5078125, -4.43359375, -2.359375, -0.28515625, 1.7890625, 3.86328125, 5.9375, 8.01171875, 10.0859375, 12.16015625, 14.234375, 16.30859375, 18.3828125, 20.45703125, 22.53125, 24.60546875, 26.6796875, 28.75390625, 30.828125, 32.90234375, 34.9765625, 37.05078125, 39.125, 41.19921875, 43.2734375, 45.34765625, 47.421875, 49.49609375, 51.5703125, 53.64453125, 55.71875, 57.79296875, 59.8671875, 61.94140625, 64.015625, 66.08984375, 68.1640625, 70.23828125, 72.3125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 47.0, 238.0, 423.0, 256.0, 40.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.61260986328125, -80.15702056884766, -71.70143127441406, -63.24584197998047, -54.790252685546875, -46.33466339111328, -37.87907409667969, -29.423484802246094, -20.9678955078125, -12.512306213378906, -4.0567169189453125, 4.398872375488281, 12.854461669921875, 21.31005096435547, 29.765640258789062, 38.221229553222656, 46.67681884765625, 55.132408142089844, 63.58799743652344, 72.04358673095703, 80.49917602539062, 88.95476531982422, 97.41035461425781, 105.8659439086914, 114.321533203125, 122.7771224975586, 131.2327117919922, 139.68829345703125, 148.14389038085938, 156.5994873046875, 165.05506896972656, 173.51065063476562, 181.96624755859375, 190.42184448242188, 198.87742614746094, 207.3330078125, 215.78860473632812, 224.24420166015625, 232.6997833251953, 241.15536499023438, 249.6109619140625, 258.0665588378906, 266.52215576171875, 274.97772216796875, 283.4333190917969, 291.888916015625, 300.344482421875, 308.8000793457031, 317.25567626953125, 325.7112731933594, 334.1668701171875, 342.6224365234375, 351.0780334472656, 359.53363037109375, 367.98919677734375, 376.4447937011719, 384.900390625, 393.3559875488281, 401.81158447265625, 410.26715087890625, 418.7227478027344, 427.1783447265625, 435.6339111328125, 444.0895080566406, 452.54510498046875]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 8.0, 3.0, 4.0, 10.0, 9.0, 13.0, 9.0, 12.0, 21.0, 23.0, 22.0, 19.0, 25.0, 40.0, 41.0, 37.0, 47.0, 45.0, 44.0, 45.0, 30.0, 43.0, 51.0, 37.0, 43.0, 46.0, 34.0, 35.0, 40.0, 31.0, 20.0, 16.0, 19.0, 9.0, 16.0, 8.0, 17.0, 9.0, 8.0, 4.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.903717041015625, -50.103485107421875, -48.30325698852539, -46.50302505493164, -44.702796936035156, -42.902565002441406, -41.102333068847656, -39.302101135253906, -37.50187301635742, -35.70164108276367, -33.90141296386719, -32.10118103027344, -30.30095100402832, -28.500720977783203, -26.700489044189453, -24.900259017944336, -23.10002899169922, -21.2997989654541, -19.499568939208984, -17.699337005615234, -15.899106979370117, -14.098876953125, -12.298645973205566, -10.498414993286133, -8.698184967041016, -6.89795446395874, -5.097723960876465, -3.2974934577941895, -1.497262954711914, 0.3029670715332031, 2.1031980514526367, 3.9034290313720703, 5.703662872314453, 7.5038933753967285, 9.304123878479004, 11.104354858398438, 12.904584884643555, 14.704814910888672, 16.505046844482422, 18.30527687072754, 20.105506896972656, 21.905736923217773, 23.70596694946289, 25.50619888305664, 27.306428909301758, 29.106658935546875, 30.906890869140625, 32.707122802734375, 34.50735092163086, 36.30758285522461, 38.107810974121094, 39.908042907714844, 41.708274841308594, 43.50850296020508, 45.30873489379883, 47.10896301269531, 48.90919494628906, 50.70942687988281, 52.5096549987793, 54.30988693237305, 56.11011505126953, 57.91034698486328, 59.71057891845703, 61.51081085205078, 63.311038970947266]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 1.0, 5.0, 8.0, 12.0, 13.0, 17.0, 24.0, 19.0, 16.0, 29.0, 29.0, 39.0, 34.0, 33.0, 46.0, 38.0, 40.0, 47.0, 61.0, 44.0, 63.0, 31.0, 40.0, 45.0, 36.0, 34.0, 29.0, 39.0, 26.0, 22.0, 19.0, 15.0, 8.0, 6.0, 6.0, 9.0, 10.0, 1.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.453125, -10.1597900390625, -9.866455078125, -9.5731201171875, -9.27978515625, -8.9864501953125, -8.693115234375, -8.3997802734375, -8.1064453125, -7.8131103515625, -7.519775390625, -7.2264404296875, -6.93310546875, -6.6397705078125, -6.346435546875, -6.0531005859375, -5.759765625, -5.4664306640625, -5.173095703125, -4.8797607421875, -4.58642578125, -4.2930908203125, -3.999755859375, -3.7064208984375, -3.4130859375, -3.1197509765625, -2.826416015625, -2.5330810546875, -2.23974609375, -1.9464111328125, -1.653076171875, -1.3597412109375, -1.06640625, -0.7730712890625, -0.479736328125, -0.1864013671875, 0.10693359375, 0.4002685546875, 0.693603515625, 0.9869384765625, 1.2802734375, 1.5736083984375, 1.866943359375, 2.1602783203125, 2.45361328125, 2.7469482421875, 3.040283203125, 3.3336181640625, 3.626953125, 3.9202880859375, 4.213623046875, 4.5069580078125, 4.80029296875, 5.0936279296875, 5.386962890625, 5.6802978515625, 5.9736328125, 6.2669677734375, 6.560302734375, 6.8536376953125, 7.14697265625, 7.4403076171875, 7.733642578125, 8.0269775390625, 8.3203125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 5.0, 3.0, 11.0, 9.0, 12.0, 18.0, 19.0, 38.0, 51.0, 62.0, 113.0, 166.0, 257.0, 362.0, 510.0, 881.0, 1196.0, 1844.0, 2817.0, 4131.0, 6175.0, 9380.0, 14076.0, 20975.0, 32177.0, 48405.0, 74260.0, 111812.0, 155229.0, 167756.0, 132470.0, 89447.0, 58828.0, 38954.0, 25523.0, 17043.0, 10969.0, 7559.0, 5003.0, 3368.0, 2101.0, 1496.0, 986.0, 687.0, 489.0, 277.0, 204.0, 132.0, 82.0, 62.0, 39.0, 34.0, 18.0, 11.0, 11.0, 10.0, 4.0, 7.0, 1.0, 1.0, 2.0], "bins": [-0.794921875, -0.7702560424804688, -0.7455902099609375, -0.7209243774414062, -0.696258544921875, -0.6715927124023438, -0.6469268798828125, -0.6222610473632812, -0.59759521484375, -0.5729293823242188, -0.5482635498046875, -0.5235977172851562, -0.498931884765625, -0.47426605224609375, -0.4496002197265625, -0.42493438720703125, -0.4002685546875, -0.37560272216796875, -0.3509368896484375, -0.32627105712890625, -0.301605224609375, -0.27693939208984375, -0.2522735595703125, -0.22760772705078125, -0.20294189453125, -0.17827606201171875, -0.1536102294921875, -0.12894439697265625, -0.104278564453125, -0.07961273193359375, -0.0549468994140625, -0.03028106689453125, -0.005615234375, 0.01905059814453125, 0.0437164306640625, 0.06838226318359375, 0.093048095703125, 0.11771392822265625, 0.1423797607421875, 0.16704559326171875, 0.19171142578125, 0.21637725830078125, 0.2410430908203125, 0.26570892333984375, 0.290374755859375, 0.31504058837890625, 0.3397064208984375, 0.36437225341796875, 0.3890380859375, 0.41370391845703125, 0.4383697509765625, 0.46303558349609375, 0.487701416015625, 0.5123672485351562, 0.5370330810546875, 0.5616989135742188, 0.58636474609375, 0.6110305786132812, 0.6356964111328125, 0.6603622436523438, 0.685028076171875, 0.7096939086914062, 0.7343597412109375, 0.7590255737304688, 0.78369140625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 7.0, 7.0, 3.0, 13.0, 9.0, 14.0, 15.0, 10.0, 14.0, 24.0, 15.0, 34.0, 26.0, 32.0, 34.0, 36.0, 26.0, 46.0, 34.0, 43.0, 45.0, 1064.0, 52.0, 45.0, 34.0, 35.0, 39.0, 27.0, 37.0, 26.0, 24.0, 20.0, 20.0, 15.0, 25.0, 12.0, 10.0, 13.0, 11.0, 5.0, 6.0, 6.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0], "bins": [-5.46875, -5.30584716796875, -5.1429443359375, -4.98004150390625, -4.817138671875, -4.65423583984375, -4.4913330078125, -4.32843017578125, -4.16552734375, -4.00262451171875, -3.8397216796875, -3.67681884765625, -3.513916015625, -3.35101318359375, -3.1881103515625, -3.02520751953125, -2.8623046875, -2.69940185546875, -2.5364990234375, -2.37359619140625, -2.210693359375, -2.04779052734375, -1.8848876953125, -1.72198486328125, -1.55908203125, -1.39617919921875, -1.2332763671875, -1.07037353515625, -0.907470703125, -0.74456787109375, -0.5816650390625, -0.41876220703125, -0.255859375, -0.09295654296875, 0.0699462890625, 0.23284912109375, 0.395751953125, 0.55865478515625, 0.7215576171875, 0.88446044921875, 1.04736328125, 1.21026611328125, 1.3731689453125, 1.53607177734375, 1.698974609375, 1.86187744140625, 2.0247802734375, 2.18768310546875, 2.3505859375, 2.51348876953125, 2.6763916015625, 2.83929443359375, 3.002197265625, 3.16510009765625, 3.3280029296875, 3.49090576171875, 3.65380859375, 3.81671142578125, 3.9796142578125, 4.14251708984375, 4.305419921875, 4.46832275390625, 4.6312255859375, 4.79412841796875, 4.95703125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 5.0, 6.0, 5.0, 14.0, 21.0, 29.0, 38.0, 54.0, 72.0, 110.0, 144.0, 222.0, 311.0, 466.0, 577.0, 839.0, 1239.0, 1781.0, 2678.0, 3907.0, 5598.0, 8073.0, 11749.0, 17233.0, 25317.0, 37222.0, 55322.0, 83131.0, 123285.0, 1211242.0, 157534.0, 114123.0, 76025.0, 50585.0, 34188.0, 23248.0, 15615.0, 10875.0, 7370.0, 5195.0, 3519.0, 2447.0, 1767.0, 1230.0, 844.0, 572.0, 433.0, 261.0, 209.0, 128.0, 83.0, 62.0, 40.0, 37.0, 24.0, 16.0, 4.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.6591796875, -0.6378402709960938, -0.6165008544921875, -0.5951614379882812, -0.573822021484375, -0.5524826049804688, -0.5311431884765625, -0.5098037719726562, -0.48846435546875, -0.46712493896484375, -0.4457855224609375, -0.42444610595703125, -0.403106689453125, -0.38176727294921875, -0.3604278564453125, -0.33908843994140625, -0.3177490234375, -0.29640960693359375, -0.2750701904296875, -0.25373077392578125, -0.232391357421875, -0.21105194091796875, -0.1897125244140625, -0.16837310791015625, -0.14703369140625, -0.12569427490234375, -0.1043548583984375, -0.08301544189453125, -0.061676025390625, -0.04033660888671875, -0.0189971923828125, 0.00234222412109375, 0.023681640625, 0.04502105712890625, 0.0663604736328125, 0.08769989013671875, 0.109039306640625, 0.13037872314453125, 0.1517181396484375, 0.17305755615234375, 0.19439697265625, 0.21573638916015625, 0.2370758056640625, 0.25841522216796875, 0.279754638671875, 0.30109405517578125, 0.3224334716796875, 0.34377288818359375, 0.3651123046875, 0.38645172119140625, 0.4077911376953125, 0.42913055419921875, 0.450469970703125, 0.47180938720703125, 0.4931488037109375, 0.5144882202148438, 0.53582763671875, 0.5571670532226562, 0.5785064697265625, 0.5998458862304688, 0.621185302734375, 0.6425247192382812, 0.6638641357421875, 0.6852035522460938, 0.70654296875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 10.0, 16.0, 12.0, 13.0, 16.0, 22.0, 27.0, 22.0, 34.0, 31.0, 47.0, 41.0, 53.0, 52.0, 44.0, 57.0, 55.0, 56.0, 67.0, 40.0, 48.0, 32.0, 24.0, 29.0, 16.0, 24.0, 14.0, 18.0, 14.0, 2.0, 2.0, 6.0, 8.0, 12.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001895904541015625, -0.0018367916345596313, -0.0017776787281036377, -0.001718565821647644, -0.0016594529151916504, -0.0016003400087356567, -0.001541227102279663, -0.0014821141958236694, -0.0014230012893676758, -0.0013638883829116821, -0.0013047754764556885, -0.0012456625699996948, -0.0011865496635437012, -0.0011274367570877075, -0.0010683238506317139, -0.0010092109441757202, -0.0009500980377197266, -0.0008909851312637329, -0.0008318722248077393, -0.0007727593183517456, -0.000713646411895752, -0.0006545335054397583, -0.0005954205989837646, -0.000536307692527771, -0.00047719478607177734, -0.0004180818796157837, -0.00035896897315979004, -0.0002998560667037964, -0.00024074316024780273, -0.00018163025379180908, -0.00012251734733581543, -6.340444087982178e-05, -4.291534423828125e-06, 5.482137203216553e-05, 0.00011393427848815918, 0.00017304718494415283, 0.00023216009140014648, 0.00029127299785614014, 0.0003503859043121338, 0.00040949881076812744, 0.0004686117172241211, 0.0005277246236801147, 0.0005868375301361084, 0.000645950436592102, 0.0007050633430480957, 0.0007641762495040894, 0.000823289155960083, 0.0008824020624160767, 0.0009415149688720703, 0.001000627875328064, 0.0010597407817840576, 0.0011188536882400513, 0.001177966594696045, 0.0012370795011520386, 0.0012961924076080322, 0.0013553053140640259, 0.0014144182205200195, 0.0014735311269760132, 0.0015326440334320068, 0.0015917569398880005, 0.0016508698463439941, 0.0017099827527999878, 0.0017690956592559814, 0.001828208565711975, 0.0018873214721679688]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 6.0, 7.0, 7.0, 11.0, 12.0, 8.0, 7.0, 22.0, 29.0, 27.0, 29.0, 53.0, 61.0, 97.0, 149.0, 295.0, 704.0, 6118.0, 1028880.0, 10457.0, 755.0, 290.0, 146.0, 94.0, 70.0, 39.0, 35.0, 27.0, 33.0, 10.0, 13.0, 14.0, 8.0, 11.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.047760009765625, -0.04629230499267578, -0.04482460021972656, -0.043356895446777344, -0.041889190673828125, -0.040421485900878906, -0.03895378112792969, -0.03748607635498047, -0.03601837158203125, -0.03455066680908203, -0.03308296203613281, -0.031615257263183594, -0.030147552490234375, -0.028679847717285156, -0.027212142944335938, -0.02574443817138672, -0.0242767333984375, -0.02280902862548828, -0.021341323852539062, -0.019873619079589844, -0.018405914306640625, -0.016938209533691406, -0.015470504760742188, -0.014002799987792969, -0.01253509521484375, -0.011067390441894531, -0.009599685668945312, -0.008131980895996094, -0.006664276123046875, -0.005196571350097656, -0.0037288665771484375, -0.0022611618041992188, -0.00079345703125, 0.0006742477416992188, 0.0021419525146484375, 0.0036096572875976562, 0.005077362060546875, 0.006545066833496094, 0.008012771606445312, 0.009480476379394531, 0.01094818115234375, 0.012415885925292969, 0.013883590698242188, 0.015351295471191406, 0.016819000244140625, 0.018286705017089844, 0.019754409790039062, 0.02122211456298828, 0.0226898193359375, 0.02415752410888672, 0.025625228881835938, 0.027092933654785156, 0.028560638427734375, 0.030028343200683594, 0.03149604797363281, 0.03296375274658203, 0.03443145751953125, 0.03589916229248047, 0.03736686706542969, 0.038834571838378906, 0.040302276611328125, 0.041769981384277344, 0.04323768615722656, 0.04470539093017578, 0.046173095703125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 24.0, 670.0, 311.0, 10.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003945305943489075, -0.0035799741744995117, -0.0032146424055099487, -0.0028493106365203857, -0.0024839788675308228, -0.0021186470985412598, -0.0017533150967210531, -0.0013879833277314901, -0.0010226515587419271, -0.0006573197897523642, -0.00029198796255514026, 7.334386464208364e-05, 0.00043867563363164663, 0.0008040074026212096, 0.0011693392880260944, 0.0015346710570156574, 0.0019000028260052204, 0.0022653345949947834, 0.0026306663639843464, 0.0029959981329739094, 0.0033613299019634724, 0.0037266616709530354, 0.004091993905603886, 0.004457325674593449, 0.004822657443583012, 0.005187989212572575, 0.005553320981562138, 0.005918652750551701, 0.006283984519541264, 0.006649316288530827, 0.0070146480575203896, 0.0073799798265099525, 0.0077453115954995155, 0.008110643364489079, 0.008475975133478642, 0.008841306902468204, 0.009206638671457767, 0.00957197044044733, 0.009937302209436893, 0.010302633978426456, 0.01066796574741602, 0.011033297516405582, 0.011398629285395145, 0.011763961054384708, 0.012129292823374271, 0.012494624592363834, 0.012859956361353397, 0.01322528813034296, 0.013590620830655098, 0.013955952599644661, 0.014321284368634224, 0.014686616137623787, 0.01505194790661335, 0.015417279675602913, 0.015782611444592476, 0.01614794321358204, 0.016513274982571602, 0.016878606751561165, 0.017243938520550728, 0.01760927028954029, 0.017974602058529854, 0.018339933827519417, 0.01870526559650898, 0.019070597365498543, 0.019435929134488106]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 11.0, 8.0, 6.0, 13.0, 11.0, 21.0, 13.0, 19.0, 26.0, 20.0, 27.0, 34.0, 26.0, 37.0, 37.0, 26.0, 46.0, 53.0, 32.0, 44.0, 50.0, 48.0, 43.0, 34.0, 20.0, 25.0, 35.0, 32.0, 25.0, 24.0, 16.0, 23.0, 18.0, 11.0, 16.0, 10.0, 11.0, 6.0, 7.0, 10.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009354948997497559, -0.0009026201441884041, -0.0008697453886270523, -0.0008368706330657005, -0.0008039958775043488, -0.000771121121942997, -0.0007382463663816452, -0.0007053716108202934, -0.0006724968552589417, -0.0006396220996975899, -0.0006067473441362381, -0.0005738725885748863, -0.0005409978330135345, -0.0005081230774521828, -0.000475248321890831, -0.0004423735663294792, -0.00040949881076812744, -0.00037662405520677567, -0.0003437492996454239, -0.0003108745440840721, -0.00027799978852272034, -0.00024512503296136856, -0.00021225027740001678, -0.000179375521838665, -0.00014650076627731323, -0.00011362601071596146, -8.075125515460968e-05, -4.7876499593257904e-05, -1.5001744031906128e-05, 1.7873011529445648e-05, 5.0747767090797424e-05, 8.36225226521492e-05, 0.00011649727821350098, 0.00014937203377485275, 0.00018224678933620453, 0.0002151215448975563, 0.0002479963004589081, 0.00028087105602025986, 0.00031374581158161163, 0.0003466205671429634, 0.0003794953227043152, 0.00041237007826566696, 0.00044524483382701874, 0.0004781195893883705, 0.0005109943449497223, 0.0005438691005110741, 0.0005767438560724258, 0.0006096186116337776, 0.0006424933671951294, 0.0006753681227564812, 0.000708242878317833, 0.0007411176338791847, 0.0007739923894405365, 0.0008068671450018883, 0.00083974190056324, 0.0008726166561245918, 0.0009054914116859436, 0.0009383661672472954, 0.0009712409228086472, 0.001004115678369999, 0.0010369904339313507, 0.0010698651894927025, 0.0011027399450540543, 0.001135614700615406, 0.0011684894561767578]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 1.0, 5.0, 8.0, 12.0, 13.0, 17.0, 24.0, 19.0, 16.0, 29.0, 29.0, 39.0, 34.0, 33.0, 46.0, 38.0, 40.0, 47.0, 61.0, 44.0, 63.0, 31.0, 40.0, 45.0, 36.0, 34.0, 29.0, 39.0, 26.0, 22.0, 19.0, 15.0, 8.0, 6.0, 6.0, 9.0, 10.0, 1.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.453125, -10.1597900390625, -9.866455078125, -9.5731201171875, -9.27978515625, -8.9864501953125, -8.693115234375, -8.3997802734375, -8.1064453125, -7.8131103515625, -7.519775390625, -7.2264404296875, -6.93310546875, -6.6397705078125, -6.346435546875, -6.0531005859375, -5.759765625, -5.4664306640625, -5.173095703125, -4.8797607421875, -4.58642578125, -4.2930908203125, -3.999755859375, -3.7064208984375, -3.4130859375, -3.1197509765625, -2.826416015625, -2.5330810546875, -2.23974609375, -1.9464111328125, -1.653076171875, -1.3597412109375, -1.06640625, -0.7730712890625, -0.479736328125, -0.1864013671875, 0.10693359375, 0.4002685546875, 0.693603515625, 0.9869384765625, 1.2802734375, 1.5736083984375, 1.866943359375, 2.1602783203125, 2.45361328125, 2.7469482421875, 3.040283203125, 3.3336181640625, 3.626953125, 3.9202880859375, 4.213623046875, 4.5069580078125, 4.80029296875, 5.0936279296875, 5.386962890625, 5.6802978515625, 5.9736328125, 6.2669677734375, 6.560302734375, 6.8536376953125, 7.14697265625, 7.4403076171875, 7.733642578125, 8.0269775390625, 8.3203125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 13.0, 12.0, 16.0, 18.0, 39.0, 61.0, 115.0, 165.0, 303.0, 540.0, 1101.0, 2347.0, 5620.0, 15639.0, 63605.0, 480117.0, 399507.0, 55380.0, 14283.0, 5324.0, 2154.0, 1027.0, 494.0, 276.0, 154.0, 89.0, 47.0, 42.0, 34.0, 9.0, 10.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7578125, -10.46673583984375, -10.1756591796875, -9.88458251953125, -9.593505859375, -9.30242919921875, -9.0113525390625, -8.72027587890625, -8.42919921875, -8.13812255859375, -7.8470458984375, -7.55596923828125, -7.264892578125, -6.97381591796875, -6.6827392578125, -6.39166259765625, -6.1005859375, -5.80950927734375, -5.5184326171875, -5.22735595703125, -4.936279296875, -4.64520263671875, -4.3541259765625, -4.06304931640625, -3.77197265625, -3.48089599609375, -3.1898193359375, -2.89874267578125, -2.607666015625, -2.31658935546875, -2.0255126953125, -1.73443603515625, -1.443359375, -1.15228271484375, -0.8612060546875, -0.57012939453125, -0.279052734375, 0.01202392578125, 0.3031005859375, 0.59417724609375, 0.88525390625, 1.17633056640625, 1.4674072265625, 1.75848388671875, 2.049560546875, 2.34063720703125, 2.6317138671875, 2.92279052734375, 3.2138671875, 3.50494384765625, 3.7960205078125, 4.08709716796875, 4.378173828125, 4.66925048828125, 4.9603271484375, 5.25140380859375, 5.54248046875, 5.83355712890625, 6.1246337890625, 6.41571044921875, 6.706787109375, 6.99786376953125, 7.2889404296875, 7.58001708984375, 7.87109375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 4.0, 11.0, 8.0, 5.0, 16.0, 23.0, 29.0, 15.0, 19.0, 31.0, 31.0, 26.0, 43.0, 53.0, 44.0, 68.0, 68.0, 128.0, 1693.0, 210.0, 85.0, 54.0, 52.0, 37.0, 40.0, 25.0, 34.0, 32.0, 18.0, 27.0, 18.0, 21.0, 13.0, 7.0, 6.0, 1.0, 12.0, 5.0, 4.0, 5.0, 7.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-27.25, -26.4404296875, -25.630859375, -24.8212890625, -24.01171875, -23.2021484375, -22.392578125, -21.5830078125, -20.7734375, -19.9638671875, -19.154296875, -18.3447265625, -17.53515625, -16.7255859375, -15.916015625, -15.1064453125, -14.296875, -13.4873046875, -12.677734375, -11.8681640625, -11.05859375, -10.2490234375, -9.439453125, -8.6298828125, -7.8203125, -7.0107421875, -6.201171875, -5.3916015625, -4.58203125, -3.7724609375, -2.962890625, -2.1533203125, -1.34375, -0.5341796875, 0.275390625, 1.0849609375, 1.89453125, 2.7041015625, 3.513671875, 4.3232421875, 5.1328125, 5.9423828125, 6.751953125, 7.5615234375, 8.37109375, 9.1806640625, 9.990234375, 10.7998046875, 11.609375, 12.4189453125, 13.228515625, 14.0380859375, 14.84765625, 15.6572265625, 16.466796875, 17.2763671875, 18.0859375, 18.8955078125, 19.705078125, 20.5146484375, 21.32421875, 22.1337890625, 22.943359375, 23.7529296875, 24.5625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 5.0, 10.0, 14.0, 13.0, 32.0, 20.0, 44.0, 76.0, 105.0, 148.0, 234.0, 388.0, 993.0, 35687.0, 3103280.0, 3160.0, 544.0, 319.0, 200.0, 151.0, 74.0, 79.0, 31.0, 29.0, 17.0, 13.0, 7.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-91.6875, -88.6572265625, -85.626953125, -82.5966796875, -79.56640625, -76.5361328125, -73.505859375, -70.4755859375, -67.4453125, -64.4150390625, -61.384765625, -58.3544921875, -55.32421875, -52.2939453125, -49.263671875, -46.2333984375, -43.203125, -40.1728515625, -37.142578125, -34.1123046875, -31.08203125, -28.0517578125, -25.021484375, -21.9912109375, -18.9609375, -15.9306640625, -12.900390625, -9.8701171875, -6.83984375, -3.8095703125, -0.779296875, 2.2509765625, 5.28125, 8.3115234375, 11.341796875, 14.3720703125, 17.40234375, 20.4326171875, 23.462890625, 26.4931640625, 29.5234375, 32.5537109375, 35.583984375, 38.6142578125, 41.64453125, 44.6748046875, 47.705078125, 50.7353515625, 53.765625, 56.7958984375, 59.826171875, 62.8564453125, 65.88671875, 68.9169921875, 71.947265625, 74.9775390625, 78.0078125, 81.0380859375, 84.068359375, 87.0986328125, 90.12890625, 93.1591796875, 96.189453125, 99.2197265625, 102.25]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 12.0, 920.0, 86.0, 0.0, 0.0, 1.0], "bins": [-576.9747314453125, -567.3026733398438, -557.6305541992188, -547.95849609375, -538.286376953125, -528.6143188476562, -518.9421997070312, -509.2701416015625, -499.5980529785156, -489.92596435546875, -480.2538757324219, -470.581787109375, -460.9096984863281, -451.23760986328125, -441.5655517578125, -431.8934631347656, -422.22137451171875, -412.5492858886719, -402.877197265625, -393.2051086425781, -383.53302001953125, -373.8609619140625, -364.1888427734375, -354.51678466796875, -344.84466552734375, -335.1725769042969, -325.50048828125, -315.8283996582031, -306.15631103515625, -296.4842529296875, -286.8121337890625, -277.14007568359375, -267.4679870605469, -257.7958984375, -248.12380981445312, -238.45172119140625, -228.77964782714844, -219.10755920410156, -209.4354705810547, -199.76339721679688, -190.09130859375, -180.41921997070312, -170.74713134765625, -161.07504272460938, -151.40296936035156, -141.7308807373047, -132.0587921142578, -122.38671112060547, -112.71463012695312, -103.04254150390625, -93.3704605102539, -83.69837188720703, -74.02629089355469, -64.35420227050781, -54.68211364746094, -45.010032653808594, -35.33794021606445, -25.665855407714844, -15.993768692016602, -6.321681976318359, 3.35040283203125, 13.02248764038086, 22.694576263427734, 32.36665725708008, 42.03874588012695]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 3.0, 3.0, 15.0, 6.0, 12.0, 17.0, 20.0, 19.0, 13.0, 19.0, 25.0, 32.0, 31.0, 26.0, 44.0, 36.0, 30.0, 29.0, 39.0, 53.0, 46.0, 48.0, 48.0, 38.0, 42.0, 43.0, 36.0, 33.0, 16.0, 27.0, 26.0, 20.0, 11.0, 21.0, 13.0, 12.0, 7.0, 11.0, 11.0, 4.0, 7.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.64562225341797, -58.309566497802734, -55.973506927490234, -53.637451171875, -51.3013916015625, -48.965335845947266, -46.62928009033203, -44.29322052001953, -41.9571647644043, -39.62110900878906, -37.28504943847656, -34.94899368286133, -32.612937927246094, -30.276878356933594, -27.94082260131836, -25.604764938354492, -23.268707275390625, -20.932649612426758, -18.59659194946289, -16.260536193847656, -13.924478530883789, -11.588420867919922, -9.252364158630371, -6.91630744934082, -4.580249786376953, -2.244192600250244, 0.09186458587646484, 2.427921772003174, 4.763978958129883, 7.10003662109375, 9.4360933303833, 11.772150039672852, 14.108207702636719, 16.444265365600586, 18.780323028564453, 21.116378784179688, 23.452436447143555, 25.788494110107422, 28.124549865722656, 30.460607528686523, 32.79666519165039, 35.132720947265625, 37.468780517578125, 39.80483627319336, 42.140892028808594, 44.476951599121094, 46.81300735473633, 49.14906311035156, 51.48512268066406, 53.8211784362793, 56.1572380065918, 58.49329376220703, 60.82935333251953, 63.165409088134766, 65.50146484375, 67.8375244140625, 70.173583984375, 72.5096435546875, 74.84569549560547, 77.18175506591797, 79.51781463623047, 81.85386657714844, 84.18992614746094, 86.52598571777344, 88.8620376586914]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 8.0, 8.0, 15.0, 14.0, 19.0, 12.0, 32.0, 20.0, 32.0, 27.0, 38.0, 35.0, 37.0, 44.0, 36.0, 57.0, 46.0, 51.0, 56.0, 39.0, 45.0, 38.0, 33.0, 40.0, 37.0, 34.0, 28.0, 20.0, 21.0, 19.0, 17.0, 9.0, 6.0, 6.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.0546875, -10.7486572265625, -10.442626953125, -10.1365966796875, -9.83056640625, -9.5245361328125, -9.218505859375, -8.9124755859375, -8.6064453125, -8.3004150390625, -7.994384765625, -7.6883544921875, -7.38232421875, -7.0762939453125, -6.770263671875, -6.4642333984375, -6.158203125, -5.8521728515625, -5.546142578125, -5.2401123046875, -4.93408203125, -4.6280517578125, -4.322021484375, -4.0159912109375, -3.7099609375, -3.4039306640625, -3.097900390625, -2.7918701171875, -2.48583984375, -2.1798095703125, -1.873779296875, -1.5677490234375, -1.26171875, -0.9556884765625, -0.649658203125, -0.3436279296875, -0.03759765625, 0.2684326171875, 0.574462890625, 0.8804931640625, 1.1865234375, 1.4925537109375, 1.798583984375, 2.1046142578125, 2.41064453125, 2.7166748046875, 3.022705078125, 3.3287353515625, 3.634765625, 3.9407958984375, 4.246826171875, 4.5528564453125, 4.85888671875, 5.1649169921875, 5.470947265625, 5.7769775390625, 6.0830078125, 6.3890380859375, 6.695068359375, 7.0010986328125, 7.30712890625, 7.6131591796875, 7.919189453125, 8.2252197265625, 8.53125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 6.0, 16.0, 5.0, 17.0, 15.0, 19.0, 28.0, 38.0, 50.0, 77.0, 127.0, 273.0, 571.0, 1705.0, 7054.0, 69904.0, 1668997.0, 2310311.0, 121656.0, 10023.0, 2020.0, 671.0, 238.0, 145.0, 71.0, 47.0, 42.0, 29.0, 24.0, 26.0, 21.0, 11.0, 7.0, 2.0, 7.0, 4.0, 6.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.03125, -23.304931640625, -22.57861328125, -21.852294921875, -21.1259765625, -20.399658203125, -19.67333984375, -18.947021484375, -18.220703125, -17.494384765625, -16.76806640625, -16.041748046875, -15.3154296875, -14.589111328125, -13.86279296875, -13.136474609375, -12.41015625, -11.683837890625, -10.95751953125, -10.231201171875, -9.5048828125, -8.778564453125, -8.05224609375, -7.325927734375, -6.599609375, -5.873291015625, -5.14697265625, -4.420654296875, -3.6943359375, -2.968017578125, -2.24169921875, -1.515380859375, -0.7890625, -0.062744140625, 0.66357421875, 1.389892578125, 2.1162109375, 2.842529296875, 3.56884765625, 4.295166015625, 5.021484375, 5.747802734375, 6.47412109375, 7.200439453125, 7.9267578125, 8.653076171875, 9.37939453125, 10.105712890625, 10.83203125, 11.558349609375, 12.28466796875, 13.010986328125, 13.7373046875, 14.463623046875, 15.18994140625, 15.916259765625, 16.642578125, 17.368896484375, 18.09521484375, 18.821533203125, 19.5478515625, 20.274169921875, 21.00048828125, 21.726806640625, 22.453125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 14.0, 16.0, 14.0, 21.0, 25.0, 32.0, 65.0, 95.0, 114.0, 206.0, 290.0, 427.0, 619.0, 679.0, 462.0, 337.0, 206.0, 151.0, 86.0, 62.0, 47.0, 35.0, 20.0, 20.0, 10.0, 9.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.90625, -19.265869140625, -18.62548828125, -17.985107421875, -17.3447265625, -16.704345703125, -16.06396484375, -15.423583984375, -14.783203125, -14.142822265625, -13.50244140625, -12.862060546875, -12.2216796875, -11.581298828125, -10.94091796875, -10.300537109375, -9.66015625, -9.019775390625, -8.37939453125, -7.739013671875, -7.0986328125, -6.458251953125, -5.81787109375, -5.177490234375, -4.537109375, -3.896728515625, -3.25634765625, -2.615966796875, -1.9755859375, -1.335205078125, -0.69482421875, -0.054443359375, 0.5859375, 1.226318359375, 1.86669921875, 2.507080078125, 3.1474609375, 3.787841796875, 4.42822265625, 5.068603515625, 5.708984375, 6.349365234375, 6.98974609375, 7.630126953125, 8.2705078125, 8.910888671875, 9.55126953125, 10.191650390625, 10.83203125, 11.472412109375, 12.11279296875, 12.753173828125, 13.3935546875, 14.033935546875, 14.67431640625, 15.314697265625, 15.955078125, 16.595458984375, 17.23583984375, 17.876220703125, 18.5166015625, 19.156982421875, 19.79736328125, 20.437744140625, 21.078125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 9.0, 17.0, 20.0, 30.0, 35.0, 55.0, 59.0, 89.0, 104.0, 162.0, 231.0, 365.0, 711.0, 6156.0, 3262922.0, 918459.0, 3181.0, 571.0, 304.0, 238.0, 145.0, 88.0, 97.0, 49.0, 40.0, 36.0, 36.0, 20.0, 19.0, 11.0, 9.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-73.5, -71.1220703125, -68.744140625, -66.3662109375, -63.98828125, -61.6103515625, -59.232421875, -56.8544921875, -54.4765625, -52.0986328125, -49.720703125, -47.3427734375, -44.96484375, -42.5869140625, -40.208984375, -37.8310546875, -35.453125, -33.0751953125, -30.697265625, -28.3193359375, -25.94140625, -23.5634765625, -21.185546875, -18.8076171875, -16.4296875, -14.0517578125, -11.673828125, -9.2958984375, -6.91796875, -4.5400390625, -2.162109375, 0.2158203125, 2.59375, 4.9716796875, 7.349609375, 9.7275390625, 12.10546875, 14.4833984375, 16.861328125, 19.2392578125, 21.6171875, 23.9951171875, 26.373046875, 28.7509765625, 31.12890625, 33.5068359375, 35.884765625, 38.2626953125, 40.640625, 43.0185546875, 45.396484375, 47.7744140625, 50.15234375, 52.5302734375, 54.908203125, 57.2861328125, 59.6640625, 62.0419921875, 64.419921875, 66.7978515625, 69.17578125, 71.5537109375, 73.931640625, 76.3095703125, 78.6875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 46.0, 280.0, 436.0, 212.0, 32.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-399.6208801269531, -391.9922180175781, -384.3635559082031, -376.7348937988281, -369.1062316894531, -361.4775695800781, -353.8489074707031, -346.2202453613281, -338.5915832519531, -330.9629211425781, -323.3342590332031, -315.7055969238281, -308.0769348144531, -300.4482727050781, -292.8196105957031, -285.1909484863281, -277.5622863769531, -269.9336242675781, -262.3049621582031, -254.67630004882812, -247.04763793945312, -239.41897583007812, -231.79031372070312, -224.16165161132812, -216.5330047607422, -208.9043426513672, -201.2756805419922, -193.6470184326172, -186.0183563232422, -178.3896942138672, -170.7610321044922, -163.1323699951172, -155.50372314453125, -147.87506103515625, -140.24639892578125, -132.61773681640625, -124.98907470703125, -117.36041259765625, -109.73175048828125, -102.10308837890625, -94.47442626953125, -86.84576416015625, -79.21710205078125, -71.58843994140625, -63.95977783203125, -56.331119537353516, -48.702457427978516, -41.073795318603516, -33.44512939453125, -25.81646728515625, -18.18780517578125, -10.559144973754883, -2.930482864379883, 4.698177337646484, 12.326839447021484, 19.955501556396484, 27.584163665771484, 35.212825775146484, 42.841487884521484, 50.47014617919922, 58.09880828857422, 65.72747039794922, 73.35613250732422, 80.98479461669922, 88.61345672607422]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 3.0, 8.0, 5.0, 9.0, 10.0, 18.0, 19.0, 24.0, 30.0, 18.0, 28.0, 31.0, 33.0, 30.0, 40.0, 49.0, 45.0, 33.0, 42.0, 32.0, 40.0, 34.0, 47.0, 36.0, 42.0, 38.0, 29.0, 27.0, 24.0, 29.0, 13.0, 18.0, 16.0, 17.0, 15.0, 10.0, 14.0, 4.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-49.75926971435547, -48.253604888916016, -46.74794387817383, -45.242279052734375, -43.73661804199219, -42.230953216552734, -40.72528839111328, -39.219627380371094, -37.71396255493164, -36.20829772949219, -34.70263671875, -33.19697189331055, -31.691308975219727, -30.185646057128906, -28.679981231689453, -27.174318313598633, -25.668655395507812, -24.162992477416992, -22.657329559326172, -21.15166473388672, -19.6460018157959, -18.140338897705078, -16.634674072265625, -15.129011154174805, -13.623348236083984, -12.117685317993164, -10.612021446228027, -9.10635757446289, -7.60069465637207, -6.095031261444092, -4.589367866516113, -3.0837039947509766, -1.5780410766601562, -0.07237768173217773, 1.4332857131958008, 2.9389491081237793, 4.444612503051758, 5.950275897979736, 7.455939292907715, 8.961603164672852, 10.467266082763672, 11.972929000854492, 13.478592872619629, 14.984256744384766, 16.489919662475586, 17.995582580566406, 19.50124740600586, 21.00691032409668, 22.5125732421875, 24.01823616027832, 25.52389907836914, 27.029563903808594, 28.535226821899414, 30.040889739990234, 31.546554565429688, 33.052215576171875, 34.55788040161133, 36.06354522705078, 37.56920623779297, 39.07487106323242, 40.580535888671875, 42.08619689941406, 43.591861724853516, 45.09752655029297, 46.603187561035156]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 9.0, 2.0, 8.0, 14.0, 13.0, 24.0, 21.0, 35.0, 22.0, 25.0, 35.0, 51.0, 39.0, 50.0, 52.0, 53.0, 71.0, 51.0, 50.0, 38.0, 57.0, 38.0, 37.0, 41.0, 30.0, 28.0, 31.0, 21.0, 14.0, 6.0, 8.0, 10.0, 3.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3671875, -12.037841796875, -11.70849609375, -11.379150390625, -11.0498046875, -10.720458984375, -10.39111328125, -10.061767578125, -9.732421875, -9.403076171875, -9.07373046875, -8.744384765625, -8.4150390625, -8.085693359375, -7.75634765625, -7.427001953125, -7.09765625, -6.768310546875, -6.43896484375, -6.109619140625, -5.7802734375, -5.450927734375, -5.12158203125, -4.792236328125, -4.462890625, -4.133544921875, -3.80419921875, -3.474853515625, -3.1455078125, -2.816162109375, -2.48681640625, -2.157470703125, -1.828125, -1.498779296875, -1.16943359375, -0.840087890625, -0.5107421875, -0.181396484375, 0.14794921875, 0.477294921875, 0.806640625, 1.135986328125, 1.46533203125, 1.794677734375, 2.1240234375, 2.453369140625, 2.78271484375, 3.112060546875, 3.44140625, 3.770751953125, 4.10009765625, 4.429443359375, 4.7587890625, 5.088134765625, 5.41748046875, 5.746826171875, 6.076171875, 6.405517578125, 6.73486328125, 7.064208984375, 7.3935546875, 7.722900390625, 8.05224609375, 8.381591796875, 8.7109375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 9.0, 7.0, 20.0, 18.0, 27.0, 42.0, 51.0, 104.0, 138.0, 211.0, 309.0, 489.0, 707.0, 1051.0, 1596.0, 2252.0, 3431.0, 5138.0, 7520.0, 11412.0, 17477.0, 26758.0, 41633.0, 64439.0, 100973.0, 152105.0, 183307.0, 148195.0, 98740.0, 63275.0, 40418.0, 25705.0, 17042.0, 11193.0, 7534.0, 5008.0, 3341.0, 2256.0, 1459.0, 1060.0, 743.0, 456.0, 294.0, 210.0, 137.0, 88.0, 60.0, 45.0, 29.0, 18.0, 12.0, 13.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.77392578125, -0.7485275268554688, -0.7231292724609375, -0.6977310180664062, -0.672332763671875, -0.6469345092773438, -0.6215362548828125, -0.5961380004882812, -0.57073974609375, -0.5453414916992188, -0.5199432373046875, -0.49454498291015625, -0.469146728515625, -0.44374847412109375, -0.4183502197265625, -0.39295196533203125, -0.3675537109375, -0.34215545654296875, -0.3167572021484375, -0.29135894775390625, -0.265960693359375, -0.24056243896484375, -0.2151641845703125, -0.18976593017578125, -0.16436767578125, -0.13896942138671875, -0.1135711669921875, -0.08817291259765625, -0.062774658203125, -0.03737640380859375, -0.0119781494140625, 0.01342010498046875, 0.038818359375, 0.06421661376953125, 0.0896148681640625, 0.11501312255859375, 0.140411376953125, 0.16580963134765625, 0.1912078857421875, 0.21660614013671875, 0.24200439453125, 0.26740264892578125, 0.2928009033203125, 0.31819915771484375, 0.343597412109375, 0.36899566650390625, 0.3943939208984375, 0.41979217529296875, 0.4451904296875, 0.47058868408203125, 0.4959869384765625, 0.5213851928710938, 0.546783447265625, 0.5721817016601562, 0.5975799560546875, 0.6229782104492188, 0.64837646484375, 0.6737747192382812, 0.6991729736328125, 0.7245712280273438, 0.749969482421875, 0.7753677368164062, 0.8007659912109375, 0.8261642456054688, 0.8515625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 7.0, 7.0, 5.0, 11.0, 17.0, 11.0, 12.0, 23.0, 22.0, 22.0, 28.0, 31.0, 37.0, 31.0, 38.0, 31.0, 39.0, 47.0, 39.0, 35.0, 1062.0, 36.0, 31.0, 42.0, 31.0, 41.0, 37.0, 31.0, 32.0, 28.0, 33.0, 16.0, 21.0, 19.0, 9.0, 15.0, 14.0, 6.0, 9.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.921875, -5.75604248046875, -5.5902099609375, -5.42437744140625, -5.258544921875, -5.09271240234375, -4.9268798828125, -4.76104736328125, -4.59521484375, -4.42938232421875, -4.2635498046875, -4.09771728515625, -3.931884765625, -3.76605224609375, -3.6002197265625, -3.43438720703125, -3.2685546875, -3.10272216796875, -2.9368896484375, -2.77105712890625, -2.605224609375, -2.43939208984375, -2.2735595703125, -2.10772705078125, -1.94189453125, -1.77606201171875, -1.6102294921875, -1.44439697265625, -1.278564453125, -1.11273193359375, -0.9468994140625, -0.78106689453125, -0.615234375, -0.44940185546875, -0.2835693359375, -0.11773681640625, 0.048095703125, 0.21392822265625, 0.3797607421875, 0.54559326171875, 0.71142578125, 0.87725830078125, 1.0430908203125, 1.20892333984375, 1.374755859375, 1.54058837890625, 1.7064208984375, 1.87225341796875, 2.0380859375, 2.20391845703125, 2.3697509765625, 2.53558349609375, 2.701416015625, 2.86724853515625, 3.0330810546875, 3.19891357421875, 3.36474609375, 3.53057861328125, 3.6964111328125, 3.86224365234375, 4.028076171875, 4.19390869140625, 4.3597412109375, 4.52557373046875, 4.69140625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 13.0, 27.0, 40.0, 39.0, 52.0, 105.0, 141.0, 266.0, 398.0, 579.0, 887.0, 1394.0, 2166.0, 3338.0, 5260.0, 8325.0, 13004.0, 21006.0, 33568.0, 54573.0, 88209.0, 140089.0, 1240271.0, 175137.0, 117018.0, 72530.0, 43960.0, 27432.0, 17222.0, 10950.0, 6821.0, 4389.0, 2913.0, 1754.0, 1130.0, 768.0, 500.0, 297.0, 201.0, 116.0, 90.0, 50.0, 32.0, 26.0, 19.0, 8.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8037109375, -0.7776107788085938, -0.7515106201171875, -0.7254104614257812, -0.699310302734375, -0.6732101440429688, -0.6471099853515625, -0.6210098266601562, -0.59490966796875, -0.5688095092773438, -0.5427093505859375, -0.5166091918945312, -0.490509033203125, -0.46440887451171875, -0.4383087158203125, -0.41220855712890625, -0.3861083984375, -0.36000823974609375, -0.3339080810546875, -0.30780792236328125, -0.281707763671875, -0.25560760498046875, -0.2295074462890625, -0.20340728759765625, -0.17730712890625, -0.15120697021484375, -0.1251068115234375, -0.09900665283203125, -0.072906494140625, -0.04680633544921875, -0.0207061767578125, 0.00539398193359375, 0.031494140625, 0.05759429931640625, 0.0836944580078125, 0.10979461669921875, 0.135894775390625, 0.16199493408203125, 0.1880950927734375, 0.21419525146484375, 0.24029541015625, 0.26639556884765625, 0.2924957275390625, 0.31859588623046875, 0.344696044921875, 0.37079620361328125, 0.3968963623046875, 0.42299652099609375, 0.4490966796875, 0.47519683837890625, 0.5012969970703125, 0.5273971557617188, 0.553497314453125, 0.5795974731445312, 0.6056976318359375, 0.6317977905273438, 0.65789794921875, 0.6839981079101562, 0.7100982666015625, 0.7361984252929688, 0.762298583984375, 0.7883987426757812, 0.8144989013671875, 0.8405990600585938, 0.86669921875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 5.0, 13.0, 6.0, 12.0, 9.0, 20.0, 18.0, 20.0, 25.0, 26.0, 34.0, 40.0, 45.0, 48.0, 45.0, 58.0, 57.0, 59.0, 67.0, 60.0, 59.0, 37.0, 41.0, 37.0, 29.0, 24.0, 25.0, 12.0, 10.0, 11.0, 7.0, 6.0, 7.0, 2.0, 2.0, 7.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0023441314697265625, -0.0022732317447662354, -0.002202332019805908, -0.002131432294845581, -0.002060532569885254, -0.0019896328449249268, -0.0019187331199645996, -0.0018478333950042725, -0.0017769336700439453, -0.0017060339450836182, -0.001635134220123291, -0.0015642344951629639, -0.0014933347702026367, -0.0014224350452423096, -0.0013515353202819824, -0.0012806355953216553, -0.0012097358703613281, -0.001138836145401001, -0.0010679364204406738, -0.0009970366954803467, -0.0009261369705200195, -0.0008552372455596924, -0.0007843375205993652, -0.0007134377956390381, -0.0006425380706787109, -0.0005716383457183838, -0.0005007386207580566, -0.0004298388957977295, -0.00035893917083740234, -0.0002880394458770752, -0.00021713972091674805, -0.0001462399959564209, -7.534027099609375e-05, -4.4405460357666016e-06, 6.645917892456055e-05, 0.0001373589038848877, 0.00020825862884521484, 0.000279158353805542, 0.00035005807876586914, 0.0004209578037261963, 0.0004918575286865234, 0.0005627572536468506, 0.0006336569786071777, 0.0007045567035675049, 0.000775456428527832, 0.0008463561534881592, 0.0009172558784484863, 0.0009881556034088135, 0.0010590553283691406, 0.0011299550533294678, 0.001200854778289795, 0.001271754503250122, 0.0013426542282104492, 0.0014135539531707764, 0.0014844536781311035, 0.0015553534030914307, 0.0016262531280517578, 0.001697152853012085, 0.0017680525779724121, 0.0018389523029327393, 0.0019098520278930664, 0.0019807517528533936, 0.0020516514778137207, 0.002122551202774048, 0.002193450927734375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 2.0, 3.0, 9.0, 9.0, 7.0, 15.0, 14.0, 18.0, 27.0, 35.0, 50.0, 66.0, 72.0, 126.0, 238.0, 464.0, 1897.0, 900455.0, 142934.0, 1112.0, 353.0, 176.0, 114.0, 77.0, 59.0, 49.0, 37.0, 28.0, 21.0, 15.0, 15.0, 9.0, 12.0, 12.0, 3.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0489501953125, -0.047310829162597656, -0.04567146301269531, -0.04403209686279297, -0.042392730712890625, -0.04075336456298828, -0.03911399841308594, -0.037474632263183594, -0.03583526611328125, -0.034195899963378906, -0.03255653381347656, -0.03091716766357422, -0.029277801513671875, -0.02763843536376953, -0.025999069213867188, -0.024359703063964844, -0.0227203369140625, -0.021080970764160156, -0.019441604614257812, -0.01780223846435547, -0.016162872314453125, -0.014523506164550781, -0.012884140014648438, -0.011244773864746094, -0.00960540771484375, -0.007966041564941406, -0.0063266754150390625, -0.004687309265136719, -0.003047943115234375, -0.0014085769653320312, 0.0002307891845703125, 0.0018701553344726562, 0.003509521484375, 0.005148887634277344, 0.0067882537841796875, 0.008427619934082031, 0.010066986083984375, 0.011706352233886719, 0.013345718383789062, 0.014985084533691406, 0.01662445068359375, 0.018263816833496094, 0.019903182983398438, 0.02154254913330078, 0.023181915283203125, 0.02482128143310547, 0.026460647583007812, 0.028100013732910156, 0.0297393798828125, 0.031378746032714844, 0.03301811218261719, 0.03465747833251953, 0.036296844482421875, 0.03793621063232422, 0.03957557678222656, 0.041214942932128906, 0.04285430908203125, 0.044493675231933594, 0.04613304138183594, 0.04777240753173828, 0.049411773681640625, 0.05105113983154297, 0.05269050598144531, 0.054329872131347656, 0.05596923828125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 38.0, 103.0, 247.0, 281.0, 194.0, 96.0, 31.0, 10.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022013718262314796, -0.00209377845749259, -0.001986185321584344, -0.0018785919528454542, -0.0017709988169372082, -0.0016634054481983185, -0.0015558121958747506, -0.0014482189435511827, -0.0013406256912276149, -0.001233032438904047, -0.0011254391865804791, -0.0010178459342569113, -0.0009102526237256825, -0.0008026593714021146, -0.0006950660608708858, -0.000587472808547318, -0.0004798795562237501, -0.00037228630390018225, -0.0002646930224727839, -0.0001570997410453856, -4.950648872181773e-05, 5.8086763601750135e-05, 0.00016568007413297892, 0.0002732733264565468, 0.00038086657878011465, 0.0004884598311036825, 0.0005960530834272504, 0.0007036463939584792, 0.000811239646282047, 0.0009188328986056149, 0.0010264262091368437, 0.0011340194614604115, 0.0012416127137839794, 0.0013492059661075473, 0.0014567992184311152, 0.0015643925871700048, 0.0016719857230782509, 0.0017795790918171406, 0.0018871723441407084, 0.0019947655964642763, 0.0021023587323725224, 0.002209952101111412, 0.002317545237019658, 0.0024251386057585478, 0.002532731741666794, 0.0026403251104056835, 0.002747918479144573, 0.0028555116150528193, 0.002963104983791709, 0.0030706983525305986, 0.0031782914884388447, 0.0032858848571777344, 0.0033934779930859804, 0.00350107136182487, 0.003608664497733116, 0.003716257866472006, 0.0038238512352108955, 0.003931444603949785, 0.004039037972688675, 0.004146630875766277, 0.004254224244505167, 0.004361817613244057, 0.004469410981982946, 0.004577004350721836, 0.0046845972537994385]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 9.0, 6.0, 4.0, 9.0, 6.0, 15.0, 17.0, 16.0, 20.0, 19.0, 21.0, 25.0, 31.0, 39.0, 28.0, 44.0, 48.0, 39.0, 35.0, 33.0, 43.0, 47.0, 53.0, 49.0, 32.0, 28.0, 41.0, 28.0, 33.0, 41.0, 21.0, 28.0, 26.0, 14.0, 13.0, 10.0, 11.0, 7.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0013148784637451172, -0.0012751724570989609, -0.0012354664504528046, -0.0011957604438066483, -0.001156054437160492, -0.0011163484305143356, -0.0010766424238681793, -0.001036936417222023, -0.0009972304105758667, -0.0009575244039297104, -0.0009178183972835541, -0.0008781123906373978, -0.0008384063839912415, -0.0007987003773450851, -0.0007589943706989288, -0.0007192883640527725, -0.0006795823574066162, -0.0006398763507604599, -0.0006001703441143036, -0.0005604643374681473, -0.000520758330821991, -0.00048105232417583466, -0.00044134631752967834, -0.00040164031088352203, -0.0003619343042373657, -0.0003222282975912094, -0.0002825222909450531, -0.0002428162842988968, -0.00020311027765274048, -0.00016340427100658417, -0.00012369826436042786, -8.399225771427155e-05, -4.4286251068115234e-05, -4.580244421958923e-06, 3.512576222419739e-05, 7.48317688703537e-05, 0.00011453777551651001, 0.00015424378216266632, 0.00019394978880882263, 0.00023365579545497894, 0.00027336180210113525, 0.00031306780874729156, 0.0003527738153934479, 0.0003924798220396042, 0.0004321858286857605, 0.0004718918353319168, 0.0005115978419780731, 0.0005513038486242294, 0.0005910098552703857, 0.000630715861916542, 0.0006704218685626984, 0.0007101278752088547, 0.000749833881855011, 0.0007895398885011673, 0.0008292458951473236, 0.0008689519017934799, 0.0009086579084396362, 0.0009483639150857925, 0.0009880699217319489, 0.0010277759283781052, 0.0010674819350242615, 0.0011071879416704178, 0.001146893948316574, 0.0011865999549627304, 0.0012263059616088867]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 9.0, 2.0, 8.0, 14.0, 13.0, 24.0, 21.0, 35.0, 22.0, 25.0, 35.0, 51.0, 39.0, 50.0, 52.0, 53.0, 71.0, 51.0, 50.0, 38.0, 57.0, 38.0, 37.0, 41.0, 30.0, 28.0, 31.0, 21.0, 14.0, 6.0, 8.0, 10.0, 3.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3671875, -12.037841796875, -11.70849609375, -11.379150390625, -11.0498046875, -10.720458984375, -10.39111328125, -10.061767578125, -9.732421875, -9.403076171875, -9.07373046875, -8.744384765625, -8.4150390625, -8.085693359375, -7.75634765625, -7.427001953125, -7.09765625, -6.768310546875, -6.43896484375, -6.109619140625, -5.7802734375, -5.450927734375, -5.12158203125, -4.792236328125, -4.462890625, -4.133544921875, -3.80419921875, -3.474853515625, -3.1455078125, -2.816162109375, -2.48681640625, -2.157470703125, -1.828125, -1.498779296875, -1.16943359375, -0.840087890625, -0.5107421875, -0.181396484375, 0.14794921875, 0.477294921875, 0.806640625, 1.135986328125, 1.46533203125, 1.794677734375, 2.1240234375, 2.453369140625, 2.78271484375, 3.112060546875, 3.44140625, 3.770751953125, 4.10009765625, 4.429443359375, 4.7587890625, 5.088134765625, 5.41748046875, 5.746826171875, 6.076171875, 6.405517578125, 6.73486328125, 7.064208984375, 7.3935546875, 7.722900390625, 8.05224609375, 8.381591796875, 8.7109375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 10.0, 2.0, 13.0, 17.0, 22.0, 40.0, 57.0, 92.0, 113.0, 224.0, 409.0, 865.0, 2123.0, 5590.0, 18117.0, 108393.0, 744584.0, 136378.0, 20911.0, 6142.0, 2367.0, 955.0, 455.0, 261.0, 140.0, 79.0, 62.0, 44.0, 23.0, 15.0, 12.0, 10.0, 4.0, 10.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.0234375, -11.7032470703125, -11.383056640625, -11.0628662109375, -10.74267578125, -10.4224853515625, -10.102294921875, -9.7821044921875, -9.4619140625, -9.1417236328125, -8.821533203125, -8.5013427734375, -8.18115234375, -7.8609619140625, -7.540771484375, -7.2205810546875, -6.900390625, -6.5802001953125, -6.260009765625, -5.9398193359375, -5.61962890625, -5.2994384765625, -4.979248046875, -4.6590576171875, -4.3388671875, -4.0186767578125, -3.698486328125, -3.3782958984375, -3.05810546875, -2.7379150390625, -2.417724609375, -2.0975341796875, -1.77734375, -1.4571533203125, -1.136962890625, -0.8167724609375, -0.49658203125, -0.1763916015625, 0.143798828125, 0.4639892578125, 0.7841796875, 1.1043701171875, 1.424560546875, 1.7447509765625, 2.06494140625, 2.3851318359375, 2.705322265625, 3.0255126953125, 3.345703125, 3.6658935546875, 3.986083984375, 4.3062744140625, 4.62646484375, 4.9466552734375, 5.266845703125, 5.5870361328125, 5.9072265625, 6.2274169921875, 6.547607421875, 6.8677978515625, 7.18798828125, 7.5081787109375, 7.828369140625, 8.1485595703125, 8.46875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 5.0, 10.0, 7.0, 18.0, 10.0, 12.0, 15.0, 21.0, 22.0, 38.0, 29.0, 13.0, 28.0, 34.0, 29.0, 43.0, 30.0, 43.0, 55.0, 1608.0, 454.0, 69.0, 42.0, 45.0, 38.0, 41.0, 30.0, 30.0, 32.0, 20.0, 27.0, 22.0, 23.0, 9.0, 19.0, 14.0, 9.0, 5.0, 9.0, 5.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-24.5, -23.708984375, -22.91796875, -22.126953125, -21.3359375, -20.544921875, -19.75390625, -18.962890625, -18.171875, -17.380859375, -16.58984375, -15.798828125, -15.0078125, -14.216796875, -13.42578125, -12.634765625, -11.84375, -11.052734375, -10.26171875, -9.470703125, -8.6796875, -7.888671875, -7.09765625, -6.306640625, -5.515625, -4.724609375, -3.93359375, -3.142578125, -2.3515625, -1.560546875, -0.76953125, 0.021484375, 0.8125, 1.603515625, 2.39453125, 3.185546875, 3.9765625, 4.767578125, 5.55859375, 6.349609375, 7.140625, 7.931640625, 8.72265625, 9.513671875, 10.3046875, 11.095703125, 11.88671875, 12.677734375, 13.46875, 14.259765625, 15.05078125, 15.841796875, 16.6328125, 17.423828125, 18.21484375, 19.005859375, 19.796875, 20.587890625, 21.37890625, 22.169921875, 22.9609375, 23.751953125, 24.54296875, 25.333984375, 26.125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 12.0, 5.0, 6.0, 10.0, 11.0, 9.0, 24.0, 20.0, 35.0, 40.0, 50.0, 62.0, 95.0, 135.0, 185.0, 256.0, 491.0, 2019.0, 280150.0, 2857714.0, 2801.0, 532.0, 270.0, 200.0, 124.0, 98.0, 74.0, 64.0, 50.0, 27.0, 21.0, 25.0, 17.0, 11.0, 11.0, 8.0, 10.0, 10.0, 4.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-60.65625, -58.56982421875, -56.4833984375, -54.39697265625, -52.310546875, -50.22412109375, -48.1376953125, -46.05126953125, -43.96484375, -41.87841796875, -39.7919921875, -37.70556640625, -35.619140625, -33.53271484375, -31.4462890625, -29.35986328125, -27.2734375, -25.18701171875, -23.1005859375, -21.01416015625, -18.927734375, -16.84130859375, -14.7548828125, -12.66845703125, -10.58203125, -8.49560546875, -6.4091796875, -4.32275390625, -2.236328125, -0.14990234375, 1.9365234375, 4.02294921875, 6.109375, 8.19580078125, 10.2822265625, 12.36865234375, 14.455078125, 16.54150390625, 18.6279296875, 20.71435546875, 22.80078125, 24.88720703125, 26.9736328125, 29.06005859375, 31.146484375, 33.23291015625, 35.3193359375, 37.40576171875, 39.4921875, 41.57861328125, 43.6650390625, 45.75146484375, 47.837890625, 49.92431640625, 52.0107421875, 54.09716796875, 56.18359375, 58.27001953125, 60.3564453125, 62.44287109375, 64.529296875, 66.61572265625, 68.7021484375, 70.78857421875, 72.875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 21.0, 360.0, 549.0, 83.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.2611312866211, -123.26496887207031, -120.26880645751953, -117.27264404296875, -114.2764892578125, -111.28032684326172, -108.28416442871094, -105.28800201416016, -102.29183959960938, -99.2956771850586, -96.29951477050781, -93.30335998535156, -90.30719757080078, -87.31103515625, -84.31487274169922, -81.31871032714844, -78.32255554199219, -75.3263931274414, -72.33023071289062, -69.33407592773438, -66.3379135131836, -63.34175109863281, -60.34558868408203, -57.34942626953125, -54.353267669677734, -51.35710525512695, -48.36094665527344, -45.364784240722656, -42.368621826171875, -39.37246322631836, -36.37630081176758, -33.38014221191406, -30.383987426757812, -27.387826919555664, -24.391666412353516, -21.395503997802734, -18.399343490600586, -15.403182983398438, -12.407020568847656, -9.410860061645508, -6.414699554443359, -3.4185385704040527, -0.4223775863647461, 2.5737838745117188, 5.569944381713867, 8.566104888916016, 11.562267303466797, 14.558427810668945, 17.554588317871094, 20.550748825073242, 23.54690933227539, 26.543071746826172, 29.53923225402832, 32.53539276123047, 35.53155517578125, 38.52771759033203, 41.52387619018555, 44.52003860473633, 47.516197204589844, 50.512359619140625, 53.508522033691406, 56.50468063354492, 59.5008430480957, 62.49700164794922, 65.4931640625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 4.0, 8.0, 11.0, 10.0, 17.0, 16.0, 24.0, 14.0, 22.0, 24.0, 29.0, 24.0, 35.0, 38.0, 40.0, 49.0, 34.0, 48.0, 46.0, 56.0, 54.0, 37.0, 32.0, 52.0, 40.0, 37.0, 23.0, 34.0, 18.0, 33.0, 9.0, 15.0, 7.0, 9.0, 15.0, 10.0, 5.0, 4.0, 6.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-89.28374481201172, -86.85139465332031, -84.4190444946289, -81.98670196533203, -79.55435180664062, -77.12200164794922, -74.68965148925781, -72.2573013305664, -69.824951171875, -67.3926010131836, -64.96025085449219, -62.52790451049805, -60.095558166503906, -57.6632080078125, -55.230857849121094, -52.79850769042969, -50.36616516113281, -47.933815002441406, -45.501468658447266, -43.06911849975586, -40.63677215576172, -38.20442199707031, -35.772071838378906, -33.3397216796875, -30.90737533569336, -28.475027084350586, -26.042678833007812, -23.610328674316406, -21.177980422973633, -18.74563217163086, -16.313282012939453, -13.88093376159668, -11.448593139648438, -9.016244888305664, -6.583895683288574, -4.151546955108643, -1.719198226928711, 0.7131500244140625, 3.1454992294311523, 5.577848434448242, 8.010196685791016, 10.442544937133789, 12.874894142150879, 15.307243347167969, 17.739591598510742, 20.171939849853516, 22.604290008544922, 25.036638259887695, 27.46898651123047, 29.901334762573242, 32.333683013916016, 34.76603317260742, 37.19837951660156, 39.63072967529297, 42.063079833984375, 44.49542999267578, 46.92777633666992, 49.36012649536133, 51.79247283935547, 54.224822998046875, 56.65717315673828, 59.08951950073242, 61.52186965942383, 63.95421600341797, 66.38656616210938]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 6.0, 16.0, 14.0, 16.0, 22.0, 34.0, 25.0, 31.0, 34.0, 42.0, 47.0, 43.0, 59.0, 54.0, 63.0, 50.0, 47.0, 49.0, 44.0, 41.0, 47.0, 42.0, 29.0, 37.0, 15.0, 16.0, 18.0, 11.0, 11.0, 11.0, 4.0, 6.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4375, -12.0985107421875, -11.759521484375, -11.4205322265625, -11.08154296875, -10.7425537109375, -10.403564453125, -10.0645751953125, -9.7255859375, -9.3865966796875, -9.047607421875, -8.7086181640625, -8.36962890625, -8.0306396484375, -7.691650390625, -7.3526611328125, -7.013671875, -6.6746826171875, -6.335693359375, -5.9967041015625, -5.65771484375, -5.3187255859375, -4.979736328125, -4.6407470703125, -4.3017578125, -3.9627685546875, -3.623779296875, -3.2847900390625, -2.94580078125, -2.6068115234375, -2.267822265625, -1.9288330078125, -1.58984375, -1.2508544921875, -0.911865234375, -0.5728759765625, -0.23388671875, 0.1051025390625, 0.444091796875, 0.7830810546875, 1.1220703125, 1.4610595703125, 1.800048828125, 2.1390380859375, 2.47802734375, 2.8170166015625, 3.156005859375, 3.4949951171875, 3.833984375, 4.1729736328125, 4.511962890625, 4.8509521484375, 5.18994140625, 5.5289306640625, 5.867919921875, 6.2069091796875, 6.5458984375, 6.8848876953125, 7.223876953125, 7.5628662109375, 7.90185546875, 8.2408447265625, 8.579833984375, 8.9188232421875, 9.2578125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 12.0, 10.0, 11.0, 16.0, 15.0, 22.0, 48.0, 47.0, 52.0, 68.0, 105.0, 154.0, 301.0, 555.0, 1409.0, 5881.0, 70634.0, 2029030.0, 2005048.0, 71924.0, 6141.0, 1433.0, 529.0, 254.0, 136.0, 100.0, 77.0, 65.0, 51.0, 31.0, 30.0, 22.0, 17.0, 13.0, 13.0, 7.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.203125, -25.432373046875, -24.66162109375, -23.890869140625, -23.1201171875, -22.349365234375, -21.57861328125, -20.807861328125, -20.037109375, -19.266357421875, -18.49560546875, -17.724853515625, -16.9541015625, -16.183349609375, -15.41259765625, -14.641845703125, -13.87109375, -13.100341796875, -12.32958984375, -11.558837890625, -10.7880859375, -10.017333984375, -9.24658203125, -8.475830078125, -7.705078125, -6.934326171875, -6.16357421875, -5.392822265625, -4.6220703125, -3.851318359375, -3.08056640625, -2.309814453125, -1.5390625, -0.768310546875, 0.00244140625, 0.773193359375, 1.5439453125, 2.314697265625, 3.08544921875, 3.856201171875, 4.626953125, 5.397705078125, 6.16845703125, 6.939208984375, 7.7099609375, 8.480712890625, 9.25146484375, 10.022216796875, 10.79296875, 11.563720703125, 12.33447265625, 13.105224609375, 13.8759765625, 14.646728515625, 15.41748046875, 16.188232421875, 16.958984375, 17.729736328125, 18.50048828125, 19.271240234375, 20.0419921875, 20.812744140625, 21.58349609375, 22.354248046875, 23.125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 17.0, 17.0, 26.0, 37.0, 36.0, 58.0, 81.0, 136.0, 184.0, 291.0, 426.0, 601.0, 568.0, 542.0, 342.0, 236.0, 159.0, 110.0, 55.0, 31.0, 31.0, 21.0, 13.0, 11.0, 9.0, 5.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.34375, -13.75048828125, -13.1572265625, -12.56396484375, -11.970703125, -11.37744140625, -10.7841796875, -10.19091796875, -9.59765625, -9.00439453125, -8.4111328125, -7.81787109375, -7.224609375, -6.63134765625, -6.0380859375, -5.44482421875, -4.8515625, -4.25830078125, -3.6650390625, -3.07177734375, -2.478515625, -1.88525390625, -1.2919921875, -0.69873046875, -0.10546875, 0.48779296875, 1.0810546875, 1.67431640625, 2.267578125, 2.86083984375, 3.4541015625, 4.04736328125, 4.640625, 5.23388671875, 5.8271484375, 6.42041015625, 7.013671875, 7.60693359375, 8.2001953125, 8.79345703125, 9.38671875, 9.97998046875, 10.5732421875, 11.16650390625, 11.759765625, 12.35302734375, 12.9462890625, 13.53955078125, 14.1328125, 14.72607421875, 15.3193359375, 15.91259765625, 16.505859375, 17.09912109375, 17.6923828125, 18.28564453125, 18.87890625, 19.47216796875, 20.0654296875, 20.65869140625, 21.251953125, 21.84521484375, 22.4384765625, 23.03173828125, 23.625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 7.0, 10.0, 8.0, 11.0, 15.0, 10.0, 32.0, 38.0, 75.0, 80.0, 132.0, 192.0, 266.0, 387.0, 792.0, 18153.0, 4141942.0, 30049.0, 799.0, 384.0, 269.0, 172.0, 123.0, 108.0, 68.0, 48.0, 31.0, 34.0, 18.0, 8.0, 9.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0], "bins": [-117.4375, -114.6103515625, -111.783203125, -108.9560546875, -106.12890625, -103.3017578125, -100.474609375, -97.6474609375, -94.8203125, -91.9931640625, -89.166015625, -86.3388671875, -83.51171875, -80.6845703125, -77.857421875, -75.0302734375, -72.203125, -69.3759765625, -66.548828125, -63.7216796875, -60.89453125, -58.0673828125, -55.240234375, -52.4130859375, -49.5859375, -46.7587890625, -43.931640625, -41.1044921875, -38.27734375, -35.4501953125, -32.623046875, -29.7958984375, -26.96875, -24.1416015625, -21.314453125, -18.4873046875, -15.66015625, -12.8330078125, -10.005859375, -7.1787109375, -4.3515625, -1.5244140625, 1.302734375, 4.1298828125, 6.95703125, 9.7841796875, 12.611328125, 15.4384765625, 18.265625, 21.0927734375, 23.919921875, 26.7470703125, 29.57421875, 32.4013671875, 35.228515625, 38.0556640625, 40.8828125, 43.7099609375, 46.537109375, 49.3642578125, 52.19140625, 55.0185546875, 57.845703125, 60.6728515625, 63.5]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 247.0, 715.0, 52.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-721.3583374023438, -706.7285766601562, -692.098876953125, -677.4691162109375, -662.83935546875, -648.2095947265625, -633.5798950195312, -618.9501342773438, -604.3203735351562, -589.6906127929688, -575.0609130859375, -560.43115234375, -545.8013916015625, -531.171630859375, -516.5419311523438, -501.91217041015625, -487.2824401855469, -472.6527099609375, -458.02294921875, -443.3932189941406, -428.7634582519531, -414.13372802734375, -399.50396728515625, -384.8742370605469, -370.2445068359375, -355.6147766113281, -340.9850158691406, -326.35528564453125, -311.72552490234375, -297.0957946777344, -282.466064453125, -267.8363037109375, -253.20652770996094, -238.5767822265625, -223.94703674316406, -209.31729125976562, -194.68756103515625, -180.05780029296875, -165.42807006835938, -150.79832458496094, -136.1685791015625, -121.53883361816406, -106.90908813476562, -92.27935028076172, -77.64960479736328, -63.019859313964844, -48.39012145996094, -33.7603759765625, -19.130630493164062, -4.500886917114258, 10.128856658935547, 24.75859832763672, 39.388343811035156, 54.018089294433594, 68.6478271484375, 83.27757263183594, 97.90731811523438, 112.53706359863281, 127.16680908203125, 141.79653930664062, 156.42630004882812, 171.0560302734375, 185.68577575683594, 200.31552124023438, 214.9452667236328]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 6.0, 4.0, 8.0, 15.0, 16.0, 12.0, 25.0, 18.0, 25.0, 22.0, 21.0, 23.0, 24.0, 35.0, 48.0, 36.0, 26.0, 45.0, 31.0, 34.0, 47.0, 49.0, 35.0, 33.0, 40.0, 37.0, 19.0, 33.0, 25.0, 30.0, 21.0, 25.0, 23.0, 15.0, 14.0, 13.0, 11.0, 5.0, 6.0, 5.0, 1.0, 4.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-43.380027770996094, -41.955596923828125, -40.53116989135742, -39.10673904418945, -37.68231201171875, -36.25788116455078, -34.83345031738281, -33.40902328491211, -31.984594345092773, -30.560165405273438, -29.1357364654541, -27.711307525634766, -26.286876678466797, -24.862449645996094, -23.438018798828125, -22.01358985900879, -20.589160919189453, -19.164731979370117, -17.74030303955078, -16.315872192382812, -14.891444206237793, -13.467015266418457, -12.042585372924805, -10.618156433105469, -9.193727493286133, -7.769298553466797, -6.344869136810303, -4.920439720153809, -3.4960107803344727, -2.0715818405151367, -0.6471519470214844, 0.7772769927978516, 2.201709747314453, 3.626138925552368, 5.050568103790283, 6.474997520446777, 7.899426460266113, 9.32385540008545, 10.748285293579102, 12.172714233398438, 13.597143173217773, 15.02157211303711, 16.446001052856445, 17.87042999267578, 19.29486083984375, 20.719287872314453, 22.143718719482422, 23.568147659301758, 24.992576599121094, 26.41700553894043, 27.841434478759766, 29.265865325927734, 30.690292358398438, 32.114723205566406, 33.539154052734375, 34.96358108520508, 36.38800811767578, 37.81243896484375, 39.23686599731445, 40.66129684448242, 42.085723876953125, 43.510154724121094, 44.93458557128906, 46.359012603759766, 47.783443450927734]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 0.0, 10.0, 6.0, 9.0, 8.0, 17.0, 22.0, 19.0, 11.0, 19.0, 24.0, 32.0, 36.0, 43.0, 47.0, 39.0, 49.0, 47.0, 56.0, 43.0, 45.0, 39.0, 41.0, 31.0, 46.0, 42.0, 37.0, 29.0, 33.0, 22.0, 20.0, 10.0, 10.0, 16.0, 5.0, 8.0, 12.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.8671875, -10.574951171875, -10.28271484375, -9.990478515625, -9.6982421875, -9.406005859375, -9.11376953125, -8.821533203125, -8.529296875, -8.237060546875, -7.94482421875, -7.652587890625, -7.3603515625, -7.068115234375, -6.77587890625, -6.483642578125, -6.19140625, -5.899169921875, -5.60693359375, -5.314697265625, -5.0224609375, -4.730224609375, -4.43798828125, -4.145751953125, -3.853515625, -3.561279296875, -3.26904296875, -2.976806640625, -2.6845703125, -2.392333984375, -2.10009765625, -1.807861328125, -1.515625, -1.223388671875, -0.93115234375, -0.638916015625, -0.3466796875, -0.054443359375, 0.23779296875, 0.530029296875, 0.822265625, 1.114501953125, 1.40673828125, 1.698974609375, 1.9912109375, 2.283447265625, 2.57568359375, 2.867919921875, 3.16015625, 3.452392578125, 3.74462890625, 4.036865234375, 4.3291015625, 4.621337890625, 4.91357421875, 5.205810546875, 5.498046875, 5.790283203125, 6.08251953125, 6.374755859375, 6.6669921875, 6.959228515625, 7.25146484375, 7.543701171875, 7.8359375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 10.0, 14.0, 29.0, 52.0, 67.0, 95.0, 175.0, 205.0, 372.0, 521.0, 762.0, 1165.0, 1750.0, 2519.0, 3929.0, 5793.0, 9085.0, 13711.0, 21173.0, 32767.0, 50526.0, 78261.0, 120433.0, 168774.0, 173694.0, 126777.0, 83248.0, 53464.0, 34422.0, 22446.0, 14520.0, 9314.0, 6253.0, 4044.0, 2700.0, 1799.0, 1198.0, 803.0, 538.0, 387.0, 256.0, 171.0, 128.0, 60.0, 48.0, 43.0, 18.0, 14.0, 10.0, 2.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.78515625, -0.7598800659179688, -0.7346038818359375, -0.7093276977539062, -0.684051513671875, -0.6587753295898438, -0.6334991455078125, -0.6082229614257812, -0.58294677734375, -0.5576705932617188, -0.5323944091796875, -0.5071182250976562, -0.481842041015625, -0.45656585693359375, -0.4312896728515625, -0.40601348876953125, -0.3807373046875, -0.35546112060546875, -0.3301849365234375, -0.30490875244140625, -0.279632568359375, -0.25435638427734375, -0.2290802001953125, -0.20380401611328125, -0.17852783203125, -0.15325164794921875, -0.1279754638671875, -0.10269927978515625, -0.077423095703125, -0.05214691162109375, -0.0268707275390625, -0.00159454345703125, 0.023681640625, 0.04895782470703125, 0.0742340087890625, 0.09951019287109375, 0.124786376953125, 0.15006256103515625, 0.1753387451171875, 0.20061492919921875, 0.22589111328125, 0.25116729736328125, 0.2764434814453125, 0.30171966552734375, 0.326995849609375, 0.35227203369140625, 0.3775482177734375, 0.40282440185546875, 0.4281005859375, 0.45337677001953125, 0.4786529541015625, 0.5039291381835938, 0.529205322265625, 0.5544815063476562, 0.5797576904296875, 0.6050338745117188, 0.63031005859375, 0.6555862426757812, 0.6808624267578125, 0.7061386108398438, 0.731414794921875, 0.7566909790039062, 0.7819671630859375, 0.8072433471679688, 0.83251953125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 3.0, 3.0, 7.0, 17.0, 9.0, 14.0, 22.0, 26.0, 23.0, 27.0, 25.0, 28.0, 38.0, 47.0, 33.0, 39.0, 46.0, 53.0, 1061.0, 53.0, 52.0, 50.0, 38.0, 44.0, 39.0, 22.0, 37.0, 30.0, 22.0, 20.0, 16.0, 14.0, 19.0, 15.0, 6.0, 6.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-7.43359375, -7.24468994140625, -7.0557861328125, -6.86688232421875, -6.677978515625, -6.48907470703125, -6.3001708984375, -6.11126708984375, -5.92236328125, -5.73345947265625, -5.5445556640625, -5.35565185546875, -5.166748046875, -4.97784423828125, -4.7889404296875, -4.60003662109375, -4.4111328125, -4.22222900390625, -4.0333251953125, -3.84442138671875, -3.655517578125, -3.46661376953125, -3.2777099609375, -3.08880615234375, -2.89990234375, -2.71099853515625, -2.5220947265625, -2.33319091796875, -2.144287109375, -1.95538330078125, -1.7664794921875, -1.57757568359375, -1.388671875, -1.19976806640625, -1.0108642578125, -0.82196044921875, -0.633056640625, -0.44415283203125, -0.2552490234375, -0.06634521484375, 0.12255859375, 0.31146240234375, 0.5003662109375, 0.68927001953125, 0.878173828125, 1.06707763671875, 1.2559814453125, 1.44488525390625, 1.6337890625, 1.82269287109375, 2.0115966796875, 2.20050048828125, 2.389404296875, 2.57830810546875, 2.7672119140625, 2.95611572265625, 3.14501953125, 3.33392333984375, 3.5228271484375, 3.71173095703125, 3.900634765625, 4.08953857421875, 4.2784423828125, 4.46734619140625, 4.65625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 8.0, 5.0, 7.0, 17.0, 13.0, 28.0, 38.0, 58.0, 71.0, 98.0, 158.0, 207.0, 305.0, 444.0, 625.0, 962.0, 1397.0, 1989.0, 2836.0, 4285.0, 6394.0, 9401.0, 13719.0, 20235.0, 30587.0, 46061.0, 69553.0, 104928.0, 150089.0, 1219859.0, 135701.0, 92065.0, 61058.0, 40333.0, 27138.0, 17828.0, 12018.0, 8200.0, 5741.0, 3949.0, 2631.0, 1869.0, 1280.0, 907.0, 652.0, 430.0, 282.0, 222.0, 139.0, 95.0, 75.0, 50.0, 36.0, 22.0, 21.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-0.68408203125, -0.6622543334960938, -0.6404266357421875, -0.6185989379882812, -0.596771240234375, -0.5749435424804688, -0.5531158447265625, -0.5312881469726562, -0.50946044921875, -0.48763275146484375, -0.4658050537109375, -0.44397735595703125, -0.422149658203125, -0.40032196044921875, -0.3784942626953125, -0.35666656494140625, -0.3348388671875, -0.31301116943359375, -0.2911834716796875, -0.26935577392578125, -0.247528076171875, -0.22570037841796875, -0.2038726806640625, -0.18204498291015625, -0.16021728515625, -0.13838958740234375, -0.1165618896484375, -0.09473419189453125, -0.072906494140625, -0.05107879638671875, -0.0292510986328125, -0.00742340087890625, 0.014404296875, 0.03623199462890625, 0.0580596923828125, 0.07988739013671875, 0.101715087890625, 0.12354278564453125, 0.1453704833984375, 0.16719818115234375, 0.18902587890625, 0.21085357666015625, 0.2326812744140625, 0.25450897216796875, 0.276336669921875, 0.29816436767578125, 0.3199920654296875, 0.34181976318359375, 0.3636474609375, 0.38547515869140625, 0.4073028564453125, 0.42913055419921875, 0.450958251953125, 0.47278594970703125, 0.4946136474609375, 0.5164413452148438, 0.53826904296875, 0.5600967407226562, 0.5819244384765625, 0.6037521362304688, 0.625579833984375, 0.6474075317382812, 0.6692352294921875, 0.6910629272460938, 0.712890625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 2.0, 4.0, 8.0, 7.0, 9.0, 21.0, 23.0, 29.0, 42.0, 37.0, 51.0, 75.0, 75.0, 83.0, 59.0, 72.0, 73.0, 62.0, 47.0, 47.0, 38.0, 36.0, 19.0, 19.0, 12.0, 10.0, 11.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025119781494140625, -0.00243493914604187, -0.0023579001426696777, -0.0022808611392974854, -0.002203822135925293, -0.0021267831325531006, -0.002049744129180908, -0.001972705125808716, -0.0018956661224365234, -0.001818627119064331, -0.0017415881156921387, -0.0016645491123199463, -0.001587510108947754, -0.0015104711055755615, -0.0014334321022033691, -0.0013563930988311768, -0.0012793540954589844, -0.001202315092086792, -0.0011252760887145996, -0.0010482370853424072, -0.0009711980819702148, -0.0008941590785980225, -0.0008171200752258301, -0.0007400810718536377, -0.0006630420684814453, -0.0005860030651092529, -0.0005089640617370605, -0.00043192505836486816, -0.0003548860549926758, -0.0002778470516204834, -0.00020080804824829102, -0.00012376904487609863, -4.673004150390625e-05, 3.0308961868286133e-05, 0.00010734796524047852, 0.0001843869686126709, 0.0002614259719848633, 0.00033846497535705566, 0.00041550397872924805, 0.0004925429821014404, 0.0005695819854736328, 0.0006466209888458252, 0.0007236599922180176, 0.00080069899559021, 0.0008777379989624023, 0.0009547770023345947, 0.0010318160057067871, 0.0011088550090789795, 0.0011858940124511719, 0.0012629330158233643, 0.0013399720191955566, 0.001417011022567749, 0.0014940500259399414, 0.0015710890293121338, 0.0016481280326843262, 0.0017251670360565186, 0.001802206039428711, 0.0018792450428009033, 0.0019562840461730957, 0.002033323049545288, 0.0021103620529174805, 0.002187401056289673, 0.0022644400596618652, 0.0023414790630340576, 0.00241851806640625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 8.0, 8.0, 9.0, 16.0, 13.0, 30.0, 34.0, 42.0, 61.0, 104.0, 150.0, 272.0, 776.0, 67168.0, 977405.0, 1524.0, 322.0, 188.0, 123.0, 83.0, 57.0, 36.0, 23.0, 24.0, 19.0, 12.0, 10.0, 8.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054779052734375, -0.05302238464355469, -0.051265716552734375, -0.04950904846191406, -0.04775238037109375, -0.04599571228027344, -0.044239044189453125, -0.04248237609863281, -0.0407257080078125, -0.03896903991699219, -0.037212371826171875, -0.03545570373535156, -0.03369903564453125, -0.03194236755371094, -0.030185699462890625, -0.028429031372070312, -0.02667236328125, -0.024915695190429688, -0.023159027099609375, -0.021402359008789062, -0.01964569091796875, -0.017889022827148438, -0.016132354736328125, -0.014375686645507812, -0.0126190185546875, -0.010862350463867188, -0.009105682373046875, -0.0073490142822265625, -0.00559234619140625, -0.0038356781005859375, -0.002079010009765625, -0.0003223419189453125, 0.001434326171875, 0.0031909942626953125, 0.004947662353515625, 0.0067043304443359375, 0.00846099853515625, 0.010217666625976562, 0.011974334716796875, 0.013731002807617188, 0.0154876708984375, 0.017244338989257812, 0.019001007080078125, 0.020757675170898438, 0.02251434326171875, 0.024271011352539062, 0.026027679443359375, 0.027784347534179688, 0.029541015625, 0.03129768371582031, 0.033054351806640625, 0.03481101989746094, 0.03656768798828125, 0.03832435607910156, 0.040081024169921875, 0.04183769226074219, 0.0435943603515625, 0.04535102844238281, 0.047107696533203125, 0.04886436462402344, 0.05062103271484375, 0.05237770080566406, 0.054134368896484375, 0.05589103698730469, 0.057647705078125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 63.0, 484.0, 424.0, 39.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005947385914623737, -0.005717841908335686, -0.005488297902047634, -0.00525875436142087, -0.005029210355132818, -0.004799666348844767, -0.004570122808218002, -0.004340578801929951, -0.004111034795641899, -0.0038814907893538475, -0.0036519470158964396, -0.0034224032424390316, -0.00319285923615098, -0.0029633152298629284, -0.0027337714564055204, -0.0025042276829481125, -0.002274683676660061, -0.0020451396703720093, -0.0018155958969146013, -0.0015860520070418715, -0.0013565081171691418, -0.001126964227296412, -0.0008974203374236822, -0.0006678764475509524, -0.00043833255767822266, -0.00020878866780549288, 2.07552220672369e-05, 0.0002502991119399667, 0.00047984300181269646, 0.0007093868916854262, 0.000938930781558156, 0.0011684746714308858, 0.0013980185613036156, 0.0016275624511763453, 0.0018571063410490751, 0.002086650114506483, 0.0023161941207945347, 0.0025457381270825863, 0.0027752819005399942, 0.003004825673997402, 0.003234369680285454, 0.0034639136865735054, 0.0036934574600309134, 0.003923001233488321, 0.004152545239776373, 0.0043820892460644245, 0.004611632786691189, 0.00484117679297924, 0.005070720799267292, 0.005300264805555344, 0.005529808811843395, 0.0057593523524701595, 0.005988896358758211, 0.006218440365046263, 0.006447983905673027, 0.006677527911961079, 0.00690707191824913, 0.007136615924537182, 0.0073661599308252335, 0.007595703471451998, 0.007825247943401337, 0.008054791018366814, 0.008284335024654865, 0.008513879030942917, 0.008743423037230968]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 4.0, 8.0, 4.0, 10.0, 8.0, 10.0, 14.0, 22.0, 17.0, 20.0, 25.0, 32.0, 35.0, 35.0, 44.0, 29.0, 44.0, 43.0, 43.0, 49.0, 49.0, 40.0, 52.0, 39.0, 39.0, 34.0, 34.0, 27.0, 32.0, 25.0, 26.0, 25.0, 12.0, 17.0, 10.0, 10.0, 8.0, 11.0, 4.0, 5.0, 4.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010339617729187012, -0.0009990474209189415, -0.0009641330689191818, -0.0009292187169194221, -0.0008943043649196625, -0.0008593900129199028, -0.0008244756609201431, -0.0007895613089203835, -0.0007546469569206238, -0.0007197326049208641, -0.0006848182529211044, -0.0006499039009213448, -0.0006149895489215851, -0.0005800751969218254, -0.0005451608449220657, -0.0005102464929223061, -0.0004753321409225464, -0.0004404177889227867, -0.00040550343692302704, -0.00037058908492326736, -0.0003356747329235077, -0.000300760380923748, -0.00026584602892398834, -0.00023093167692422867, -0.000196017324924469, -0.00016110297292470932, -0.00012618862092494965, -9.127426892518997e-05, -5.63599169254303e-05, -2.1445564925670624e-05, 1.346878707408905e-05, 4.8383139073848724e-05, 8.32974910736084e-05, 0.00011821184307336807, 0.00015312619507312775, 0.00018804054707288742, 0.0002229548990726471, 0.00025786925107240677, 0.00029278360307216644, 0.0003276979550719261, 0.0003626123070716858, 0.00039752665907144547, 0.00043244101107120514, 0.0004673553630709648, 0.0005022697150707245, 0.0005371840670704842, 0.0005720984190702438, 0.0006070127710700035, 0.0006419271230697632, 0.0006768414750695229, 0.0007117558270692825, 0.0007466701790690422, 0.0007815845310688019, 0.0008164988830685616, 0.0008514132350683212, 0.0008863275870680809, 0.0009212419390678406, 0.0009561562910676003, 0.00099107064306736, 0.0010259849950671196, 0.0010608993470668793, 0.001095813699066639, 0.0011307280510663986, 0.0011656424030661583, 0.001200556755065918]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 0.0, 10.0, 6.0, 9.0, 8.0, 17.0, 22.0, 19.0, 11.0, 19.0, 24.0, 32.0, 36.0, 43.0, 47.0, 39.0, 49.0, 47.0, 56.0, 43.0, 45.0, 39.0, 41.0, 31.0, 46.0, 42.0, 37.0, 29.0, 33.0, 22.0, 20.0, 10.0, 10.0, 16.0, 5.0, 8.0, 12.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.8671875, -10.574951171875, -10.28271484375, -9.990478515625, -9.6982421875, -9.406005859375, -9.11376953125, -8.821533203125, -8.529296875, -8.237060546875, -7.94482421875, -7.652587890625, -7.3603515625, -7.068115234375, -6.77587890625, -6.483642578125, -6.19140625, -5.899169921875, -5.60693359375, -5.314697265625, -5.0224609375, -4.730224609375, -4.43798828125, -4.145751953125, -3.853515625, -3.561279296875, -3.26904296875, -2.976806640625, -2.6845703125, -2.392333984375, -2.10009765625, -1.807861328125, -1.515625, -1.223388671875, -0.93115234375, -0.638916015625, -0.3466796875, -0.054443359375, 0.23779296875, 0.530029296875, 0.822265625, 1.114501953125, 1.40673828125, 1.698974609375, 1.9912109375, 2.283447265625, 2.57568359375, 2.867919921875, 3.16015625, 3.452392578125, 3.74462890625, 4.036865234375, 4.3291015625, 4.621337890625, 4.91357421875, 5.205810546875, 5.498046875, 5.790283203125, 6.08251953125, 6.374755859375, 6.6669921875, 6.959228515625, 7.25146484375, 7.543701171875, 7.8359375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 8.0, 6.0, 5.0, 6.0, 10.0, 19.0, 21.0, 33.0, 43.0, 108.0, 165.0, 440.0, 1222.0, 3790.0, 12271.0, 44508.0, 210941.0, 601654.0, 129598.0, 30557.0, 8802.0, 2752.0, 891.0, 329.0, 136.0, 87.0, 45.0, 26.0, 28.0, 16.0, 11.0, 13.0, 8.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.9375, -10.66650390625, -10.3955078125, -10.12451171875, -9.853515625, -9.58251953125, -9.3115234375, -9.04052734375, -8.76953125, -8.49853515625, -8.2275390625, -7.95654296875, -7.685546875, -7.41455078125, -7.1435546875, -6.87255859375, -6.6015625, -6.33056640625, -6.0595703125, -5.78857421875, -5.517578125, -5.24658203125, -4.9755859375, -4.70458984375, -4.43359375, -4.16259765625, -3.8916015625, -3.62060546875, -3.349609375, -3.07861328125, -2.8076171875, -2.53662109375, -2.265625, -1.99462890625, -1.7236328125, -1.45263671875, -1.181640625, -0.91064453125, -0.6396484375, -0.36865234375, -0.09765625, 0.17333984375, 0.4443359375, 0.71533203125, 0.986328125, 1.25732421875, 1.5283203125, 1.79931640625, 2.0703125, 2.34130859375, 2.6123046875, 2.88330078125, 3.154296875, 3.42529296875, 3.6962890625, 3.96728515625, 4.23828125, 4.50927734375, 4.7802734375, 5.05126953125, 5.322265625, 5.59326171875, 5.8642578125, 6.13525390625, 6.40625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 4.0, 11.0, 14.0, 12.0, 27.0, 24.0, 23.0, 28.0, 31.0, 42.0, 39.0, 50.0, 58.0, 75.0, 216.0, 1809.0, 107.0, 72.0, 54.0, 50.0, 42.0, 48.0, 36.0, 30.0, 34.0, 26.0, 15.0, 22.0, 11.0, 15.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.59375, -31.4423828125, -30.291015625, -29.1396484375, -27.98828125, -26.8369140625, -25.685546875, -24.5341796875, -23.3828125, -22.2314453125, -21.080078125, -19.9287109375, -18.77734375, -17.6259765625, -16.474609375, -15.3232421875, -14.171875, -13.0205078125, -11.869140625, -10.7177734375, -9.56640625, -8.4150390625, -7.263671875, -6.1123046875, -4.9609375, -3.8095703125, -2.658203125, -1.5068359375, -0.35546875, 0.7958984375, 1.947265625, 3.0986328125, 4.25, 5.4013671875, 6.552734375, 7.7041015625, 8.85546875, 10.0068359375, 11.158203125, 12.3095703125, 13.4609375, 14.6123046875, 15.763671875, 16.9150390625, 18.06640625, 19.2177734375, 20.369140625, 21.5205078125, 22.671875, 23.8232421875, 24.974609375, 26.1259765625, 27.27734375, 28.4287109375, 29.580078125, 30.7314453125, 31.8828125, 33.0341796875, 34.185546875, 35.3369140625, 36.48828125, 37.6396484375, 38.791015625, 39.9423828125, 41.09375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 5.0, 6.0, 20.0, 20.0, 26.0, 35.0, 64.0, 92.0, 127.0, 140.0, 290.0, 347.0, 1037.0, 183220.0, 2957658.0, 1450.0, 383.0, 244.0, 174.0, 107.0, 66.0, 59.0, 36.0, 33.0, 16.0, 19.0, 7.0, 2.0, 4.0, 7.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-131.625, -128.341796875, -125.05859375, -121.775390625, -118.4921875, -115.208984375, -111.92578125, -108.642578125, -105.359375, -102.076171875, -98.79296875, -95.509765625, -92.2265625, -88.943359375, -85.66015625, -82.376953125, -79.09375, -75.810546875, -72.52734375, -69.244140625, -65.9609375, -62.677734375, -59.39453125, -56.111328125, -52.828125, -49.544921875, -46.26171875, -42.978515625, -39.6953125, -36.412109375, -33.12890625, -29.845703125, -26.5625, -23.279296875, -19.99609375, -16.712890625, -13.4296875, -10.146484375, -6.86328125, -3.580078125, -0.296875, 2.986328125, 6.26953125, 9.552734375, 12.8359375, 16.119140625, 19.40234375, 22.685546875, 25.96875, 29.251953125, 32.53515625, 35.818359375, 39.1015625, 42.384765625, 45.66796875, 48.951171875, 52.234375, 55.517578125, 58.80078125, 62.083984375, 65.3671875, 68.650390625, 71.93359375, 75.216796875, 78.5]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 16.0, 993.0, 8.0, 0.0, 0.0, 0.0, 1.0], "bins": [-706.4120483398438, -694.3201293945312, -682.2281494140625, -670.13623046875, -658.0442504882812, -645.9523315429688, -633.8603515625, -621.7684326171875, -609.6764526367188, -597.5845336914062, -585.4925537109375, -573.400634765625, -561.3086547851562, -549.2167358398438, -537.124755859375, -525.0328369140625, -512.9408569335938, -500.8489074707031, -488.7569580078125, -476.6650085449219, -464.57305908203125, -452.4811096191406, -440.38916015625, -428.2972106933594, -416.2052917480469, -404.11334228515625, -392.0213928222656, -379.929443359375, -367.8374938964844, -355.74554443359375, -343.6535949707031, -331.5616455078125, -319.46966552734375, -307.3777160644531, -295.2857666015625, -283.1938171386719, -271.10186767578125, -259.0099182128906, -246.91796875, -234.82601928710938, -222.7340850830078, -210.6421356201172, -198.55018615722656, -186.45823669433594, -174.3662872314453, -162.2743377685547, -150.18240356445312, -138.0904541015625, -125.99849700927734, -113.90654754638672, -101.8145980834961, -89.72265625, -77.63070678710938, -65.53875732421875, -53.446807861328125, -41.3548583984375, -29.262908935546875, -17.17095947265625, -5.079011917114258, 7.012935638427734, 19.10488510131836, 31.196834564208984, 43.288780212402344, 55.38072967529297, 67.4726791381836]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 5.0, 5.0, 8.0, 10.0, 16.0, 19.0, 17.0, 14.0, 17.0, 20.0, 27.0, 28.0, 26.0, 37.0, 38.0, 39.0, 38.0, 30.0, 34.0, 27.0, 38.0, 38.0, 37.0, 42.0, 52.0, 35.0, 30.0, 28.0, 29.0, 27.0, 19.0, 26.0, 18.0, 17.0, 13.0, 9.0, 19.0, 11.0, 12.0, 9.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-77.07290649414062, -74.66583251953125, -72.2587661743164, -69.85169219970703, -67.44462585449219, -65.03755187988281, -62.6304817199707, -60.223411560058594, -57.816341400146484, -55.409271240234375, -53.002201080322266, -50.595130920410156, -48.18805694580078, -45.78099060058594, -43.37391662597656, -40.96684646606445, -38.559776306152344, -36.152706146240234, -33.745635986328125, -31.338563919067383, -28.931493759155273, -26.524423599243164, -24.117351531982422, -21.710281372070312, -19.303211212158203, -16.896141052246094, -14.489069938659668, -12.081998825073242, -9.674928665161133, -7.267858505249023, -4.860787391662598, -2.453716278076172, -0.04665374755859375, 2.360416889190674, 4.767487525939941, 7.174558162689209, 9.581628799438477, 11.988698959350586, 14.395770072937012, 16.802841186523438, 19.209911346435547, 21.616981506347656, 24.024051666259766, 26.431123733520508, 28.838193893432617, 31.245264053344727, 33.65233612060547, 36.05940628051758, 38.46647644042969, 40.8735466003418, 43.280616760253906, 45.687686920166016, 48.094757080078125, 50.5018310546875, 52.90890121459961, 55.31597137451172, 57.72304153442383, 60.13011169433594, 62.53718185424805, 64.94425201416016, 67.35132598876953, 69.75839233398438, 72.16546630859375, 74.57254028320312, 76.97960662841797]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 3.0, 10.0, 11.0, 14.0, 24.0, 11.0, 18.0, 21.0, 27.0, 27.0, 45.0, 43.0, 37.0, 52.0, 39.0, 54.0, 47.0, 49.0, 36.0, 36.0, 36.0, 42.0, 40.0, 43.0, 43.0, 27.0, 27.0, 30.0, 14.0, 10.0, 14.0, 10.0, 10.0, 10.0, 10.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.2421875, -10.9398193359375, -10.637451171875, -10.3350830078125, -10.03271484375, -9.7303466796875, -9.427978515625, -9.1256103515625, -8.8232421875, -8.5208740234375, -8.218505859375, -7.9161376953125, -7.61376953125, -7.3114013671875, -7.009033203125, -6.7066650390625, -6.404296875, -6.1019287109375, -5.799560546875, -5.4971923828125, -5.19482421875, -4.8924560546875, -4.590087890625, -4.2877197265625, -3.9853515625, -3.6829833984375, -3.380615234375, -3.0782470703125, -2.77587890625, -2.4735107421875, -2.171142578125, -1.8687744140625, -1.56640625, -1.2640380859375, -0.961669921875, -0.6593017578125, -0.35693359375, -0.0545654296875, 0.247802734375, 0.5501708984375, 0.8525390625, 1.1549072265625, 1.457275390625, 1.7596435546875, 2.06201171875, 2.3643798828125, 2.666748046875, 2.9691162109375, 3.271484375, 3.5738525390625, 3.876220703125, 4.1785888671875, 4.48095703125, 4.7833251953125, 5.085693359375, 5.3880615234375, 5.6904296875, 5.9927978515625, 6.295166015625, 6.5975341796875, 6.89990234375, 7.2022705078125, 7.504638671875, 7.8070068359375, 8.109375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 8.0, 9.0, 3.0, 8.0, 7.0, 22.0, 18.0, 22.0, 20.0, 19.0, 42.0, 60.0, 79.0, 116.0, 270.0, 607.0, 1925.0, 13924.0, 899529.0, 3193408.0, 78079.0, 4199.0, 1010.0, 343.0, 189.0, 77.0, 67.0, 48.0, 29.0, 29.0, 22.0, 15.0, 16.0, 16.0, 9.0, 4.0, 9.0, 8.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-35.6875, -34.70263671875, -33.7177734375, -32.73291015625, -31.748046875, -30.76318359375, -29.7783203125, -28.79345703125, -27.80859375, -26.82373046875, -25.8388671875, -24.85400390625, -23.869140625, -22.88427734375, -21.8994140625, -20.91455078125, -19.9296875, -18.94482421875, -17.9599609375, -16.97509765625, -15.990234375, -15.00537109375, -14.0205078125, -13.03564453125, -12.05078125, -11.06591796875, -10.0810546875, -9.09619140625, -8.111328125, -7.12646484375, -6.1416015625, -5.15673828125, -4.171875, -3.18701171875, -2.2021484375, -1.21728515625, -0.232421875, 0.75244140625, 1.7373046875, 2.72216796875, 3.70703125, 4.69189453125, 5.6767578125, 6.66162109375, 7.646484375, 8.63134765625, 9.6162109375, 10.60107421875, 11.5859375, 12.57080078125, 13.5556640625, 14.54052734375, 15.525390625, 16.51025390625, 17.4951171875, 18.47998046875, 19.46484375, 20.44970703125, 21.4345703125, 22.41943359375, 23.404296875, 24.38916015625, 25.3740234375, 26.35888671875, 27.34375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 8.0, 18.0, 9.0, 23.0, 20.0, 29.0, 64.0, 72.0, 119.0, 159.0, 235.0, 398.0, 546.0, 653.0, 506.0, 368.0, 269.0, 178.0, 121.0, 76.0, 45.0, 43.0, 35.0, 23.0, 13.0, 10.0, 6.0, 3.0, 8.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-23.25, -22.67578125, -22.1015625, -21.52734375, -20.953125, -20.37890625, -19.8046875, -19.23046875, -18.65625, -18.08203125, -17.5078125, -16.93359375, -16.359375, -15.78515625, -15.2109375, -14.63671875, -14.0625, -13.48828125, -12.9140625, -12.33984375, -11.765625, -11.19140625, -10.6171875, -10.04296875, -9.46875, -8.89453125, -8.3203125, -7.74609375, -7.171875, -6.59765625, -6.0234375, -5.44921875, -4.875, -4.30078125, -3.7265625, -3.15234375, -2.578125, -2.00390625, -1.4296875, -0.85546875, -0.28125, 0.29296875, 0.8671875, 1.44140625, 2.015625, 2.58984375, 3.1640625, 3.73828125, 4.3125, 4.88671875, 5.4609375, 6.03515625, 6.609375, 7.18359375, 7.7578125, 8.33203125, 8.90625, 9.48046875, 10.0546875, 10.62890625, 11.203125, 11.77734375, 12.3515625, 12.92578125, 13.5]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 9.0, 8.0, 18.0, 15.0, 28.0, 50.0, 62.0, 86.0, 143.0, 195.0, 296.0, 532.0, 1439.0, 302329.0, 3884525.0, 2921.0, 620.0, 310.0, 224.0, 148.0, 99.0, 67.0, 51.0, 34.0, 29.0, 20.0, 8.0, 10.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-112.5, -109.2998046875, -106.099609375, -102.8994140625, -99.69921875, -96.4990234375, -93.298828125, -90.0986328125, -86.8984375, -83.6982421875, -80.498046875, -77.2978515625, -74.09765625, -70.8974609375, -67.697265625, -64.4970703125, -61.296875, -58.0966796875, -54.896484375, -51.6962890625, -48.49609375, -45.2958984375, -42.095703125, -38.8955078125, -35.6953125, -32.4951171875, -29.294921875, -26.0947265625, -22.89453125, -19.6943359375, -16.494140625, -13.2939453125, -10.09375, -6.8935546875, -3.693359375, -0.4931640625, 2.70703125, 5.9072265625, 9.107421875, 12.3076171875, 15.5078125, 18.7080078125, 21.908203125, 25.1083984375, 28.30859375, 31.5087890625, 34.708984375, 37.9091796875, 41.109375, 44.3095703125, 47.509765625, 50.7099609375, 53.91015625, 57.1103515625, 60.310546875, 63.5107421875, 66.7109375, 69.9111328125, 73.111328125, 76.3115234375, 79.51171875, 82.7119140625, 85.912109375, 89.1123046875, 92.3125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 41.0, 478.0, 459.0, 38.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-548.2899169921875, -536.8585815429688, -525.4273071289062, -513.9959716796875, -502.56463623046875, -491.1333312988281, -479.7020263671875, -468.27069091796875, -456.83935546875, -445.4080505371094, -433.9767150878906, -422.54541015625, -411.11407470703125, -399.6827697753906, -388.25146484375, -376.82012939453125, -365.3888244628906, -353.95751953125, -342.52618408203125, -331.0948791503906, -319.6635437011719, -308.23223876953125, -296.8009033203125, -285.3695983886719, -273.93829345703125, -262.5069885253906, -251.07565307617188, -239.64434814453125, -228.2130126953125, -216.78170776367188, -205.3503875732422, -193.9190673828125, -182.48770141601562, -171.05638122558594, -159.62506103515625, -148.19375610351562, -136.76242065429688, -125.33110809326172, -113.89979553222656, -102.46847534179688, -91.03715515136719, -79.6058349609375, -68.17451477050781, -56.743202209472656, -45.31188201904297, -33.88056182861328, -22.449249267578125, -11.017929077148438, 0.41339111328125, 11.844709396362305, 23.27602767944336, 34.70734405517578, 46.13866424560547, 57.569984436035156, 69.00129699707031, 80.4326171875, 91.86393737792969, 103.29525756835938, 114.72657775878906, 126.15789031982422, 137.58920288085938, 149.02053833007812, 160.45184326171875, 171.88316345214844, 183.31448364257812]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 4.0, 5.0, 6.0, 15.0, 4.0, 9.0, 10.0, 18.0, 14.0, 27.0, 20.0, 27.0, 31.0, 33.0, 33.0, 35.0, 35.0, 38.0, 36.0, 39.0, 39.0, 41.0, 45.0, 38.0, 36.0, 35.0, 35.0, 31.0, 24.0, 26.0, 29.0, 29.0, 22.0, 26.0, 15.0, 11.0, 10.0, 12.0, 9.0, 8.0, 7.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-47.519779205322266, -46.01433181762695, -44.50888442993164, -43.00343322753906, -41.49798583984375, -39.99253845214844, -38.487091064453125, -36.98164367675781, -35.476192474365234, -33.97074508666992, -32.46529769897461, -30.959848403930664, -29.45439910888672, -27.948951721191406, -26.443504333496094, -24.93805503845215, -23.432607650756836, -21.927160263061523, -20.421710968017578, -18.916263580322266, -17.41081428527832, -15.905366897583008, -14.399918556213379, -12.89447021484375, -11.389021873474121, -9.883573532104492, -8.378125190734863, -6.872677326202393, -5.367228984832764, -3.8617806434631348, -2.356332778930664, -0.8508844375610352, 0.6545639038085938, 2.1600122451782227, 3.6654603481292725, 5.170908451080322, 6.676356792449951, 8.181804656982422, 9.68725299835205, 11.19270133972168, 12.698149681091309, 14.203598022460938, 15.709046363830566, 17.214494705200195, 18.719942092895508, 20.225391387939453, 21.730838775634766, 23.236286163330078, 24.741735458374023, 26.247182846069336, 27.75263214111328, 29.258079528808594, 30.76352882385254, 32.268978118896484, 33.7744255065918, 35.27987289428711, 36.78532028198242, 38.290767669677734, 39.79621505737305, 41.301666259765625, 42.80711364746094, 44.31256103515625, 45.81800842285156, 47.323455810546875, 48.82890701293945]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 5.0, 6.0, 4.0, 9.0, 5.0, 12.0, 11.0, 13.0, 14.0, 17.0, 17.0, 23.0, 40.0, 21.0, 24.0, 20.0, 33.0, 40.0, 48.0, 28.0, 38.0, 45.0, 37.0, 36.0, 39.0, 43.0, 40.0, 29.0, 29.0, 35.0, 31.0, 22.0, 26.0, 24.0, 25.0, 18.0, 15.0, 11.0, 15.0, 10.0, 11.0, 2.0, 8.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.2890625, -8.03533935546875, -7.7816162109375, -7.52789306640625, -7.274169921875, -7.02044677734375, -6.7667236328125, -6.51300048828125, -6.25927734375, -6.00555419921875, -5.7518310546875, -5.49810791015625, -5.244384765625, -4.99066162109375, -4.7369384765625, -4.48321533203125, -4.2294921875, -3.97576904296875, -3.7220458984375, -3.46832275390625, -3.214599609375, -2.96087646484375, -2.7071533203125, -2.45343017578125, -2.19970703125, -1.94598388671875, -1.6922607421875, -1.43853759765625, -1.184814453125, -0.93109130859375, -0.6773681640625, -0.42364501953125, -0.169921875, 0.08380126953125, 0.3375244140625, 0.59124755859375, 0.844970703125, 1.09869384765625, 1.3524169921875, 1.60614013671875, 1.85986328125, 2.11358642578125, 2.3673095703125, 2.62103271484375, 2.874755859375, 3.12847900390625, 3.3822021484375, 3.63592529296875, 3.8896484375, 4.14337158203125, 4.3970947265625, 4.65081787109375, 4.904541015625, 5.15826416015625, 5.4119873046875, 5.66571044921875, 5.91943359375, 6.17315673828125, 6.4268798828125, 6.68060302734375, 6.934326171875, 7.18804931640625, 7.4417724609375, 7.69549560546875, 7.94921875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 12.0, 9.0, 15.0, 25.0, 37.0, 50.0, 69.0, 113.0, 174.0, 272.0, 427.0, 647.0, 947.0, 1578.0, 2429.0, 3896.0, 6270.0, 10045.0, 16406.0, 27306.0, 45798.0, 77153.0, 126702.0, 191402.0, 196663.0, 134442.0, 81793.0, 48392.0, 29322.0, 17583.0, 10804.0, 6525.0, 4065.0, 2592.0, 1628.0, 1049.0, 664.0, 421.0, 291.0, 188.0, 114.0, 73.0, 59.0, 32.0, 24.0, 16.0, 10.0, 6.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.99755859375, -0.9673843383789062, -0.9372100830078125, -0.9070358276367188, -0.876861572265625, -0.8466873168945312, -0.8165130615234375, -0.7863388061523438, -0.75616455078125, -0.7259902954101562, -0.6958160400390625, -0.6656417846679688, -0.635467529296875, -0.6052932739257812, -0.5751190185546875, -0.5449447631835938, -0.5147705078125, -0.48459625244140625, -0.4544219970703125, -0.42424774169921875, -0.394073486328125, -0.36389923095703125, -0.3337249755859375, -0.30355072021484375, -0.27337646484375, -0.24320220947265625, -0.2130279541015625, -0.18285369873046875, -0.152679443359375, -0.12250518798828125, -0.0923309326171875, -0.06215667724609375, -0.031982421875, -0.00180816650390625, 0.0283660888671875, 0.05854034423828125, 0.088714599609375, 0.11888885498046875, 0.1490631103515625, 0.17923736572265625, 0.20941162109375, 0.23958587646484375, 0.2697601318359375, 0.29993438720703125, 0.330108642578125, 0.36028289794921875, 0.3904571533203125, 0.42063140869140625, 0.4508056640625, 0.48097991943359375, 0.5111541748046875, 0.5413284301757812, 0.571502685546875, 0.6016769409179688, 0.6318511962890625, 0.6620254516601562, 0.69219970703125, 0.7223739624023438, 0.7525482177734375, 0.7827224731445312, 0.812896728515625, 0.8430709838867188, 0.8732452392578125, 0.9034194946289062, 0.93359375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 7.0, 10.0, 15.0, 10.0, 18.0, 22.0, 25.0, 18.0, 24.0, 27.0, 31.0, 47.0, 31.0, 43.0, 35.0, 40.0, 54.0, 1066.0, 43.0, 26.0, 42.0, 45.0, 33.0, 35.0, 36.0, 33.0, 31.0, 25.0, 28.0, 15.0, 18.0, 16.0, 18.0, 6.0, 10.0, 4.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.58203125, -5.40301513671875, -5.2239990234375, -5.04498291015625, -4.865966796875, -4.68695068359375, -4.5079345703125, -4.32891845703125, -4.14990234375, -3.97088623046875, -3.7918701171875, -3.61285400390625, -3.433837890625, -3.25482177734375, -3.0758056640625, -2.89678955078125, -2.7177734375, -2.53875732421875, -2.3597412109375, -2.18072509765625, -2.001708984375, -1.82269287109375, -1.6436767578125, -1.46466064453125, -1.28564453125, -1.10662841796875, -0.9276123046875, -0.74859619140625, -0.569580078125, -0.39056396484375, -0.2115478515625, -0.03253173828125, 0.146484375, 0.32550048828125, 0.5045166015625, 0.68353271484375, 0.862548828125, 1.04156494140625, 1.2205810546875, 1.39959716796875, 1.57861328125, 1.75762939453125, 1.9366455078125, 2.11566162109375, 2.294677734375, 2.47369384765625, 2.6527099609375, 2.83172607421875, 3.0107421875, 3.18975830078125, 3.3687744140625, 3.54779052734375, 3.726806640625, 3.90582275390625, 4.0848388671875, 4.26385498046875, 4.44287109375, 4.62188720703125, 4.8009033203125, 4.97991943359375, 5.158935546875, 5.33795166015625, 5.5169677734375, 5.69598388671875, 5.875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 15.0, 21.0, 29.0, 36.0, 59.0, 80.0, 144.0, 193.0, 261.0, 385.0, 614.0, 902.0, 1301.0, 1901.0, 2905.0, 4299.0, 6345.0, 9574.0, 13775.0, 20653.0, 30893.0, 46546.0, 68724.0, 101030.0, 141583.0, 1212443.0, 136101.0, 96562.0, 66061.0, 44023.0, 29218.0, 19790.0, 13092.0, 8991.0, 5907.0, 4123.0, 2686.0, 1837.0, 1299.0, 942.0, 569.0, 407.0, 269.0, 173.0, 121.0, 103.0, 50.0, 28.0, 28.0, 13.0, 8.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.73974609375, -0.7169418334960938, -0.6941375732421875, -0.6713333129882812, -0.648529052734375, -0.6257247924804688, -0.6029205322265625, -0.5801162719726562, -0.55731201171875, -0.5345077514648438, -0.5117034912109375, -0.48889923095703125, -0.466094970703125, -0.44329071044921875, -0.4204864501953125, -0.39768218994140625, -0.3748779296875, -0.35207366943359375, -0.3292694091796875, -0.30646514892578125, -0.283660888671875, -0.26085662841796875, -0.2380523681640625, -0.21524810791015625, -0.19244384765625, -0.16963958740234375, -0.1468353271484375, -0.12403106689453125, -0.101226806640625, -0.07842254638671875, -0.0556182861328125, -0.03281402587890625, -0.010009765625, 0.01279449462890625, 0.0355987548828125, 0.05840301513671875, 0.081207275390625, 0.10401153564453125, 0.1268157958984375, 0.14962005615234375, 0.17242431640625, 0.19522857666015625, 0.2180328369140625, 0.24083709716796875, 0.263641357421875, 0.28644561767578125, 0.3092498779296875, 0.33205413818359375, 0.3548583984375, 0.37766265869140625, 0.4004669189453125, 0.42327117919921875, 0.446075439453125, 0.46887969970703125, 0.4916839599609375, 0.5144882202148438, 0.53729248046875, 0.5600967407226562, 0.5829010009765625, 0.6057052612304688, 0.628509521484375, 0.6513137817382812, 0.6741180419921875, 0.6969223022460938, 0.7197265625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 8.0, 5.0, 7.0, 10.0, 10.0, 12.0, 19.0, 12.0, 15.0, 27.0, 42.0, 31.0, 40.0, 38.0, 45.0, 46.0, 53.0, 46.0, 59.0, 64.0, 60.0, 47.0, 44.0, 39.0, 31.0, 32.0, 23.0, 16.0, 19.0, 14.0, 13.0, 12.0, 11.0, 8.0, 8.0, 13.0, 4.0, 6.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002109527587890625, -0.002036869525909424, -0.0019642114639282227, -0.0018915534019470215, -0.0018188953399658203, -0.0017462372779846191, -0.001673579216003418, -0.0016009211540222168, -0.0015282630920410156, -0.0014556050300598145, -0.0013829469680786133, -0.0013102889060974121, -0.001237630844116211, -0.0011649727821350098, -0.0010923147201538086, -0.0010196566581726074, -0.0009469985961914062, -0.0008743405342102051, -0.0008016824722290039, -0.0007290244102478027, -0.0006563663482666016, -0.0005837082862854004, -0.0005110502243041992, -0.00043839216232299805, -0.0003657341003417969, -0.0002930760383605957, -0.00022041797637939453, -0.00014775991439819336, -7.510185241699219e-05, -2.4437904357910156e-06, 7.021427154541016e-05, 0.00014287233352661133, 0.0002155303955078125, 0.00028818845748901367, 0.00036084651947021484, 0.000433504581451416, 0.0005061626434326172, 0.0005788207054138184, 0.0006514787673950195, 0.0007241368293762207, 0.0007967948913574219, 0.000869452953338623, 0.0009421110153198242, 0.0010147690773010254, 0.0010874271392822266, 0.0011600852012634277, 0.001232743263244629, 0.00130540132522583, 0.0013780593872070312, 0.0014507174491882324, 0.0015233755111694336, 0.0015960335731506348, 0.001668691635131836, 0.0017413496971130371, 0.0018140077590942383, 0.0018866658210754395, 0.0019593238830566406, 0.002031981945037842, 0.002104640007019043, 0.002177298069000244, 0.0022499561309814453, 0.0023226141929626465, 0.0023952722549438477, 0.002467930316925049, 0.00254058837890625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 6.0, 12.0, 10.0, 12.0, 6.0, 19.0, 11.0, 22.0, 29.0, 40.0, 39.0, 63.0, 67.0, 90.0, 123.0, 331.0, 778.0, 12916.0, 1030115.0, 2564.0, 571.0, 213.0, 129.0, 80.0, 68.0, 60.0, 34.0, 25.0, 20.0, 29.0, 11.0, 10.0, 12.0, 8.0, 4.0, 5.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.060791015625, -0.0590214729309082, -0.057251930236816406, -0.05548238754272461, -0.05371284484863281, -0.051943302154541016, -0.05017375946044922, -0.04840421676635742, -0.046634674072265625, -0.04486513137817383, -0.04309558868408203, -0.041326045989990234, -0.03955650329589844, -0.03778696060180664, -0.036017417907714844, -0.03424787521362305, -0.03247833251953125, -0.030708789825439453, -0.028939247131347656, -0.02716970443725586, -0.025400161743164062, -0.023630619049072266, -0.02186107635498047, -0.020091533660888672, -0.018321990966796875, -0.016552448272705078, -0.014782905578613281, -0.013013362884521484, -0.011243820190429688, -0.00947427749633789, -0.007704734802246094, -0.005935192108154297, -0.0041656494140625, -0.002396106719970703, -0.0006265640258789062, 0.0011429786682128906, 0.0029125213623046875, 0.004682064056396484, 0.006451606750488281, 0.008221149444580078, 0.009990692138671875, 0.011760234832763672, 0.013529777526855469, 0.015299320220947266, 0.017068862915039062, 0.01883840560913086, 0.020607948303222656, 0.022377490997314453, 0.02414703369140625, 0.025916576385498047, 0.027686119079589844, 0.02945566177368164, 0.031225204467773438, 0.032994747161865234, 0.03476428985595703, 0.03653383255004883, 0.038303375244140625, 0.04007291793823242, 0.04184246063232422, 0.043612003326416016, 0.04538154602050781, 0.04715108871459961, 0.048920631408691406, 0.0506901741027832, 0.052459716796875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 85.0, 731.0, 198.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002768824575468898, -0.0024477990809828043, -0.002126773353666067, -0.0018057478591799736, -0.00148472236469388, -0.0011636968702077866, -0.0008426712593063712, -0.0005216456484049559, -0.00020062015391886234, 0.00012040539877489209, 0.0004414309514686465, 0.000762456504162401, 0.0010834820568561554, 0.001404507551342249, 0.0017255331622436643, 0.0020465587731450796, 0.002367584267631173, 0.0026886097621172667, 0.003009635489434004, 0.0033306609839200974, 0.003651686478406191, 0.003972711972892284, 0.004293737467378378, 0.0046147629618644714, 0.004935788922011852, 0.005256814416497946, 0.005577839910984039, 0.005898865405470133, 0.006219890899956226, 0.006540916860103607, 0.006861942354589701, 0.007182967849075794, 0.007503993809223175, 0.007825019769370556, 0.008146044798195362, 0.008467070758342743, 0.00878809578716755, 0.00910912174731493, 0.009430146776139736, 0.009751172736287117, 0.010072197765111923, 0.010393223725259304, 0.01071424875408411, 0.011035274714231491, 0.011356299743056297, 0.011677325703203678, 0.011998350732028484, 0.012319376692175865, 0.012640402652323246, 0.012961428612470627, 0.013282453641295433, 0.013603479601442814, 0.01392450463026762, 0.014245530590415001, 0.014566555619239807, 0.014887581579387188, 0.015208607539534569, 0.01552963349968195, 0.01585065945982933, 0.016171684488654137, 0.016492709517478943, 0.01681373454630375, 0.017134761437773705, 0.01745578646659851, 0.017776811495423317]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 11.0, 9.0, 14.0, 11.0, 12.0, 17.0, 18.0, 14.0, 19.0, 24.0, 19.0, 32.0, 30.0, 36.0, 38.0, 44.0, 46.0, 39.0, 42.0, 42.0, 49.0, 37.0, 37.0, 36.0, 32.0, 35.0, 32.0, 31.0, 33.0, 25.0, 15.0, 18.0, 13.0, 12.0, 11.0, 12.0, 12.0, 8.0, 6.0, 5.0, 5.0, 3.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0], "bins": [-0.0013791322708129883, -0.0013384316116571426, -0.001297730952501297, -0.0012570302933454514, -0.0012163296341896057, -0.00117562897503376, -0.0011349283158779144, -0.0010942276567220688, -0.0010535269975662231, -0.0010128263384103775, -0.0009721256792545319, -0.0009314250200986862, -0.0008907243609428406, -0.0008500237017869949, -0.0008093230426311493, -0.0007686223834753036, -0.000727921724319458, -0.0006872210651636124, -0.0006465204060077667, -0.0006058197468519211, -0.0005651190876960754, -0.0005244184285402298, -0.00048371776938438416, -0.0004430171102285385, -0.00040231645107269287, -0.00036161579191684723, -0.0003209151327610016, -0.00028021447360515594, -0.0002395138144493103, -0.00019881315529346466, -0.00015811249613761902, -0.00011741183698177338, -7.671117782592773e-05, -3.601051867008209e-05, 4.69014048576355e-06, 4.539079964160919e-05, 8.609145879745483e-05, 0.00012679211795330048, 0.00016749277710914612, 0.00020819343626499176, 0.0002488940954208374, 0.00028959475457668304, 0.0003302954137325287, 0.00037099607288837433, 0.00041169673204421997, 0.0004523973912000656, 0.0004930980503559113, 0.0005337987095117569, 0.0005744993686676025, 0.0006152000278234482, 0.0006559006869792938, 0.0006966013461351395, 0.0007373020052909851, 0.0007780026644468307, 0.0008187033236026764, 0.000859403982758522, 0.0009001046419143677, 0.0009408053010702133, 0.000981505960226059, 0.0010222066193819046, 0.0010629072785377502, 0.0011036079376935959, 0.0011443085968494415, 0.0011850092560052872, 0.0012257099151611328]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 5.0, 6.0, 4.0, 9.0, 5.0, 12.0, 11.0, 13.0, 14.0, 17.0, 17.0, 23.0, 40.0, 21.0, 24.0, 20.0, 32.0, 41.0, 48.0, 28.0, 38.0, 45.0, 37.0, 36.0, 39.0, 43.0, 40.0, 29.0, 29.0, 35.0, 31.0, 22.0, 26.0, 24.0, 25.0, 18.0, 15.0, 11.0, 15.0, 10.0, 11.0, 2.0, 8.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.2890625, -8.03533935546875, -7.7816162109375, -7.52789306640625, -7.274169921875, -7.02044677734375, -6.7667236328125, -6.51300048828125, -6.25927734375, -6.00555419921875, -5.7518310546875, -5.49810791015625, -5.244384765625, -4.99066162109375, -4.7369384765625, -4.48321533203125, -4.2294921875, -3.97576904296875, -3.7220458984375, -3.46832275390625, -3.214599609375, -2.96087646484375, -2.7071533203125, -2.45343017578125, -2.19970703125, -1.94598388671875, -1.6922607421875, -1.43853759765625, -1.184814453125, -0.93109130859375, -0.6773681640625, -0.42364501953125, -0.169921875, 0.08380126953125, 0.3375244140625, 0.59124755859375, 0.844970703125, 1.09869384765625, 1.3524169921875, 1.60614013671875, 1.85986328125, 2.11358642578125, 2.3673095703125, 2.62103271484375, 2.874755859375, 3.12847900390625, 3.3822021484375, 3.63592529296875, 3.8896484375, 4.14337158203125, 4.3970947265625, 4.65081787109375, 4.904541015625, 5.15826416015625, 5.4119873046875, 5.66571044921875, 5.91943359375, 6.17315673828125, 6.4268798828125, 6.68060302734375, 6.934326171875, 7.18804931640625, 7.4417724609375, 7.69549560546875, 7.94921875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 13.0, 6.0, 11.0, 17.0, 17.0, 19.0, 30.0, 42.0, 40.0, 64.0, 70.0, 92.0, 147.0, 158.0, 295.0, 439.0, 855.0, 2062.0, 5889.0, 18609.0, 63836.0, 266626.0, 516654.0, 122753.0, 33249.0, 10093.0, 3398.0, 1273.0, 554.0, 359.0, 210.0, 154.0, 108.0, 92.0, 68.0, 51.0, 40.0, 34.0, 24.0, 28.0, 9.0, 20.0, 15.0, 9.0, 5.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.0390625, -7.78173828125, -7.5244140625, -7.26708984375, -7.009765625, -6.75244140625, -6.4951171875, -6.23779296875, -5.98046875, -5.72314453125, -5.4658203125, -5.20849609375, -4.951171875, -4.69384765625, -4.4365234375, -4.17919921875, -3.921875, -3.66455078125, -3.4072265625, -3.14990234375, -2.892578125, -2.63525390625, -2.3779296875, -2.12060546875, -1.86328125, -1.60595703125, -1.3486328125, -1.09130859375, -0.833984375, -0.57666015625, -0.3193359375, -0.06201171875, 0.1953125, 0.45263671875, 0.7099609375, 0.96728515625, 1.224609375, 1.48193359375, 1.7392578125, 1.99658203125, 2.25390625, 2.51123046875, 2.7685546875, 3.02587890625, 3.283203125, 3.54052734375, 3.7978515625, 4.05517578125, 4.3125, 4.56982421875, 4.8271484375, 5.08447265625, 5.341796875, 5.59912109375, 5.8564453125, 6.11376953125, 6.37109375, 6.62841796875, 6.8857421875, 7.14306640625, 7.400390625, 7.65771484375, 7.9150390625, 8.17236328125, 8.4296875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 3.0, 7.0, 6.0, 10.0, 9.0, 11.0, 16.0, 21.0, 26.0, 28.0, 24.0, 36.0, 30.0, 33.0, 48.0, 49.0, 84.0, 130.0, 1684.0, 309.0, 104.0, 48.0, 50.0, 37.0, 22.0, 37.0, 24.0, 27.0, 26.0, 20.0, 15.0, 15.0, 20.0, 7.0, 9.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.750244140625, -31.78173828125, -30.813232421875, -29.8447265625, -28.876220703125, -27.90771484375, -26.939208984375, -25.970703125, -25.002197265625, -24.03369140625, -23.065185546875, -22.0966796875, -21.128173828125, -20.15966796875, -19.191162109375, -18.22265625, -17.254150390625, -16.28564453125, -15.317138671875, -14.3486328125, -13.380126953125, -12.41162109375, -11.443115234375, -10.474609375, -9.506103515625, -8.53759765625, -7.569091796875, -6.6005859375, -5.632080078125, -4.66357421875, -3.695068359375, -2.7265625, -1.758056640625, -0.78955078125, 0.178955078125, 1.1474609375, 2.115966796875, 3.08447265625, 4.052978515625, 5.021484375, 5.989990234375, 6.95849609375, 7.927001953125, 8.8955078125, 9.864013671875, 10.83251953125, 11.801025390625, 12.76953125, 13.738037109375, 14.70654296875, 15.675048828125, 16.6435546875, 17.612060546875, 18.58056640625, 19.549072265625, 20.517578125, 21.486083984375, 22.45458984375, 23.423095703125, 24.3916015625, 25.360107421875, 26.32861328125, 27.297119140625, 28.265625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 8.0, 10.0, 13.0, 18.0, 28.0, 34.0, 35.0, 43.0, 73.0, 89.0, 126.0, 142.0, 258.0, 414.0, 1191.0, 74281.0, 3064335.0, 2929.0, 563.0, 312.0, 193.0, 151.0, 98.0, 91.0, 63.0, 55.0, 31.0, 29.0, 23.0, 18.0, 13.0, 9.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.875, -56.62890625, -54.3828125, -52.13671875, -49.890625, -47.64453125, -45.3984375, -43.15234375, -40.90625, -38.66015625, -36.4140625, -34.16796875, -31.921875, -29.67578125, -27.4296875, -25.18359375, -22.9375, -20.69140625, -18.4453125, -16.19921875, -13.953125, -11.70703125, -9.4609375, -7.21484375, -4.96875, -2.72265625, -0.4765625, 1.76953125, 4.015625, 6.26171875, 8.5078125, 10.75390625, 13.0, 15.24609375, 17.4921875, 19.73828125, 21.984375, 24.23046875, 26.4765625, 28.72265625, 30.96875, 33.21484375, 35.4609375, 37.70703125, 39.953125, 42.19921875, 44.4453125, 46.69140625, 48.9375, 51.18359375, 53.4296875, 55.67578125, 57.921875, 60.16796875, 62.4140625, 64.66015625, 66.90625, 69.15234375, 71.3984375, 73.64453125, 75.890625, 78.13671875, 80.3828125, 82.62890625, 84.875]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 69.0, 410.0, 457.0, 69.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.95025634765625, -153.871826171875, -150.7934112548828, -147.71498107910156, -144.63656616210938, -141.55813598632812, -138.47972106933594, -135.4012908935547, -132.3228759765625, -129.24444580078125, -126.16603088378906, -123.08760833740234, -120.00918579101562, -116.9307632446289, -113.85234069824219, -110.77391052246094, -107.69548797607422, -104.6170654296875, -101.53864288330078, -98.46022033691406, -95.38179779052734, -92.30337524414062, -89.22494506835938, -86.14653015136719, -83.06809997558594, -79.98967742919922, -76.9112548828125, -73.83283233642578, -70.75440979003906, -67.67598724365234, -64.59756469726562, -61.51913833618164, -58.44072341918945, -55.362300872802734, -52.283878326416016, -49.20545196533203, -46.12702941894531, -43.048606872558594, -39.970184326171875, -36.891761779785156, -33.81333923339844, -30.73491668701172, -27.656494140625, -24.57806968688965, -21.49964714050293, -18.42122459411621, -15.34280014038086, -12.26437759399414, -9.185955047607422, -6.107532024383545, -3.029109001159668, 0.04931449890136719, 3.127737045288086, 6.206159591674805, 9.284584045410156, 12.363006591796875, 15.441429138183594, 18.519851684570312, 21.59827423095703, 24.676698684692383, 27.7551212310791, 30.83354377746582, 33.91196823120117, 36.99039077758789, 40.06881332397461]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 8.0, 4.0, 3.0, 4.0, 5.0, 2.0, 7.0, 9.0, 11.0, 7.0, 18.0, 11.0, 16.0, 22.0, 21.0, 23.0, 16.0, 35.0, 36.0, 37.0, 35.0, 38.0, 40.0, 43.0, 45.0, 50.0, 46.0, 44.0, 49.0, 29.0, 42.0, 37.0, 21.0, 34.0, 32.0, 23.0, 15.0, 16.0, 13.0, 16.0, 6.0, 6.0, 11.0, 1.0, 5.0, 3.0, 1.0, 8.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-87.60235595703125, -85.01819610595703, -82.43404388427734, -79.84988403320312, -77.26573181152344, -74.68157196044922, -72.09741973876953, -69.51325988769531, -66.92910766601562, -64.3449478149414, -61.76079559326172, -59.176639556884766, -56.59248352050781, -54.008323669433594, -51.42416763305664, -48.84001159667969, -46.25585174560547, -43.671695709228516, -41.08753967285156, -38.50338363647461, -35.919227600097656, -33.33506774902344, -30.750911712646484, -28.16675567626953, -25.582599639892578, -22.998443603515625, -20.414287567138672, -17.830129623413086, -15.245973587036133, -12.66181755065918, -10.07766056060791, -7.493503570556641, -4.909355163574219, -2.3251986503601074, 0.2589578628540039, 2.8431143760681152, 5.427270889282227, 8.01142692565918, 10.59558391571045, 13.179740905761719, 15.763896942138672, 18.348052978515625, 20.932209014892578, 23.516366958618164, 26.100522994995117, 28.68467903137207, 31.268836975097656, 33.85299301147461, 36.43714904785156, 39.021305084228516, 41.60546112060547, 44.18961715698242, 46.773773193359375, 49.357933044433594, 51.94208908081055, 54.5262451171875, 57.11040115356445, 59.694557189941406, 62.27871322631836, 64.86286926269531, 67.44702911376953, 70.03118133544922, 72.61534118652344, 75.19949340820312, 77.78365325927734]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 3.0, 10.0, 3.0, 8.0, 9.0, 12.0, 12.0, 14.0, 16.0, 17.0, 17.0, 25.0, 33.0, 35.0, 19.0, 41.0, 37.0, 35.0, 42.0, 40.0, 33.0, 30.0, 44.0, 48.0, 28.0, 39.0, 34.0, 31.0, 29.0, 23.0, 29.0, 34.0, 28.0, 17.0, 19.0, 18.0, 15.0, 14.0, 7.0, 9.0, 8.0, 9.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.9375, -8.67333984375, -8.4091796875, -8.14501953125, -7.880859375, -7.61669921875, -7.3525390625, -7.08837890625, -6.82421875, -6.56005859375, -6.2958984375, -6.03173828125, -5.767578125, -5.50341796875, -5.2392578125, -4.97509765625, -4.7109375, -4.44677734375, -4.1826171875, -3.91845703125, -3.654296875, -3.39013671875, -3.1259765625, -2.86181640625, -2.59765625, -2.33349609375, -2.0693359375, -1.80517578125, -1.541015625, -1.27685546875, -1.0126953125, -0.74853515625, -0.484375, -0.22021484375, 0.0439453125, 0.30810546875, 0.572265625, 0.83642578125, 1.1005859375, 1.36474609375, 1.62890625, 1.89306640625, 2.1572265625, 2.42138671875, 2.685546875, 2.94970703125, 3.2138671875, 3.47802734375, 3.7421875, 4.00634765625, 4.2705078125, 4.53466796875, 4.798828125, 5.06298828125, 5.3271484375, 5.59130859375, 5.85546875, 6.11962890625, 6.3837890625, 6.64794921875, 6.912109375, 7.17626953125, 7.4404296875, 7.70458984375, 7.96875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 7.0, 5.0, 17.0, 10.0, 9.0, 19.0, 18.0, 21.0, 51.0, 58.0, 49.0, 93.0, 97.0, 165.0, 241.0, 467.0, 1118.0, 3896.0, 33551.0, 1599407.0, 2486005.0, 61120.0, 5080.0, 1283.0, 528.0, 259.0, 170.0, 129.0, 71.0, 77.0, 51.0, 41.0, 30.0, 27.0, 20.0, 22.0, 12.0, 12.0, 5.0, 2.0, 6.0, 5.0, 8.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-29.0, -28.12353515625, -27.2470703125, -26.37060546875, -25.494140625, -24.61767578125, -23.7412109375, -22.86474609375, -21.98828125, -21.11181640625, -20.2353515625, -19.35888671875, -18.482421875, -17.60595703125, -16.7294921875, -15.85302734375, -14.9765625, -14.10009765625, -13.2236328125, -12.34716796875, -11.470703125, -10.59423828125, -9.7177734375, -8.84130859375, -7.96484375, -7.08837890625, -6.2119140625, -5.33544921875, -4.458984375, -3.58251953125, -2.7060546875, -1.82958984375, -0.953125, -0.07666015625, 0.7998046875, 1.67626953125, 2.552734375, 3.42919921875, 4.3056640625, 5.18212890625, 6.05859375, 6.93505859375, 7.8115234375, 8.68798828125, 9.564453125, 10.44091796875, 11.3173828125, 12.19384765625, 13.0703125, 13.94677734375, 14.8232421875, 15.69970703125, 16.576171875, 17.45263671875, 18.3291015625, 19.20556640625, 20.08203125, 20.95849609375, 21.8349609375, 22.71142578125, 23.587890625, 24.46435546875, 25.3408203125, 26.21728515625, 27.09375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 11.0, 25.0, 16.0, 43.0, 65.0, 138.0, 244.0, 413.0, 711.0, 853.0, 697.0, 349.0, 197.0, 131.0, 68.0, 40.0, 29.0, 15.0, 9.0, 3.0, 5.0, 1.0, 5.0, 3.0], "bins": [-40.71875, -39.8955078125, -39.072265625, -38.2490234375, -37.42578125, -36.6025390625, -35.779296875, -34.9560546875, -34.1328125, -33.3095703125, -32.486328125, -31.6630859375, -30.83984375, -30.0166015625, -29.193359375, -28.3701171875, -27.546875, -26.7236328125, -25.900390625, -25.0771484375, -24.25390625, -23.4306640625, -22.607421875, -21.7841796875, -20.9609375, -20.1376953125, -19.314453125, -18.4912109375, -17.66796875, -16.8447265625, -16.021484375, -15.1982421875, -14.375, -13.5517578125, -12.728515625, -11.9052734375, -11.08203125, -10.2587890625, -9.435546875, -8.6123046875, -7.7890625, -6.9658203125, -6.142578125, -5.3193359375, -4.49609375, -3.6728515625, -2.849609375, -2.0263671875, -1.203125, -0.3798828125, 0.443359375, 1.2666015625, 2.08984375, 2.9130859375, 3.736328125, 4.5595703125, 5.3828125, 6.2060546875, 7.029296875, 7.8525390625, 8.67578125, 9.4990234375, 10.322265625, 11.1455078125, 11.96875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 15.0, 5.0, 22.0, 27.0, 62.0, 112.0, 170.0, 277.0, 475.0, 2025.0, 4129175.0, 60112.0, 822.0, 409.0, 241.0, 151.0, 77.0, 45.0, 24.0, 24.0, 2.0, 8.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.9375, -66.1337890625, -61.330078125, -56.5263671875, -51.72265625, -46.9189453125, -42.115234375, -37.3115234375, -32.5078125, -27.7041015625, -22.900390625, -18.0966796875, -13.29296875, -8.4892578125, -3.685546875, 1.1181640625, 5.921875, 10.7255859375, 15.529296875, 20.3330078125, 25.13671875, 29.9404296875, 34.744140625, 39.5478515625, 44.3515625, 49.1552734375, 53.958984375, 58.7626953125, 63.56640625, 68.3701171875, 73.173828125, 77.9775390625, 82.78125, 87.5849609375, 92.388671875, 97.1923828125, 101.99609375, 106.7998046875, 111.603515625, 116.4072265625, 121.2109375, 126.0146484375, 130.818359375, 135.6220703125, 140.42578125, 145.2294921875, 150.033203125, 154.8369140625, 159.640625, 164.4443359375, 169.248046875, 174.0517578125, 178.85546875, 183.6591796875, 188.462890625, 193.2666015625, 198.0703125, 202.8740234375, 207.677734375, 212.4814453125, 217.28515625, 222.0888671875, 226.892578125, 231.6962890625, 236.5]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 13.0, 19.0, 34.0, 62.0, 116.0, 161.0, 130.0, 164.0, 139.0, 78.0, 45.0, 19.0, 11.0, 5.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.40932083129883, -50.007816314697266, -47.60630798339844, -45.204803466796875, -42.80329895019531, -40.401790618896484, -38.00028610229492, -35.598777770996094, -33.19727325439453, -30.795766830444336, -28.39426040649414, -25.992755889892578, -23.591249465942383, -21.189743041992188, -18.788238525390625, -16.38673210144043, -13.985225677490234, -11.583719253540039, -9.18221378326416, -6.780707836151123, -4.379201889038086, -1.9776954650878906, 0.4238100051879883, 2.825315475463867, 5.2268218994140625, 7.6283278465271, 10.029833793640137, 12.431339263916016, 14.832845687866211, 17.234352111816406, 19.63585662841797, 22.037363052368164, 24.438873291015625, 26.84037971496582, 29.241886138916016, 31.643390655517578, 34.044898986816406, 36.44640350341797, 38.84790802001953, 41.249412536621094, 43.65092086791992, 46.052425384521484, 48.45393371582031, 50.855438232421875, 53.25694274902344, 55.658451080322266, 58.05995559692383, 60.461463928222656, 62.86296844482422, 65.26447296142578, 67.66597747802734, 70.06748962402344, 72.468994140625, 74.87049865722656, 77.27200317382812, 79.67350769042969, 82.07501220703125, 84.47651672363281, 86.87802124023438, 89.27953338623047, 91.68103790283203, 94.0825424194336, 96.48404693603516, 98.88555145263672, 101.28706359863281]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 6.0, 9.0, 5.0, 8.0, 7.0, 15.0, 17.0, 24.0, 20.0, 21.0, 34.0, 27.0, 36.0, 39.0, 36.0, 42.0, 41.0, 43.0, 38.0, 49.0, 35.0, 36.0, 44.0, 37.0, 39.0, 32.0, 41.0, 23.0, 26.0, 29.0, 17.0, 28.0, 14.0, 18.0, 13.0, 14.0, 7.0, 10.0, 4.0, 6.0, 2.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.11839294433594, -44.52022933959961, -42.92206573486328, -41.32390213012695, -39.725738525390625, -38.1275749206543, -36.52941131591797, -34.93124771118164, -33.33308410644531, -31.734920501708984, -30.136756896972656, -28.538593292236328, -26.9404296875, -25.342266082763672, -23.744102478027344, -22.145938873291016, -20.547775268554688, -18.94961166381836, -17.35144805908203, -15.753284454345703, -14.155120849609375, -12.556957244873047, -10.958793640136719, -9.36063003540039, -7.7624664306640625, -6.164302825927734, -4.566139221191406, -2.967975616455078, -1.36981201171875, 0.22835159301757812, 1.8265151977539062, 3.4246788024902344, 5.0228424072265625, 6.621006011962891, 8.219169616699219, 9.817333221435547, 11.415496826171875, 13.013660430908203, 14.611824035644531, 16.20998764038086, 17.808151245117188, 19.406314849853516, 21.004478454589844, 22.602642059326172, 24.2008056640625, 25.798969268798828, 27.397132873535156, 28.995296478271484, 30.593460083007812, 32.19162368774414, 33.78978729248047, 35.3879508972168, 36.986114501953125, 38.58427810668945, 40.18244171142578, 41.78060531616211, 43.37876892089844, 44.976932525634766, 46.575096130371094, 48.17325973510742, 49.77142333984375, 51.36958694458008, 52.967750549316406, 54.565914154052734, 56.16407775878906]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 6.0, 11.0, 11.0, 11.0, 25.0, 15.0, 16.0, 26.0, 26.0, 27.0, 30.0, 48.0, 35.0, 39.0, 43.0, 44.0, 46.0, 50.0, 39.0, 48.0, 46.0, 31.0, 37.0, 29.0, 24.0, 35.0, 24.0, 25.0, 24.0, 26.0, 23.0, 12.0, 15.0, 13.0, 6.0, 7.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.8828125, -9.5882568359375, -9.293701171875, -8.9991455078125, -8.70458984375, -8.4100341796875, -8.115478515625, -7.8209228515625, -7.5263671875, -7.2318115234375, -6.937255859375, -6.6427001953125, -6.34814453125, -6.0535888671875, -5.759033203125, -5.4644775390625, -5.169921875, -4.8753662109375, -4.580810546875, -4.2862548828125, -3.99169921875, -3.6971435546875, -3.402587890625, -3.1080322265625, -2.8134765625, -2.5189208984375, -2.224365234375, -1.9298095703125, -1.63525390625, -1.3406982421875, -1.046142578125, -0.7515869140625, -0.45703125, -0.1624755859375, 0.132080078125, 0.4266357421875, 0.72119140625, 1.0157470703125, 1.310302734375, 1.6048583984375, 1.8994140625, 2.1939697265625, 2.488525390625, 2.7830810546875, 3.07763671875, 3.3721923828125, 3.666748046875, 3.9613037109375, 4.255859375, 4.5504150390625, 4.844970703125, 5.1395263671875, 5.43408203125, 5.7286376953125, 6.023193359375, 6.3177490234375, 6.6123046875, 6.9068603515625, 7.201416015625, 7.4959716796875, 7.79052734375, 8.0850830078125, 8.379638671875, 8.6741943359375, 8.96875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 12.0, 22.0, 17.0, 27.0, 48.0, 71.0, 89.0, 160.0, 194.0, 343.0, 511.0, 684.0, 985.0, 1531.0, 2279.0, 3502.0, 5148.0, 7760.0, 12200.0, 18601.0, 29577.0, 46390.0, 74663.0, 116828.0, 170651.0, 183648.0, 134077.0, 86708.0, 54625.0, 34365.0, 21825.0, 14043.0, 8999.0, 5948.0, 4036.0, 2641.0, 1742.0, 1183.0, 791.0, 511.0, 343.0, 264.0, 153.0, 137.0, 83.0, 51.0, 29.0, 20.0, 12.0, 19.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.88623046875, -0.8577957153320312, -0.8293609619140625, -0.8009262084960938, -0.772491455078125, -0.7440567016601562, -0.7156219482421875, -0.6871871948242188, -0.65875244140625, -0.6303176879882812, -0.6018829345703125, -0.5734481811523438, -0.545013427734375, -0.5165786743164062, -0.4881439208984375, -0.45970916748046875, -0.4312744140625, -0.40283966064453125, -0.3744049072265625, -0.34597015380859375, -0.317535400390625, -0.28910064697265625, -0.2606658935546875, -0.23223114013671875, -0.20379638671875, -0.17536163330078125, -0.1469268798828125, -0.11849212646484375, -0.090057373046875, -0.06162261962890625, -0.0331878662109375, -0.00475311279296875, 0.023681640625, 0.05211639404296875, 0.0805511474609375, 0.10898590087890625, 0.137420654296875, 0.16585540771484375, 0.1942901611328125, 0.22272491455078125, 0.25115966796875, 0.27959442138671875, 0.3080291748046875, 0.33646392822265625, 0.364898681640625, 0.39333343505859375, 0.4217681884765625, 0.45020294189453125, 0.4786376953125, 0.5070724487304688, 0.5355072021484375, 0.5639419555664062, 0.592376708984375, 0.6208114624023438, 0.6492462158203125, 0.6776809692382812, 0.70611572265625, 0.7345504760742188, 0.7629852294921875, 0.7914199829101562, 0.819854736328125, 0.8482894897460938, 0.8767242431640625, 0.9051589965820312, 0.93359375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 2.0, 8.0, 12.0, 8.0, 9.0, 12.0, 20.0, 14.0, 24.0, 27.0, 29.0, 16.0, 28.0, 23.0, 46.0, 43.0, 32.0, 30.0, 46.0, 28.0, 1063.0, 43.0, 37.0, 31.0, 37.0, 37.0, 33.0, 24.0, 38.0, 26.0, 30.0, 32.0, 19.0, 20.0, 20.0, 12.0, 4.0, 10.0, 12.0, 8.0, 5.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.5625, -5.39666748046875, -5.2308349609375, -5.06500244140625, -4.899169921875, -4.73333740234375, -4.5675048828125, -4.40167236328125, -4.23583984375, -4.07000732421875, -3.9041748046875, -3.73834228515625, -3.572509765625, -3.40667724609375, -3.2408447265625, -3.07501220703125, -2.9091796875, -2.74334716796875, -2.5775146484375, -2.41168212890625, -2.245849609375, -2.08001708984375, -1.9141845703125, -1.74835205078125, -1.58251953125, -1.41668701171875, -1.2508544921875, -1.08502197265625, -0.919189453125, -0.75335693359375, -0.5875244140625, -0.42169189453125, -0.255859375, -0.09002685546875, 0.0758056640625, 0.24163818359375, 0.407470703125, 0.57330322265625, 0.7391357421875, 0.90496826171875, 1.07080078125, 1.23663330078125, 1.4024658203125, 1.56829833984375, 1.734130859375, 1.89996337890625, 2.0657958984375, 2.23162841796875, 2.3974609375, 2.56329345703125, 2.7291259765625, 2.89495849609375, 3.060791015625, 3.22662353515625, 3.3924560546875, 3.55828857421875, 3.72412109375, 3.88995361328125, 4.0557861328125, 4.22161865234375, 4.387451171875, 4.55328369140625, 4.7191162109375, 4.88494873046875, 5.05078125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 4.0, 10.0, 14.0, 22.0, 33.0, 41.0, 72.0, 77.0, 113.0, 168.0, 240.0, 312.0, 459.0, 707.0, 914.0, 1237.0, 1779.0, 2562.0, 3622.0, 4968.0, 6925.0, 9732.0, 13827.0, 19379.0, 27663.0, 39790.0, 56925.0, 81763.0, 113800.0, 1138875.0, 194193.0, 110783.0, 79187.0, 55626.0, 38747.0, 26958.0, 18962.0, 13295.0, 9610.0, 6802.0, 4793.0, 3458.0, 2510.0, 1681.0, 1275.0, 942.0, 627.0, 461.0, 381.0, 256.0, 160.0, 106.0, 99.0, 66.0, 44.0, 29.0, 29.0, 9.0, 10.0, 8.0, 1.0], "bins": [-0.705078125, -0.683685302734375, -0.66229248046875, -0.640899658203125, -0.6195068359375, -0.598114013671875, -0.57672119140625, -0.555328369140625, -0.533935546875, -0.512542724609375, -0.49114990234375, -0.469757080078125, -0.4483642578125, -0.426971435546875, -0.40557861328125, -0.384185791015625, -0.36279296875, -0.341400146484375, -0.32000732421875, -0.298614501953125, -0.2772216796875, -0.255828857421875, -0.23443603515625, -0.213043212890625, -0.191650390625, -0.170257568359375, -0.14886474609375, -0.127471923828125, -0.1060791015625, -0.084686279296875, -0.06329345703125, -0.041900634765625, -0.0205078125, 0.000885009765625, 0.02227783203125, 0.043670654296875, 0.0650634765625, 0.086456298828125, 0.10784912109375, 0.129241943359375, 0.150634765625, 0.172027587890625, 0.19342041015625, 0.214813232421875, 0.2362060546875, 0.257598876953125, 0.27899169921875, 0.300384521484375, 0.32177734375, 0.343170166015625, 0.36456298828125, 0.385955810546875, 0.4073486328125, 0.428741455078125, 0.45013427734375, 0.471527099609375, 0.492919921875, 0.514312744140625, 0.53570556640625, 0.557098388671875, 0.5784912109375, 0.599884033203125, 0.62127685546875, 0.642669677734375, 0.6640625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 11.0, 12.0, 13.0, 11.0, 16.0, 21.0, 31.0, 38.0, 33.0, 32.0, 44.0, 58.0, 59.0, 61.0, 76.0, 58.0, 48.0, 49.0, 45.0, 40.0, 44.0, 32.0, 26.0, 27.0, 18.0, 14.0, 9.0, 8.0, 8.0, 12.0, 6.0, 8.0, 6.0, 3.0, 1.0, 3.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002246856689453125, -0.002174675464630127, -0.002102494239807129, -0.002030313014984131, -0.001958131790161133, -0.0018859505653381348, -0.0018137693405151367, -0.0017415881156921387, -0.0016694068908691406, -0.0015972256660461426, -0.0015250444412231445, -0.0014528632164001465, -0.0013806819915771484, -0.0013085007667541504, -0.0012363195419311523, -0.0011641383171081543, -0.0010919570922851562, -0.0010197758674621582, -0.0009475946426391602, -0.0008754134178161621, -0.0008032321929931641, -0.000731050968170166, -0.000658869743347168, -0.0005866885185241699, -0.0005145072937011719, -0.00044232606887817383, -0.0003701448440551758, -0.00029796361923217773, -0.0002257823944091797, -0.00015360116958618164, -8.14199447631836e-05, -9.238719940185547e-06, 6.29425048828125e-05, 0.00013512372970581055, 0.0002073049545288086, 0.00027948617935180664, 0.0003516674041748047, 0.00042384862899780273, 0.0004960298538208008, 0.0005682110786437988, 0.0006403923034667969, 0.0007125735282897949, 0.000784754753112793, 0.000856935977935791, 0.0009291172027587891, 0.0010012984275817871, 0.0010734796524047852, 0.0011456608772277832, 0.0012178421020507812, 0.0012900233268737793, 0.0013622045516967773, 0.0014343857765197754, 0.0015065670013427734, 0.0015787482261657715, 0.0016509294509887695, 0.0017231106758117676, 0.0017952919006347656, 0.0018674731254577637, 0.0019396543502807617, 0.0020118355751037598, 0.002084016799926758, 0.002156198024749756, 0.002228379249572754, 0.002300560474395752, 0.00237274169921875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 3.0, 4.0, 6.0, 5.0, 8.0, 10.0, 15.0, 11.0, 8.0, 15.0, 20.0, 16.0, 25.0, 40.0, 42.0, 69.0, 90.0, 117.0, 188.0, 427.0, 1383.0, 798009.0, 245838.0, 1108.0, 389.0, 181.0, 128.0, 91.0, 69.0, 57.0, 37.0, 32.0, 27.0, 14.0, 17.0, 9.0, 14.0, 11.0, 11.0, 6.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.053680419921875, -0.05204963684082031, -0.050418853759765625, -0.04878807067871094, -0.04715728759765625, -0.04552650451660156, -0.043895721435546875, -0.04226493835449219, -0.0406341552734375, -0.03900337219238281, -0.037372589111328125, -0.03574180603027344, -0.03411102294921875, -0.03248023986816406, -0.030849456787109375, -0.029218673706054688, -0.027587890625, -0.025957107543945312, -0.024326324462890625, -0.022695541381835938, -0.02106475830078125, -0.019433975219726562, -0.017803192138671875, -0.016172409057617188, -0.0145416259765625, -0.012910842895507812, -0.011280059814453125, -0.009649276733398438, -0.00801849365234375, -0.0063877105712890625, -0.004756927490234375, -0.0031261444091796875, -0.001495361328125, 0.0001354217529296875, 0.001766204833984375, 0.0033969879150390625, 0.00502777099609375, 0.0066585540771484375, 0.008289337158203125, 0.009920120239257812, 0.0115509033203125, 0.013181686401367188, 0.014812469482421875, 0.016443252563476562, 0.01807403564453125, 0.019704818725585938, 0.021335601806640625, 0.022966384887695312, 0.02459716796875, 0.026227951049804688, 0.027858734130859375, 0.029489517211914062, 0.03112030029296875, 0.03275108337402344, 0.034381866455078125, 0.03601264953613281, 0.0376434326171875, 0.03927421569824219, 0.040904998779296875, 0.04253578186035156, 0.04416656494140625, 0.04579734802246094, 0.047428131103515625, 0.04905891418457031, 0.050689697265625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 45.0, 115.0, 169.0, 248.0, 218.0, 133.0, 42.0, 30.0, 7.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004393134266138077, -0.004306461662054062, -0.004219789523631334, -0.004133117385208607, -0.004046444781124592, -0.003959772177040577, -0.0038731000386178493, -0.003786427667364478, -0.003699755296111107, -0.0036130829248577356, -0.0035264105536043644, -0.003439738182350993, -0.003353065811097622, -0.0032663934398442507, -0.0031797210685908794, -0.003093048697337508, -0.003006376326084137, -0.0029197039548307657, -0.0028330315835773945, -0.0027463592123240232, -0.002659686841070652, -0.0025730144698172808, -0.0024863420985639095, -0.0023996697273105383, -0.002312997356057167, -0.002226324984803796, -0.0021396526135504246, -0.0020529802422970533, -0.001966307871043682, -0.0018796354997903109, -0.0017929631285369396, -0.0017062907572835684, -0.001619618502445519, -0.0015329461311921477, -0.0014462737599387765, -0.0013596013886854053, -0.001272929017432034, -0.0011862566461786628, -0.0010995842749252915, -0.0010129119036719203, -0.0009262395324185491, -0.0008395671611651778, -0.0007528947899118066, -0.0006662224186584353, -0.0005795500474050641, -0.0004928776761516929, -0.00040620530489832163, -0.0003195329336449504, -0.00023286056239157915, -0.0001461881911382079, -5.9515819884836674e-05, 2.7156551368534565e-05, 0.0001138289226219058, 0.00020050129387527704, 0.0002871736651286483, 0.0003738460363820195, 0.00046051840763539076, 0.000547190778888762, 0.0006338631501421332, 0.0007205355213955045, 0.0008072078926488757, 0.000893880263902247, 0.0009805526351556182, 0.0010672250064089894, 0.0011538973776623607]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 7.0, 4.0, 8.0, 13.0, 12.0, 16.0, 13.0, 26.0, 28.0, 24.0, 35.0, 33.0, 39.0, 40.0, 50.0, 51.0, 50.0, 51.0, 44.0, 43.0, 37.0, 43.0, 35.0, 43.0, 34.0, 37.0, 39.0, 23.0, 19.0, 15.0, 14.0, 16.0, 6.0, 15.0, 11.0, 5.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012528300285339355, -0.0012106718495488167, -0.0011685136705636978, -0.001126355491578579, -0.00108419731259346, -0.0010420391336083412, -0.0009998809546232224, -0.0009577227756381035, -0.0009155645966529846, -0.0008734064176678658, -0.0008312482386827469, -0.000789090059697628, -0.0007469318807125092, -0.0007047737017273903, -0.0006626155227422714, -0.0006204573437571526, -0.0005782991647720337, -0.0005361409857869148, -0.000493982806801796, -0.0004518246278166771, -0.00040966644883155823, -0.00036750826984643936, -0.0003253500908613205, -0.00028319191187620163, -0.00024103373289108276, -0.0001988755539059639, -0.00015671737492084503, -0.00011455919593572617, -7.24010169506073e-05, -3.0242837965488434e-05, 1.1915341019630432e-05, 5.40735200047493e-05, 9.623169898986816e-05, 0.00013838987797498703, 0.0001805480569601059, 0.00022270623594522476, 0.00026486441493034363, 0.0003070225939154625, 0.00034918077290058136, 0.0003913389518857002, 0.0004334971308708191, 0.00047565530985593796, 0.0005178134888410568, 0.0005599716678261757, 0.0006021298468112946, 0.0006442880257964134, 0.0006864462047815323, 0.0007286043837666512, 0.00077076256275177, 0.0008129207417368889, 0.0008550789207220078, 0.0008972370997071266, 0.0009393952786922455, 0.0009815534576773643, 0.0010237116366624832, 0.001065869815647602, 0.001108027994632721, 0.0011501861736178398, 0.0011923443526029587, 0.0012345025315880775, 0.0012766607105731964, 0.0013188188895583153, 0.0013609770685434341, 0.001403135247528553, 0.0014452934265136719]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 6.0, 11.0, 11.0, 11.0, 25.0, 15.0, 16.0, 26.0, 26.0, 27.0, 30.0, 48.0, 35.0, 39.0, 43.0, 44.0, 46.0, 50.0, 39.0, 48.0, 46.0, 31.0, 37.0, 29.0, 24.0, 35.0, 24.0, 25.0, 24.0, 26.0, 23.0, 12.0, 15.0, 13.0, 6.0, 7.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.8828125, -9.5882568359375, -9.293701171875, -8.9991455078125, -8.70458984375, -8.4100341796875, -8.115478515625, -7.8209228515625, -7.5263671875, -7.2318115234375, -6.937255859375, -6.6427001953125, -6.34814453125, -6.0535888671875, -5.759033203125, -5.4644775390625, -5.169921875, -4.8753662109375, -4.580810546875, -4.2862548828125, -3.99169921875, -3.6971435546875, -3.402587890625, -3.1080322265625, -2.8134765625, -2.5189208984375, -2.224365234375, -1.9298095703125, -1.63525390625, -1.3406982421875, -1.046142578125, -0.7515869140625, -0.45703125, -0.1624755859375, 0.132080078125, 0.4266357421875, 0.72119140625, 1.0157470703125, 1.310302734375, 1.6048583984375, 1.8994140625, 2.1939697265625, 2.488525390625, 2.7830810546875, 3.07763671875, 3.3721923828125, 3.666748046875, 3.9613037109375, 4.255859375, 4.5504150390625, 4.844970703125, 5.1395263671875, 5.43408203125, 5.7286376953125, 6.023193359375, 6.3177490234375, 6.6123046875, 6.9068603515625, 7.201416015625, 7.4959716796875, 7.79052734375, 8.0850830078125, 8.379638671875, 8.6741943359375, 8.96875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 10.0, 9.0, 11.0, 14.0, 12.0, 19.0, 38.0, 33.0, 55.0, 59.0, 91.0, 129.0, 198.0, 301.0, 508.0, 873.0, 1921.0, 8916.0, 107212.0, 845232.0, 72031.0, 7032.0, 1683.0, 780.0, 438.0, 262.0, 160.0, 145.0, 85.0, 77.0, 50.0, 48.0, 35.0, 19.0, 19.0, 13.0, 11.0, 7.0, 7.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.673828125, -17.12890625, -16.583984375, -16.0390625, -15.494140625, -14.94921875, -14.404296875, -13.859375, -13.314453125, -12.76953125, -12.224609375, -11.6796875, -11.134765625, -10.58984375, -10.044921875, -9.5, -8.955078125, -8.41015625, -7.865234375, -7.3203125, -6.775390625, -6.23046875, -5.685546875, -5.140625, -4.595703125, -4.05078125, -3.505859375, -2.9609375, -2.416015625, -1.87109375, -1.326171875, -0.78125, -0.236328125, 0.30859375, 0.853515625, 1.3984375, 1.943359375, 2.48828125, 3.033203125, 3.578125, 4.123046875, 4.66796875, 5.212890625, 5.7578125, 6.302734375, 6.84765625, 7.392578125, 7.9375, 8.482421875, 9.02734375, 9.572265625, 10.1171875, 10.662109375, 11.20703125, 11.751953125, 12.296875, 12.841796875, 13.38671875, 13.931640625, 14.4765625, 15.021484375, 15.56640625, 16.111328125, 16.65625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 7.0, 5.0, 7.0, 9.0, 11.0, 14.0, 11.0, 26.0, 24.0, 33.0, 39.0, 41.0, 37.0, 61.0, 59.0, 108.0, 1584.0, 434.0, 105.0, 66.0, 59.0, 58.0, 45.0, 37.0, 37.0, 27.0, 17.0, 23.0, 20.0, 17.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.71875, -38.61474609375, -37.5107421875, -36.40673828125, -35.302734375, -34.19873046875, -33.0947265625, -31.99072265625, -30.88671875, -29.78271484375, -28.6787109375, -27.57470703125, -26.470703125, -25.36669921875, -24.2626953125, -23.15869140625, -22.0546875, -20.95068359375, -19.8466796875, -18.74267578125, -17.638671875, -16.53466796875, -15.4306640625, -14.32666015625, -13.22265625, -12.11865234375, -11.0146484375, -9.91064453125, -8.806640625, -7.70263671875, -6.5986328125, -5.49462890625, -4.390625, -3.28662109375, -2.1826171875, -1.07861328125, 0.025390625, 1.12939453125, 2.2333984375, 3.33740234375, 4.44140625, 5.54541015625, 6.6494140625, 7.75341796875, 8.857421875, 9.96142578125, 11.0654296875, 12.16943359375, 13.2734375, 14.37744140625, 15.4814453125, 16.58544921875, 17.689453125, 18.79345703125, 19.8974609375, 21.00146484375, 22.10546875, 23.20947265625, 24.3134765625, 25.41748046875, 26.521484375, 27.62548828125, 28.7294921875, 29.83349609375, 30.9375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 8.0, 3.0, 11.0, 25.0, 17.0, 29.0, 20.0, 38.0, 49.0, 55.0, 76.0, 145.0, 260.0, 583.0, 4022.0, 3133843.0, 5252.0, 536.0, 255.0, 137.0, 82.0, 63.0, 42.0, 29.0, 28.0, 16.0, 14.0, 13.0, 12.0, 10.0, 6.0, 4.0, 8.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.125, -89.861328125, -86.59765625, -83.333984375, -80.0703125, -76.806640625, -73.54296875, -70.279296875, -67.015625, -63.751953125, -60.48828125, -57.224609375, -53.9609375, -50.697265625, -47.43359375, -44.169921875, -40.90625, -37.642578125, -34.37890625, -31.115234375, -27.8515625, -24.587890625, -21.32421875, -18.060546875, -14.796875, -11.533203125, -8.26953125, -5.005859375, -1.7421875, 1.521484375, 4.78515625, 8.048828125, 11.3125, 14.576171875, 17.83984375, 21.103515625, 24.3671875, 27.630859375, 30.89453125, 34.158203125, 37.421875, 40.685546875, 43.94921875, 47.212890625, 50.4765625, 53.740234375, 57.00390625, 60.267578125, 63.53125, 66.794921875, 70.05859375, 73.322265625, 76.5859375, 79.849609375, 83.11328125, 86.376953125, 89.640625, 92.904296875, 96.16796875, 99.431640625, 102.6953125, 105.958984375, 109.22265625, 112.486328125, 115.75]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 52.0, 309.0, 462.0, 171.0, 16.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.937437057495117, -29.34268569946289, -26.747934341430664, -24.153182983398438, -21.558429718017578, -18.963680267333984, -16.368927001953125, -13.774175643920898, -11.179424285888672, -8.584672927856445, -5.9899210929870605, -3.395169258117676, -0.8004179000854492, 1.7943334579467773, 4.38908576965332, 6.983837127685547, 9.578588485717773, 12.17333984375, 14.768091201782227, 17.362842559814453, 19.957595825195312, 22.552345275878906, 25.147098541259766, 27.741849899291992, 30.33660125732422, 32.93135452270508, 35.52610397338867, 38.12085723876953, 40.715606689453125, 43.310359954833984, 45.905113220214844, 48.49986267089844, 51.09461212158203, 53.68936538696289, 56.284114837646484, 58.878868103027344, 61.47361755371094, 64.06836700439453, 66.66312408447266, 69.25787353515625, 71.85262298583984, 74.44737243652344, 77.04212951660156, 79.63687896728516, 82.23162841796875, 84.82637786865234, 87.42113494873047, 90.01588439941406, 92.61064147949219, 95.20539093017578, 97.8001480102539, 100.3948974609375, 102.9896469116211, 105.58439636230469, 108.17915344238281, 110.7739028930664, 113.36865234375, 115.9634017944336, 118.55815887451172, 121.15290832519531, 123.7476577758789, 126.3424072265625, 128.93716430664062, 131.53192138671875, 134.1266632080078]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 6.0, 14.0, 14.0, 17.0, 21.0, 20.0, 22.0, 17.0, 21.0, 31.0, 37.0, 28.0, 32.0, 58.0, 43.0, 45.0, 42.0, 46.0, 32.0, 47.0, 27.0, 40.0, 45.0, 24.0, 27.0, 26.0, 33.0, 25.0, 15.0, 23.0, 18.0, 20.0, 23.0, 9.0, 8.0, 7.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.18292999267578, -84.43472290039062, -81.68651580810547, -78.93831634521484, -76.19010925292969, -73.44190216064453, -70.69369506835938, -67.94549560546875, -65.1972885131836, -62.44908142089844, -59.70087814331055, -56.95267105102539, -54.2044677734375, -51.456260681152344, -48.70805358886719, -45.9598503112793, -43.21164321899414, -40.463436126708984, -37.715232849121094, -34.96702575683594, -32.21882247924805, -29.47061538696289, -26.722410202026367, -23.974205017089844, -21.22599983215332, -18.477794647216797, -15.729589462280273, -12.981383323669434, -10.23317813873291, -7.484972953796387, -4.736766815185547, -1.9885616302490234, 0.7596435546875, 3.5078489780426025, 6.256054401397705, 9.004260063171387, 11.75246524810791, 14.500670433044434, 17.248876571655273, 19.997081756591797, 22.74528694152832, 25.493492126464844, 28.241697311401367, 30.98990249633789, 33.73810958862305, 36.48631286621094, 39.234519958496094, 41.98272705078125, 44.73093032836914, 47.4791374206543, 50.22734069824219, 52.975547790527344, 55.723751068115234, 58.47195816040039, 61.22016143798828, 63.96836853027344, 66.7165756225586, 69.46478271484375, 72.2129898071289, 74.96118927001953, 77.70939636230469, 80.45760345458984, 83.205810546875, 85.95401000976562, 88.70221710205078]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 6.0, 5.0, 9.0, 20.0, 21.0, 17.0, 11.0, 21.0, 20.0, 22.0, 35.0, 40.0, 42.0, 36.0, 37.0, 30.0, 50.0, 44.0, 45.0, 41.0, 44.0, 38.0, 44.0, 30.0, 22.0, 34.0, 34.0, 30.0, 18.0, 15.0, 18.0, 26.0, 12.0, 17.0, 12.0, 11.0, 7.0, 8.0, 8.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.2109375, -9.9134521484375, -9.615966796875, -9.3184814453125, -9.02099609375, -8.7235107421875, -8.426025390625, -8.1285400390625, -7.8310546875, -7.5335693359375, -7.236083984375, -6.9385986328125, -6.64111328125, -6.3436279296875, -6.046142578125, -5.7486572265625, -5.451171875, -5.1536865234375, -4.856201171875, -4.5587158203125, -4.26123046875, -3.9637451171875, -3.666259765625, -3.3687744140625, -3.0712890625, -2.7738037109375, -2.476318359375, -2.1788330078125, -1.88134765625, -1.5838623046875, -1.286376953125, -0.9888916015625, -0.69140625, -0.3939208984375, -0.096435546875, 0.2010498046875, 0.49853515625, 0.7960205078125, 1.093505859375, 1.3909912109375, 1.6884765625, 1.9859619140625, 2.283447265625, 2.5809326171875, 2.87841796875, 3.1759033203125, 3.473388671875, 3.7708740234375, 4.068359375, 4.3658447265625, 4.663330078125, 4.9608154296875, 5.25830078125, 5.5557861328125, 5.853271484375, 6.1507568359375, 6.4482421875, 6.7457275390625, 7.043212890625, 7.3406982421875, 7.63818359375, 7.9356689453125, 8.233154296875, 8.5306396484375, 8.828125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 5.0, 11.0, 21.0, 19.0, 18.0, 30.0, 40.0, 63.0, 75.0, 95.0, 173.0, 248.0, 380.0, 690.0, 1284.0, 2798.0, 6946.0, 21690.0, 105291.0, 590439.0, 1709696.0, 1337448.0, 334739.0, 58393.0, 14060.0, 4857.0, 2147.0, 1044.0, 538.0, 328.0, 201.0, 134.0, 89.0, 59.0, 57.0, 35.0, 35.0, 25.0, 16.0, 16.0, 13.0, 8.0, 7.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.0078125, -11.6182861328125, -11.228759765625, -10.8392333984375, -10.44970703125, -10.0601806640625, -9.670654296875, -9.2811279296875, -8.8916015625, -8.5020751953125, -8.112548828125, -7.7230224609375, -7.33349609375, -6.9439697265625, -6.554443359375, -6.1649169921875, -5.775390625, -5.3858642578125, -4.996337890625, -4.6068115234375, -4.21728515625, -3.8277587890625, -3.438232421875, -3.0487060546875, -2.6591796875, -2.2696533203125, -1.880126953125, -1.4906005859375, -1.10107421875, -0.7115478515625, -0.322021484375, 0.0675048828125, 0.45703125, 0.8465576171875, 1.236083984375, 1.6256103515625, 2.01513671875, 2.4046630859375, 2.794189453125, 3.1837158203125, 3.5732421875, 3.9627685546875, 4.352294921875, 4.7418212890625, 5.13134765625, 5.5208740234375, 5.910400390625, 6.2999267578125, 6.689453125, 7.0789794921875, 7.468505859375, 7.8580322265625, 8.24755859375, 8.6370849609375, 9.026611328125, 9.4161376953125, 9.8056640625, 10.1951904296875, 10.584716796875, 10.9742431640625, 11.36376953125, 11.7532958984375, 12.142822265625, 12.5323486328125, 12.921875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 11.0, 21.0, 26.0, 46.0, 72.0, 130.0, 180.0, 266.0, 415.0, 575.0, 657.0, 583.0, 366.0, 262.0, 149.0, 122.0, 58.0, 41.0, 31.0, 20.0, 9.0, 13.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.8671875, -15.1260986328125, -14.385009765625, -13.6439208984375, -12.90283203125, -12.1617431640625, -11.420654296875, -10.6795654296875, -9.9384765625, -9.1973876953125, -8.456298828125, -7.7152099609375, -6.97412109375, -6.2330322265625, -5.491943359375, -4.7508544921875, -4.009765625, -3.2686767578125, -2.527587890625, -1.7864990234375, -1.04541015625, -0.3043212890625, 0.436767578125, 1.1778564453125, 1.9189453125, 2.6600341796875, 3.401123046875, 4.1422119140625, 4.88330078125, 5.6243896484375, 6.365478515625, 7.1065673828125, 7.84765625, 8.5887451171875, 9.329833984375, 10.0709228515625, 10.81201171875, 11.5531005859375, 12.294189453125, 13.0352783203125, 13.7763671875, 14.5174560546875, 15.258544921875, 15.9996337890625, 16.74072265625, 17.4818115234375, 18.222900390625, 18.9639892578125, 19.705078125, 20.4461669921875, 21.187255859375, 21.9283447265625, 22.66943359375, 23.4105224609375, 24.151611328125, 24.8927001953125, 25.6337890625, 26.3748779296875, 27.115966796875, 27.8570556640625, 28.59814453125, 29.3392333984375, 30.080322265625, 30.8214111328125, 31.5625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 9.0, 17.0, 18.0, 25.0, 43.0, 64.0, 91.0, 140.0, 164.0, 228.0, 362.0, 607.0, 1508.0, 14892.0, 4027129.0, 143923.0, 2840.0, 790.0, 456.0, 285.0, 214.0, 146.0, 113.0, 73.0, 44.0, 26.0, 23.0, 11.0, 12.0, 12.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-105.1875, -102.60302734375, -100.0185546875, -97.43408203125, -94.849609375, -92.26513671875, -89.6806640625, -87.09619140625, -84.51171875, -81.92724609375, -79.3427734375, -76.75830078125, -74.173828125, -71.58935546875, -69.0048828125, -66.42041015625, -63.8359375, -61.25146484375, -58.6669921875, -56.08251953125, -53.498046875, -50.91357421875, -48.3291015625, -45.74462890625, -43.16015625, -40.57568359375, -37.9912109375, -35.40673828125, -32.822265625, -30.23779296875, -27.6533203125, -25.06884765625, -22.484375, -19.89990234375, -17.3154296875, -14.73095703125, -12.146484375, -9.56201171875, -6.9775390625, -4.39306640625, -1.80859375, 0.77587890625, 3.3603515625, 5.94482421875, 8.529296875, 11.11376953125, 13.6982421875, 16.28271484375, 18.8671875, 21.45166015625, 24.0361328125, 26.62060546875, 29.205078125, 31.78955078125, 34.3740234375, 36.95849609375, 39.54296875, 42.12744140625, 44.7119140625, 47.29638671875, 49.880859375, 52.46533203125, 55.0498046875, 57.63427734375, 60.21875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 327.0, 688.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-666.4459838867188, -633.261474609375, -600.076904296875, -566.8923950195312, -533.7078857421875, -500.5233154296875, -467.33880615234375, -434.1542663574219, -400.9697265625, -367.7851867675781, -334.60064697265625, -301.4161376953125, -268.2315979003906, -235.04705810546875, -201.86253356933594, -168.67800903320312, -135.49346923828125, -102.3089370727539, -69.12440490722656, -35.93987274169922, -2.755340576171875, 30.42919921875, 63.61372375488281, 96.79824829101562, 129.9827880859375, 163.16732788085938, 196.3518524169922, 229.536376953125, 262.7209167480469, 295.90545654296875, 329.0899658203125, 362.2745056152344, 395.458984375, 428.6435241699219, 461.82806396484375, 495.0125732421875, 528.1971435546875, 561.3816528320312, 594.566162109375, 627.750732421875, 660.9352416992188, 694.1197509765625, 727.3043212890625, 760.4888305664062, 793.67333984375, 826.85791015625, 860.0424194335938, 893.2269287109375, 926.4114990234375, 959.5960083007812, 992.7805786132812, 1025.965087890625, 1059.149658203125, 1092.334228515625, 1125.5186767578125, 1158.7032470703125, 1191.8876953125, 1225.072265625, 1258.2567138671875, 1291.4412841796875, 1324.6258544921875, 1357.810302734375, 1390.994873046875, 1424.179443359375, 1457.364013671875]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 10.0, 7.0, 13.0, 14.0, 19.0, 17.0, 23.0, 20.0, 29.0, 42.0, 38.0, 40.0, 62.0, 52.0, 55.0, 58.0, 55.0, 64.0, 52.0, 48.0, 36.0, 44.0, 38.0, 32.0, 25.0, 21.0, 17.0, 16.0, 14.0, 12.0, 9.0, 4.0, 7.0, 2.0, 5.0, 0.0, 4.0, 6.0], "bins": [-95.39794921875, -93.1355209350586, -90.87309265136719, -88.61066436767578, -86.34823608398438, -84.08580780029297, -81.82337951660156, -79.56094360351562, -77.29852294921875, -75.03609466552734, -72.77366638183594, -70.51123809814453, -68.24880981445312, -65.98638153076172, -63.72394943237305, -61.46152114868164, -59.19908905029297, -56.93666076660156, -54.674232482910156, -52.41180419921875, -50.149375915527344, -47.88694763183594, -45.624515533447266, -43.36208724975586, -41.09965896606445, -38.83723068237305, -36.57480239868164, -34.312374114990234, -32.04994201660156, -29.78751564025879, -27.52508544921875, -25.262657165527344, -23.000221252441406, -20.73779296875, -18.475364685058594, -16.212934494018555, -13.950506210327148, -11.688077926635742, -9.42564868927002, -7.163219451904297, -4.900791168212891, -2.638362407684326, -0.3759336471557617, 1.8864951133728027, 4.148923873901367, 6.411352157592773, 8.673781394958496, 10.936210632324219, 13.198638916015625, 15.461067199707031, 17.723495483398438, 19.985925674438477, 22.248353958129883, 24.51078224182129, 26.773212432861328, 29.035640716552734, 31.29806900024414, 33.56049728393555, 35.82292556762695, 38.08535385131836, 40.34778594970703, 42.61021423339844, 44.872642517089844, 47.13507080078125, 49.397499084472656]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 8.0, 4.0, 4.0, 12.0, 10.0, 6.0, 16.0, 13.0, 17.0, 20.0, 20.0, 26.0, 33.0, 30.0, 30.0, 43.0, 26.0, 34.0, 34.0, 58.0, 43.0, 49.0, 48.0, 28.0, 37.0, 33.0, 26.0, 31.0, 28.0, 28.0, 30.0, 25.0, 28.0, 13.0, 15.0, 13.0, 22.0, 20.0, 9.0, 5.0, 7.0, 8.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8203125, -8.5406494140625, -8.260986328125, -7.9813232421875, -7.70166015625, -7.4219970703125, -7.142333984375, -6.8626708984375, -6.5830078125, -6.3033447265625, -6.023681640625, -5.7440185546875, -5.46435546875, -5.1846923828125, -4.905029296875, -4.6253662109375, -4.345703125, -4.0660400390625, -3.786376953125, -3.5067138671875, -3.22705078125, -2.9473876953125, -2.667724609375, -2.3880615234375, -2.1083984375, -1.8287353515625, -1.549072265625, -1.2694091796875, -0.98974609375, -0.7100830078125, -0.430419921875, -0.1507568359375, 0.12890625, 0.4085693359375, 0.688232421875, 0.9678955078125, 1.24755859375, 1.5272216796875, 1.806884765625, 2.0865478515625, 2.3662109375, 2.6458740234375, 2.925537109375, 3.2052001953125, 3.48486328125, 3.7645263671875, 4.044189453125, 4.3238525390625, 4.603515625, 4.8831787109375, 5.162841796875, 5.4425048828125, 5.72216796875, 6.0018310546875, 6.281494140625, 6.5611572265625, 6.8408203125, 7.1204833984375, 7.400146484375, 7.6798095703125, 7.95947265625, 8.2391357421875, 8.518798828125, 8.7984619140625, 9.078125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 6.0, 3.0, 12.0, 12.0, 21.0, 36.0, 38.0, 58.0, 80.0, 138.0, 187.0, 280.0, 381.0, 585.0, 812.0, 1194.0, 1853.0, 2675.0, 4162.0, 6135.0, 9025.0, 13441.0, 19604.0, 29346.0, 43626.0, 65839.0, 99460.0, 143671.0, 172424.0, 141536.0, 97265.0, 64200.0, 42949.0, 28478.0, 18920.0, 13126.0, 8931.0, 5859.0, 3909.0, 2680.0, 1803.0, 1229.0, 834.0, 560.0, 372.0, 244.0, 180.0, 124.0, 97.0, 58.0, 29.0, 32.0, 22.0, 7.0, 5.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.8251953125, -0.7989730834960938, -0.7727508544921875, -0.7465286254882812, -0.720306396484375, -0.6940841674804688, -0.6678619384765625, -0.6416397094726562, -0.61541748046875, -0.5891952514648438, -0.5629730224609375, -0.5367507934570312, -0.510528564453125, -0.48430633544921875, -0.4580841064453125, -0.43186187744140625, -0.4056396484375, -0.37941741943359375, -0.3531951904296875, -0.32697296142578125, -0.300750732421875, -0.27452850341796875, -0.2483062744140625, -0.22208404541015625, -0.19586181640625, -0.16963958740234375, -0.1434173583984375, -0.11719512939453125, -0.090972900390625, -0.06475067138671875, -0.0385284423828125, -0.01230621337890625, 0.013916015625, 0.04013824462890625, 0.0663604736328125, 0.09258270263671875, 0.118804931640625, 0.14502716064453125, 0.1712493896484375, 0.19747161865234375, 0.22369384765625, 0.24991607666015625, 0.2761383056640625, 0.30236053466796875, 0.328582763671875, 0.35480499267578125, 0.3810272216796875, 0.40724945068359375, 0.4334716796875, 0.45969390869140625, 0.4859161376953125, 0.5121383666992188, 0.538360595703125, 0.5645828247070312, 0.5908050537109375, 0.6170272827148438, 0.64324951171875, 0.6694717407226562, 0.6956939697265625, 0.7219161987304688, 0.748138427734375, 0.7743606567382812, 0.8005828857421875, 0.8268051147460938, 0.85302734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 4.0, 1.0, 11.0, 13.0, 11.0, 15.0, 20.0, 20.0, 26.0, 23.0, 30.0, 32.0, 20.0, 42.0, 33.0, 46.0, 32.0, 42.0, 44.0, 1065.0, 47.0, 37.0, 36.0, 46.0, 34.0, 33.0, 31.0, 28.0, 27.0, 34.0, 19.0, 30.0, 12.0, 15.0, 17.0, 8.0, 10.0, 11.0, 7.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.68359375, -5.4986572265625, -5.313720703125, -5.1287841796875, -4.94384765625, -4.7589111328125, -4.573974609375, -4.3890380859375, -4.2041015625, -4.0191650390625, -3.834228515625, -3.6492919921875, -3.46435546875, -3.2794189453125, -3.094482421875, -2.9095458984375, -2.724609375, -2.5396728515625, -2.354736328125, -2.1697998046875, -1.98486328125, -1.7999267578125, -1.614990234375, -1.4300537109375, -1.2451171875, -1.0601806640625, -0.875244140625, -0.6903076171875, -0.50537109375, -0.3204345703125, -0.135498046875, 0.0494384765625, 0.234375, 0.4193115234375, 0.604248046875, 0.7891845703125, 0.97412109375, 1.1590576171875, 1.343994140625, 1.5289306640625, 1.7138671875, 1.8988037109375, 2.083740234375, 2.2686767578125, 2.45361328125, 2.6385498046875, 2.823486328125, 3.0084228515625, 3.193359375, 3.3782958984375, 3.563232421875, 3.7481689453125, 3.93310546875, 4.1180419921875, 4.302978515625, 4.4879150390625, 4.6728515625, 4.8577880859375, 5.042724609375, 5.2276611328125, 5.41259765625, 5.5975341796875, 5.782470703125, 5.9674072265625, 6.15234375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 13.0, 15.0, 13.0, 33.0, 35.0, 61.0, 95.0, 137.0, 207.0, 294.0, 433.0, 578.0, 869.0, 1210.0, 1759.0, 2633.0, 3828.0, 5489.0, 7796.0, 11316.0, 16229.0, 23909.0, 34829.0, 51371.0, 77088.0, 112197.0, 152724.0, 1205132.0, 122623.0, 84101.0, 57130.0, 38502.0, 26430.0, 17719.0, 12407.0, 8544.0, 5927.0, 4044.0, 2840.0, 2061.0, 1355.0, 970.0, 682.0, 478.0, 316.0, 205.0, 165.0, 106.0, 76.0, 50.0, 48.0, 13.0, 18.0, 13.0, 11.0, 5.0, 4.0, 2.0], "bins": [-0.77001953125, -0.7467727661132812, -0.7235260009765625, -0.7002792358398438, -0.677032470703125, -0.6537857055664062, -0.6305389404296875, -0.6072921752929688, -0.58404541015625, -0.5607986450195312, -0.5375518798828125, -0.5143051147460938, -0.491058349609375, -0.46781158447265625, -0.4445648193359375, -0.42131805419921875, -0.3980712890625, -0.37482452392578125, -0.3515777587890625, -0.32833099365234375, -0.305084228515625, -0.28183746337890625, -0.2585906982421875, -0.23534393310546875, -0.21209716796875, -0.18885040283203125, -0.1656036376953125, -0.14235687255859375, -0.119110107421875, -0.09586334228515625, -0.0726165771484375, -0.04936981201171875, -0.026123046875, -0.00287628173828125, 0.0203704833984375, 0.04361724853515625, 0.066864013671875, 0.09011077880859375, 0.1133575439453125, 0.13660430908203125, 0.15985107421875, 0.18309783935546875, 0.2063446044921875, 0.22959136962890625, 0.252838134765625, 0.27608489990234375, 0.2993316650390625, 0.32257843017578125, 0.3458251953125, 0.36907196044921875, 0.3923187255859375, 0.41556549072265625, 0.438812255859375, 0.46205902099609375, 0.4853057861328125, 0.5085525512695312, 0.53179931640625, 0.5550460815429688, 0.5782928466796875, 0.6015396118164062, 0.624786376953125, 0.6480331420898438, 0.6712799072265625, 0.6945266723632812, 0.7177734375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 1.0, 2.0, 8.0, 10.0, 20.0, 8.0, 15.0, 23.0, 30.0, 37.0, 43.0, 53.0, 59.0, 60.0, 57.0, 59.0, 59.0, 59.0, 68.0, 62.0, 42.0, 43.0, 26.0, 37.0, 30.0, 17.0, 13.0, 15.0, 13.0, 10.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026111602783203125, -0.0025269389152526855, -0.0024427175521850586, -0.0023584961891174316, -0.0022742748260498047, -0.0021900534629821777, -0.0021058320999145508, -0.002021610736846924, -0.0019373893737792969, -0.00185316801071167, -0.001768946647644043, -0.001684725284576416, -0.001600503921508789, -0.0015162825584411621, -0.0014320611953735352, -0.0013478398323059082, -0.0012636184692382812, -0.0011793971061706543, -0.0010951757431030273, -0.0010109543800354004, -0.0009267330169677734, -0.0008425116539001465, -0.0007582902908325195, -0.0006740689277648926, -0.0005898475646972656, -0.0005056262016296387, -0.0004214048385620117, -0.00033718347549438477, -0.0002529621124267578, -0.00016874074935913086, -8.45193862915039e-05, -2.980232238769531e-07, 8.392333984375e-05, 0.00016814470291137695, 0.0002523660659790039, 0.00033658742904663086, 0.0004208087921142578, 0.0005050301551818848, 0.0005892515182495117, 0.0006734728813171387, 0.0007576942443847656, 0.0008419156074523926, 0.0009261369705200195, 0.0010103583335876465, 0.0010945796966552734, 0.0011788010597229004, 0.0012630224227905273, 0.0013472437858581543, 0.0014314651489257812, 0.0015156865119934082, 0.0015999078750610352, 0.0016841292381286621, 0.001768350601196289, 0.001852571964263916, 0.001936793327331543, 0.00202101469039917, 0.002105236053466797, 0.002189457416534424, 0.0022736787796020508, 0.0023579001426696777, 0.0024421215057373047, 0.0025263428688049316, 0.0026105642318725586, 0.0026947855949401855, 0.0027790069580078125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 8.0, 8.0, 21.0, 17.0, 31.0, 42.0, 54.0, 59.0, 106.0, 133.0, 240.0, 801.0, 38364.0, 1006375.0, 1340.0, 370.0, 164.0, 114.0, 89.0, 47.0, 39.0, 28.0, 26.0, 15.0, 13.0, 11.0, 2.0, 3.0, 8.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.07403564453125, -0.07193183898925781, -0.06982803344726562, -0.06772422790527344, -0.06562042236328125, -0.06351661682128906, -0.061412811279296875, -0.05930900573730469, -0.0572052001953125, -0.05510139465332031, -0.052997589111328125, -0.05089378356933594, -0.04878997802734375, -0.04668617248535156, -0.044582366943359375, -0.04247856140136719, -0.040374755859375, -0.03827095031738281, -0.036167144775390625, -0.03406333923339844, -0.03195953369140625, -0.029855728149414062, -0.027751922607421875, -0.025648117065429688, -0.0235443115234375, -0.021440505981445312, -0.019336700439453125, -0.017232894897460938, -0.01512908935546875, -0.013025283813476562, -0.010921478271484375, -0.008817672729492188, -0.0067138671875, -0.0046100616455078125, -0.002506256103515625, -0.0004024505615234375, 0.00170135498046875, 0.0038051605224609375, 0.005908966064453125, 0.008012771606445312, 0.0101165771484375, 0.012220382690429688, 0.014324188232421875, 0.016427993774414062, 0.01853179931640625, 0.020635604858398438, 0.022739410400390625, 0.024843215942382812, 0.026947021484375, 0.029050827026367188, 0.031154632568359375, 0.03325843811035156, 0.03536224365234375, 0.03746604919433594, 0.039569854736328125, 0.04167366027832031, 0.0437774658203125, 0.04588127136230469, 0.047985076904296875, 0.05008888244628906, 0.05219268798828125, 0.05429649353027344, 0.056400299072265625, 0.05850410461425781, 0.06060791015625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 961.0, 56.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026387255638837814, -0.0019234810024499893, -0.0012082364410161972, -0.0004929918795824051, 0.00022225268185138702, 0.0009374972432851791, 0.0016527418047189713, 0.0023679863661527634, 0.0030832309275865555, 0.0037984754890203476, 0.00451372005045414, 0.005228964611887932, 0.005944209173321724, 0.006659453734755516, 0.007374698296189308, 0.0080899428576231, 0.008805187419056892, 0.009520431980490685, 0.010235676541924477, 0.010950921103358269, 0.01166616566479206, 0.012381410226225853, 0.013096654787659645, 0.013811899349093437, 0.01452714391052723, 0.015242388471961021, 0.015957633033394814, 0.016672877594828606, 0.017388122156262398, 0.01810336671769619, 0.018818611279129982, 0.019533855840563774, 0.020249098539352417, 0.02096434310078621, 0.02167958766222, 0.022394832223653793, 0.023110076785087585, 0.023825321346521378, 0.02454056590795517, 0.025255810469388962, 0.025971055030822754, 0.026686299592256546, 0.027401544153690338, 0.02811678871512413, 0.028832033276557922, 0.029547277837991714, 0.030262522399425507, 0.0309777669608593, 0.03169301152229309, 0.03240825608372688, 0.033123500645160675, 0.03383874520659447, 0.03455398976802826, 0.03526923432946205, 0.035984478890895844, 0.036699723452329636, 0.03741496801376343, 0.03813021257519722, 0.03884545713663101, 0.039560701698064804, 0.040275946259498596, 0.04099119082093239, 0.04170643538236618, 0.04242167994379997, 0.043136924505233765]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 2.0, 8.0, 9.0, 10.0, 13.0, 21.0, 18.0, 23.0, 27.0, 31.0, 29.0, 41.0, 40.0, 45.0, 48.0, 54.0, 43.0, 49.0, 50.0, 51.0, 52.0, 34.0, 62.0, 47.0, 26.0, 30.0, 40.0, 19.0, 18.0, 16.0, 9.0, 9.0, 7.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0017737150192260742, -0.00172490905970335, -0.001676103100180626, -0.0016272971406579018, -0.0015784911811351776, -0.0015296852216124535, -0.0014808792620897293, -0.0014320733025670052, -0.001383267343044281, -0.0013344613835215569, -0.0012856554239988327, -0.0012368494644761086, -0.0011880435049533844, -0.0011392375454306602, -0.001090431585907936, -0.001041625626385212, -0.0009928196668624878, -0.0009440137073397636, -0.0008952077478170395, -0.0008464017882943153, -0.0007975958287715912, -0.000748789869248867, -0.0006999839097261429, -0.0006511779502034187, -0.0006023719906806946, -0.0005535660311579704, -0.0005047600716352463, -0.0004559541121125221, -0.000407148152589798, -0.0003583421930670738, -0.00030953623354434967, -0.0002607302740216255, -0.00021192431449890137, -0.00016311835497617722, -0.00011431239545345306, -6.550643593072891e-05, -1.670047640800476e-05, 3.210548311471939e-05, 8.091144263744354e-05, 0.0001297174021601677, 0.00017852336168289185, 0.000227329321205616, 0.00027613528072834015, 0.0003249412402510643, 0.00037374719977378845, 0.0004225531592965126, 0.00047135911881923676, 0.0005201650783419609, 0.0005689710378646851, 0.0006177769973874092, 0.0006665829569101334, 0.0007153889164328575, 0.0007641948759555817, 0.0008130008354783058, 0.00086180679500103, 0.0009106127545237541, 0.0009594187140464783, 0.0010082246735692024, 0.0010570306330919266, 0.0011058365926146507, 0.0011546425521373749, 0.001203448511660099, 0.0012522544711828232, 0.0013010604307055473, 0.0013498663902282715]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 8.0, 4.0, 4.0, 12.0, 10.0, 6.0, 16.0, 13.0, 17.0, 20.0, 20.0, 26.0, 33.0, 30.0, 30.0, 43.0, 26.0, 34.0, 34.0, 58.0, 43.0, 49.0, 48.0, 28.0, 37.0, 33.0, 26.0, 31.0, 28.0, 28.0, 30.0, 25.0, 28.0, 13.0, 15.0, 13.0, 22.0, 20.0, 9.0, 5.0, 7.0, 8.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8203125, -8.5406494140625, -8.260986328125, -7.9813232421875, -7.70166015625, -7.4219970703125, -7.142333984375, -6.8626708984375, -6.5830078125, -6.3033447265625, -6.023681640625, -5.7440185546875, -5.46435546875, -5.1846923828125, -4.905029296875, -4.6253662109375, -4.345703125, -4.0660400390625, -3.786376953125, -3.5067138671875, -3.22705078125, -2.9473876953125, -2.667724609375, -2.3880615234375, -2.1083984375, -1.8287353515625, -1.549072265625, -1.2694091796875, -0.98974609375, -0.7100830078125, -0.430419921875, -0.1507568359375, 0.12890625, 0.4085693359375, 0.688232421875, 0.9678955078125, 1.24755859375, 1.5272216796875, 1.806884765625, 2.0865478515625, 2.3662109375, 2.6458740234375, 2.925537109375, 3.2052001953125, 3.48486328125, 3.7645263671875, 4.044189453125, 4.3238525390625, 4.603515625, 4.8831787109375, 5.162841796875, 5.4425048828125, 5.72216796875, 6.0018310546875, 6.281494140625, 6.5611572265625, 6.8408203125, 7.1204833984375, 7.400146484375, 7.6798095703125, 7.95947265625, 8.2391357421875, 8.518798828125, 8.7984619140625, 9.078125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 13.0, 8.0, 14.0, 15.0, 20.0, 29.0, 39.0, 57.0, 74.0, 120.0, 229.0, 446.0, 906.0, 1890.0, 4313.0, 10792.0, 28282.0, 81771.0, 257101.0, 426321.0, 154089.0, 50994.0, 18148.0, 7105.0, 2958.0, 1336.0, 622.0, 333.0, 155.0, 121.0, 62.0, 49.0, 40.0, 31.0, 16.0, 15.0, 7.0, 8.0, 7.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.3795166015625, -8.102783203125, -7.8260498046875, -7.54931640625, -7.2725830078125, -6.995849609375, -6.7191162109375, -6.4423828125, -6.1656494140625, -5.888916015625, -5.6121826171875, -5.33544921875, -5.0587158203125, -4.781982421875, -4.5052490234375, -4.228515625, -3.9517822265625, -3.675048828125, -3.3983154296875, -3.12158203125, -2.8448486328125, -2.568115234375, -2.2913818359375, -2.0146484375, -1.7379150390625, -1.461181640625, -1.1844482421875, -0.90771484375, -0.6309814453125, -0.354248046875, -0.0775146484375, 0.19921875, 0.4759521484375, 0.752685546875, 1.0294189453125, 1.30615234375, 1.5828857421875, 1.859619140625, 2.1363525390625, 2.4130859375, 2.6898193359375, 2.966552734375, 3.2432861328125, 3.52001953125, 3.7967529296875, 4.073486328125, 4.3502197265625, 4.626953125, 4.9036865234375, 5.180419921875, 5.4571533203125, 5.73388671875, 6.0106201171875, 6.287353515625, 6.5640869140625, 6.8408203125, 7.1175537109375, 7.394287109375, 7.6710205078125, 7.94775390625, 8.2244873046875, 8.501220703125, 8.7779541015625, 9.0546875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 13.0, 10.0, 9.0, 15.0, 29.0, 17.0, 30.0, 14.0, 30.0, 45.0, 44.0, 49.0, 40.0, 55.0, 169.0, 1621.0, 326.0, 89.0, 70.0, 45.0, 43.0, 44.0, 33.0, 28.0, 25.0, 21.0, 25.0, 14.0, 14.0, 16.0, 9.0, 13.0, 7.0, 6.0, 4.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.40625, -33.386474609375, -32.36669921875, -31.346923828125, -30.3271484375, -29.307373046875, -28.28759765625, -27.267822265625, -26.248046875, -25.228271484375, -24.20849609375, -23.188720703125, -22.1689453125, -21.149169921875, -20.12939453125, -19.109619140625, -18.08984375, -17.070068359375, -16.05029296875, -15.030517578125, -14.0107421875, -12.990966796875, -11.97119140625, -10.951416015625, -9.931640625, -8.911865234375, -7.89208984375, -6.872314453125, -5.8525390625, -4.832763671875, -3.81298828125, -2.793212890625, -1.7734375, -0.753662109375, 0.26611328125, 1.285888671875, 2.3056640625, 3.325439453125, 4.34521484375, 5.364990234375, 6.384765625, 7.404541015625, 8.42431640625, 9.444091796875, 10.4638671875, 11.483642578125, 12.50341796875, 13.523193359375, 14.54296875, 15.562744140625, 16.58251953125, 17.602294921875, 18.6220703125, 19.641845703125, 20.66162109375, 21.681396484375, 22.701171875, 23.720947265625, 24.74072265625, 25.760498046875, 26.7802734375, 27.800048828125, 28.81982421875, 29.839599609375, 30.859375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 3.0, 6.0, 5.0, 10.0, 11.0, 11.0, 16.0, 24.0, 27.0, 42.0, 36.0, 80.0, 68.0, 98.0, 158.0, 184.0, 326.0, 611.0, 2556.0, 266435.0, 2865546.0, 7401.0, 836.0, 386.0, 218.0, 148.0, 106.0, 73.0, 50.0, 55.0, 39.0, 40.0, 18.0, 23.0, 11.0, 11.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.71875, -49.03759765625, -47.3564453125, -45.67529296875, -43.994140625, -42.31298828125, -40.6318359375, -38.95068359375, -37.26953125, -35.58837890625, -33.9072265625, -32.22607421875, -30.544921875, -28.86376953125, -27.1826171875, -25.50146484375, -23.8203125, -22.13916015625, -20.4580078125, -18.77685546875, -17.095703125, -15.41455078125, -13.7333984375, -12.05224609375, -10.37109375, -8.68994140625, -7.0087890625, -5.32763671875, -3.646484375, -1.96533203125, -0.2841796875, 1.39697265625, 3.078125, 4.75927734375, 6.4404296875, 8.12158203125, 9.802734375, 11.48388671875, 13.1650390625, 14.84619140625, 16.52734375, 18.20849609375, 19.8896484375, 21.57080078125, 23.251953125, 24.93310546875, 26.6142578125, 28.29541015625, 29.9765625, 31.65771484375, 33.3388671875, 35.02001953125, 36.701171875, 38.38232421875, 40.0634765625, 41.74462890625, 43.42578125, 45.10693359375, 46.7880859375, 48.46923828125, 50.150390625, 51.83154296875, 53.5126953125, 55.19384765625, 56.875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 109.0, 861.0, 51.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-464.9685974121094, -456.86767578125, -448.7667541503906, -440.6658630371094, -432.56494140625, -424.4640197753906, -416.36309814453125, -408.26220703125, -400.1612854003906, -392.06036376953125, -383.9594421386719, -375.8585510253906, -367.75762939453125, -359.6567077636719, -351.5557861328125, -343.45489501953125, -335.35394287109375, -327.2530212402344, -319.152099609375, -311.05120849609375, -302.9502868652344, -294.849365234375, -286.7484436035156, -278.64752197265625, -270.546630859375, -262.4457092285156, -254.3448028564453, -246.24388122558594, -238.14297485351562, -230.04205322265625, -221.94113159179688, -213.84022521972656, -205.7393341064453, -197.63841247558594, -189.53750610351562, -181.43658447265625, -173.33567810058594, -165.23475646972656, -157.13385009765625, -149.03292846679688, -140.93202209472656, -132.8311004638672, -124.73019409179688, -116.6292724609375, -108.52836608886719, -100.42744445800781, -92.32653045654297, -84.22561645507812, -76.12469482421875, -68.0237808227539, -59.92286682128906, -51.82194900512695, -43.72103500366211, -35.620121002197266, -27.519203186035156, -19.418289184570312, -11.317378997802734, -3.216464042663574, 4.884450912475586, 12.985366821289062, 21.086280822753906, 29.18719482421875, 37.28811264038086, 45.3890266418457, 53.48994064331055]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 5.0, 6.0, 3.0, 4.0, 10.0, 11.0, 9.0, 17.0, 23.0, 20.0, 21.0, 19.0, 23.0, 35.0, 36.0, 29.0, 44.0, 45.0, 40.0, 47.0, 46.0, 38.0, 47.0, 48.0, 36.0, 37.0, 40.0, 33.0, 35.0, 37.0, 24.0, 24.0, 18.0, 19.0, 16.0, 10.0, 10.0, 7.0, 11.0, 6.0, 7.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.4904556274414, -78.79129791259766, -76.09214782714844, -73.39299011230469, -70.69384002685547, -67.99468231201172, -65.2955322265625, -62.59637451171875, -59.897220611572266, -57.19806671142578, -54.4989128112793, -51.79975891113281, -49.10060119628906, -46.401451110839844, -43.702293395996094, -41.00313949584961, -38.303985595703125, -35.60483169555664, -32.905677795410156, -30.20652198791504, -27.507368087768555, -24.80821418762207, -22.109058380126953, -19.40990447998047, -16.710750579833984, -14.0115966796875, -11.3124418258667, -8.613286972045898, -5.914133071899414, -3.2149791717529297, -0.5158233642578125, 2.183330535888672, 4.882476806640625, 7.581631183624268, 10.28078556060791, 12.979940414428711, 15.679094314575195, 18.37824821472168, 21.077404022216797, 23.77655792236328, 26.475711822509766, 29.17486572265625, 31.874019622802734, 34.57317352294922, 37.27233123779297, 39.97148132324219, 42.67063903808594, 45.36979293823242, 48.068946838378906, 50.76810073852539, 53.467254638671875, 56.166412353515625, 58.865562438964844, 61.564720153808594, 64.26387023925781, 66.96302795410156, 69.66218566894531, 72.36134338378906, 75.06049346923828, 77.75965118408203, 80.45880126953125, 83.157958984375, 85.85711669921875, 88.55626678466797, 91.25541687011719]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 6.0, 4.0, 8.0, 5.0, 10.0, 4.0, 15.0, 15.0, 14.0, 13.0, 21.0, 20.0, 29.0, 27.0, 27.0, 34.0, 31.0, 34.0, 45.0, 36.0, 37.0, 50.0, 42.0, 39.0, 29.0, 42.0, 36.0, 23.0, 23.0, 27.0, 33.0, 28.0, 25.0, 18.0, 21.0, 27.0, 11.0, 22.0, 11.0, 11.0, 9.0, 6.0, 10.0, 7.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.0, -8.7259521484375, -8.451904296875, -8.1778564453125, -7.90380859375, -7.6297607421875, -7.355712890625, -7.0816650390625, -6.8076171875, -6.5335693359375, -6.259521484375, -5.9854736328125, -5.71142578125, -5.4373779296875, -5.163330078125, -4.8892822265625, -4.615234375, -4.3411865234375, -4.067138671875, -3.7930908203125, -3.51904296875, -3.2449951171875, -2.970947265625, -2.6968994140625, -2.4228515625, -2.1488037109375, -1.874755859375, -1.6007080078125, -1.32666015625, -1.0526123046875, -0.778564453125, -0.5045166015625, -0.23046875, 0.0435791015625, 0.317626953125, 0.5916748046875, 0.86572265625, 1.1397705078125, 1.413818359375, 1.6878662109375, 1.9619140625, 2.2359619140625, 2.510009765625, 2.7840576171875, 3.05810546875, 3.3321533203125, 3.606201171875, 3.8802490234375, 4.154296875, 4.4283447265625, 4.702392578125, 4.9764404296875, 5.25048828125, 5.5245361328125, 5.798583984375, 6.0726318359375, 6.3466796875, 6.6207275390625, 6.894775390625, 7.1688232421875, 7.44287109375, 7.7169189453125, 7.990966796875, 8.2650146484375, 8.5390625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 4.0, 4.0, 7.0, 10.0, 13.0, 20.0, 17.0, 21.0, 25.0, 21.0, 36.0, 50.0, 59.0, 78.0, 100.0, 186.0, 416.0, 1463.0, 8485.0, 195077.0, 3492779.0, 478650.0, 13594.0, 1957.0, 473.0, 220.0, 100.0, 64.0, 64.0, 46.0, 41.0, 34.0, 26.0, 23.0, 19.0, 13.0, 15.0, 10.0, 9.0, 12.0, 10.0, 10.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-31.203125, -30.24609375, -29.2890625, -28.33203125, -27.375, -26.41796875, -25.4609375, -24.50390625, -23.546875, -22.58984375, -21.6328125, -20.67578125, -19.71875, -18.76171875, -17.8046875, -16.84765625, -15.890625, -14.93359375, -13.9765625, -13.01953125, -12.0625, -11.10546875, -10.1484375, -9.19140625, -8.234375, -7.27734375, -6.3203125, -5.36328125, -4.40625, -3.44921875, -2.4921875, -1.53515625, -0.578125, 0.37890625, 1.3359375, 2.29296875, 3.25, 4.20703125, 5.1640625, 6.12109375, 7.078125, 8.03515625, 8.9921875, 9.94921875, 10.90625, 11.86328125, 12.8203125, 13.77734375, 14.734375, 15.69140625, 16.6484375, 17.60546875, 18.5625, 19.51953125, 20.4765625, 21.43359375, 22.390625, 23.34765625, 24.3046875, 25.26171875, 26.21875, 27.17578125, 28.1328125, 29.08984375, 30.046875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 9.0, 11.0, 11.0, 14.0, 24.0, 31.0, 36.0, 51.0, 64.0, 117.0, 113.0, 171.0, 197.0, 336.0, 464.0, 492.0, 465.0, 392.0, 286.0, 195.0, 162.0, 88.0, 86.0, 69.0, 41.0, 31.0, 27.0, 21.0, 17.0, 17.0, 13.0, 3.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.3671875, -13.8841552734375, -13.401123046875, -12.9180908203125, -12.43505859375, -11.9520263671875, -11.468994140625, -10.9859619140625, -10.5029296875, -10.0198974609375, -9.536865234375, -9.0538330078125, -8.57080078125, -8.0877685546875, -7.604736328125, -7.1217041015625, -6.638671875, -6.1556396484375, -5.672607421875, -5.1895751953125, -4.70654296875, -4.2235107421875, -3.740478515625, -3.2574462890625, -2.7744140625, -2.2913818359375, -1.808349609375, -1.3253173828125, -0.84228515625, -0.3592529296875, 0.123779296875, 0.6068115234375, 1.08984375, 1.5728759765625, 2.055908203125, 2.5389404296875, 3.02197265625, 3.5050048828125, 3.988037109375, 4.4710693359375, 4.9541015625, 5.4371337890625, 5.920166015625, 6.4031982421875, 6.88623046875, 7.3692626953125, 7.852294921875, 8.3353271484375, 8.818359375, 9.3013916015625, 9.784423828125, 10.2674560546875, 10.75048828125, 11.2335205078125, 11.716552734375, 12.1995849609375, 12.6826171875, 13.1656494140625, 13.648681640625, 14.1317138671875, 14.61474609375, 15.0977783203125, 15.580810546875, 16.0638427734375, 16.546875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 7.0, 5.0, 9.0, 12.0, 19.0, 18.0, 27.0, 47.0, 45.0, 56.0, 90.0, 112.0, 168.0, 224.0, 335.0, 616.0, 3462.0, 190387.0, 3968339.0, 27490.0, 1379.0, 399.0, 223.0, 179.0, 144.0, 109.0, 99.0, 67.0, 55.0, 38.0, 27.0, 28.0, 17.0, 10.0, 12.0, 8.0, 9.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.25, -62.8603515625, -60.470703125, -58.0810546875, -55.69140625, -53.3017578125, -50.912109375, -48.5224609375, -46.1328125, -43.7431640625, -41.353515625, -38.9638671875, -36.57421875, -34.1845703125, -31.794921875, -29.4052734375, -27.015625, -24.6259765625, -22.236328125, -19.8466796875, -17.45703125, -15.0673828125, -12.677734375, -10.2880859375, -7.8984375, -5.5087890625, -3.119140625, -0.7294921875, 1.66015625, 4.0498046875, 6.439453125, 8.8291015625, 11.21875, 13.6083984375, 15.998046875, 18.3876953125, 20.77734375, 23.1669921875, 25.556640625, 27.9462890625, 30.3359375, 32.7255859375, 35.115234375, 37.5048828125, 39.89453125, 42.2841796875, 44.673828125, 47.0634765625, 49.453125, 51.8427734375, 54.232421875, 56.6220703125, 59.01171875, 61.4013671875, 63.791015625, 66.1806640625, 68.5703125, 70.9599609375, 73.349609375, 75.7392578125, 78.12890625, 80.5185546875, 82.908203125, 85.2978515625, 87.6875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 401.0, 605.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-630.762451171875, -611.0979614257812, -591.4334716796875, -571.76904296875, -552.1045532226562, -532.4400634765625, -512.775634765625, -493.11114501953125, -473.4466552734375, -453.78216552734375, -434.1177062988281, -414.4532470703125, -394.78875732421875, -375.124267578125, -355.4598083496094, -335.79534912109375, -316.130859375, -296.46636962890625, -276.8019104003906, -257.137451171875, -237.47296142578125, -217.80848693847656, -198.14401245117188, -178.4795379638672, -158.8150634765625, -139.1505889892578, -119.48611450195312, -99.82164001464844, -80.15716552734375, -60.49269104003906, -40.828216552734375, -21.163742065429688, -1.499267578125, 18.165206909179688, 37.829681396484375, 57.49415588378906, 77.15863037109375, 96.82310485839844, 116.48757934570312, 136.1520538330078, 155.8165283203125, 175.4810028076172, 195.14547729492188, 214.80995178222656, 234.47442626953125, 254.13890075683594, 273.8033752441406, 293.46783447265625, 313.13232421875, 332.79681396484375, 352.4612731933594, 372.125732421875, 391.79022216796875, 411.4547119140625, 431.1191711425781, 450.78363037109375, 470.4481201171875, 490.11260986328125, 509.7770690917969, 529.4415283203125, 549.1060180664062, 568.7705078125, 588.4349365234375, 608.0994262695312, 627.763916015625]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 6.0, 8.0, 4.0, 5.0, 12.0, 19.0, 14.0, 18.0, 15.0, 15.0, 21.0, 22.0, 27.0, 32.0, 31.0, 38.0, 23.0, 28.0, 38.0, 42.0, 38.0, 25.0, 47.0, 32.0, 25.0, 33.0, 33.0, 42.0, 34.0, 28.0, 26.0, 27.0, 26.0, 23.0, 23.0, 12.0, 15.0, 15.0, 18.0, 17.0, 9.0, 5.0, 5.0, 8.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-46.48933792114258, -44.93326950073242, -43.377197265625, -41.821128845214844, -40.26505661010742, -38.708988189697266, -37.152915954589844, -35.59684753417969, -34.04077911376953, -32.484710693359375, -30.928638458251953, -29.372570037841797, -27.816497802734375, -26.26042938232422, -24.70435905456543, -23.14828872680664, -21.59221649169922, -20.03614616394043, -18.48007583618164, -16.924007415771484, -15.367936134338379, -13.81186580657959, -12.255796432495117, -10.699726104736328, -9.143655776977539, -7.58758544921875, -6.031515598297119, -4.475445747375488, -2.919375419616699, -1.3633050918579102, 0.1927642822265625, 1.7488346099853516, 3.304901123046875, 4.860971450805664, 6.417041301727295, 7.973111152648926, 9.529181480407715, 11.085251808166504, 12.641321182250977, 14.197391510009766, 15.753461837768555, 17.309532165527344, 18.865602493286133, 20.421672821044922, 21.977741241455078, 23.5338134765625, 25.089881896972656, 26.645952224731445, 28.202022552490234, 29.758092880249023, 31.314163208007812, 32.87023162841797, 34.42630386352539, 35.98237228393555, 37.53844451904297, 39.094512939453125, 40.65058135986328, 42.20664978027344, 43.76272201538086, 45.318790435791016, 46.87486267089844, 48.430931091308594, 49.98699951171875, 51.54307174682617, 53.099143981933594]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 6.0, 7.0, 7.0, 5.0, 10.0, 4.0, 8.0, 16.0, 18.0, 18.0, 28.0, 26.0, 17.0, 23.0, 23.0, 31.0, 31.0, 36.0, 36.0, 28.0, 45.0, 38.0, 33.0, 32.0, 43.0, 27.0, 42.0, 30.0, 31.0, 20.0, 25.0, 29.0, 20.0, 27.0, 22.0, 11.0, 16.0, 13.0, 21.0, 10.0, 13.0, 9.0, 11.0, 8.0, 15.0, 4.0, 12.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0], "bins": [-8.265625, -8.0174560546875, -7.769287109375, -7.5211181640625, -7.27294921875, -7.0247802734375, -6.776611328125, -6.5284423828125, -6.2802734375, -6.0321044921875, -5.783935546875, -5.5357666015625, -5.28759765625, -5.0394287109375, -4.791259765625, -4.5430908203125, -4.294921875, -4.0467529296875, -3.798583984375, -3.5504150390625, -3.30224609375, -3.0540771484375, -2.805908203125, -2.5577392578125, -2.3095703125, -2.0614013671875, -1.813232421875, -1.5650634765625, -1.31689453125, -1.0687255859375, -0.820556640625, -0.5723876953125, -0.32421875, -0.0760498046875, 0.172119140625, 0.4202880859375, 0.66845703125, 0.9166259765625, 1.164794921875, 1.4129638671875, 1.6611328125, 1.9093017578125, 2.157470703125, 2.4056396484375, 2.65380859375, 2.9019775390625, 3.150146484375, 3.3983154296875, 3.646484375, 3.8946533203125, 4.142822265625, 4.3909912109375, 4.63916015625, 4.8873291015625, 5.135498046875, 5.3836669921875, 5.6318359375, 5.8800048828125, 6.128173828125, 6.3763427734375, 6.62451171875, 6.8726806640625, 7.120849609375, 7.3690185546875, 7.6171875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 4.0, 33.0, 35.0, 47.0, 78.0, 91.0, 144.0, 223.0, 328.0, 526.0, 740.0, 1139.0, 1665.0, 2386.0, 3719.0, 5579.0, 8449.0, 12905.0, 19915.0, 30649.0, 46773.0, 73201.0, 113608.0, 162511.0, 178476.0, 134677.0, 87874.0, 56958.0, 36270.0, 23742.0, 15706.0, 10193.0, 6520.0, 4395.0, 2979.0, 1996.0, 1331.0, 873.0, 602.0, 402.0, 240.0, 206.0, 132.0, 66.0, 76.0, 38.0, 22.0, 18.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.86083984375, -0.8332595825195312, -0.8056793212890625, -0.7780990600585938, -0.750518798828125, -0.7229385375976562, -0.6953582763671875, -0.6677780151367188, -0.64019775390625, -0.6126174926757812, -0.5850372314453125, -0.5574569702148438, -0.529876708984375, -0.5022964477539062, -0.4747161865234375, -0.44713592529296875, -0.4195556640625, -0.39197540283203125, -0.3643951416015625, -0.33681488037109375, -0.309234619140625, -0.28165435791015625, -0.2540740966796875, -0.22649383544921875, -0.19891357421875, -0.17133331298828125, -0.1437530517578125, -0.11617279052734375, -0.088592529296875, -0.06101226806640625, -0.0334320068359375, -0.00585174560546875, 0.021728515625, 0.04930877685546875, 0.0768890380859375, 0.10446929931640625, 0.132049560546875, 0.15962982177734375, 0.1872100830078125, 0.21479034423828125, 0.24237060546875, 0.26995086669921875, 0.2975311279296875, 0.32511138916015625, 0.352691650390625, 0.38027191162109375, 0.4078521728515625, 0.43543243408203125, 0.4630126953125, 0.49059295654296875, 0.5181732177734375, 0.5457534790039062, 0.573333740234375, 0.6009140014648438, 0.6284942626953125, 0.6560745239257812, 0.68365478515625, 0.7112350463867188, 0.7388153076171875, 0.7663955688476562, 0.793975830078125, 0.8215560913085938, 0.8491363525390625, 0.8767166137695312, 0.904296875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 9.0, 6.0, 17.0, 11.0, 22.0, 18.0, 22.0, 23.0, 31.0, 21.0, 36.0, 30.0, 36.0, 45.0, 37.0, 38.0, 43.0, 48.0, 1065.0, 52.0, 36.0, 35.0, 35.0, 30.0, 35.0, 37.0, 20.0, 25.0, 18.0, 19.0, 25.0, 22.0, 13.0, 14.0, 9.0, 8.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.00390625, -5.81048583984375, -5.6170654296875, -5.42364501953125, -5.230224609375, -5.03680419921875, -4.8433837890625, -4.64996337890625, -4.45654296875, -4.26312255859375, -4.0697021484375, -3.87628173828125, -3.682861328125, -3.48944091796875, -3.2960205078125, -3.10260009765625, -2.9091796875, -2.71575927734375, -2.5223388671875, -2.32891845703125, -2.135498046875, -1.94207763671875, -1.7486572265625, -1.55523681640625, -1.36181640625, -1.16839599609375, -0.9749755859375, -0.78155517578125, -0.588134765625, -0.39471435546875, -0.2012939453125, -0.00787353515625, 0.185546875, 0.37896728515625, 0.5723876953125, 0.76580810546875, 0.959228515625, 1.15264892578125, 1.3460693359375, 1.53948974609375, 1.73291015625, 1.92633056640625, 2.1197509765625, 2.31317138671875, 2.506591796875, 2.70001220703125, 2.8934326171875, 3.08685302734375, 3.2802734375, 3.47369384765625, 3.6671142578125, 3.86053466796875, 4.053955078125, 4.24737548828125, 4.4407958984375, 4.63421630859375, 4.82763671875, 5.02105712890625, 5.2144775390625, 5.40789794921875, 5.601318359375, 5.79473876953125, 5.9881591796875, 6.18157958984375, 6.375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 16.0, 14.0, 23.0, 32.0, 52.0, 83.0, 119.0, 188.0, 240.0, 383.0, 524.0, 867.0, 1222.0, 1822.0, 2812.0, 4146.0, 6245.0, 9623.0, 14691.0, 22651.0, 35042.0, 54366.0, 85298.0, 131261.0, 1224715.0, 168852.0, 117010.0, 76650.0, 48772.0, 31003.0, 19998.0, 13069.0, 8516.0, 5705.0, 3730.0, 2446.0, 1682.0, 1111.0, 675.0, 477.0, 321.0, 229.0, 136.0, 114.0, 55.0, 42.0, 39.0, 15.0, 18.0, 10.0, 10.0, 4.0, 1.0, 5.0, 1.0], "bins": [-0.89794921875, -0.8714370727539062, -0.8449249267578125, -0.8184127807617188, -0.791900634765625, -0.7653884887695312, -0.7388763427734375, -0.7123641967773438, -0.68585205078125, -0.6593399047851562, -0.6328277587890625, -0.6063156127929688, -0.579803466796875, -0.5532913208007812, -0.5267791748046875, -0.5002670288085938, -0.4737548828125, -0.44724273681640625, -0.4207305908203125, -0.39421844482421875, -0.367706298828125, -0.34119415283203125, -0.3146820068359375, -0.28816986083984375, -0.26165771484375, -0.23514556884765625, -0.2086334228515625, -0.18212127685546875, -0.155609130859375, -0.12909698486328125, -0.1025848388671875, -0.07607269287109375, -0.049560546875, -0.02304840087890625, 0.0034637451171875, 0.02997589111328125, 0.056488037109375, 0.08300018310546875, 0.1095123291015625, 0.13602447509765625, 0.16253662109375, 0.18904876708984375, 0.2155609130859375, 0.24207305908203125, 0.268585205078125, 0.29509735107421875, 0.3216094970703125, 0.34812164306640625, 0.3746337890625, 0.40114593505859375, 0.4276580810546875, 0.45417022705078125, 0.480682373046875, 0.5071945190429688, 0.5337066650390625, 0.5602188110351562, 0.58673095703125, 0.6132431030273438, 0.6397552490234375, 0.6662673950195312, 0.692779541015625, 0.7192916870117188, 0.7458038330078125, 0.7723159790039062, 0.798828125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 6.0, 9.0, 5.0, 7.0, 11.0, 23.0, 18.0, 15.0, 22.0, 31.0, 38.0, 42.0, 55.0, 53.0, 64.0, 75.0, 83.0, 70.0, 68.0, 54.0, 51.0, 36.0, 31.0, 27.0, 22.0, 19.0, 20.0, 11.0, 8.0, 9.0, 1.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0031871795654296875, -0.003093928098678589, -0.0030006766319274902, -0.0029074251651763916, -0.002814173698425293, -0.0027209222316741943, -0.0026276707649230957, -0.002534419298171997, -0.0024411678314208984, -0.0023479163646698, -0.002254664897918701, -0.0021614134311676025, -0.002068161964416504, -0.0019749104976654053, -0.0018816590309143066, -0.001788407564163208, -0.0016951560974121094, -0.0016019046306610107, -0.0015086531639099121, -0.0014154016971588135, -0.0013221502304077148, -0.0012288987636566162, -0.0011356472969055176, -0.001042395830154419, -0.0009491443634033203, -0.0008558928966522217, -0.000762641429901123, -0.0006693899631500244, -0.0005761384963989258, -0.00048288702964782715, -0.0003896355628967285, -0.0002963840961456299, -0.00020313262939453125, -0.00010988116264343262, -1.6629695892333984e-05, 7.662177085876465e-05, 0.00016987323760986328, 0.0002631247043609619, 0.00035637617111206055, 0.0004496276378631592, 0.0005428791046142578, 0.0006361305713653564, 0.0007293820381164551, 0.0008226335048675537, 0.0009158849716186523, 0.001009136438369751, 0.0011023879051208496, 0.0011956393718719482, 0.0012888908386230469, 0.0013821423053741455, 0.0014753937721252441, 0.0015686452388763428, 0.0016618967056274414, 0.00175514817237854, 0.0018483996391296387, 0.0019416511058807373, 0.002034902572631836, 0.0021281540393829346, 0.002221405506134033, 0.002314656972885132, 0.0024079084396362305, 0.002501159906387329, 0.0025944113731384277, 0.0026876628398895264, 0.002780914306640625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 5.0, 2.0, 8.0, 9.0, 5.0, 21.0, 17.0, 26.0, 38.0, 47.0, 44.0, 84.0, 113.0, 177.0, 385.0, 1128.0, 823255.0, 221347.0, 897.0, 345.0, 167.0, 122.0, 70.0, 56.0, 50.0, 28.0, 16.0, 19.0, 18.0, 18.0, 12.0, 5.0, 4.0, 5.0, 2.0, 2.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06488037109375, -0.06278228759765625, -0.0606842041015625, -0.05858612060546875, -0.056488037109375, -0.05438995361328125, -0.0522918701171875, -0.05019378662109375, -0.048095703125, -0.04599761962890625, -0.0438995361328125, -0.04180145263671875, -0.039703369140625, -0.03760528564453125, -0.0355072021484375, -0.03340911865234375, -0.03131103515625, -0.02921295166015625, -0.0271148681640625, -0.02501678466796875, -0.022918701171875, -0.02082061767578125, -0.0187225341796875, -0.01662445068359375, -0.0145263671875, -0.01242828369140625, -0.0103302001953125, -0.00823211669921875, -0.006134033203125, -0.00403594970703125, -0.0019378662109375, 0.00016021728515625, 0.00225830078125, 0.00435638427734375, 0.0064544677734375, 0.00855255126953125, 0.010650634765625, 0.01274871826171875, 0.0148468017578125, 0.01694488525390625, 0.01904296875, 0.02114105224609375, 0.0232391357421875, 0.02533721923828125, 0.027435302734375, 0.02953338623046875, 0.0316314697265625, 0.03372955322265625, 0.03582763671875, 0.03792572021484375, 0.0400238037109375, 0.04212188720703125, 0.044219970703125, 0.04631805419921875, 0.0484161376953125, 0.05051422119140625, 0.0526123046875, 0.05471038818359375, 0.0568084716796875, 0.05890655517578125, 0.061004638671875, 0.06310272216796875, 0.0652008056640625, 0.06729888916015625, 0.06939697265625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 99.0, 454.0, 358.0, 76.0, 15.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0074713705107569695, -0.007284095976501703, -0.007096821442246437, -0.006909547373652458, -0.006722272839397192, -0.006534998305141926, -0.006347724236547947, -0.006160449702292681, -0.0059731751680374146, -0.005785900633782148, -0.005598626099526882, -0.005411352030932903, -0.005224077496677637, -0.005036802962422371, -0.004849528893828392, -0.004662254359573126, -0.00447497982531786, -0.0042877052910625935, -0.004100430756807327, -0.003913156688213348, -0.003725882153958082, -0.003538607619702816, -0.0033513333182781935, -0.003164059016853571, -0.0029767844825983047, -0.0027895099483430386, -0.002602235646918416, -0.0024149613454937935, -0.0022276868112385273, -0.002040412276983261, -0.0018531379755586386, -0.0016658635577186942, -0.0014785896055400372, -0.0012913151877000928, -0.0011040407698601484, -0.0009167663520202041, -0.0007294919341802597, -0.0005422175163403153, -0.000354943098500371, -0.00016766868066042662, 1.9605737179517746e-05, 0.0002068801550194621, 0.00039415457285940647, 0.0005814289906993508, 0.0007687034085392952, 0.0009559778263792396, 0.001143252244219184, 0.0013305266620591283, 0.0015178010798990726, 0.001705075497739017, 0.0018923499155789614, 0.002079624217003584, 0.00226689875125885, 0.0024541732855141163, 0.002641447586938739, 0.0028287218883633614, 0.0030159964226186275, 0.0032032709568738937, 0.0033905452582985163, 0.003577819559723139, 0.003765094093978405, 0.003952368628233671, 0.004139643162488937, 0.004326917231082916, 0.0045141917653381824]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 7.0, 14.0, 8.0, 6.0, 16.0, 18.0, 22.0, 16.0, 19.0, 31.0, 35.0, 29.0, 30.0, 34.0, 36.0, 34.0, 35.0, 45.0, 34.0, 37.0, 41.0, 38.0, 35.0, 34.0, 30.0, 22.0, 21.0, 22.0, 36.0, 28.0, 24.0, 18.0, 17.0, 15.0, 15.0, 11.0, 21.0, 6.0, 13.0, 8.0, 8.0, 5.0, 1.0, 5.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0012064576148986816, -0.0011669304221868515, -0.0011274032294750214, -0.0010878760367631912, -0.001048348844051361, -0.001008821651339531, -0.0009692944586277008, -0.0009297672659158707, -0.0008902400732040405, -0.0008507128804922104, -0.0008111856877803802, -0.0007716584950685501, -0.00073213130235672, -0.0006926041096448898, -0.0006530769169330597, -0.0006135497242212296, -0.0005740225315093994, -0.0005344953387975693, -0.0004949681460857391, -0.000455440953373909, -0.00041591376066207886, -0.0003763865679502487, -0.0003368593752384186, -0.00029733218252658844, -0.0002578049898147583, -0.00021827779710292816, -0.00017875060439109802, -0.00013922341167926788, -9.969621896743774e-05, -6.0169026255607605e-05, -2.0641833543777466e-05, 1.8885359168052673e-05, 5.841255187988281e-05, 9.793974459171295e-05, 0.0001374669373035431, 0.00017699413001537323, 0.00021652132272720337, 0.0002560485154390335, 0.00029557570815086365, 0.0003351029008626938, 0.0003746300935745239, 0.00041415728628635406, 0.0004536844789981842, 0.0004932116717100143, 0.0005327388644218445, 0.0005722660571336746, 0.0006117932498455048, 0.0006513204425573349, 0.000690847635269165, 0.0007303748279809952, 0.0007699020206928253, 0.0008094292134046555, 0.0008489564061164856, 0.0008884835988283157, 0.0009280107915401459, 0.000967537984251976, 0.0010070651769638062, 0.0010465923696756363, 0.0010861195623874664, 0.0011256467550992966, 0.0011651739478111267, 0.0012047011405229568, 0.001244228333234787, 0.0012837555259466171, 0.0013232827186584473]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 6.0, 7.0, 7.0, 5.0, 10.0, 4.0, 8.0, 16.0, 18.0, 18.0, 28.0, 26.0, 17.0, 23.0, 23.0, 31.0, 31.0, 36.0, 36.0, 28.0, 45.0, 38.0, 33.0, 32.0, 43.0, 27.0, 42.0, 30.0, 31.0, 20.0, 25.0, 29.0, 20.0, 27.0, 22.0, 11.0, 16.0, 13.0, 21.0, 10.0, 13.0, 9.0, 11.0, 8.0, 15.0, 4.0, 12.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0], "bins": [-8.265625, -8.0174560546875, -7.769287109375, -7.5211181640625, -7.27294921875, -7.0247802734375, -6.776611328125, -6.5284423828125, -6.2802734375, -6.0321044921875, -5.783935546875, -5.5357666015625, -5.28759765625, -5.0394287109375, -4.791259765625, -4.5430908203125, -4.294921875, -4.0467529296875, -3.798583984375, -3.5504150390625, -3.30224609375, -3.0540771484375, -2.805908203125, -2.5577392578125, -2.3095703125, -2.0614013671875, -1.813232421875, -1.5650634765625, -1.31689453125, -1.0687255859375, -0.820556640625, -0.5723876953125, -0.32421875, -0.0760498046875, 0.172119140625, 0.4202880859375, 0.66845703125, 0.9166259765625, 1.164794921875, 1.4129638671875, 1.6611328125, 1.9093017578125, 2.157470703125, 2.4056396484375, 2.65380859375, 2.9019775390625, 3.150146484375, 3.3983154296875, 3.646484375, 3.8946533203125, 4.142822265625, 4.3909912109375, 4.63916015625, 4.8873291015625, 5.135498046875, 5.3836669921875, 5.6318359375, 5.8800048828125, 6.128173828125, 6.3763427734375, 6.62451171875, 6.8726806640625, 7.120849609375, 7.3690185546875, 7.6171875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 5.0, 8.0, 6.0, 7.0, 12.0, 5.0, 13.0, 19.0, 33.0, 38.0, 45.0, 53.0, 69.0, 81.0, 130.0, 131.0, 216.0, 262.0, 465.0, 1071.0, 3749.0, 20867.0, 173732.0, 719681.0, 108448.0, 14260.0, 2757.0, 860.0, 413.0, 262.0, 212.0, 142.0, 111.0, 83.0, 62.0, 41.0, 34.0, 29.0, 24.0, 18.0, 15.0, 11.0, 14.0, 7.0, 17.0, 4.0, 14.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0], "bins": [-16.421875, -15.93017578125, -15.4384765625, -14.94677734375, -14.455078125, -13.96337890625, -13.4716796875, -12.97998046875, -12.48828125, -11.99658203125, -11.5048828125, -11.01318359375, -10.521484375, -10.02978515625, -9.5380859375, -9.04638671875, -8.5546875, -8.06298828125, -7.5712890625, -7.07958984375, -6.587890625, -6.09619140625, -5.6044921875, -5.11279296875, -4.62109375, -4.12939453125, -3.6376953125, -3.14599609375, -2.654296875, -2.16259765625, -1.6708984375, -1.17919921875, -0.6875, -0.19580078125, 0.2958984375, 0.78759765625, 1.279296875, 1.77099609375, 2.2626953125, 2.75439453125, 3.24609375, 3.73779296875, 4.2294921875, 4.72119140625, 5.212890625, 5.70458984375, 6.1962890625, 6.68798828125, 7.1796875, 7.67138671875, 8.1630859375, 8.65478515625, 9.146484375, 9.63818359375, 10.1298828125, 10.62158203125, 11.11328125, 11.60498046875, 12.0966796875, 12.58837890625, 13.080078125, 13.57177734375, 14.0634765625, 14.55517578125, 15.046875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 7.0, 14.0, 7.0, 12.0, 12.0, 17.0, 19.0, 28.0, 30.0, 34.0, 50.0, 44.0, 40.0, 50.0, 61.0, 104.0, 495.0, 1482.0, 108.0, 67.0, 47.0, 55.0, 37.0, 35.0, 26.0, 29.0, 24.0, 23.0, 15.0, 18.0, 12.0, 3.0, 9.0, 6.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.09375, -31.05859375, -30.0234375, -28.98828125, -27.953125, -26.91796875, -25.8828125, -24.84765625, -23.8125, -22.77734375, -21.7421875, -20.70703125, -19.671875, -18.63671875, -17.6015625, -16.56640625, -15.53125, -14.49609375, -13.4609375, -12.42578125, -11.390625, -10.35546875, -9.3203125, -8.28515625, -7.25, -6.21484375, -5.1796875, -4.14453125, -3.109375, -2.07421875, -1.0390625, -0.00390625, 1.03125, 2.06640625, 3.1015625, 4.13671875, 5.171875, 6.20703125, 7.2421875, 8.27734375, 9.3125, 10.34765625, 11.3828125, 12.41796875, 13.453125, 14.48828125, 15.5234375, 16.55859375, 17.59375, 18.62890625, 19.6640625, 20.69921875, 21.734375, 22.76953125, 23.8046875, 24.83984375, 25.875, 26.91015625, 27.9453125, 28.98046875, 30.015625, 31.05078125, 32.0859375, 33.12109375, 34.15625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 5.0, 8.0, 7.0, 9.0, 18.0, 16.0, 23.0, 35.0, 37.0, 46.0, 49.0, 95.0, 139.0, 227.0, 504.0, 2042.0, 595453.0, 2543059.0, 2563.0, 543.0, 237.0, 142.0, 117.0, 73.0, 62.0, 46.0, 26.0, 22.0, 11.0, 17.0, 14.0, 14.0, 9.0, 7.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-79.6875, -77.2763671875, -74.865234375, -72.4541015625, -70.04296875, -67.6318359375, -65.220703125, -62.8095703125, -60.3984375, -57.9873046875, -55.576171875, -53.1650390625, -50.75390625, -48.3427734375, -45.931640625, -43.5205078125, -41.109375, -38.6982421875, -36.287109375, -33.8759765625, -31.46484375, -29.0537109375, -26.642578125, -24.2314453125, -21.8203125, -19.4091796875, -16.998046875, -14.5869140625, -12.17578125, -9.7646484375, -7.353515625, -4.9423828125, -2.53125, -0.1201171875, 2.291015625, 4.7021484375, 7.11328125, 9.5244140625, 11.935546875, 14.3466796875, 16.7578125, 19.1689453125, 21.580078125, 23.9912109375, 26.40234375, 28.8134765625, 31.224609375, 33.6357421875, 36.046875, 38.4580078125, 40.869140625, 43.2802734375, 45.69140625, 48.1025390625, 50.513671875, 52.9248046875, 55.3359375, 57.7470703125, 60.158203125, 62.5693359375, 64.98046875, 67.3916015625, 69.802734375, 72.2138671875, 74.625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 16.0, 51.0, 159.0, 276.0, 302.0, 146.0, 46.0, 15.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.62635803222656, -73.73023986816406, -71.83411407470703, -69.93798828125, -68.0418701171875, -66.145751953125, -64.24962615966797, -62.3535041809082, -60.45738220214844, -58.56126022338867, -56.665138244628906, -54.76901626586914, -52.872894287109375, -50.97677230834961, -49.080650329589844, -47.18452835083008, -45.28840637207031, -43.39228439331055, -41.49616241455078, -39.600040435791016, -37.70391845703125, -35.807796478271484, -33.91167449951172, -32.01555252075195, -30.119430541992188, -28.223308563232422, -26.327186584472656, -24.43106460571289, -22.534942626953125, -20.63882064819336, -18.742698669433594, -16.846576690673828, -14.950458526611328, -13.054336547851562, -11.158214569091797, -9.262092590332031, -7.365970611572266, -5.4698486328125, -3.5737266540527344, -1.6776046752929688, 0.21851730346679688, 2.1146392822265625, 4.010761260986328, 5.906883239746094, 7.803005218505859, 9.699127197265625, 11.59524917602539, 13.491371154785156, 15.387493133544922, 17.283615112304688, 19.179737091064453, 21.07585906982422, 22.971981048583984, 24.86810302734375, 26.764225006103516, 28.66034698486328, 30.556468963623047, 32.45259094238281, 34.34871292114258, 36.244834899902344, 38.14095687866211, 40.037078857421875, 41.93320083618164, 43.829322814941406, 45.72544479370117]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 5.0, 10.0, 9.0, 10.0, 12.0, 17.0, 16.0, 11.0, 13.0, 17.0, 25.0, 27.0, 23.0, 36.0, 46.0, 45.0, 44.0, 35.0, 40.0, 43.0, 52.0, 38.0, 39.0, 43.0, 45.0, 33.0, 33.0, 40.0, 31.0, 32.0, 25.0, 14.0, 13.0, 18.0, 13.0, 10.0, 10.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0], "bins": [-91.76187896728516, -89.16018676757812, -86.5584945678711, -83.95680236816406, -81.35511016845703, -78.75341796875, -76.15172576904297, -73.55003356933594, -70.94833374023438, -68.34664154052734, -65.74494934082031, -63.14325714111328, -60.54156494140625, -57.93987274169922, -55.33817672729492, -52.73648452758789, -50.134796142578125, -47.533103942871094, -44.93141174316406, -42.32971954345703, -39.72802734375, -37.12633514404297, -34.52463912963867, -31.92294692993164, -29.32125473022461, -26.719562530517578, -24.117870330810547, -21.516176223754883, -18.91448402404785, -16.31279182434082, -13.711098670959473, -11.109405517578125, -8.507720947265625, -5.9060282707214355, -3.304335594177246, -0.7026429176330566, 1.8990497589111328, 4.500741958618164, 7.102435111999512, 9.70412826538086, 12.30582046508789, 14.907512664794922, 17.509204864501953, 20.110898971557617, 22.71259117126465, 25.31428337097168, 27.915977478027344, 30.517669677734375, 33.119361877441406, 35.72105407714844, 38.32274627685547, 40.9244384765625, 43.52613067626953, 46.12782287597656, 48.72951889038086, 51.33121109008789, 53.93290328979492, 56.53459548950195, 59.136287689208984, 61.737979888916016, 64.33967590332031, 66.94136810302734, 69.54306030273438, 72.1447525024414, 74.74644470214844]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 6.0, 8.0, 6.0, 8.0, 15.0, 17.0, 18.0, 19.0, 21.0, 25.0, 19.0, 32.0, 45.0, 36.0, 31.0, 37.0, 46.0, 46.0, 44.0, 49.0, 37.0, 40.0, 28.0, 34.0, 40.0, 27.0, 30.0, 25.0, 27.0, 18.0, 20.0, 16.0, 17.0, 18.0, 13.0, 13.0, 14.0, 8.0, 19.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.265625, -8.97216796875, -8.6787109375, -8.38525390625, -8.091796875, -7.79833984375, -7.5048828125, -7.21142578125, -6.91796875, -6.62451171875, -6.3310546875, -6.03759765625, -5.744140625, -5.45068359375, -5.1572265625, -4.86376953125, -4.5703125, -4.27685546875, -3.9833984375, -3.68994140625, -3.396484375, -3.10302734375, -2.8095703125, -2.51611328125, -2.22265625, -1.92919921875, -1.6357421875, -1.34228515625, -1.048828125, -0.75537109375, -0.4619140625, -0.16845703125, 0.125, 0.41845703125, 0.7119140625, 1.00537109375, 1.298828125, 1.59228515625, 1.8857421875, 2.17919921875, 2.47265625, 2.76611328125, 3.0595703125, 3.35302734375, 3.646484375, 3.93994140625, 4.2333984375, 4.52685546875, 4.8203125, 5.11376953125, 5.4072265625, 5.70068359375, 5.994140625, 6.28759765625, 6.5810546875, 6.87451171875, 7.16796875, 7.46142578125, 7.7548828125, 8.04833984375, 8.341796875, 8.63525390625, 8.9287109375, 9.22216796875, 9.515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 10.0, 5.0, 4.0, 13.0, 4.0, 10.0, 9.0, 10.0, 20.0, 22.0, 21.0, 24.0, 36.0, 38.0, 54.0, 115.0, 193.0, 336.0, 711.0, 1930.0, 6430.0, 35634.0, 726897.0, 3054176.0, 338379.0, 21965.0, 4446.0, 1435.0, 577.0, 262.0, 135.0, 77.0, 61.0, 41.0, 33.0, 26.0, 21.0, 15.0, 20.0, 13.0, 13.0, 11.0, 13.0, 15.0, 9.0, 0.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.328125, -23.576904296875, -22.82568359375, -22.074462890625, -21.3232421875, -20.572021484375, -19.82080078125, -19.069580078125, -18.318359375, -17.567138671875, -16.81591796875, -16.064697265625, -15.3134765625, -14.562255859375, -13.81103515625, -13.059814453125, -12.30859375, -11.557373046875, -10.80615234375, -10.054931640625, -9.3037109375, -8.552490234375, -7.80126953125, -7.050048828125, -6.298828125, -5.547607421875, -4.79638671875, -4.045166015625, -3.2939453125, -2.542724609375, -1.79150390625, -1.040283203125, -0.2890625, 0.462158203125, 1.21337890625, 1.964599609375, 2.7158203125, 3.467041015625, 4.21826171875, 4.969482421875, 5.720703125, 6.471923828125, 7.22314453125, 7.974365234375, 8.7255859375, 9.476806640625, 10.22802734375, 10.979248046875, 11.73046875, 12.481689453125, 13.23291015625, 13.984130859375, 14.7353515625, 15.486572265625, 16.23779296875, 16.989013671875, 17.740234375, 18.491455078125, 19.24267578125, 19.993896484375, 20.7451171875, 21.496337890625, 22.24755859375, 22.998779296875, 23.75]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 8.0, 7.0, 20.0, 22.0, 18.0, 36.0, 52.0, 86.0, 96.0, 166.0, 213.0, 255.0, 440.0, 574.0, 591.0, 457.0, 336.0, 239.0, 137.0, 90.0, 66.0, 44.0, 33.0, 22.0, 23.0, 9.0, 5.0, 7.0, 4.0, 8.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.15625, -18.593505859375, -18.03076171875, -17.468017578125, -16.9052734375, -16.342529296875, -15.77978515625, -15.217041015625, -14.654296875, -14.091552734375, -13.52880859375, -12.966064453125, -12.4033203125, -11.840576171875, -11.27783203125, -10.715087890625, -10.15234375, -9.589599609375, -9.02685546875, -8.464111328125, -7.9013671875, -7.338623046875, -6.77587890625, -6.213134765625, -5.650390625, -5.087646484375, -4.52490234375, -3.962158203125, -3.3994140625, -2.836669921875, -2.27392578125, -1.711181640625, -1.1484375, -0.585693359375, -0.02294921875, 0.539794921875, 1.1025390625, 1.665283203125, 2.22802734375, 2.790771484375, 3.353515625, 3.916259765625, 4.47900390625, 5.041748046875, 5.6044921875, 6.167236328125, 6.72998046875, 7.292724609375, 7.85546875, 8.418212890625, 8.98095703125, 9.543701171875, 10.1064453125, 10.669189453125, 11.23193359375, 11.794677734375, 12.357421875, 12.920166015625, 13.48291015625, 14.045654296875, 14.6083984375, 15.171142578125, 15.73388671875, 16.296630859375, 16.859375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 7.0, 7.0, 8.0, 3.0, 9.0, 18.0, 11.0, 28.0, 35.0, 42.0, 59.0, 78.0, 85.0, 112.0, 149.0, 264.0, 450.0, 1371.0, 8341.0, 257012.0, 3866813.0, 53539.0, 3857.0, 774.0, 340.0, 210.0, 135.0, 109.0, 84.0, 69.0, 50.0, 38.0, 35.0, 35.0, 23.0, 22.0, 10.0, 8.0, 15.0, 6.0, 9.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.3125, -51.494140625, -49.67578125, -47.857421875, -46.0390625, -44.220703125, -42.40234375, -40.583984375, -38.765625, -36.947265625, -35.12890625, -33.310546875, -31.4921875, -29.673828125, -27.85546875, -26.037109375, -24.21875, -22.400390625, -20.58203125, -18.763671875, -16.9453125, -15.126953125, -13.30859375, -11.490234375, -9.671875, -7.853515625, -6.03515625, -4.216796875, -2.3984375, -0.580078125, 1.23828125, 3.056640625, 4.875, 6.693359375, 8.51171875, 10.330078125, 12.1484375, 13.966796875, 15.78515625, 17.603515625, 19.421875, 21.240234375, 23.05859375, 24.876953125, 26.6953125, 28.513671875, 30.33203125, 32.150390625, 33.96875, 35.787109375, 37.60546875, 39.423828125, 41.2421875, 43.060546875, 44.87890625, 46.697265625, 48.515625, 50.333984375, 52.15234375, 53.970703125, 55.7890625, 57.607421875, 59.42578125, 61.244140625, 63.0625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 76.0, 577.0, 330.0, 29.0, 4.0, 2.0], "bins": [-610.7935180664062, -600.5831298828125, -590.3727416992188, -580.162353515625, -569.951904296875, -559.7415161132812, -549.5311279296875, -539.3207397460938, -529.1103515625, -518.8999633789062, -508.6895446777344, -498.4791564941406, -488.2687683105469, -478.0583801269531, -467.84796142578125, -457.6375732421875, -447.42718505859375, -437.216796875, -427.0063781738281, -416.7959899902344, -406.5856018066406, -396.3752136230469, -386.164794921875, -375.95440673828125, -365.7439880371094, -355.5335998535156, -345.32318115234375, -335.11279296875, -324.90240478515625, -314.6920166015625, -304.4815979003906, -294.2712097167969, -284.06085205078125, -273.8504638671875, -263.6400451660156, -253.42965698242188, -243.21926879882812, -233.0088653564453, -222.7984619140625, -212.58807373046875, -202.37767028808594, -192.16726684570312, -181.95687866210938, -171.74647521972656, -161.5360870361328, -151.32568359375, -141.11529541015625, -130.90489196777344, -120.69449615478516, -110.48410034179688, -100.2737045288086, -90.06330871582031, -79.8529052734375, -69.64251708984375, -59.43211364746094, -49.221717834472656, -39.011322021484375, -28.800926208496094, -18.59052848815918, -8.380130767822266, 1.8302650451660156, 12.040660858154297, 22.251060485839844, 32.461456298828125, 42.671852111816406]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 5.0, 3.0, 1.0, 5.0, 6.0, 4.0, 7.0, 7.0, 7.0, 10.0, 14.0, 8.0, 17.0, 29.0, 24.0, 26.0, 24.0, 31.0, 34.0, 31.0, 36.0, 52.0, 38.0, 46.0, 44.0, 52.0, 40.0, 32.0, 46.0, 30.0, 35.0, 22.0, 33.0, 25.0, 34.0, 25.0, 29.0, 20.0, 19.0, 14.0, 15.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-44.81871032714844, -43.24138641357422, -41.6640625, -40.08673858642578, -38.50941467285156, -36.932090759277344, -35.354766845703125, -33.777442932128906, -32.20011901855469, -30.62279510498047, -29.04547119140625, -27.46814727783203, -25.890823364257812, -24.313499450683594, -22.736173629760742, -21.158849716186523, -19.581523895263672, -18.004199981689453, -16.426876068115234, -14.8495512008667, -13.27222728729248, -11.694903373718262, -10.117578506469727, -8.540254592895508, -6.962930679321289, -5.38560676574707, -3.8082823753356934, -2.2309579849243164, -0.6536340713500977, 0.9236898422241211, 2.5010147094726562, 4.078338623046875, 5.655662536621094, 7.2329864501953125, 8.810310363769531, 10.387635231018066, 11.964959144592285, 13.542283058166504, 15.119607925415039, 16.696931838989258, 18.274255752563477, 19.851579666137695, 21.428903579711914, 23.006229400634766, 24.583553314208984, 26.160877227783203, 27.738201141357422, 29.31552505493164, 30.89284896850586, 32.47017288208008, 34.0474967956543, 35.624820709228516, 37.202144622802734, 38.77946853637695, 40.35679626464844, 41.934120178222656, 43.511444091796875, 45.088768005371094, 46.66609191894531, 48.24341583251953, 49.82073974609375, 51.39806365966797, 52.97538757324219, 54.552711486816406, 56.130035400390625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 6.0, 1.0, 4.0, 7.0, 8.0, 10.0, 12.0, 4.0, 14.0, 16.0, 16.0, 17.0, 26.0, 34.0, 22.0, 38.0, 32.0, 33.0, 41.0, 33.0, 36.0, 35.0, 44.0, 30.0, 41.0, 43.0, 53.0, 37.0, 32.0, 36.0, 24.0, 26.0, 19.0, 31.0, 24.0, 22.0, 18.0, 11.0, 13.0, 10.0, 11.0, 10.0, 8.0, 5.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.844482421875, -7.54833984375, -7.252197265625, -6.9560546875, -6.659912109375, -6.36376953125, -6.067626953125, -5.771484375, -5.475341796875, -5.17919921875, -4.883056640625, -4.5869140625, -4.290771484375, -3.99462890625, -3.698486328125, -3.40234375, -3.106201171875, -2.81005859375, -2.513916015625, -2.2177734375, -1.921630859375, -1.62548828125, -1.329345703125, -1.033203125, -0.737060546875, -0.44091796875, -0.144775390625, 0.1513671875, 0.447509765625, 0.74365234375, 1.039794921875, 1.3359375, 1.632080078125, 1.92822265625, 2.224365234375, 2.5205078125, 2.816650390625, 3.11279296875, 3.408935546875, 3.705078125, 4.001220703125, 4.29736328125, 4.593505859375, 4.8896484375, 5.185791015625, 5.48193359375, 5.778076171875, 6.07421875, 6.370361328125, 6.66650390625, 6.962646484375, 7.2587890625, 7.554931640625, 7.85107421875, 8.147216796875, 8.443359375, 8.739501953125, 9.03564453125, 9.331787109375, 9.6279296875, 9.924072265625, 10.22021484375, 10.516357421875, 10.8125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 10.0, 7.0, 12.0, 24.0, 27.0, 45.0, 64.0, 91.0, 135.0, 228.0, 338.0, 460.0, 711.0, 1047.0, 1626.0, 2473.0, 3692.0, 5787.0, 8791.0, 13717.0, 21027.0, 32548.0, 50874.0, 78703.0, 120221.0, 168069.0, 173407.0, 127925.0, 83494.0, 54136.0, 34849.0, 22410.0, 14516.0, 9310.0, 6148.0, 3813.0, 2601.0, 1667.0, 1206.0, 755.0, 461.0, 361.0, 252.0, 161.0, 109.0, 80.0, 66.0, 29.0, 31.0, 21.0, 11.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0], "bins": [-1.0087890625, -0.9782867431640625, -0.947784423828125, -0.9172821044921875, -0.88677978515625, -0.8562774658203125, -0.825775146484375, -0.7952728271484375, -0.7647705078125, -0.7342681884765625, -0.703765869140625, -0.6732635498046875, -0.64276123046875, -0.6122589111328125, -0.581756591796875, -0.5512542724609375, -0.520751953125, -0.4902496337890625, -0.459747314453125, -0.4292449951171875, -0.39874267578125, -0.3682403564453125, -0.337738037109375, -0.3072357177734375, -0.2767333984375, -0.2462310791015625, -0.215728759765625, -0.1852264404296875, -0.15472412109375, -0.1242218017578125, -0.093719482421875, -0.0632171630859375, -0.03271484375, -0.0022125244140625, 0.028289794921875, 0.0587921142578125, 0.08929443359375, 0.1197967529296875, 0.150299072265625, 0.1808013916015625, 0.2113037109375, 0.2418060302734375, 0.272308349609375, 0.3028106689453125, 0.33331298828125, 0.3638153076171875, 0.394317626953125, 0.4248199462890625, 0.455322265625, 0.4858245849609375, 0.516326904296875, 0.5468292236328125, 0.57733154296875, 0.6078338623046875, 0.638336181640625, 0.6688385009765625, 0.6993408203125, 0.7298431396484375, 0.760345458984375, 0.7908477783203125, 0.82135009765625, 0.8518524169921875, 0.882354736328125, 0.9128570556640625, 0.943359375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 11.0, 8.0, 12.0, 10.0, 9.0, 12.0, 14.0, 26.0, 23.0, 20.0, 35.0, 31.0, 33.0, 27.0, 38.0, 37.0, 39.0, 43.0, 37.0, 1066.0, 44.0, 49.0, 35.0, 39.0, 34.0, 41.0, 20.0, 18.0, 17.0, 35.0, 26.0, 15.0, 21.0, 11.0, 15.0, 14.0, 13.0, 5.0, 10.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-6.0546875, -5.87408447265625, -5.6934814453125, -5.51287841796875, -5.332275390625, -5.15167236328125, -4.9710693359375, -4.79046630859375, -4.60986328125, -4.42926025390625, -4.2486572265625, -4.06805419921875, -3.887451171875, -3.70684814453125, -3.5262451171875, -3.34564208984375, -3.1650390625, -2.98443603515625, -2.8038330078125, -2.62322998046875, -2.442626953125, -2.26202392578125, -2.0814208984375, -1.90081787109375, -1.72021484375, -1.53961181640625, -1.3590087890625, -1.17840576171875, -0.997802734375, -0.81719970703125, -0.6365966796875, -0.45599365234375, -0.275390625, -0.09478759765625, 0.0858154296875, 0.26641845703125, 0.447021484375, 0.62762451171875, 0.8082275390625, 0.98883056640625, 1.16943359375, 1.35003662109375, 1.5306396484375, 1.71124267578125, 1.891845703125, 2.07244873046875, 2.2530517578125, 2.43365478515625, 2.6142578125, 2.79486083984375, 2.9754638671875, 3.15606689453125, 3.336669921875, 3.51727294921875, 3.6978759765625, 3.87847900390625, 4.05908203125, 4.23968505859375, 4.4202880859375, 4.60089111328125, 4.781494140625, 4.96209716796875, 5.1427001953125, 5.32330322265625, 5.50390625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 9.0, 22.0, 23.0, 43.0, 46.0, 74.0, 118.0, 163.0, 294.0, 426.0, 625.0, 956.0, 1433.0, 2258.0, 3442.0, 5619.0, 8137.0, 12948.0, 19374.0, 30075.0, 47462.0, 75948.0, 121207.0, 178579.0, 1228821.0, 131280.0, 82436.0, 51496.0, 32769.0, 21301.0, 13672.0, 9109.0, 5890.0, 3885.0, 2537.0, 1598.0, 1093.0, 703.0, 446.0, 307.0, 187.0, 113.0, 67.0, 54.0, 30.0, 24.0, 15.0, 8.0, 5.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.89794921875, -0.8690643310546875, -0.840179443359375, -0.8112945556640625, -0.78240966796875, -0.7535247802734375, -0.724639892578125, -0.6957550048828125, -0.6668701171875, -0.6379852294921875, -0.609100341796875, -0.5802154541015625, -0.55133056640625, -0.5224456787109375, -0.493560791015625, -0.4646759033203125, -0.435791015625, -0.4069061279296875, -0.378021240234375, -0.3491363525390625, -0.32025146484375, -0.2913665771484375, -0.262481689453125, -0.2335968017578125, -0.2047119140625, -0.1758270263671875, -0.146942138671875, -0.1180572509765625, -0.08917236328125, -0.0602874755859375, -0.031402587890625, -0.0025177001953125, 0.0263671875, 0.0552520751953125, 0.084136962890625, 0.1130218505859375, 0.14190673828125, 0.1707916259765625, 0.199676513671875, 0.2285614013671875, 0.2574462890625, 0.2863311767578125, 0.315216064453125, 0.3441009521484375, 0.37298583984375, 0.4018707275390625, 0.430755615234375, 0.4596405029296875, 0.488525390625, 0.5174102783203125, 0.546295166015625, 0.5751800537109375, 0.60406494140625, 0.6329498291015625, 0.661834716796875, 0.6907196044921875, 0.7196044921875, 0.7484893798828125, 0.777374267578125, 0.8062591552734375, 0.83514404296875, 0.8640289306640625, 0.892913818359375, 0.9217987060546875, 0.95068359375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 4.0, 6.0, 5.0, 15.0, 10.0, 12.0, 22.0, 19.0, 18.0, 30.0, 37.0, 41.0, 49.0, 46.0, 53.0, 55.0, 61.0, 67.0, 50.0, 55.0, 58.0, 42.0, 31.0, 30.0, 24.0, 29.0, 19.0, 18.0, 22.0, 14.0, 9.0, 10.0, 4.0, 6.0, 4.0, 4.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0027790069580078125, -0.0027035772800445557, -0.002628147602081299, -0.002552717924118042, -0.002477288246154785, -0.0024018585681915283, -0.0023264288902282715, -0.0022509992122650146, -0.002175569534301758, -0.002100139856338501, -0.002024710178375244, -0.0019492805004119873, -0.0018738508224487305, -0.0017984211444854736, -0.0017229914665222168, -0.00164756178855896, -0.0015721321105957031, -0.0014967024326324463, -0.0014212727546691895, -0.0013458430767059326, -0.0012704133987426758, -0.001194983720779419, -0.0011195540428161621, -0.0010441243648529053, -0.0009686946868896484, -0.0008932650089263916, -0.0008178353309631348, -0.0007424056529998779, -0.0006669759750366211, -0.0005915462970733643, -0.0005161166191101074, -0.0004406869411468506, -0.00036525726318359375, -0.0002898275852203369, -0.00021439790725708008, -0.00013896822929382324, -6.35385513305664e-05, 1.189112663269043e-05, 8.732080459594727e-05, 0.0001627504825592041, 0.00023818016052246094, 0.0003136098384857178, 0.0003890395164489746, 0.00046446919441223145, 0.0005398988723754883, 0.0006153285503387451, 0.000690758228302002, 0.0007661879062652588, 0.0008416175842285156, 0.0009170472621917725, 0.0009924769401550293, 0.0010679066181182861, 0.001143336296081543, 0.0012187659740447998, 0.0012941956520080566, 0.0013696253299713135, 0.0014450550079345703, 0.0015204846858978271, 0.001595914363861084, 0.0016713440418243408, 0.0017467737197875977, 0.0018222033977508545, 0.0018976330757141113, 0.001973062753677368, 0.002048492431640625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 5.0, 8.0, 12.0, 9.0, 11.0, 25.0, 34.0, 32.0, 38.0, 46.0, 64.0, 67.0, 102.0, 171.0, 303.0, 707.0, 5342.0, 1033843.0, 6060.0, 703.0, 303.0, 184.0, 108.0, 75.0, 77.0, 39.0, 34.0, 32.0, 15.0, 25.0, 21.0, 7.0, 9.0, 4.0, 4.0, 7.0, 6.0, 3.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0435791015625, -0.04193544387817383, -0.040291786193847656, -0.038648128509521484, -0.03700447082519531, -0.03536081314086914, -0.03371715545654297, -0.0320734977722168, -0.030429840087890625, -0.028786182403564453, -0.02714252471923828, -0.02549886703491211, -0.023855209350585938, -0.022211551666259766, -0.020567893981933594, -0.018924236297607422, -0.01728057861328125, -0.015636920928955078, -0.013993263244628906, -0.012349605560302734, -0.010705947875976562, -0.00906229019165039, -0.007418632507324219, -0.005774974822998047, -0.004131317138671875, -0.002487659454345703, -0.0008440017700195312, 0.0007996559143066406, 0.0024433135986328125, 0.004086971282958984, 0.005730628967285156, 0.007374286651611328, 0.0090179443359375, 0.010661602020263672, 0.012305259704589844, 0.013948917388916016, 0.015592575073242188, 0.01723623275756836, 0.01887989044189453, 0.020523548126220703, 0.022167205810546875, 0.023810863494873047, 0.02545452117919922, 0.02709817886352539, 0.028741836547851562, 0.030385494232177734, 0.032029151916503906, 0.03367280960083008, 0.03531646728515625, 0.03696012496948242, 0.038603782653808594, 0.040247440338134766, 0.04189109802246094, 0.04353475570678711, 0.04517841339111328, 0.04682207107543945, 0.048465728759765625, 0.0501093864440918, 0.05175304412841797, 0.05339670181274414, 0.05504035949707031, 0.056684017181396484, 0.058327674865722656, 0.05997133255004883, 0.061614990234375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 149.0, 855.0, 15.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021074225660413504, -0.0016216511139646173, -0.0011358796618878841, -0.0006501083262264729, -0.00016433687414973974, 0.00032143457792699337, 0.0008072059135884047, 0.0012929774820804596, 0.0017787488177418709, 0.002264520153403282, 0.002750291721895337, 0.0032360630575567484, 0.0037218346260488033, 0.004207605961710215, 0.004693377297371626, 0.0051791490986943245, 0.005664920434355736, 0.006150691770017147, 0.006636463105678558, 0.00712223444133997, 0.007608006242662668, 0.008093778043985367, 0.008579548448324203, 0.00906532071530819, 0.009551091119647026, 0.010036862455308437, 0.010522633790969849, 0.01100840512663126, 0.011494176462292671, 0.011979948729276657, 0.012465719133615494, 0.01295149140059948, 0.013437262736260891, 0.013923034071922302, 0.014408805407583714, 0.014894576743245125, 0.015380348078906536, 0.015866119414567947, 0.016351891681551933, 0.01683766208589077, 0.017323434352874756, 0.017809206619858742, 0.01829497702419758, 0.018780749291181564, 0.0192665196955204, 0.019752291962504387, 0.020238062366843224, 0.02072383463382721, 0.021209605038166046, 0.021695377305150032, 0.02218114770948887, 0.022666919976472855, 0.02315269038081169, 0.023638462647795677, 0.024124233052134514, 0.0246100053191185, 0.025095777586102486, 0.02558154985308647, 0.026067320257425308, 0.026553092524409294, 0.02703886292874813, 0.027524635195732117, 0.028010405600070953, 0.02849617786705494, 0.028981948271393776]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 9.0, 5.0, 9.0, 12.0, 16.0, 13.0, 23.0, 15.0, 35.0, 29.0, 32.0, 28.0, 41.0, 41.0, 38.0, 48.0, 39.0, 51.0, 43.0, 47.0, 42.0, 39.0, 40.0, 30.0, 32.0, 28.0, 36.0, 32.0, 21.0, 29.0, 15.0, 16.0, 14.0, 6.0, 11.0, 8.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0013304352760314941, -0.0012877611443400383, -0.0012450870126485825, -0.0012024128809571266, -0.0011597387492656708, -0.001117064617574215, -0.001074390485882759, -0.0010317163541913033, -0.0009890422224998474, -0.0009463680908083916, -0.0009036939591169357, -0.0008610198274254799, -0.000818345695734024, -0.0007756715640425682, -0.0007329974323511124, -0.0006903233006596565, -0.0006476491689682007, -0.0006049750372767448, -0.000562300905585289, -0.0005196267738938332, -0.0004769526422023773, -0.0004342785105109215, -0.00039160437881946564, -0.0003489302471280098, -0.00030625611543655396, -0.0002635819837450981, -0.00022090785205364227, -0.00017823372036218643, -0.0001355595886707306, -9.288545697927475e-05, -5.021132528781891e-05, -7.537193596363068e-06, 3.5136938095092773e-05, 7.781106978654861e-05, 0.00012048520147800446, 0.0001631593331694603, 0.00020583346486091614, 0.000248507596552372, 0.0002911817282438278, 0.00033385585993528366, 0.0003765299916267395, 0.00041920412331819534, 0.0004618782550096512, 0.000504552386701107, 0.0005472265183925629, 0.0005899006500840187, 0.0006325747817754745, 0.0006752489134669304, 0.0007179230451583862, 0.0007605971768498421, 0.0008032713085412979, 0.0008459454402327538, 0.0008886195719242096, 0.0009312937036156654, 0.0009739678353071213, 0.0010166419669985771, 0.001059316098690033, 0.0011019902303814888, 0.0011446643620729446, 0.0011873384937644005, 0.0012300126254558563, 0.0012726867571473122, 0.001315360888838768, 0.0013580350205302238, 0.0014007091522216797]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 6.0, 1.0, 4.0, 7.0, 8.0, 10.0, 12.0, 4.0, 14.0, 16.0, 16.0, 17.0, 26.0, 34.0, 22.0, 38.0, 32.0, 33.0, 41.0, 33.0, 36.0, 35.0, 44.0, 30.0, 41.0, 43.0, 53.0, 37.0, 32.0, 36.0, 24.0, 26.0, 19.0, 31.0, 24.0, 22.0, 18.0, 11.0, 13.0, 10.0, 11.0, 10.0, 8.0, 5.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.844482421875, -7.54833984375, -7.252197265625, -6.9560546875, -6.659912109375, -6.36376953125, -6.067626953125, -5.771484375, -5.475341796875, -5.17919921875, -4.883056640625, -4.5869140625, -4.290771484375, -3.99462890625, -3.698486328125, -3.40234375, -3.106201171875, -2.81005859375, -2.513916015625, -2.2177734375, -1.921630859375, -1.62548828125, -1.329345703125, -1.033203125, -0.737060546875, -0.44091796875, -0.144775390625, 0.1513671875, 0.447509765625, 0.74365234375, 1.039794921875, 1.3359375, 1.632080078125, 1.92822265625, 2.224365234375, 2.5205078125, 2.816650390625, 3.11279296875, 3.408935546875, 3.705078125, 4.001220703125, 4.29736328125, 4.593505859375, 4.8896484375, 5.185791015625, 5.48193359375, 5.778076171875, 6.07421875, 6.370361328125, 6.66650390625, 6.962646484375, 7.2587890625, 7.554931640625, 7.85107421875, 8.147216796875, 8.443359375, 8.739501953125, 9.03564453125, 9.331787109375, 9.6279296875, 9.924072265625, 10.22021484375, 10.516357421875, 10.8125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 8.0, 13.0, 13.0, 17.0, 23.0, 21.0, 28.0, 35.0, 50.0, 71.0, 96.0, 147.0, 172.0, 251.0, 302.0, 439.0, 530.0, 805.0, 1744.0, 7713.0, 72975.0, 860184.0, 89043.0, 8852.0, 1867.0, 884.0, 553.0, 440.0, 286.0, 233.0, 179.0, 158.0, 95.0, 86.0, 47.0, 32.0, 35.0, 25.0, 19.0, 19.0, 13.0, 16.0, 8.0, 10.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.625, -19.8759765625, -19.126953125, -18.3779296875, -17.62890625, -16.8798828125, -16.130859375, -15.3818359375, -14.6328125, -13.8837890625, -13.134765625, -12.3857421875, -11.63671875, -10.8876953125, -10.138671875, -9.3896484375, -8.640625, -7.8916015625, -7.142578125, -6.3935546875, -5.64453125, -4.8955078125, -4.146484375, -3.3974609375, -2.6484375, -1.8994140625, -1.150390625, -0.4013671875, 0.34765625, 1.0966796875, 1.845703125, 2.5947265625, 3.34375, 4.0927734375, 4.841796875, 5.5908203125, 6.33984375, 7.0888671875, 7.837890625, 8.5869140625, 9.3359375, 10.0849609375, 10.833984375, 11.5830078125, 12.33203125, 13.0810546875, 13.830078125, 14.5791015625, 15.328125, 16.0771484375, 16.826171875, 17.5751953125, 18.32421875, 19.0732421875, 19.822265625, 20.5712890625, 21.3203125, 22.0693359375, 22.818359375, 23.5673828125, 24.31640625, 25.0654296875, 25.814453125, 26.5634765625, 27.3125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 7.0, 8.0, 7.0, 6.0, 9.0, 7.0, 30.0, 30.0, 23.0, 35.0, 22.0, 25.0, 36.0, 38.0, 57.0, 50.0, 66.0, 278.0, 1714.0, 142.0, 58.0, 48.0, 49.0, 34.0, 43.0, 34.0, 30.0, 21.0, 22.0, 19.0, 17.0, 20.0, 12.0, 11.0, 8.0, 5.0, 2.0, 8.0, 2.0, 4.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.65625, -31.731201171875, -30.80615234375, -29.881103515625, -28.9560546875, -28.031005859375, -27.10595703125, -26.180908203125, -25.255859375, -24.330810546875, -23.40576171875, -22.480712890625, -21.5556640625, -20.630615234375, -19.70556640625, -18.780517578125, -17.85546875, -16.930419921875, -16.00537109375, -15.080322265625, -14.1552734375, -13.230224609375, -12.30517578125, -11.380126953125, -10.455078125, -9.530029296875, -8.60498046875, -7.679931640625, -6.7548828125, -5.829833984375, -4.90478515625, -3.979736328125, -3.0546875, -2.129638671875, -1.20458984375, -0.279541015625, 0.6455078125, 1.570556640625, 2.49560546875, 3.420654296875, 4.345703125, 5.270751953125, 6.19580078125, 7.120849609375, 8.0458984375, 8.970947265625, 9.89599609375, 10.821044921875, 11.74609375, 12.671142578125, 13.59619140625, 14.521240234375, 15.4462890625, 16.371337890625, 17.29638671875, 18.221435546875, 19.146484375, 20.071533203125, 20.99658203125, 21.921630859375, 22.8466796875, 23.771728515625, 24.69677734375, 25.621826171875, 26.546875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 8.0, 10.0, 7.0, 19.0, 18.0, 17.0, 22.0, 26.0, 31.0, 33.0, 49.0, 64.0, 72.0, 139.0, 282.0, 802.0, 16897.0, 3119895.0, 6008.0, 575.0, 238.0, 112.0, 75.0, 48.0, 40.0, 30.0, 37.0, 33.0, 27.0, 23.0, 6.0, 10.0, 7.0, 8.0, 5.0, 7.0, 5.0, 4.0, 6.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.5, -70.912109375, -68.32421875, -65.736328125, -63.1484375, -60.560546875, -57.97265625, -55.384765625, -52.796875, -50.208984375, -47.62109375, -45.033203125, -42.4453125, -39.857421875, -37.26953125, -34.681640625, -32.09375, -29.505859375, -26.91796875, -24.330078125, -21.7421875, -19.154296875, -16.56640625, -13.978515625, -11.390625, -8.802734375, -6.21484375, -3.626953125, -1.0390625, 1.548828125, 4.13671875, 6.724609375, 9.3125, 11.900390625, 14.48828125, 17.076171875, 19.6640625, 22.251953125, 24.83984375, 27.427734375, 30.015625, 32.603515625, 35.19140625, 37.779296875, 40.3671875, 42.955078125, 45.54296875, 48.130859375, 50.71875, 53.306640625, 55.89453125, 58.482421875, 61.0703125, 63.658203125, 66.24609375, 68.833984375, 71.421875, 74.009765625, 76.59765625, 79.185546875, 81.7734375, 84.361328125, 86.94921875, 89.537109375, 92.125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 11.0, 23.0, 52.0, 88.0, 132.0, 141.0, 157.0, 150.0, 119.0, 62.0, 33.0, 28.0, 7.0, 4.0, 1.0, 2.0], "bins": [-46.33613967895508, -45.478797912597656, -44.62145233154297, -43.76411056518555, -42.906768798828125, -42.0494270324707, -41.19208526611328, -40.334739685058594, -39.47739791870117, -38.62005615234375, -37.76271057128906, -36.90536880493164, -36.04802703857422, -35.1906852722168, -34.333343505859375, -33.47599792480469, -32.618656158447266, -31.761314392089844, -30.90397071838379, -30.046627044677734, -29.189285278320312, -28.33194351196289, -27.474599838256836, -26.61725616455078, -25.75991439819336, -24.902572631835938, -24.045228958129883, -23.187885284423828, -22.330543518066406, -21.473201751708984, -20.61585807800293, -19.758514404296875, -18.901172637939453, -18.04383087158203, -17.186487197875977, -16.329143524169922, -15.4718017578125, -14.614459037780762, -13.757116317749023, -12.899773597717285, -12.04242992401123, -11.185087203979492, -10.327744483947754, -9.470401763916016, -8.613059043884277, -7.755716323852539, -6.898373603820801, -6.0410308837890625, -5.183688163757324, -4.326345443725586, -3.4690027236938477, -2.6116600036621094, -1.754317283630371, -0.8969745635986328, -0.03963184356689453, 0.8177108764648438, 1.675053596496582, 2.5323963165283203, 3.3897390365600586, 4.247081756591797, 5.104424476623535, 5.961767196655273, 6.819109916687012, 7.67645263671875, 8.533795356750488]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 5.0, 15.0, 10.0, 7.0, 17.0, 9.0, 20.0, 10.0, 16.0, 19.0, 34.0, 24.0, 18.0, 29.0, 27.0, 21.0, 30.0, 43.0, 28.0, 44.0, 55.0, 33.0, 45.0, 41.0, 34.0, 29.0, 39.0, 27.0, 36.0, 26.0, 28.0, 24.0, 17.0, 25.0, 13.0, 16.0, 16.0, 11.0, 10.0, 8.0, 9.0, 4.0, 9.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-63.99790573120117, -61.894683837890625, -59.79146194458008, -57.68824005126953, -55.585018157958984, -53.48179626464844, -51.37857437133789, -49.275352478027344, -47.1721305847168, -45.06890869140625, -42.9656867980957, -40.862464904785156, -38.75924301147461, -36.65602111816406, -34.552799224853516, -32.44957733154297, -30.346355438232422, -28.243133544921875, -26.139911651611328, -24.03668975830078, -21.933467864990234, -19.830245971679688, -17.72702407836914, -15.623802185058594, -13.520580291748047, -11.4173583984375, -9.314136505126953, -7.210914611816406, -5.107692718505859, -3.0044708251953125, -0.9012489318847656, 1.2019729614257812, 3.3051910400390625, 5.408412933349609, 7.511634826660156, 9.614856719970703, 11.71807861328125, 13.821300506591797, 15.924522399902344, 18.02774429321289, 20.130966186523438, 22.234188079833984, 24.33740997314453, 26.440631866455078, 28.543853759765625, 30.647075653076172, 32.75029754638672, 34.853519439697266, 36.95674133300781, 39.05996322631836, 41.163185119628906, 43.26640701293945, 45.36962890625, 47.47285079956055, 49.576072692871094, 51.67929458618164, 53.78251647949219, 55.885738372802734, 57.98896026611328, 60.09218215942383, 62.195404052734375, 64.29862976074219, 66.40184783935547, 68.50506591796875, 70.60829162597656]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 11.0, 10.0, 7.0, 14.0, 22.0, 13.0, 24.0, 22.0, 25.0, 30.0, 35.0, 26.0, 37.0, 52.0, 49.0, 35.0, 38.0, 45.0, 33.0, 44.0, 42.0, 49.0, 44.0, 26.0, 26.0, 30.0, 22.0, 27.0, 22.0, 27.0, 20.0, 14.0, 13.0, 14.0, 6.0, 13.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.1702880859375, -7.856201171875, -7.5421142578125, -7.22802734375, -6.9139404296875, -6.599853515625, -6.2857666015625, -5.9716796875, -5.6575927734375, -5.343505859375, -5.0294189453125, -4.71533203125, -4.4012451171875, -4.087158203125, -3.7730712890625, -3.458984375, -3.1448974609375, -2.830810546875, -2.5167236328125, -2.20263671875, -1.8885498046875, -1.574462890625, -1.2603759765625, -0.9462890625, -0.6322021484375, -0.318115234375, -0.0040283203125, 0.31005859375, 0.6241455078125, 0.938232421875, 1.2523193359375, 1.56640625, 1.8804931640625, 2.194580078125, 2.5086669921875, 2.82275390625, 3.1368408203125, 3.450927734375, 3.7650146484375, 4.0791015625, 4.3931884765625, 4.707275390625, 5.0213623046875, 5.33544921875, 5.6495361328125, 5.963623046875, 6.2777099609375, 6.591796875, 6.9058837890625, 7.219970703125, 7.5340576171875, 7.84814453125, 8.1622314453125, 8.476318359375, 8.7904052734375, 9.1044921875, 9.4185791015625, 9.732666015625, 10.0467529296875, 10.36083984375, 10.6749267578125, 10.989013671875, 11.3031005859375, 11.6171875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 2.0, 10.0, 12.0, 6.0, 11.0, 12.0, 27.0, 30.0, 39.0, 30.0, 55.0, 61.0, 103.0, 113.0, 152.0, 219.0, 327.0, 485.0, 842.0, 1566.0, 3464.0, 9640.0, 43461.0, 500337.0, 2586618.0, 947649.0, 76388.0, 13443.0, 4419.0, 1971.0, 949.0, 541.0, 369.0, 217.0, 170.0, 123.0, 69.0, 94.0, 66.0, 49.0, 32.0, 25.0, 19.0, 19.0, 14.0, 11.0, 10.0, 8.0, 3.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.90869140625, -15.3330078125, -14.75732421875, -14.181640625, -13.60595703125, -13.0302734375, -12.45458984375, -11.87890625, -11.30322265625, -10.7275390625, -10.15185546875, -9.576171875, -9.00048828125, -8.4248046875, -7.84912109375, -7.2734375, -6.69775390625, -6.1220703125, -5.54638671875, -4.970703125, -4.39501953125, -3.8193359375, -3.24365234375, -2.66796875, -2.09228515625, -1.5166015625, -0.94091796875, -0.365234375, 0.21044921875, 0.7861328125, 1.36181640625, 1.9375, 2.51318359375, 3.0888671875, 3.66455078125, 4.240234375, 4.81591796875, 5.3916015625, 5.96728515625, 6.54296875, 7.11865234375, 7.6943359375, 8.27001953125, 8.845703125, 9.42138671875, 9.9970703125, 10.57275390625, 11.1484375, 11.72412109375, 12.2998046875, 12.87548828125, 13.451171875, 14.02685546875, 14.6025390625, 15.17822265625, 15.75390625, 16.32958984375, 16.9052734375, 17.48095703125, 18.056640625, 18.63232421875, 19.2080078125, 19.78369140625, 20.359375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 5.0, 6.0, 10.0, 11.0, 46.0, 50.0, 76.0, 139.0, 250.0, 457.0, 785.0, 902.0, 602.0, 333.0, 173.0, 100.0, 53.0, 40.0, 17.0, 12.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.203125, -27.403076171875, -26.60302734375, -25.802978515625, -25.0029296875, -24.202880859375, -23.40283203125, -22.602783203125, -21.802734375, -21.002685546875, -20.20263671875, -19.402587890625, -18.6025390625, -17.802490234375, -17.00244140625, -16.202392578125, -15.40234375, -14.602294921875, -13.80224609375, -13.002197265625, -12.2021484375, -11.402099609375, -10.60205078125, -9.802001953125, -9.001953125, -8.201904296875, -7.40185546875, -6.601806640625, -5.8017578125, -5.001708984375, -4.20166015625, -3.401611328125, -2.6015625, -1.801513671875, -1.00146484375, -0.201416015625, 0.5986328125, 1.398681640625, 2.19873046875, 2.998779296875, 3.798828125, 4.598876953125, 5.39892578125, 6.198974609375, 6.9990234375, 7.799072265625, 8.59912109375, 9.399169921875, 10.19921875, 10.999267578125, 11.79931640625, 12.599365234375, 13.3994140625, 14.199462890625, 14.99951171875, 15.799560546875, 16.599609375, 17.399658203125, 18.19970703125, 18.999755859375, 19.7998046875, 20.599853515625, 21.39990234375, 22.199951171875, 23.0]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 6.0, 10.0, 14.0, 15.0, 23.0, 60.0, 62.0, 134.0, 193.0, 426.0, 1291.0, 7700.0, 719192.0, 3448249.0, 14039.0, 1583.0, 559.0, 241.0, 156.0, 114.0, 68.0, 41.0, 34.0, 19.0, 14.0, 10.0, 7.0, 8.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-56.0625, -53.7373046875, -51.412109375, -49.0869140625, -46.76171875, -44.4365234375, -42.111328125, -39.7861328125, -37.4609375, -35.1357421875, -32.810546875, -30.4853515625, -28.16015625, -25.8349609375, -23.509765625, -21.1845703125, -18.859375, -16.5341796875, -14.208984375, -11.8837890625, -9.55859375, -7.2333984375, -4.908203125, -2.5830078125, -0.2578125, 2.0673828125, 4.392578125, 6.7177734375, 9.04296875, 11.3681640625, 13.693359375, 16.0185546875, 18.34375, 20.6689453125, 22.994140625, 25.3193359375, 27.64453125, 29.9697265625, 32.294921875, 34.6201171875, 36.9453125, 39.2705078125, 41.595703125, 43.9208984375, 46.24609375, 48.5712890625, 50.896484375, 53.2216796875, 55.546875, 57.8720703125, 60.197265625, 62.5224609375, 64.84765625, 67.1728515625, 69.498046875, 71.8232421875, 74.1484375, 76.4736328125, 78.798828125, 81.1240234375, 83.44921875, 85.7744140625, 88.099609375, 90.4248046875, 92.75]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 180.0, 752.0, 76.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-683.9979858398438, -670.9443359375, -657.890625, -644.8369750976562, -631.7832641601562, -618.7296142578125, -605.6759033203125, -592.6222534179688, -579.568603515625, -566.5149536132812, -553.4612426757812, -540.4075927734375, -527.3538818359375, -514.3002319335938, -501.2465515136719, -488.19287109375, -475.1391906738281, -462.08551025390625, -449.0318298339844, -435.9781494140625, -422.92449951171875, -409.8708190917969, -396.817138671875, -383.7634582519531, -370.70977783203125, -357.6560974121094, -344.6024169921875, -331.54876708984375, -318.4950866699219, -305.44140625, -292.3877258300781, -279.33404541015625, -266.2803955078125, -253.22671508789062, -240.1730499267578, -227.11936950683594, -214.06570434570312, -201.01202392578125, -187.95834350585938, -174.9046630859375, -161.8509979248047, -148.7973175048828, -135.74365234375, -122.68997192382812, -109.63629913330078, -96.58262634277344, -83.52894592285156, -70.47527313232422, -57.421600341796875, -44.36792755126953, -31.314250946044922, -18.260574340820312, -5.206901550292969, 7.846771240234375, 20.90045166015625, 33.954124450683594, 47.00779724121094, 60.06147003173828, 73.11514282226562, 86.1688232421875, 99.22249603271484, 112.27616882324219, 125.32984924316406, 138.38351440429688, 151.43719482421875]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 2.0, 1.0, 5.0, 5.0, 8.0, 7.0, 15.0, 16.0, 14.0, 19.0, 26.0, 35.0, 29.0, 32.0, 36.0, 32.0, 42.0, 40.0, 47.0, 50.0, 35.0, 43.0, 44.0, 38.0, 34.0, 44.0, 35.0, 34.0, 30.0, 30.0, 33.0, 18.0, 19.0, 17.0, 13.0, 15.0, 8.0, 9.0, 9.0, 3.0, 6.0, 9.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-51.77858352661133, -50.225223541259766, -48.6718635559082, -47.11850357055664, -45.56514358520508, -44.011783599853516, -42.45842361450195, -40.90506362915039, -39.35170364379883, -37.798343658447266, -36.2449836730957, -34.69162368774414, -33.13826370239258, -31.584903717041016, -30.031543731689453, -28.47818374633789, -26.92482566833496, -25.3714656829834, -23.818105697631836, -22.264745712280273, -20.71138572692871, -19.15802574157715, -17.60466766357422, -16.051307678222656, -14.497946739196777, -12.944586753845215, -11.391226768493652, -9.837867736816406, -8.284507751464844, -6.731147289276123, -5.177787780761719, -3.6244277954101562, -2.0710678100585938, -0.5177079439163208, 1.0356519222259521, 2.5890116691589355, 4.142371654510498, 5.6957316398620605, 7.249091148376465, 8.802451133728027, 10.35581111907959, 11.909171104431152, 13.462531089782715, 15.015890121459961, 16.569250106811523, 18.122610092163086, 19.67597007751465, 21.22933006286621, 22.782690048217773, 24.336050033569336, 25.8894100189209, 27.44277000427246, 28.996129989624023, 30.549489974975586, 32.102848052978516, 33.65620803833008, 35.20956802368164, 36.7629280090332, 38.316287994384766, 39.86964797973633, 41.42300796508789, 42.97636795043945, 44.529727935791016, 46.08308792114258, 47.63644790649414]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 8.0, 7.0, 13.0, 15.0, 8.0, 14.0, 9.0, 21.0, 21.0, 19.0, 30.0, 30.0, 25.0, 30.0, 32.0, 48.0, 47.0, 35.0, 45.0, 47.0, 40.0, 30.0, 36.0, 35.0, 44.0, 27.0, 33.0, 30.0, 25.0, 22.0, 30.0, 27.0, 22.0, 15.0, 16.0, 6.0, 12.0, 9.0, 7.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.1640625, -9.865478515625, -9.56689453125, -9.268310546875, -8.9697265625, -8.671142578125, -8.37255859375, -8.073974609375, -7.775390625, -7.476806640625, -7.17822265625, -6.879638671875, -6.5810546875, -6.282470703125, -5.98388671875, -5.685302734375, -5.38671875, -5.088134765625, -4.78955078125, -4.490966796875, -4.1923828125, -3.893798828125, -3.59521484375, -3.296630859375, -2.998046875, -2.699462890625, -2.40087890625, -2.102294921875, -1.8037109375, -1.505126953125, -1.20654296875, -0.907958984375, -0.609375, -0.310791015625, -0.01220703125, 0.286376953125, 0.5849609375, 0.883544921875, 1.18212890625, 1.480712890625, 1.779296875, 2.077880859375, 2.37646484375, 2.675048828125, 2.9736328125, 3.272216796875, 3.57080078125, 3.869384765625, 4.16796875, 4.466552734375, 4.76513671875, 5.063720703125, 5.3623046875, 5.660888671875, 5.95947265625, 6.258056640625, 6.556640625, 6.855224609375, 7.15380859375, 7.452392578125, 7.7509765625, 8.049560546875, 8.34814453125, 8.646728515625, 8.9453125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 7.0, 10.0, 13.0, 20.0, 48.0, 59.0, 99.0, 110.0, 195.0, 257.0, 428.0, 618.0, 916.0, 1286.0, 1884.0, 2621.0, 3750.0, 5081.0, 7450.0, 10639.0, 15289.0, 21966.0, 32344.0, 48215.0, 73785.0, 110547.0, 152624.0, 164521.0, 127848.0, 86406.0, 57312.0, 38060.0, 25666.0, 17734.0, 12158.0, 8554.0, 5911.0, 4166.0, 3050.0, 2126.0, 1479.0, 1089.0, 696.0, 530.0, 312.0, 223.0, 170.0, 104.0, 67.0, 35.0, 33.0, 22.0, 11.0, 11.0, 8.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8662109375, -0.8384475708007812, -0.8106842041015625, -0.7829208374023438, -0.755157470703125, -0.7273941040039062, -0.6996307373046875, -0.6718673706054688, -0.64410400390625, -0.6163406372070312, -0.5885772705078125, -0.5608139038085938, -0.533050537109375, -0.5052871704101562, -0.4775238037109375, -0.44976043701171875, -0.4219970703125, -0.39423370361328125, -0.3664703369140625, -0.33870697021484375, -0.310943603515625, -0.28318023681640625, -0.2554168701171875, -0.22765350341796875, -0.19989013671875, -0.17212677001953125, -0.1443634033203125, -0.11660003662109375, -0.088836669921875, -0.06107330322265625, -0.0333099365234375, -0.00554656982421875, 0.022216796875, 0.04998016357421875, 0.0777435302734375, 0.10550689697265625, 0.133270263671875, 0.16103363037109375, 0.1887969970703125, 0.21656036376953125, 0.24432373046875, 0.27208709716796875, 0.2998504638671875, 0.32761383056640625, 0.355377197265625, 0.38314056396484375, 0.4109039306640625, 0.43866729736328125, 0.4664306640625, 0.49419403076171875, 0.5219573974609375, 0.5497207641601562, 0.577484130859375, 0.6052474975585938, 0.6330108642578125, 0.6607742309570312, 0.68853759765625, 0.7163009643554688, 0.7440643310546875, 0.7718276977539062, 0.799591064453125, 0.8273544311523438, 0.8551177978515625, 0.8828811645507812, 0.91064453125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 10.0, 9.0, 16.0, 12.0, 8.0, 12.0, 14.0, 18.0, 16.0, 32.0, 26.0, 41.0, 35.0, 39.0, 37.0, 55.0, 44.0, 58.0, 1067.0, 40.0, 47.0, 44.0, 42.0, 37.0, 36.0, 28.0, 41.0, 23.0, 27.0, 23.0, 25.0, 15.0, 14.0, 5.0, 13.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28515625, -7.06842041015625, -6.8516845703125, -6.63494873046875, -6.418212890625, -6.20147705078125, -5.9847412109375, -5.76800537109375, -5.55126953125, -5.33453369140625, -5.1177978515625, -4.90106201171875, -4.684326171875, -4.46759033203125, -4.2508544921875, -4.03411865234375, -3.8173828125, -3.60064697265625, -3.3839111328125, -3.16717529296875, -2.950439453125, -2.73370361328125, -2.5169677734375, -2.30023193359375, -2.08349609375, -1.86676025390625, -1.6500244140625, -1.43328857421875, -1.216552734375, -0.99981689453125, -0.7830810546875, -0.56634521484375, -0.349609375, -0.13287353515625, 0.0838623046875, 0.30059814453125, 0.517333984375, 0.73406982421875, 0.9508056640625, 1.16754150390625, 1.38427734375, 1.60101318359375, 1.8177490234375, 2.03448486328125, 2.251220703125, 2.46795654296875, 2.6846923828125, 2.90142822265625, 3.1181640625, 3.33489990234375, 3.5516357421875, 3.76837158203125, 3.985107421875, 4.20184326171875, 4.4185791015625, 4.63531494140625, 4.85205078125, 5.06878662109375, 5.2855224609375, 5.50225830078125, 5.718994140625, 5.93572998046875, 6.1524658203125, 6.36920166015625, 6.5859375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 10.0, 22.0, 20.0, 34.0, 60.0, 87.0, 126.0, 164.0, 267.0, 411.0, 629.0, 912.0, 1352.0, 1972.0, 3116.0, 4775.0, 7019.0, 10929.0, 16659.0, 26045.0, 41049.0, 66522.0, 106707.0, 164790.0, 1241124.0, 148066.0, 92873.0, 57819.0, 36381.0, 23308.0, 14964.0, 9854.0, 6374.0, 4317.0, 2907.0, 1838.0, 1211.0, 848.0, 537.0, 341.0, 226.0, 148.0, 98.0, 70.0, 54.0, 28.0, 25.0, 22.0, 10.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.025390625, -0.9946517944335938, -0.9639129638671875, -0.9331741333007812, -0.902435302734375, -0.8716964721679688, -0.8409576416015625, -0.8102188110351562, -0.77947998046875, -0.7487411499023438, -0.7180023193359375, -0.6872634887695312, -0.656524658203125, -0.6257858276367188, -0.5950469970703125, -0.5643081665039062, -0.5335693359375, -0.5028305053710938, -0.4720916748046875, -0.44135284423828125, -0.410614013671875, -0.37987518310546875, -0.3491363525390625, -0.31839752197265625, -0.28765869140625, -0.25691986083984375, -0.2261810302734375, -0.19544219970703125, -0.164703369140625, -0.13396453857421875, -0.1032257080078125, -0.07248687744140625, -0.041748046875, -0.01100921630859375, 0.0197296142578125, 0.05046844482421875, 0.081207275390625, 0.11194610595703125, 0.1426849365234375, 0.17342376708984375, 0.20416259765625, 0.23490142822265625, 0.2656402587890625, 0.29637908935546875, 0.327117919921875, 0.35785675048828125, 0.3885955810546875, 0.41933441162109375, 0.4500732421875, 0.48081207275390625, 0.5115509033203125, 0.5422897338867188, 0.573028564453125, 0.6037673950195312, 0.6345062255859375, 0.6652450561523438, 0.69598388671875, 0.7267227172851562, 0.7574615478515625, 0.7882003784179688, 0.818939208984375, 0.8496780395507812, 0.8804168701171875, 0.9111557006835938, 0.94189453125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 9.0, 8.0, 7.0, 12.0, 14.0, 18.0, 20.0, 24.0, 28.0, 43.0, 63.0, 61.0, 66.0, 71.0, 78.0, 67.0, 79.0, 62.0, 57.0, 43.0, 35.0, 46.0, 28.0, 22.0, 16.0, 6.0, 12.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027618408203125, -0.0026692748069763184, -0.0025767087936401367, -0.002484142780303955, -0.0023915767669677734, -0.002299010753631592, -0.00220644474029541, -0.0021138787269592285, -0.002021312713623047, -0.0019287467002868652, -0.0018361806869506836, -0.001743614673614502, -0.0016510486602783203, -0.0015584826469421387, -0.001465916633605957, -0.0013733506202697754, -0.0012807846069335938, -0.0011882185935974121, -0.0010956525802612305, -0.0010030865669250488, -0.0009105205535888672, -0.0008179545402526855, -0.0007253885269165039, -0.0006328225135803223, -0.0005402565002441406, -0.000447690486907959, -0.00035512447357177734, -0.0002625584602355957, -0.00016999244689941406, -7.742643356323242e-05, 1.5139579772949219e-05, 0.00010770559310913086, 0.0002002716064453125, 0.00029283761978149414, 0.0003854036331176758, 0.0004779696464538574, 0.0005705356597900391, 0.0006631016731262207, 0.0007556676864624023, 0.000848233699798584, 0.0009407997131347656, 0.0010333657264709473, 0.001125931739807129, 0.0012184977531433105, 0.0013110637664794922, 0.0014036297798156738, 0.0014961957931518555, 0.0015887618064880371, 0.0016813278198242188, 0.0017738938331604004, 0.001866459846496582, 0.0019590258598327637, 0.0020515918731689453, 0.002144157886505127, 0.0022367238998413086, 0.0023292899131774902, 0.002421855926513672, 0.0025144219398498535, 0.002606987953186035, 0.002699553966522217, 0.0027921199798583984, 0.00288468599319458, 0.0029772520065307617, 0.0030698180198669434, 0.003162384033203125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 5.0, 11.0, 11.0, 21.0, 26.0, 42.0, 60.0, 67.0, 87.0, 131.0, 175.0, 365.0, 904.0, 57946.0, 985549.0, 1819.0, 535.0, 248.0, 138.0, 109.0, 92.0, 50.0, 31.0, 30.0, 25.0, 23.0, 13.0, 9.0, 7.0, 10.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061279296875, -0.05943441390991211, -0.05758953094482422, -0.05574464797973633, -0.05389976501464844, -0.05205488204956055, -0.050209999084472656, -0.048365116119384766, -0.046520233154296875, -0.044675350189208984, -0.042830467224121094, -0.0409855842590332, -0.03914070129394531, -0.03729581832885742, -0.03545093536376953, -0.03360605239868164, -0.03176116943359375, -0.02991628646850586, -0.02807140350341797, -0.026226520538330078, -0.024381637573242188, -0.022536754608154297, -0.020691871643066406, -0.018846988677978516, -0.017002105712890625, -0.015157222747802734, -0.013312339782714844, -0.011467456817626953, -0.009622573852539062, -0.007777690887451172, -0.005932807922363281, -0.004087924957275391, -0.0022430419921875, -0.0003981590270996094, 0.0014467239379882812, 0.003291606903076172, 0.0051364898681640625, 0.006981372833251953, 0.008826255798339844, 0.010671138763427734, 0.012516021728515625, 0.014360904693603516, 0.016205787658691406, 0.018050670623779297, 0.019895553588867188, 0.021740436553955078, 0.02358531951904297, 0.02543020248413086, 0.02727508544921875, 0.02911996841430664, 0.03096485137939453, 0.03280973434448242, 0.03465461730957031, 0.0364995002746582, 0.038344383239746094, 0.040189266204833984, 0.042034149169921875, 0.043879032135009766, 0.045723915100097656, 0.04756879806518555, 0.04941368103027344, 0.05125856399536133, 0.05310344696044922, 0.05494832992553711, 0.056793212890625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 12.0, 167.0, 686.0, 147.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004613431170582771, -0.004314451478421688, -0.004015471786260605, -0.0037164923269301653, -0.003417512634769082, -0.003118532942607999, -0.0028195534832775593, -0.002520573791116476, -0.002221594098955393, -0.0019226144067943096, -0.0016236348310485482, -0.0013246552553027868, -0.0010256755631417036, -0.0007266958709806204, -0.000427716295234859, -0.0001287367194890976, 0.00017024297267198563, 0.00046922260662540793, 0.0007682022405788302, 0.0010671818163245916, 0.0013661615084856749, 0.001665141200646758, 0.0019641206599771976, 0.002263100352138281, 0.002562080044299364, 0.0028610597364604473, 0.0031600394286215305, 0.00345901888795197, 0.0037579985801130533, 0.004056978039443493, 0.004355957731604576, 0.004654937423765659, 0.004953916184604168, 0.005252895876765251, 0.005551875568926334, 0.005850855261087418, 0.006149834953248501, 0.006448814645409584, 0.00674779387190938, 0.007046773564070463, 0.007345753256231546, 0.00764473294839263, 0.007943712174892426, 0.008242691867053509, 0.008541671559214592, 0.008840651251375675, 0.009139630943536758, 0.009438610635697842, 0.009737590327858925, 0.010036570020020008, 0.010335549712181091, 0.010634529404342175, 0.010933509096503258, 0.011232488788664341, 0.011531468480825424, 0.011830447241663933, 0.01212942786514759, 0.012428407557308674, 0.012727387249469757, 0.01302636694163084, 0.013325346633791924, 0.013624326325953007, 0.01392330601811409, 0.014222284778952599, 0.014521264471113682]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 7.0, 8.0, 10.0, 15.0, 7.0, 10.0, 14.0, 12.0, 21.0, 25.0, 29.0, 31.0, 29.0, 35.0, 39.0, 30.0, 42.0, 23.0, 31.0, 33.0, 31.0, 42.0, 37.0, 38.0, 40.0, 35.0, 42.0, 31.0, 25.0, 30.0, 21.0, 20.0, 28.0, 15.0, 20.0, 9.0, 20.0, 11.0, 12.0, 7.0, 10.0, 5.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0011608600616455078, -0.0011260062456130981, -0.0010911524295806885, -0.0010562986135482788, -0.0010214447975158691, -0.0009865909814834595, -0.0009517371654510498, -0.0009168833494186401, -0.0008820295333862305, -0.0008471757173538208, -0.0008123219013214111, -0.0007774680852890015, -0.0007426142692565918, -0.0007077604532241821, -0.0006729066371917725, -0.0006380528211593628, -0.0006031990051269531, -0.0005683451890945435, -0.0005334913730621338, -0.0004986375570297241, -0.00046378374099731445, -0.0004289299249649048, -0.0003940761089324951, -0.00035922229290008545, -0.0003243684768676758, -0.0002895146608352661, -0.00025466084480285645, -0.00021980702877044678, -0.0001849532127380371, -0.00015009939670562744, -0.00011524558067321777, -8.03917646408081e-05, -4.553794860839844e-05, -1.068413257598877e-05, 2.41696834564209e-05, 5.9023499488830566e-05, 9.387731552124023e-05, 0.0001287311315536499, 0.00016358494758605957, 0.00019843876361846924, 0.0002332925796508789, 0.0002681463956832886, 0.00030300021171569824, 0.0003378540277481079, 0.0003727078437805176, 0.00040756165981292725, 0.0004424154758453369, 0.0004772692918777466, 0.0005121231079101562, 0.0005469769239425659, 0.0005818307399749756, 0.0006166845560073853, 0.0006515383720397949, 0.0006863921880722046, 0.0007212460041046143, 0.0007560998201370239, 0.0007909536361694336, 0.0008258074522018433, 0.0008606612682342529, 0.0008955150842666626, 0.0009303689002990723, 0.0009652227163314819, 0.0010000765323638916, 0.0010349303483963013, 0.001069784164428711]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 8.0, 7.0, 13.0, 15.0, 8.0, 14.0, 9.0, 21.0, 21.0, 19.0, 30.0, 30.0, 25.0, 30.0, 32.0, 48.0, 47.0, 35.0, 45.0, 47.0, 40.0, 30.0, 36.0, 35.0, 44.0, 27.0, 33.0, 30.0, 25.0, 22.0, 30.0, 27.0, 22.0, 15.0, 16.0, 6.0, 12.0, 9.0, 7.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.1640625, -9.865478515625, -9.56689453125, -9.268310546875, -8.9697265625, -8.671142578125, -8.37255859375, -8.073974609375, -7.775390625, -7.476806640625, -7.17822265625, -6.879638671875, -6.5810546875, -6.282470703125, -5.98388671875, -5.685302734375, -5.38671875, -5.088134765625, -4.78955078125, -4.490966796875, -4.1923828125, -3.893798828125, -3.59521484375, -3.296630859375, -2.998046875, -2.699462890625, -2.40087890625, -2.102294921875, -1.8037109375, -1.505126953125, -1.20654296875, -0.907958984375, -0.609375, -0.310791015625, -0.01220703125, 0.286376953125, 0.5849609375, 0.883544921875, 1.18212890625, 1.480712890625, 1.779296875, 2.077880859375, 2.37646484375, 2.675048828125, 2.9736328125, 3.272216796875, 3.57080078125, 3.869384765625, 4.16796875, 4.466552734375, 4.76513671875, 5.063720703125, 5.3623046875, 5.660888671875, 5.95947265625, 6.258056640625, 6.556640625, 6.855224609375, 7.15380859375, 7.452392578125, 7.7509765625, 8.049560546875, 8.34814453125, 8.646728515625, 8.9453125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 5.0, 7.0, 10.0, 15.0, 23.0, 23.0, 30.0, 34.0, 48.0, 68.0, 106.0, 132.0, 199.0, 270.0, 430.0, 658.0, 1180.0, 2152.0, 4188.0, 9657.0, 25321.0, 88108.0, 409050.0, 382279.0, 81939.0, 24013.0, 9096.0, 4161.0, 2203.0, 1079.0, 685.0, 391.0, 277.0, 226.0, 118.0, 92.0, 65.0, 55.0, 35.0, 38.0, 18.0, 16.0, 18.0, 10.0, 10.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.9609375, -12.5794677734375, -12.197998046875, -11.8165283203125, -11.43505859375, -11.0535888671875, -10.672119140625, -10.2906494140625, -9.9091796875, -9.5277099609375, -9.146240234375, -8.7647705078125, -8.38330078125, -8.0018310546875, -7.620361328125, -7.2388916015625, -6.857421875, -6.4759521484375, -6.094482421875, -5.7130126953125, -5.33154296875, -4.9500732421875, -4.568603515625, -4.1871337890625, -3.8056640625, -3.4241943359375, -3.042724609375, -2.6612548828125, -2.27978515625, -1.8983154296875, -1.516845703125, -1.1353759765625, -0.75390625, -0.3724365234375, 0.009033203125, 0.3905029296875, 0.77197265625, 1.1534423828125, 1.534912109375, 1.9163818359375, 2.2978515625, 2.6793212890625, 3.060791015625, 3.4422607421875, 3.82373046875, 4.2052001953125, 4.586669921875, 4.9681396484375, 5.349609375, 5.7310791015625, 6.112548828125, 6.4940185546875, 6.87548828125, 7.2569580078125, 7.638427734375, 8.0198974609375, 8.4013671875, 8.7828369140625, 9.164306640625, 9.5457763671875, 9.92724609375, 10.3087158203125, 10.690185546875, 11.0716552734375, 11.453125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 9.0, 7.0, 6.0, 9.0, 15.0, 19.0, 11.0, 20.0, 32.0, 28.0, 29.0, 36.0, 29.0, 32.0, 51.0, 57.0, 88.0, 168.0, 1522.0, 272.0, 127.0, 72.0, 55.0, 47.0, 44.0, 35.0, 27.0, 42.0, 38.0, 22.0, 18.0, 18.0, 3.0, 14.0, 7.0, 6.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.734375, -21.913818359375, -21.09326171875, -20.272705078125, -19.4521484375, -18.631591796875, -17.81103515625, -16.990478515625, -16.169921875, -15.349365234375, -14.52880859375, -13.708251953125, -12.8876953125, -12.067138671875, -11.24658203125, -10.426025390625, -9.60546875, -8.784912109375, -7.96435546875, -7.143798828125, -6.3232421875, -5.502685546875, -4.68212890625, -3.861572265625, -3.041015625, -2.220458984375, -1.39990234375, -0.579345703125, 0.2412109375, 1.061767578125, 1.88232421875, 2.702880859375, 3.5234375, 4.343994140625, 5.16455078125, 5.985107421875, 6.8056640625, 7.626220703125, 8.44677734375, 9.267333984375, 10.087890625, 10.908447265625, 11.72900390625, 12.549560546875, 13.3701171875, 14.190673828125, 15.01123046875, 15.831787109375, 16.65234375, 17.472900390625, 18.29345703125, 19.114013671875, 19.9345703125, 20.755126953125, 21.57568359375, 22.396240234375, 23.216796875, 24.037353515625, 24.85791015625, 25.678466796875, 26.4990234375, 27.319580078125, 28.14013671875, 28.960693359375, 29.78125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 10.0, 9.0, 11.0, 13.0, 26.0, 21.0, 22.0, 38.0, 34.0, 66.0, 91.0, 125.0, 197.0, 267.0, 410.0, 1126.0, 7007.0, 154615.0, 2928262.0, 47939.0, 3537.0, 724.0, 347.0, 211.0, 155.0, 119.0, 75.0, 51.0, 50.0, 27.0, 25.0, 27.0, 19.0, 12.0, 10.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.25, -31.07080078125, -29.8916015625, -28.71240234375, -27.533203125, -26.35400390625, -25.1748046875, -23.99560546875, -22.81640625, -21.63720703125, -20.4580078125, -19.27880859375, -18.099609375, -16.92041015625, -15.7412109375, -14.56201171875, -13.3828125, -12.20361328125, -11.0244140625, -9.84521484375, -8.666015625, -7.48681640625, -6.3076171875, -5.12841796875, -3.94921875, -2.77001953125, -1.5908203125, -0.41162109375, 0.767578125, 1.94677734375, 3.1259765625, 4.30517578125, 5.484375, 6.66357421875, 7.8427734375, 9.02197265625, 10.201171875, 11.38037109375, 12.5595703125, 13.73876953125, 14.91796875, 16.09716796875, 17.2763671875, 18.45556640625, 19.634765625, 20.81396484375, 21.9931640625, 23.17236328125, 24.3515625, 25.53076171875, 26.7099609375, 27.88916015625, 29.068359375, 30.24755859375, 31.4267578125, 32.60595703125, 33.78515625, 34.96435546875, 36.1435546875, 37.32275390625, 38.501953125, 39.68115234375, 40.8603515625, 42.03955078125, 43.21875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 27.0, 242.0, 563.0, 171.0, 15.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.89213180541992, -55.062469482421875, -51.232810974121094, -47.40315246582031, -43.573490142822266, -39.74382781982422, -35.91416931152344, -32.084510803222656, -28.25484848022461, -24.425188064575195, -20.59552764892578, -16.765867233276367, -12.936206817626953, -9.106546401977539, -5.276885986328125, -1.447225570678711, 2.382434844970703, 6.212095260620117, 10.041755676269531, 13.871416091918945, 17.70107650756836, 21.530736923217773, 25.360397338867188, 29.1900577545166, 33.019718170166016, 36.84938049316406, 40.679039001464844, 44.508697509765625, 48.33835983276367, 52.16802215576172, 55.9976806640625, 59.82733917236328, 63.65699768066406, 67.48665618896484, 71.31631469726562, 75.14598083496094, 78.97563934326172, 82.8052978515625, 86.63496398925781, 90.4646224975586, 94.29428100585938, 98.12393951416016, 101.95359802246094, 105.78326416015625, 109.61292266845703, 113.44258117675781, 117.27224731445312, 121.1019058227539, 124.93156433105469, 128.76123046875, 132.59088134765625, 136.42054748535156, 140.25021362304688, 144.07986450195312, 147.90953063964844, 151.7391815185547, 155.56884765625, 159.3985137939453, 163.22816467285156, 167.05783081054688, 170.88748168945312, 174.71714782714844, 178.54681396484375, 182.37646484375, 186.2061309814453]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 5.0, 7.0, 6.0, 2.0, 14.0, 18.0, 17.0, 17.0, 19.0, 27.0, 23.0, 20.0, 30.0, 29.0, 31.0, 37.0, 39.0, 38.0, 36.0, 31.0, 34.0, 45.0, 35.0, 31.0, 28.0, 31.0, 39.0, 27.0, 24.0, 27.0, 25.0, 23.0, 17.0, 19.0, 19.0, 19.0, 16.0, 18.0, 13.0, 10.0, 7.0, 16.0, 5.0, 6.0, 10.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-52.88605499267578, -51.26676559448242, -49.64747619628906, -48.0281867980957, -46.408897399902344, -44.78961181640625, -43.17032241821289, -41.55103302001953, -39.93174362182617, -38.31245422363281, -36.69316482543945, -35.073875427246094, -33.45458984375, -31.835298538208008, -30.21601104736328, -28.596721649169922, -26.977432250976562, -25.358142852783203, -23.738853454589844, -22.119565963745117, -20.500276565551758, -18.8809871673584, -17.261699676513672, -15.642410278320312, -14.023120880126953, -12.403831481933594, -10.78454303741455, -9.165254592895508, -7.545965194702148, -5.926675796508789, -4.307387351989746, -2.688098907470703, -1.0688133239746094, 0.5504755973815918, 2.169764518737793, 3.789053440093994, 5.408342361450195, 7.027631759643555, 8.646920204162598, 10.26620864868164, 11.885498046875, 13.50478744506836, 15.124075889587402, 16.743364334106445, 18.362653732299805, 19.981943130493164, 21.60123062133789, 23.22052001953125, 24.83980941772461, 26.45909881591797, 28.078388214111328, 29.697675704956055, 31.316965103149414, 32.936256408691406, 34.5555419921875, 36.17483139038086, 37.79412078857422, 39.41341018676758, 41.03269958496094, 42.6519889831543, 44.271278381347656, 45.89056396484375, 47.50985336303711, 49.12914276123047, 50.74843215942383]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 8.0, 6.0, 7.0, 8.0, 10.0, 8.0, 13.0, 13.0, 18.0, 15.0, 23.0, 34.0, 26.0, 33.0, 38.0, 31.0, 42.0, 36.0, 43.0, 37.0, 47.0, 39.0, 32.0, 32.0, 33.0, 38.0, 34.0, 34.0, 28.0, 33.0, 25.0, 23.0, 31.0, 21.0, 12.0, 11.0, 20.0, 9.0, 7.0, 6.0, 7.0, 5.0, 6.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.92333984375, -8.6279296875, -8.33251953125, -8.037109375, -7.74169921875, -7.4462890625, -7.15087890625, -6.85546875, -6.56005859375, -6.2646484375, -5.96923828125, -5.673828125, -5.37841796875, -5.0830078125, -4.78759765625, -4.4921875, -4.19677734375, -3.9013671875, -3.60595703125, -3.310546875, -3.01513671875, -2.7197265625, -2.42431640625, -2.12890625, -1.83349609375, -1.5380859375, -1.24267578125, -0.947265625, -0.65185546875, -0.3564453125, -0.06103515625, 0.234375, 0.52978515625, 0.8251953125, 1.12060546875, 1.416015625, 1.71142578125, 2.0068359375, 2.30224609375, 2.59765625, 2.89306640625, 3.1884765625, 3.48388671875, 3.779296875, 4.07470703125, 4.3701171875, 4.66552734375, 4.9609375, 5.25634765625, 5.5517578125, 5.84716796875, 6.142578125, 6.43798828125, 6.7333984375, 7.02880859375, 7.32421875, 7.61962890625, 7.9150390625, 8.21044921875, 8.505859375, 8.80126953125, 9.0966796875, 9.39208984375, 9.6875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 10.0, 5.0, 4.0, 8.0, 7.0, 11.0, 18.0, 15.0, 17.0, 16.0, 26.0, 23.0, 36.0, 49.0, 62.0, 142.0, 271.0, 772.0, 2661.0, 12621.0, 161806.0, 2772066.0, 1187727.0, 46913.0, 6415.0, 1522.0, 447.0, 207.0, 104.0, 58.0, 50.0, 33.0, 33.0, 15.0, 23.0, 19.0, 12.0, 19.0, 7.0, 12.0, 10.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.390625, -26.580078125, -25.76953125, -24.958984375, -24.1484375, -23.337890625, -22.52734375, -21.716796875, -20.90625, -20.095703125, -19.28515625, -18.474609375, -17.6640625, -16.853515625, -16.04296875, -15.232421875, -14.421875, -13.611328125, -12.80078125, -11.990234375, -11.1796875, -10.369140625, -9.55859375, -8.748046875, -7.9375, -7.126953125, -6.31640625, -5.505859375, -4.6953125, -3.884765625, -3.07421875, -2.263671875, -1.453125, -0.642578125, 0.16796875, 0.978515625, 1.7890625, 2.599609375, 3.41015625, 4.220703125, 5.03125, 5.841796875, 6.65234375, 7.462890625, 8.2734375, 9.083984375, 9.89453125, 10.705078125, 11.515625, 12.326171875, 13.13671875, 13.947265625, 14.7578125, 15.568359375, 16.37890625, 17.189453125, 18.0, 18.810546875, 19.62109375, 20.431640625, 21.2421875, 22.052734375, 22.86328125, 23.673828125, 24.484375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 4.0, 12.0, 8.0, 16.0, 11.0, 25.0, 27.0, 47.0, 68.0, 78.0, 115.0, 159.0, 236.0, 322.0, 529.0, 554.0, 522.0, 404.0, 265.0, 171.0, 143.0, 88.0, 62.0, 56.0, 34.0, 25.0, 24.0, 18.0, 11.0, 7.0, 8.0, 4.0, 7.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-14.296875, -13.872802734375, -13.44873046875, -13.024658203125, -12.6005859375, -12.176513671875, -11.75244140625, -11.328369140625, -10.904296875, -10.480224609375, -10.05615234375, -9.632080078125, -9.2080078125, -8.783935546875, -8.35986328125, -7.935791015625, -7.51171875, -7.087646484375, -6.66357421875, -6.239501953125, -5.8154296875, -5.391357421875, -4.96728515625, -4.543212890625, -4.119140625, -3.695068359375, -3.27099609375, -2.846923828125, -2.4228515625, -1.998779296875, -1.57470703125, -1.150634765625, -0.7265625, -0.302490234375, 0.12158203125, 0.545654296875, 0.9697265625, 1.393798828125, 1.81787109375, 2.241943359375, 2.666015625, 3.090087890625, 3.51416015625, 3.938232421875, 4.3623046875, 4.786376953125, 5.21044921875, 5.634521484375, 6.05859375, 6.482666015625, 6.90673828125, 7.330810546875, 7.7548828125, 8.178955078125, 8.60302734375, 9.027099609375, 9.451171875, 9.875244140625, 10.29931640625, 10.723388671875, 11.1474609375, 11.571533203125, 11.99560546875, 12.419677734375, 12.84375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 9.0, 6.0, 13.0, 10.0, 32.0, 57.0, 106.0, 210.0, 441.0, 1204.0, 5235.0, 45441.0, 2291185.0, 1802618.0, 40753.0, 4884.0, 1215.0, 416.0, 194.0, 95.0, 49.0, 22.0, 23.0, 16.0, 12.0, 13.0, 9.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.21875, -40.9384765625, -39.658203125, -38.3779296875, -37.09765625, -35.8173828125, -34.537109375, -33.2568359375, -31.9765625, -30.6962890625, -29.416015625, -28.1357421875, -26.85546875, -25.5751953125, -24.294921875, -23.0146484375, -21.734375, -20.4541015625, -19.173828125, -17.8935546875, -16.61328125, -15.3330078125, -14.052734375, -12.7724609375, -11.4921875, -10.2119140625, -8.931640625, -7.6513671875, -6.37109375, -5.0908203125, -3.810546875, -2.5302734375, -1.25, 0.0302734375, 1.310546875, 2.5908203125, 3.87109375, 5.1513671875, 6.431640625, 7.7119140625, 8.9921875, 10.2724609375, 11.552734375, 12.8330078125, 14.11328125, 15.3935546875, 16.673828125, 17.9541015625, 19.234375, 20.5146484375, 21.794921875, 23.0751953125, 24.35546875, 25.6357421875, 26.916015625, 28.1962890625, 29.4765625, 30.7568359375, 32.037109375, 33.3173828125, 34.59765625, 35.8779296875, 37.158203125, 38.4384765625, 39.71875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 19.0, 95.0, 304.0, 388.0, 159.0, 42.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-278.40380859375, -273.16400146484375, -267.9241943359375, -262.6844177246094, -257.4446105957031, -252.20480346679688, -246.96499633789062, -241.72520446777344, -236.4853973388672, -231.24559020996094, -226.00579833984375, -220.7659912109375, -215.5261993408203, -210.28639221191406, -205.04660034179688, -199.80679321289062, -194.56698608398438, -189.32717895507812, -184.08738708496094, -178.8475799560547, -173.6077880859375, -168.36798095703125, -163.128173828125, -157.8883819580078, -152.64859008789062, -147.40878295898438, -142.1689910888672, -136.92918395996094, -131.68939208984375, -126.4495849609375, -121.20978546142578, -115.96998596191406, -110.73018646240234, -105.49038696289062, -100.2505874633789, -95.01078796386719, -89.77098083496094, -84.53118133544922, -79.2913818359375, -74.05157470703125, -68.81178283691406, -63.571983337402344, -58.33218002319336, -53.09238052368164, -47.852577209472656, -42.61277770996094, -37.37297821044922, -32.133174896240234, -26.89337158203125, -21.6535701751709, -16.413768768310547, -11.173969268798828, -5.934167861938477, -0.694366455078125, 4.545433044433594, 9.785236358642578, 15.025035858154297, 20.26483726501465, 25.504638671875, 30.74443817138672, 35.98423767089844, 41.22404098510742, 46.46384048461914, 51.703643798828125, 56.943443298339844]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 8.0, 7.0, 6.0, 9.0, 13.0, 8.0, 15.0, 20.0, 19.0, 15.0, 18.0, 21.0, 25.0, 21.0, 29.0, 33.0, 40.0, 35.0, 31.0, 26.0, 38.0, 36.0, 32.0, 40.0, 31.0, 46.0, 40.0, 31.0, 23.0, 29.0, 29.0, 34.0, 25.0, 21.0, 15.0, 24.0, 12.0, 15.0, 14.0, 11.0, 9.0, 10.0, 9.0, 2.0, 2.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.8673210144043, -35.645599365234375, -34.42387771606445, -33.20215606689453, -31.98043441772461, -30.758712768554688, -29.536991119384766, -28.315269470214844, -27.093547821044922, -25.871826171875, -24.650104522705078, -23.428382873535156, -22.206661224365234, -20.984939575195312, -19.76321792602539, -18.54149627685547, -17.31977653503418, -16.098054885864258, -14.876333236694336, -13.654611587524414, -12.432889938354492, -11.21116828918457, -9.989447593688965, -8.767725944519043, -7.546004295349121, -6.324282646179199, -5.102560997009277, -3.8808398246765137, -2.659118175506592, -1.43739652633667, -0.21567535400390625, 1.0060462951660156, 2.2277679443359375, 3.4494895935058594, 4.671211242675781, 5.892932415008545, 7.114654064178467, 8.336376190185547, 9.558096885681152, 10.779818534851074, 12.001540184020996, 13.223261833190918, 14.44498348236084, 15.666704177856445, 16.888425827026367, 18.11014747619629, 19.33186912536621, 20.553590774536133, 21.775312423706055, 22.997034072875977, 24.2187557220459, 25.44047737121582, 26.662199020385742, 27.883920669555664, 29.105640411376953, 30.327362060546875, 31.549083709716797, 32.77080535888672, 33.99252700805664, 35.21424865722656, 36.435970306396484, 37.657691955566406, 38.87941360473633, 40.10113525390625, 41.32285690307617]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 3.0, 7.0, 8.0, 10.0, 10.0, 15.0, 21.0, 10.0, 19.0, 22.0, 21.0, 34.0, 31.0, 38.0, 27.0, 41.0, 33.0, 40.0, 49.0, 47.0, 40.0, 39.0, 42.0, 35.0, 36.0, 35.0, 43.0, 29.0, 29.0, 29.0, 30.0, 14.0, 16.0, 10.0, 20.0, 10.0, 14.0, 6.0, 8.0, 9.0, 6.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.25, -9.9326171875, -9.615234375, -9.2978515625, -8.98046875, -8.6630859375, -8.345703125, -8.0283203125, -7.7109375, -7.3935546875, -7.076171875, -6.7587890625, -6.44140625, -6.1240234375, -5.806640625, -5.4892578125, -5.171875, -4.8544921875, -4.537109375, -4.2197265625, -3.90234375, -3.5849609375, -3.267578125, -2.9501953125, -2.6328125, -2.3154296875, -1.998046875, -1.6806640625, -1.36328125, -1.0458984375, -0.728515625, -0.4111328125, -0.09375, 0.2236328125, 0.541015625, 0.8583984375, 1.17578125, 1.4931640625, 1.810546875, 2.1279296875, 2.4453125, 2.7626953125, 3.080078125, 3.3974609375, 3.71484375, 4.0322265625, 4.349609375, 4.6669921875, 4.984375, 5.3017578125, 5.619140625, 5.9365234375, 6.25390625, 6.5712890625, 6.888671875, 7.2060546875, 7.5234375, 7.8408203125, 8.158203125, 8.4755859375, 8.79296875, 9.1103515625, 9.427734375, 9.7451171875, 10.0625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 3.0, 9.0, 11.0, 12.0, 16.0, 23.0, 34.0, 50.0, 61.0, 105.0, 176.0, 199.0, 281.0, 467.0, 701.0, 926.0, 1411.0, 1952.0, 2891.0, 4186.0, 6000.0, 8768.0, 12773.0, 18248.0, 27001.0, 39549.0, 57436.0, 83756.0, 119165.0, 155514.0, 149468.0, 111248.0, 77031.0, 52897.0, 36181.0, 25031.0, 16971.0, 11867.0, 8233.0, 5523.0, 3782.0, 2564.0, 1911.0, 1286.0, 871.0, 623.0, 400.0, 303.0, 188.0, 138.0, 106.0, 78.0, 31.0, 41.0, 29.0, 11.0, 10.0, 13.0, 6.0, 3.0, 2.0], "bins": [-0.89892578125, -0.8715972900390625, -0.844268798828125, -0.8169403076171875, -0.78961181640625, -0.7622833251953125, -0.734954833984375, -0.7076263427734375, -0.6802978515625, -0.6529693603515625, -0.625640869140625, -0.5983123779296875, -0.57098388671875, -0.5436553955078125, -0.516326904296875, -0.4889984130859375, -0.461669921875, -0.4343414306640625, -0.407012939453125, -0.3796844482421875, -0.35235595703125, -0.3250274658203125, -0.297698974609375, -0.2703704833984375, -0.2430419921875, -0.2157135009765625, -0.188385009765625, -0.1610565185546875, -0.13372802734375, -0.1063995361328125, -0.079071044921875, -0.0517425537109375, -0.0244140625, 0.0029144287109375, 0.030242919921875, 0.0575714111328125, 0.08489990234375, 0.1122283935546875, 0.139556884765625, 0.1668853759765625, 0.1942138671875, 0.2215423583984375, 0.248870849609375, 0.2761993408203125, 0.30352783203125, 0.3308563232421875, 0.358184814453125, 0.3855133056640625, 0.412841796875, 0.4401702880859375, 0.467498779296875, 0.4948272705078125, 0.52215576171875, 0.5494842529296875, 0.576812744140625, 0.6041412353515625, 0.6314697265625, 0.6587982177734375, 0.686126708984375, 0.7134552001953125, 0.74078369140625, 0.7681121826171875, 0.795440673828125, 0.8227691650390625, 0.85009765625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 11.0, 7.0, 12.0, 12.0, 10.0, 15.0, 15.0, 14.0, 29.0, 24.0, 22.0, 27.0, 37.0, 29.0, 38.0, 35.0, 39.0, 39.0, 33.0, 1051.0, 36.0, 33.0, 44.0, 42.0, 29.0, 32.0, 38.0, 25.0, 32.0, 24.0, 24.0, 16.0, 25.0, 25.0, 18.0, 13.0, 15.0, 13.0, 16.0, 4.0, 8.0, 2.0, 7.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-6.6484375, -6.45831298828125, -6.2681884765625, -6.07806396484375, -5.887939453125, -5.69781494140625, -5.5076904296875, -5.31756591796875, -5.12744140625, -4.93731689453125, -4.7471923828125, -4.55706787109375, -4.366943359375, -4.17681884765625, -3.9866943359375, -3.79656982421875, -3.6064453125, -3.41632080078125, -3.2261962890625, -3.03607177734375, -2.845947265625, -2.65582275390625, -2.4656982421875, -2.27557373046875, -2.08544921875, -1.89532470703125, -1.7052001953125, -1.51507568359375, -1.324951171875, -1.13482666015625, -0.9447021484375, -0.75457763671875, -0.564453125, -0.37432861328125, -0.1842041015625, 0.00592041015625, 0.196044921875, 0.38616943359375, 0.5762939453125, 0.76641845703125, 0.95654296875, 1.14666748046875, 1.3367919921875, 1.52691650390625, 1.717041015625, 1.90716552734375, 2.0972900390625, 2.28741455078125, 2.4775390625, 2.66766357421875, 2.8577880859375, 3.04791259765625, 3.238037109375, 3.42816162109375, 3.6182861328125, 3.80841064453125, 3.99853515625, 4.18865966796875, 4.3787841796875, 4.56890869140625, 4.759033203125, 4.94915771484375, 5.1392822265625, 5.32940673828125, 5.51953125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 11.0, 13.0, 22.0, 38.0, 53.0, 85.0, 104.0, 162.0, 259.0, 335.0, 544.0, 812.0, 1220.0, 1765.0, 2726.0, 4092.0, 6293.0, 9476.0, 14258.0, 21554.0, 32900.0, 50527.0, 78691.0, 120162.0, 168292.0, 1214800.0, 127016.0, 83645.0, 54081.0, 35030.0, 22756.0, 15182.0, 10179.0, 6805.0, 4475.0, 2915.0, 1954.0, 1283.0, 888.0, 569.0, 347.0, 265.0, 190.0, 103.0, 69.0, 55.0, 54.0, 27.0, 17.0, 13.0, 4.0, 5.0, 0.0, 4.0, 3.0], "bins": [-1.00390625, -0.9744415283203125, -0.944976806640625, -0.9155120849609375, -0.88604736328125, -0.8565826416015625, -0.827117919921875, -0.7976531982421875, -0.7681884765625, -0.7387237548828125, -0.709259033203125, -0.6797943115234375, -0.65032958984375, -0.6208648681640625, -0.591400146484375, -0.5619354248046875, -0.532470703125, -0.5030059814453125, -0.473541259765625, -0.4440765380859375, -0.41461181640625, -0.3851470947265625, -0.355682373046875, -0.3262176513671875, -0.2967529296875, -0.2672882080078125, -0.237823486328125, -0.2083587646484375, -0.17889404296875, -0.1494293212890625, -0.119964599609375, -0.0904998779296875, -0.06103515625, -0.0315704345703125, -0.002105712890625, 0.0273590087890625, 0.05682373046875, 0.0862884521484375, 0.115753173828125, 0.1452178955078125, 0.1746826171875, 0.2041473388671875, 0.233612060546875, 0.2630767822265625, 0.29254150390625, 0.3220062255859375, 0.351470947265625, 0.3809356689453125, 0.410400390625, 0.4398651123046875, 0.469329833984375, 0.4987945556640625, 0.52825927734375, 0.5577239990234375, 0.587188720703125, 0.6166534423828125, 0.6461181640625, 0.6755828857421875, 0.705047607421875, 0.7345123291015625, 0.76397705078125, 0.7934417724609375, 0.822906494140625, 0.8523712158203125, 0.8818359375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 13.0, 7.0, 9.0, 12.0, 13.0, 20.0, 27.0, 25.0, 36.0, 36.0, 46.0, 53.0, 62.0, 43.0, 54.0, 63.0, 50.0, 44.0, 51.0, 36.0, 43.0, 33.0, 30.0, 33.0, 26.0, 19.0, 22.0, 13.0, 18.0, 11.0, 6.0, 7.0, 6.0, 7.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00223541259765625, -0.0021665990352630615, -0.002097785472869873, -0.0020289719104766846, -0.001960158348083496, -0.0018913447856903076, -0.0018225312232971191, -0.0017537176609039307, -0.0016849040985107422, -0.0016160905361175537, -0.0015472769737243652, -0.0014784634113311768, -0.0014096498489379883, -0.0013408362865447998, -0.0012720227241516113, -0.0012032091617584229, -0.0011343955993652344, -0.001065582036972046, -0.0009967684745788574, -0.0009279549121856689, -0.0008591413497924805, -0.000790327787399292, -0.0007215142250061035, -0.000652700662612915, -0.0005838871002197266, -0.0005150735378265381, -0.0004462599754333496, -0.00037744641304016113, -0.00030863285064697266, -0.00023981928825378418, -0.0001710057258605957, -0.00010219216346740723, -3.337860107421875e-05, 3.5434961318969727e-05, 0.0001042485237121582, 0.00017306208610534668, 0.00024187564849853516, 0.00031068921089172363, 0.0003795027732849121, 0.0004483163356781006, 0.0005171298980712891, 0.0005859434604644775, 0.000654757022857666, 0.0007235705852508545, 0.000792384147644043, 0.0008611977100372314, 0.0009300112724304199, 0.0009988248348236084, 0.0010676383972167969, 0.0011364519596099854, 0.0012052655220031738, 0.0012740790843963623, 0.0013428926467895508, 0.0014117062091827393, 0.0014805197715759277, 0.0015493333339691162, 0.0016181468963623047, 0.0016869604587554932, 0.0017557740211486816, 0.0018245875835418701, 0.0018934011459350586, 0.001962214708328247, 0.0020310282707214355, 0.002099841833114624, 0.0021686553955078125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 6.0, 3.0, 4.0, 12.0, 7.0, 15.0, 9.0, 20.0, 24.0, 29.0, 34.0, 52.0, 53.0, 69.0, 90.0, 116.0, 154.0, 289.0, 500.0, 1308.0, 247902.0, 794110.0, 2116.0, 575.0, 330.0, 190.0, 128.0, 100.0, 61.0, 43.0, 45.0, 37.0, 33.0, 23.0, 16.0, 8.0, 11.0, 13.0, 2.0, 4.0, 7.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03936767578125, -0.03796672821044922, -0.03656578063964844, -0.035164833068847656, -0.033763885498046875, -0.032362937927246094, -0.030961990356445312, -0.02956104278564453, -0.02816009521484375, -0.02675914764404297, -0.025358200073242188, -0.023957252502441406, -0.022556304931640625, -0.021155357360839844, -0.019754409790039062, -0.01835346221923828, -0.0169525146484375, -0.015551567077636719, -0.014150619506835938, -0.012749671936035156, -0.011348724365234375, -0.009947776794433594, -0.008546829223632812, -0.007145881652832031, -0.00574493408203125, -0.004343986511230469, -0.0029430389404296875, -0.0015420913696289062, -0.000141143798828125, 0.0012598037719726562, 0.0026607513427734375, 0.004061698913574219, 0.005462646484375, 0.006863594055175781, 0.008264541625976562, 0.009665489196777344, 0.011066436767578125, 0.012467384338378906, 0.013868331909179688, 0.015269279479980469, 0.01667022705078125, 0.01807117462158203, 0.019472122192382812, 0.020873069763183594, 0.022274017333984375, 0.023674964904785156, 0.025075912475585938, 0.02647686004638672, 0.0278778076171875, 0.02927875518798828, 0.030679702758789062, 0.032080650329589844, 0.033481597900390625, 0.034882545471191406, 0.03628349304199219, 0.03768444061279297, 0.03908538818359375, 0.04048633575439453, 0.04188728332519531, 0.043288230895996094, 0.044689178466796875, 0.046090126037597656, 0.04749107360839844, 0.04889202117919922, 0.05029296875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 73.0, 244.0, 398.0, 213.0, 70.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007948392070829868, -0.007796796038746834, -0.007645199541002512, -0.0074936035089194775, -0.007342007476836443, -0.007190410979092121, -0.007038814947009087, -0.006887218914926052, -0.00673562241718173, -0.006584026385098696, -0.006432429887354374, -0.006280833855271339, -0.006129237823188305, -0.005977641325443983, -0.0058260452933609486, -0.005674448795616627, -0.005522852763533592, -0.005371256731450558, -0.005219660233706236, -0.005068064201623201, -0.004916468169540167, -0.004764871671795845, -0.0046132756397128105, -0.004461679607629776, -0.0043100835755467415, -0.004158487543463707, -0.004006891045719385, -0.0038552950136363506, -0.0037036987487226725, -0.0035521024838089943, -0.0034005064517259598, -0.0032489101868122816, -0.00309731368906796, -0.0029457174241542816, -0.002794121392071247, -0.002642525127157569, -0.0024909288622438908, -0.0023393328301608562, -0.002187736565247178, -0.0020361403003335, -0.0018845441518351436, -0.0017329480033367872, -0.001581351738423109, -0.0014297555899247527, -0.0012781594414263964, -0.0011265631765127182, -0.0009749670280143619, -0.0008233707631006837, -0.0006717746146023273, -0.0005201784078963101, -0.0003685822302941233, -0.0002169860526919365, -6.538984598591924e-05, 8.620636072009802e-05, 0.00023780250921845436, 0.00038939877413213253, 0.0005409949226304889, 0.0006925911293365061, 0.0008441873360425234, 0.0009957834845408797, 0.001147379633039236, 0.0012989758979529142, 0.0014505720464512706, 0.0016021683113649487, 0.001753764459863305]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 8.0, 9.0, 5.0, 10.0, 9.0, 11.0, 10.0, 13.0, 15.0, 16.0, 20.0, 25.0, 28.0, 25.0, 36.0, 24.0, 33.0, 35.0, 31.0, 29.0, 36.0, 36.0, 35.0, 42.0, 39.0, 38.0, 35.0, 41.0, 32.0, 28.0, 32.0, 25.0, 28.0, 8.0, 24.0, 24.0, 13.0, 16.0, 17.0, 12.0, 8.0, 8.0, 6.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0], "bins": [-0.0011650919914245605, -0.0011296728625893593, -0.001094253733754158, -0.0010588346049189568, -0.0010234154760837555, -0.0009879963472485542, -0.000952577218413353, -0.0009171580895781517, -0.0008817389607429504, -0.0008463198319077492, -0.0008109007030725479, -0.0007754815742373466, -0.0007400624454021454, -0.0007046433165669441, -0.0006692241877317429, -0.0006338050588965416, -0.0005983859300613403, -0.0005629668012261391, -0.0005275476723909378, -0.0004921285435557365, -0.0004567094147205353, -0.000421290285885334, -0.00038587115705013275, -0.0003504520282149315, -0.0003150328993797302, -0.00027961377054452896, -0.0002441946417093277, -0.00020877551287412643, -0.00017335638403892517, -0.0001379372552037239, -0.00010251812636852264, -6.709899753332138e-05, -3.167986869812012e-05, 3.7392601370811462e-06, 3.915838897228241e-05, 7.457751780748367e-05, 0.00010999664664268494, 0.0001454157754778862, 0.00018083490431308746, 0.00021625403314828873, 0.00025167316198349, 0.00028709229081869125, 0.0003225114196538925, 0.0003579305484890938, 0.00039334967732429504, 0.0004287688061594963, 0.00046418793499469757, 0.0004996070638298988, 0.0005350261926651001, 0.0005704453215003014, 0.0006058644503355026, 0.0006412835791707039, 0.0006767027080059052, 0.0007121218368411064, 0.0007475409656763077, 0.0007829600945115089, 0.0008183792233467102, 0.0008537983521819115, 0.0008892174810171127, 0.000924636609852314, 0.0009600557386875153, 0.0009954748675227165, 0.0010308939963579178, 0.001066313125193119, 0.0011017322540283203]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 3.0, 7.0, 8.0, 10.0, 10.0, 15.0, 21.0, 10.0, 19.0, 22.0, 21.0, 34.0, 31.0, 38.0, 27.0, 41.0, 33.0, 40.0, 49.0, 47.0, 39.0, 40.0, 42.0, 35.0, 36.0, 35.0, 43.0, 29.0, 29.0, 29.0, 30.0, 14.0, 16.0, 10.0, 20.0, 10.0, 14.0, 6.0, 8.0, 9.0, 6.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.25, -9.9326171875, -9.615234375, -9.2978515625, -8.98046875, -8.6630859375, -8.345703125, -8.0283203125, -7.7109375, -7.3935546875, -7.076171875, -6.7587890625, -6.44140625, -6.1240234375, -5.806640625, -5.4892578125, -5.171875, -4.8544921875, -4.537109375, -4.2197265625, -3.90234375, -3.5849609375, -3.267578125, -2.9501953125, -2.6328125, -2.3154296875, -1.998046875, -1.6806640625, -1.36328125, -1.0458984375, -0.728515625, -0.4111328125, -0.09375, 0.2236328125, 0.541015625, 0.8583984375, 1.17578125, 1.4931640625, 1.810546875, 2.1279296875, 2.4453125, 2.7626953125, 3.080078125, 3.3974609375, 3.71484375, 4.0322265625, 4.349609375, 4.6669921875, 4.984375, 5.3017578125, 5.619140625, 5.9365234375, 6.25390625, 6.5712890625, 6.888671875, 7.2060546875, 7.5234375, 7.8408203125, 8.158203125, 8.4755859375, 8.79296875, 9.1103515625, 9.427734375, 9.7451171875, 10.0625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 8.0, 7.0, 7.0, 19.0, 16.0, 30.0, 32.0, 36.0, 48.0, 86.0, 113.0, 147.0, 219.0, 311.0, 594.0, 921.0, 1552.0, 2814.0, 5329.0, 10755.0, 24459.0, 70017.0, 278500.0, 462484.0, 121293.0, 37536.0, 15078.0, 7274.0, 3707.0, 2021.0, 1134.0, 697.0, 425.0, 266.0, 158.0, 109.0, 107.0, 85.0, 43.0, 32.0, 18.0, 26.0, 12.0, 9.0, 5.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.3828125, -11.006103515625, -10.62939453125, -10.252685546875, -9.8759765625, -9.499267578125, -9.12255859375, -8.745849609375, -8.369140625, -7.992431640625, -7.61572265625, -7.239013671875, -6.8623046875, -6.485595703125, -6.10888671875, -5.732177734375, -5.35546875, -4.978759765625, -4.60205078125, -4.225341796875, -3.8486328125, -3.471923828125, -3.09521484375, -2.718505859375, -2.341796875, -1.965087890625, -1.58837890625, -1.211669921875, -0.8349609375, -0.458251953125, -0.08154296875, 0.295166015625, 0.671875, 1.048583984375, 1.42529296875, 1.802001953125, 2.1787109375, 2.555419921875, 2.93212890625, 3.308837890625, 3.685546875, 4.062255859375, 4.43896484375, 4.815673828125, 5.1923828125, 5.569091796875, 5.94580078125, 6.322509765625, 6.69921875, 7.075927734375, 7.45263671875, 7.829345703125, 8.2060546875, 8.582763671875, 8.95947265625, 9.336181640625, 9.712890625, 10.089599609375, 10.46630859375, 10.843017578125, 11.2197265625, 11.596435546875, 11.97314453125, 12.349853515625, 12.7265625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 7.0, 11.0, 11.0, 10.0, 9.0, 16.0, 23.0, 28.0, 33.0, 34.0, 40.0, 47.0, 58.0, 71.0, 115.0, 287.0, 1547.0, 166.0, 92.0, 57.0, 60.0, 43.0, 40.0, 28.0, 40.0, 23.0, 37.0, 22.0, 9.0, 14.0, 13.0, 15.0, 5.0, 7.0, 3.0, 8.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.6875, -26.80322265625, -25.9189453125, -25.03466796875, -24.150390625, -23.26611328125, -22.3818359375, -21.49755859375, -20.61328125, -19.72900390625, -18.8447265625, -17.96044921875, -17.076171875, -16.19189453125, -15.3076171875, -14.42333984375, -13.5390625, -12.65478515625, -11.7705078125, -10.88623046875, -10.001953125, -9.11767578125, -8.2333984375, -7.34912109375, -6.46484375, -5.58056640625, -4.6962890625, -3.81201171875, -2.927734375, -2.04345703125, -1.1591796875, -0.27490234375, 0.609375, 1.49365234375, 2.3779296875, 3.26220703125, 4.146484375, 5.03076171875, 5.9150390625, 6.79931640625, 7.68359375, 8.56787109375, 9.4521484375, 10.33642578125, 11.220703125, 12.10498046875, 12.9892578125, 13.87353515625, 14.7578125, 15.64208984375, 16.5263671875, 17.41064453125, 18.294921875, 19.17919921875, 20.0634765625, 20.94775390625, 21.83203125, 22.71630859375, 23.6005859375, 24.48486328125, 25.369140625, 26.25341796875, 27.1376953125, 28.02197265625, 28.90625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 9.0, 6.0, 9.0, 12.0, 20.0, 26.0, 24.0, 47.0, 71.0, 80.0, 127.0, 195.0, 343.0, 720.0, 4236.0, 189868.0, 2932446.0, 15029.0, 1274.0, 458.0, 254.0, 135.0, 82.0, 60.0, 48.0, 32.0, 25.0, 24.0, 14.0, 8.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.75, -56.92626953125, -55.1025390625, -53.27880859375, -51.455078125, -49.63134765625, -47.8076171875, -45.98388671875, -44.16015625, -42.33642578125, -40.5126953125, -38.68896484375, -36.865234375, -35.04150390625, -33.2177734375, -31.39404296875, -29.5703125, -27.74658203125, -25.9228515625, -24.09912109375, -22.275390625, -20.45166015625, -18.6279296875, -16.80419921875, -14.98046875, -13.15673828125, -11.3330078125, -9.50927734375, -7.685546875, -5.86181640625, -4.0380859375, -2.21435546875, -0.390625, 1.43310546875, 3.2568359375, 5.08056640625, 6.904296875, 8.72802734375, 10.5517578125, 12.37548828125, 14.19921875, 16.02294921875, 17.8466796875, 19.67041015625, 21.494140625, 23.31787109375, 25.1416015625, 26.96533203125, 28.7890625, 30.61279296875, 32.4365234375, 34.26025390625, 36.083984375, 37.90771484375, 39.7314453125, 41.55517578125, 43.37890625, 45.20263671875, 47.0263671875, 48.85009765625, 50.673828125, 52.49755859375, 54.3212890625, 56.14501953125, 57.96875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 8.0, 119.0, 506.0, 325.0, 55.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.15635681152344, -54.87336730957031, -50.59038162231445, -46.307395935058594, -42.02440643310547, -37.741416931152344, -33.458431243896484, -29.175443649291992, -24.8924560546875, -20.609468460083008, -16.326480865478516, -12.043493270874023, -7.760505676269531, -3.477518081665039, 0.8054695129394531, 5.088457107543945, 9.371444702148438, 13.65443229675293, 17.937419891357422, 22.220407485961914, 26.503395080566406, 30.7863826751709, 35.06937026977539, 39.35235595703125, 43.635345458984375, 47.9183349609375, 52.20132064819336, 56.48430633544922, 60.767295837402344, 65.05028533935547, 69.33326721191406, 73.61625671386719, 77.89923095703125, 82.18222045898438, 86.4652099609375, 90.7481918334961, 95.03118133544922, 99.31417083740234, 103.59715270996094, 107.88014221191406, 112.16313171386719, 116.44612121582031, 120.72911071777344, 125.01209259033203, 129.29507446289062, 133.57806396484375, 137.86105346679688, 142.14404296875, 146.42703247070312, 150.71002197265625, 154.99301147460938, 159.2760009765625, 163.55899047851562, 167.8419647216797, 172.1249542236328, 176.40794372558594, 180.69093322753906, 184.9739227294922, 189.2569122314453, 193.53990173339844, 197.8228759765625, 202.10586547851562, 206.38885498046875, 210.67184448242188, 214.954833984375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 8.0, 15.0, 9.0, 20.0, 12.0, 23.0, 23.0, 44.0, 32.0, 30.0, 40.0, 45.0, 47.0, 49.0, 47.0, 52.0, 41.0, 60.0, 47.0, 44.0, 43.0, 39.0, 37.0, 30.0, 23.0, 23.0, 24.0, 20.0, 11.0, 14.0, 18.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-72.99568939208984, -70.92285919189453, -68.85002899169922, -66.7771987915039, -64.7043685913086, -62.63153839111328, -60.55870819091797, -58.485877990722656, -56.413047790527344, -54.34021759033203, -52.26738739013672, -50.194557189941406, -48.121726989746094, -46.04889678955078, -43.97606658935547, -41.903236389160156, -39.830406188964844, -37.75757598876953, -35.68474578857422, -33.611915588378906, -31.539085388183594, -29.46625518798828, -27.39342498779297, -25.320594787597656, -23.247764587402344, -21.17493438720703, -19.10210418701172, -17.029273986816406, -14.956443786621094, -12.883613586425781, -10.810783386230469, -8.737953186035156, -6.6651153564453125, -4.59228515625, -2.5194549560546875, -0.446624755859375, 1.6262054443359375, 3.69903564453125, 5.7718658447265625, 7.844696044921875, 9.917526245117188, 11.9903564453125, 14.063186645507812, 16.136016845703125, 18.208847045898438, 20.28167724609375, 22.354507446289062, 24.427337646484375, 26.500167846679688, 28.572998046875, 30.645828247070312, 32.718658447265625, 34.79148864746094, 36.86431884765625, 38.93714904785156, 41.009979248046875, 43.08280944824219, 45.1556396484375, 47.22846984863281, 49.301300048828125, 51.37413024902344, 53.44696044921875, 55.51979064941406, 57.592620849609375, 59.66545104980469]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 11.0, 6.0, 6.0, 10.0, 16.0, 11.0, 15.0, 21.0, 19.0, 20.0, 33.0, 27.0, 34.0, 25.0, 41.0, 39.0, 55.0, 37.0, 43.0, 37.0, 49.0, 42.0, 40.0, 41.0, 40.0, 42.0, 24.0, 29.0, 27.0, 23.0, 25.0, 17.0, 17.0, 13.0, 16.0, 8.0, 11.0, 7.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.828125, -10.4949951171875, -10.161865234375, -9.8287353515625, -9.49560546875, -9.1624755859375, -8.829345703125, -8.4962158203125, -8.1630859375, -7.8299560546875, -7.496826171875, -7.1636962890625, -6.83056640625, -6.4974365234375, -6.164306640625, -5.8311767578125, -5.498046875, -5.1649169921875, -4.831787109375, -4.4986572265625, -4.16552734375, -3.8323974609375, -3.499267578125, -3.1661376953125, -2.8330078125, -2.4998779296875, -2.166748046875, -1.8336181640625, -1.50048828125, -1.1673583984375, -0.834228515625, -0.5010986328125, -0.16796875, 0.1651611328125, 0.498291015625, 0.8314208984375, 1.16455078125, 1.4976806640625, 1.830810546875, 2.1639404296875, 2.4970703125, 2.8302001953125, 3.163330078125, 3.4964599609375, 3.82958984375, 4.1627197265625, 4.495849609375, 4.8289794921875, 5.162109375, 5.4952392578125, 5.828369140625, 6.1614990234375, 6.49462890625, 6.8277587890625, 7.160888671875, 7.4940185546875, 7.8271484375, 8.1602783203125, 8.493408203125, 8.8265380859375, 9.15966796875, 9.4927978515625, 9.825927734375, 10.1590576171875, 10.4921875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 8.0, 9.0, 4.0, 3.0, 7.0, 12.0, 19.0, 21.0, 29.0, 24.0, 29.0, 46.0, 58.0, 75.0, 105.0, 116.0, 182.0, 228.0, 318.0, 332.0, 668.0, 140443.0, 4048918.0, 835.0, 393.0, 345.0, 248.0, 214.0, 152.0, 79.0, 86.0, 60.0, 51.0, 36.0, 20.0, 19.0, 25.0, 17.0, 14.0, 8.0, 13.0, 3.0, 4.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-231.75, -224.955078125, -218.16015625, -211.365234375, -204.5703125, -197.775390625, -190.98046875, -184.185546875, -177.390625, -170.595703125, -163.80078125, -157.005859375, -150.2109375, -143.416015625, -136.62109375, -129.826171875, -123.03125, -116.236328125, -109.44140625, -102.646484375, -95.8515625, -89.056640625, -82.26171875, -75.466796875, -68.671875, -61.876953125, -55.08203125, -48.287109375, -41.4921875, -34.697265625, -27.90234375, -21.107421875, -14.3125, -7.517578125, -0.72265625, 6.072265625, 12.8671875, 19.662109375, 26.45703125, 33.251953125, 40.046875, 46.841796875, 53.63671875, 60.431640625, 67.2265625, 74.021484375, 80.81640625, 87.611328125, 94.40625, 101.201171875, 107.99609375, 114.791015625, 121.5859375, 128.380859375, 135.17578125, 141.970703125, 148.765625, 155.560546875, 162.35546875, 169.150390625, 175.9453125, 182.740234375, 189.53515625, 196.330078125, 203.125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 9.0, 12.0, 12.0, 11.0, 13.0, 25.0, 25.0, 41.0, 36.0, 60.0, 79.0, 106.0, 165.0, 270.0, 420.0, 594.0, 638.0, 544.0, 305.0, 200.0, 152.0, 103.0, 67.0, 42.0, 40.0, 28.0, 22.0, 16.0, 10.0, 8.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.790283203125, -14.28369140625, -13.777099609375, -13.2705078125, -12.763916015625, -12.25732421875, -11.750732421875, -11.244140625, -10.737548828125, -10.23095703125, -9.724365234375, -9.2177734375, -8.711181640625, -8.20458984375, -7.697998046875, -7.19140625, -6.684814453125, -6.17822265625, -5.671630859375, -5.1650390625, -4.658447265625, -4.15185546875, -3.645263671875, -3.138671875, -2.632080078125, -2.12548828125, -1.618896484375, -1.1123046875, -0.605712890625, -0.09912109375, 0.407470703125, 0.9140625, 1.420654296875, 1.92724609375, 2.433837890625, 2.9404296875, 3.447021484375, 3.95361328125, 4.460205078125, 4.966796875, 5.473388671875, 5.97998046875, 6.486572265625, 6.9931640625, 7.499755859375, 8.00634765625, 8.512939453125, 9.01953125, 9.526123046875, 10.03271484375, 10.539306640625, 11.0458984375, 11.552490234375, 12.05908203125, 12.565673828125, 13.072265625, 13.578857421875, 14.08544921875, 14.592041015625, 15.0986328125, 15.605224609375, 16.11181640625, 16.618408203125, 17.125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 2.0, 2.0, 4.0, 9.0, 7.0, 15.0, 18.0, 19.0, 18.0, 18.0, 28.0, 39.0, 45.0, 66.0, 64.0, 139.0, 725.0, 802513.0, 3388899.0, 1027.0, 168.0, 97.0, 54.0, 72.0, 42.0, 38.0, 35.0, 27.0, 21.0, 18.0, 18.0, 8.0, 5.0, 6.0, 5.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.9375, -116.7744140625, -112.611328125, -108.4482421875, -104.28515625, -100.1220703125, -95.958984375, -91.7958984375, -87.6328125, -83.4697265625, -79.306640625, -75.1435546875, -70.98046875, -66.8173828125, -62.654296875, -58.4912109375, -54.328125, -50.1650390625, -46.001953125, -41.8388671875, -37.67578125, -33.5126953125, -29.349609375, -25.1865234375, -21.0234375, -16.8603515625, -12.697265625, -8.5341796875, -4.37109375, -0.2080078125, 3.955078125, 8.1181640625, 12.28125, 16.4443359375, 20.607421875, 24.7705078125, 28.93359375, 33.0966796875, 37.259765625, 41.4228515625, 45.5859375, 49.7490234375, 53.912109375, 58.0751953125, 62.23828125, 66.4013671875, 70.564453125, 74.7275390625, 78.890625, 83.0537109375, 87.216796875, 91.3798828125, 95.54296875, 99.7060546875, 103.869140625, 108.0322265625, 112.1953125, 116.3583984375, 120.521484375, 124.6845703125, 128.84765625, 133.0107421875, 137.173828125, 141.3369140625, 145.5]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 11.0, 75.0, 508.0, 378.0, 42.0, 1.0, 1.0], "bins": [-468.31292724609375, -460.4886169433594, -452.664306640625, -444.8399658203125, -437.0156555175781, -429.19134521484375, -421.3670349121094, -413.542724609375, -405.7183837890625, -397.8940734863281, -390.06976318359375, -382.24542236328125, -374.4211120605469, -366.5968017578125, -358.7724914550781, -350.94818115234375, -343.12384033203125, -335.2995300292969, -327.4752197265625, -319.65087890625, -311.8265686035156, -304.00225830078125, -296.1779479980469, -288.3536376953125, -280.5293273925781, -272.70501708984375, -264.8807067871094, -257.0563659667969, -249.2320556640625, -241.40774536132812, -233.58343505859375, -225.7591094970703, -217.93478393554688, -210.1104736328125, -202.28614807128906, -194.4618377685547, -186.63751220703125, -178.81320190429688, -170.9888916015625, -163.16456604003906, -155.3402557373047, -147.5159454345703, -139.69161987304688, -131.8673095703125, -124.04298400878906, -116.21867370605469, -108.39435577392578, -100.57003784179688, -92.74571990966797, -84.92140197753906, -77.09708404541016, -69.27276611328125, -61.44845199584961, -53.6241340637207, -45.79981994628906, -37.975502014160156, -30.15118408203125, -22.326866149902344, -14.50255012512207, -6.678234100341797, 1.1460838317871094, 8.970401763916016, 16.794715881347656, 24.619033813476562, 32.44335174560547]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 10.0, 5.0, 9.0, 5.0, 5.0, 12.0, 10.0, 16.0, 21.0, 15.0, 12.0, 18.0, 23.0, 15.0, 24.0, 26.0, 36.0, 37.0, 43.0, 39.0, 35.0, 35.0, 41.0, 30.0, 39.0, 36.0, 31.0, 36.0, 30.0, 32.0, 23.0, 33.0, 34.0, 29.0, 28.0, 19.0, 17.0, 21.0, 10.0, 10.0, 6.0, 11.0, 8.0, 8.0, 3.0, 3.0, 6.0, 2.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-42.38567352294922, -40.97593307495117, -39.566192626953125, -38.15644836425781, -36.746707916259766, -35.33696746826172, -33.92722702026367, -32.517486572265625, -31.107744216918945, -29.6980037689209, -28.28826141357422, -26.878520965576172, -25.468780517578125, -24.059038162231445, -22.6492977142334, -21.23955535888672, -19.829814910888672, -18.420074462890625, -17.010332107543945, -15.600591659545898, -14.190850257873535, -12.781108856201172, -11.371368408203125, -9.961627006530762, -8.551885604858398, -7.142144203186035, -5.73240327835083, -4.322662353515625, -2.9129209518432617, -1.5031795501708984, -0.09343910217285156, 1.3163022994995117, 2.7260475158691406, 4.135788917541504, 5.545529842376709, 6.955270767211914, 8.365012168884277, 9.77475357055664, 11.184494018554688, 12.59423542022705, 14.003976821899414, 15.413718223571777, 16.82345962524414, 18.233200073242188, 19.642940521240234, 21.052682876586914, 22.46242332458496, 23.87216567993164, 25.281906127929688, 26.691646575927734, 28.101388931274414, 29.51112937927246, 30.92087173461914, 32.33061218261719, 33.740352630615234, 35.15009307861328, 36.559837341308594, 37.96957778930664, 39.37931823730469, 40.7890625, 42.19880294799805, 43.608543395996094, 45.01828384399414, 46.42802429199219, 47.837764739990234]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 5.0, 5.0, 6.0, 10.0, 12.0, 17.0, 15.0, 16.0, 19.0, 21.0, 24.0, 34.0, 25.0, 42.0, 39.0, 36.0, 38.0, 42.0, 47.0, 27.0, 39.0, 45.0, 46.0, 46.0, 45.0, 40.0, 32.0, 32.0, 28.0, 19.0, 27.0, 29.0, 20.0, 12.0, 9.0, 15.0, 10.0, 10.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.046875, -10.7147216796875, -10.382568359375, -10.0504150390625, -9.71826171875, -9.3861083984375, -9.053955078125, -8.7218017578125, -8.3896484375, -8.0574951171875, -7.725341796875, -7.3931884765625, -7.06103515625, -6.7288818359375, -6.396728515625, -6.0645751953125, -5.732421875, -5.4002685546875, -5.068115234375, -4.7359619140625, -4.40380859375, -4.0716552734375, -3.739501953125, -3.4073486328125, -3.0751953125, -2.7430419921875, -2.410888671875, -2.0787353515625, -1.74658203125, -1.4144287109375, -1.082275390625, -0.7501220703125, -0.41796875, -0.0858154296875, 0.246337890625, 0.5784912109375, 0.91064453125, 1.2427978515625, 1.574951171875, 1.9071044921875, 2.2392578125, 2.5714111328125, 2.903564453125, 3.2357177734375, 3.56787109375, 3.9000244140625, 4.232177734375, 4.5643310546875, 4.896484375, 5.2286376953125, 5.560791015625, 5.8929443359375, 6.22509765625, 6.5572509765625, 6.889404296875, 7.2215576171875, 7.5537109375, 7.8858642578125, 8.218017578125, 8.5501708984375, 8.88232421875, 9.2144775390625, 9.546630859375, 9.8787841796875, 10.2109375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 14.0, 24.0, 37.0, 49.0, 72.0, 101.0, 186.0, 276.0, 446.0, 683.0, 1131.0, 1712.0, 2588.0, 3993.0, 6534.0, 9926.0, 15844.0, 25360.0, 40791.0, 65622.0, 105525.0, 160710.0, 194339.0, 151317.0, 97960.0, 61174.0, 38125.0, 23619.0, 14774.0, 9268.0, 5929.0, 3695.0, 2423.0, 1560.0, 1005.0, 588.0, 418.0, 265.0, 178.0, 95.0, 66.0, 38.0, 41.0, 21.0, 15.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1259765625, -1.09228515625, -1.05859375, -1.02490234375, -0.9912109375, -0.95751953125, -0.923828125, -0.89013671875, -0.8564453125, -0.82275390625, -0.7890625, -0.75537109375, -0.7216796875, -0.68798828125, -0.654296875, -0.62060546875, -0.5869140625, -0.55322265625, -0.51953125, -0.48583984375, -0.4521484375, -0.41845703125, -0.384765625, -0.35107421875, -0.3173828125, -0.28369140625, -0.25, -0.21630859375, -0.1826171875, -0.14892578125, -0.115234375, -0.08154296875, -0.0478515625, -0.01416015625, 0.01953125, 0.05322265625, 0.0869140625, 0.12060546875, 0.154296875, 0.18798828125, 0.2216796875, 0.25537109375, 0.2890625, 0.32275390625, 0.3564453125, 0.39013671875, 0.423828125, 0.45751953125, 0.4912109375, 0.52490234375, 0.55859375, 0.59228515625, 0.6259765625, 0.65966796875, 0.693359375, 0.72705078125, 0.7607421875, 0.79443359375, 0.828125, 0.86181640625, 0.8955078125, 0.92919921875, 0.962890625, 0.99658203125, 1.0302734375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 8.0, 8.0, 12.0, 12.0, 17.0, 18.0, 25.0, 16.0, 28.0, 24.0, 33.0, 31.0, 28.0, 45.0, 44.0, 32.0, 49.0, 40.0, 1058.0, 58.0, 44.0, 48.0, 46.0, 40.0, 33.0, 32.0, 25.0, 24.0, 15.0, 23.0, 25.0, 18.0, 15.0, 9.0, 11.0, 9.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-7.8046875, -7.5880126953125, -7.371337890625, -7.1546630859375, -6.93798828125, -6.7213134765625, -6.504638671875, -6.2879638671875, -6.0712890625, -5.8546142578125, -5.637939453125, -5.4212646484375, -5.20458984375, -4.9879150390625, -4.771240234375, -4.5545654296875, -4.337890625, -4.1212158203125, -3.904541015625, -3.6878662109375, -3.47119140625, -3.2545166015625, -3.037841796875, -2.8211669921875, -2.6044921875, -2.3878173828125, -2.171142578125, -1.9544677734375, -1.73779296875, -1.5211181640625, -1.304443359375, -1.0877685546875, -0.87109375, -0.6544189453125, -0.437744140625, -0.2210693359375, -0.00439453125, 0.2122802734375, 0.428955078125, 0.6456298828125, 0.8623046875, 1.0789794921875, 1.295654296875, 1.5123291015625, 1.72900390625, 1.9456787109375, 2.162353515625, 2.3790283203125, 2.595703125, 2.8123779296875, 3.029052734375, 3.2457275390625, 3.46240234375, 3.6790771484375, 3.895751953125, 4.1124267578125, 4.3291015625, 4.5457763671875, 4.762451171875, 4.9791259765625, 5.19580078125, 5.4124755859375, 5.629150390625, 5.8458251953125, 6.0625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 5.0, 4.0, 11.0, 18.0, 27.0, 39.0, 67.0, 84.0, 139.0, 202.0, 243.0, 381.0, 554.0, 796.0, 1206.0, 1700.0, 2490.0, 3704.0, 5372.0, 7733.0, 11498.0, 16733.0, 24830.0, 37412.0, 55396.0, 81638.0, 118778.0, 793652.0, 561276.0, 117859.0, 82129.0, 55298.0, 37238.0, 25055.0, 16822.0, 11733.0, 7842.0, 5284.0, 3704.0, 2511.0, 1787.0, 1186.0, 883.0, 615.0, 348.0, 256.0, 195.0, 128.0, 77.0, 55.0, 56.0, 28.0, 20.0, 22.0, 5.0, 7.0, 6.0, 2.0], "bins": [-0.87744140625, -0.8516311645507812, -0.8258209228515625, -0.8000106811523438, -0.774200439453125, -0.7483901977539062, -0.7225799560546875, -0.6967697143554688, -0.67095947265625, -0.6451492309570312, -0.6193389892578125, -0.5935287475585938, -0.567718505859375, -0.5419082641601562, -0.5160980224609375, -0.49028778076171875, -0.4644775390625, -0.43866729736328125, -0.4128570556640625, -0.38704681396484375, -0.361236572265625, -0.33542633056640625, -0.3096160888671875, -0.28380584716796875, -0.25799560546875, -0.23218536376953125, -0.2063751220703125, -0.18056488037109375, -0.154754638671875, -0.12894439697265625, -0.1031341552734375, -0.07732391357421875, -0.051513671875, -0.02570343017578125, 0.0001068115234375, 0.02591705322265625, 0.051727294921875, 0.07753753662109375, 0.1033477783203125, 0.12915802001953125, 0.15496826171875, 0.18077850341796875, 0.2065887451171875, 0.23239898681640625, 0.258209228515625, 0.28401947021484375, 0.3098297119140625, 0.33563995361328125, 0.3614501953125, 0.38726043701171875, 0.4130706787109375, 0.43888092041015625, 0.464691162109375, 0.49050140380859375, 0.5163116455078125, 0.5421218872070312, 0.56793212890625, 0.5937423706054688, 0.6195526123046875, 0.6453628540039062, 0.671173095703125, 0.6969833374023438, 0.7227935791015625, 0.7486038208007812, 0.7744140625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 9.0, 6.0, 12.0, 9.0, 13.0, 14.0, 16.0, 26.0, 26.0, 32.0, 36.0, 37.0, 57.0, 49.0, 57.0, 55.0, 66.0, 46.0, 63.0, 58.0, 47.0, 45.0, 35.0, 39.0, 30.0, 17.0, 18.0, 17.0, 9.0, 10.0, 6.0, 7.0, 6.0, 4.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024318695068359375, -0.002347797155380249, -0.0022637248039245605, -0.002179652452468872, -0.0020955801010131836, -0.002011507749557495, -0.0019274353981018066, -0.0018433630466461182, -0.0017592906951904297, -0.0016752183437347412, -0.0015911459922790527, -0.0015070736408233643, -0.0014230012893676758, -0.0013389289379119873, -0.0012548565864562988, -0.0011707842350006104, -0.0010867118835449219, -0.0010026395320892334, -0.0009185671806335449, -0.0008344948291778564, -0.000750422477722168, -0.0006663501262664795, -0.000582277774810791, -0.0004982054233551025, -0.00041413307189941406, -0.0003300607204437256, -0.0002459883689880371, -0.00016191601753234863, -7.784366607666016e-05, 6.22868537902832e-06, 9.03010368347168e-05, 0.00017437338829040527, 0.00025844573974609375, 0.0003425180912017822, 0.0004265904426574707, 0.0005106627941131592, 0.0005947351455688477, 0.0006788074970245361, 0.0007628798484802246, 0.0008469521999359131, 0.0009310245513916016, 0.00101509690284729, 0.0010991692543029785, 0.001183241605758667, 0.0012673139572143555, 0.001351386308670044, 0.0014354586601257324, 0.001519531011581421, 0.0016036033630371094, 0.0016876757144927979, 0.0017717480659484863, 0.0018558204174041748, 0.0019398927688598633, 0.0020239651203155518, 0.0021080374717712402, 0.0021921098232269287, 0.002276182174682617, 0.0023602545261383057, 0.002444326877593994, 0.0025283992290496826, 0.002612471580505371, 0.0026965439319610596, 0.002780616283416748, 0.0028646886348724365, 0.002948760986328125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 9.0, 4.0, 6.0, 13.0, 14.0, 11.0, 11.0, 16.0, 24.0, 29.0, 30.0, 37.0, 54.0, 79.0, 124.0, 144.0, 208.0, 334.0, 515.0, 1101.0, 70705.0, 970023.0, 2844.0, 771.0, 437.0, 250.0, 181.0, 134.0, 101.0, 82.0, 70.0, 41.0, 28.0, 26.0, 19.0, 15.0, 13.0, 5.0, 16.0, 8.0, 8.0, 2.0, 2.0, 3.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.051422119140625, -0.04996299743652344, -0.048503875732421875, -0.04704475402832031, -0.04558563232421875, -0.04412651062011719, -0.042667388916015625, -0.04120826721191406, -0.0397491455078125, -0.03829002380371094, -0.036830902099609375, -0.03537178039550781, -0.03391265869140625, -0.03245353698730469, -0.030994415283203125, -0.029535293579101562, -0.028076171875, -0.026617050170898438, -0.025157928466796875, -0.023698806762695312, -0.02223968505859375, -0.020780563354492188, -0.019321441650390625, -0.017862319946289062, -0.0164031982421875, -0.014944076538085938, -0.013484954833984375, -0.012025833129882812, -0.01056671142578125, -0.009107589721679688, -0.007648468017578125, -0.0061893463134765625, -0.004730224609375, -0.0032711029052734375, -0.001811981201171875, -0.0003528594970703125, 0.00110626220703125, 0.0025653839111328125, 0.004024505615234375, 0.0054836273193359375, 0.0069427490234375, 0.008401870727539062, 0.009860992431640625, 0.011320114135742188, 0.01277923583984375, 0.014238357543945312, 0.015697479248046875, 0.017156600952148438, 0.01861572265625, 0.020074844360351562, 0.021533966064453125, 0.022993087768554688, 0.02445220947265625, 0.025911331176757812, 0.027370452880859375, 0.028829574584960938, 0.0302886962890625, 0.03174781799316406, 0.033206939697265625, 0.03466606140136719, 0.03612518310546875, 0.03758430480957031, 0.039043426513671875, 0.04050254821777344, 0.041961669921875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 44.0, 239.0, 423.0, 245.0, 41.0, 13.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0036159211304038763, -0.003455694764852524, -0.0032954683993011713, -0.003135242033749819, -0.0029750156681984663, -0.002814789302647114, -0.0026545627042651176, -0.002494336571544409, -0.0023341099731624126, -0.00217388360761106, -0.0020136572420597076, -0.0018534308765083551, -0.0016932045109570026, -0.0015329781454056501, -0.0013727516634389758, -0.0012125252978876233, -0.0010522990487515926, -0.0008920726832002401, -0.0007318463176488876, -0.0005716198938898742, -0.0004113935283385217, -0.0002511671627871692, -9.09407390281558e-05, 6.92856265231967e-05, 0.0002295119920745492, 0.0003897383576259017, 0.0005499647231772542, 0.0007101911469362676, 0.0008704175124876201, 0.0010306439362466335, 0.001190870301797986, 0.0013510966673493385, 0.0015113232657313347, 0.0016715496312826872, 0.0018317759968340397, 0.001992002362385392, 0.0021522287279367447, 0.002312455093488097, 0.0024726814590394497, 0.002632908057421446, 0.0027931341901421547, 0.002953360555693507, 0.0031135869212448597, 0.003273813286796212, 0.0034340396523475647, 0.003594266017898917, 0.0037544923834502697, 0.003914718981832266, 0.004074945114552975, 0.004235171712934971, 0.00439539784565568, 0.004555624444037676, 0.004715850576758385, 0.004876077175140381, 0.00503630330786109, 0.005196529906243086, 0.005356756504625082, 0.005516983103007078, 0.005677209235727787, 0.005837435834109783, 0.005997661966830492, 0.006157888565212488, 0.006318114697933197, 0.006478341296315193, 0.006638567429035902]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 3.0, 7.0, 8.0, 8.0, 12.0, 11.0, 19.0, 17.0, 18.0, 28.0, 32.0, 20.0, 25.0, 24.0, 33.0, 28.0, 40.0, 40.0, 45.0, 35.0, 46.0, 41.0, 24.0, 46.0, 42.0, 29.0, 44.0, 33.0, 28.0, 39.0, 23.0, 23.0, 23.0, 28.0, 13.0, 12.0, 12.0, 11.0, 7.0, 2.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014730095863342285, -0.0014281775802373886, -0.0013833455741405487, -0.0013385135680437088, -0.001293681561946869, -0.001248849555850029, -0.001204017549753189, -0.0011591855436563492, -0.0011143535375595093, -0.0010695215314626694, -0.0010246895253658295, -0.0009798575192689896, -0.0009350255131721497, -0.0008901935070753098, -0.0008453615009784698, -0.0008005294948816299, -0.00075569748878479, -0.0007108654826879501, -0.0006660334765911102, -0.0006212014704942703, -0.0005763694643974304, -0.0005315374583005905, -0.0004867054522037506, -0.0004418734461069107, -0.0003970414400100708, -0.0003522094339132309, -0.000307377427816391, -0.0002625454217195511, -0.00021771341562271118, -0.00017288140952587128, -0.00012804940342903137, -8.321739733219147e-05, -3.838539123535156e-05, 6.446614861488342e-06, 5.127862095832825e-05, 9.611062705516815e-05, 0.00014094263315200806, 0.00018577463924884796, 0.00023060664534568787, 0.00027543865144252777, 0.0003202706575393677, 0.0003651026636362076, 0.0004099346697330475, 0.0004547666758298874, 0.0004995986819267273, 0.0005444306880235672, 0.0005892626941204071, 0.000634094700217247, 0.0006789267063140869, 0.0007237587124109268, 0.0007685907185077667, 0.0008134227246046066, 0.0008582547307014465, 0.0009030867367982864, 0.0009479187428951263, 0.0009927507489919662, 0.0010375827550888062, 0.001082414761185646, 0.001127246767282486, 0.0011720787733793259, 0.0012169107794761658, 0.0012617427855730057, 0.0013065747916698456, 0.0013514067977666855, 0.0013962388038635254]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 5.0, 5.0, 6.0, 10.0, 12.0, 17.0, 15.0, 16.0, 19.0, 21.0, 24.0, 34.0, 25.0, 42.0, 39.0, 36.0, 38.0, 42.0, 47.0, 27.0, 39.0, 45.0, 46.0, 46.0, 45.0, 40.0, 32.0, 32.0, 28.0, 19.0, 27.0, 29.0, 20.0, 12.0, 9.0, 15.0, 10.0, 10.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.046875, -10.7147216796875, -10.382568359375, -10.0504150390625, -9.71826171875, -9.3861083984375, -9.053955078125, -8.7218017578125, -8.3896484375, -8.0574951171875, -7.725341796875, -7.3931884765625, -7.06103515625, -6.7288818359375, -6.396728515625, -6.0645751953125, -5.732421875, -5.4002685546875, -5.068115234375, -4.7359619140625, -4.40380859375, -4.0716552734375, -3.739501953125, -3.4073486328125, -3.0751953125, -2.7430419921875, -2.410888671875, -2.0787353515625, -1.74658203125, -1.4144287109375, -1.082275390625, -0.7501220703125, -0.41796875, -0.0858154296875, 0.246337890625, 0.5784912109375, 0.91064453125, 1.2427978515625, 1.574951171875, 1.9071044921875, 2.2392578125, 2.5714111328125, 2.903564453125, 3.2357177734375, 3.56787109375, 3.9000244140625, 4.232177734375, 4.5643310546875, 4.896484375, 5.2286376953125, 5.560791015625, 5.8929443359375, 6.22509765625, 6.5572509765625, 6.889404296875, 7.2215576171875, 7.5537109375, 7.8858642578125, 8.218017578125, 8.5501708984375, 8.88232421875, 9.2144775390625, 9.546630859375, 9.8787841796875, 10.2109375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 8.0, 7.0, 10.0, 16.0, 26.0, 31.0, 52.0, 56.0, 112.0, 116.0, 170.0, 215.0, 317.0, 376.0, 501.0, 676.0, 874.0, 1237.0, 2010.0, 4060.0, 13779.0, 79469.0, 487388.0, 379450.0, 57082.0, 10627.0, 3560.0, 1797.0, 1145.0, 836.0, 627.0, 513.0, 342.0, 262.0, 222.0, 167.0, 111.0, 90.0, 69.0, 44.0, 27.0, 28.0, 10.0, 7.0, 13.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.09375, -16.55810546875, -16.0224609375, -15.48681640625, -14.951171875, -14.41552734375, -13.8798828125, -13.34423828125, -12.80859375, -12.27294921875, -11.7373046875, -11.20166015625, -10.666015625, -10.13037109375, -9.5947265625, -9.05908203125, -8.5234375, -7.98779296875, -7.4521484375, -6.91650390625, -6.380859375, -5.84521484375, -5.3095703125, -4.77392578125, -4.23828125, -3.70263671875, -3.1669921875, -2.63134765625, -2.095703125, -1.56005859375, -1.0244140625, -0.48876953125, 0.046875, 0.58251953125, 1.1181640625, 1.65380859375, 2.189453125, 2.72509765625, 3.2607421875, 3.79638671875, 4.33203125, 4.86767578125, 5.4033203125, 5.93896484375, 6.474609375, 7.01025390625, 7.5458984375, 8.08154296875, 8.6171875, 9.15283203125, 9.6884765625, 10.22412109375, 10.759765625, 11.29541015625, 11.8310546875, 12.36669921875, 12.90234375, 13.43798828125, 13.9736328125, 14.50927734375, 15.044921875, 15.58056640625, 16.1162109375, 16.65185546875, 17.1875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 4.0, 7.0, 13.0, 10.0, 13.0, 30.0, 25.0, 29.0, 39.0, 52.0, 54.0, 50.0, 96.0, 197.0, 1719.0, 227.0, 96.0, 78.0, 57.0, 44.0, 45.0, 29.0, 30.0, 28.0, 16.0, 12.0, 14.0, 9.0, 5.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.96875, -34.9267578125, -33.884765625, -32.8427734375, -31.80078125, -30.7587890625, -29.716796875, -28.6748046875, -27.6328125, -26.5908203125, -25.548828125, -24.5068359375, -23.46484375, -22.4228515625, -21.380859375, -20.3388671875, -19.296875, -18.2548828125, -17.212890625, -16.1708984375, -15.12890625, -14.0869140625, -13.044921875, -12.0029296875, -10.9609375, -9.9189453125, -8.876953125, -7.8349609375, -6.79296875, -5.7509765625, -4.708984375, -3.6669921875, -2.625, -1.5830078125, -0.541015625, 0.5009765625, 1.54296875, 2.5849609375, 3.626953125, 4.6689453125, 5.7109375, 6.7529296875, 7.794921875, 8.8369140625, 9.87890625, 10.9208984375, 11.962890625, 13.0048828125, 14.046875, 15.0888671875, 16.130859375, 17.1728515625, 18.21484375, 19.2568359375, 20.298828125, 21.3408203125, 22.3828125, 23.4248046875, 24.466796875, 25.5087890625, 26.55078125, 27.5927734375, 28.634765625, 29.6767578125, 30.71875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 8.0, 12.0, 6.0, 9.0, 17.0, 13.0, 17.0, 18.0, 33.0, 48.0, 41.0, 66.0, 127.0, 184.0, 335.0, 578.0, 1621.0, 269805.0, 2868959.0, 2124.0, 718.0, 325.0, 174.0, 130.0, 90.0, 58.0, 39.0, 35.0, 22.0, 17.0, 11.0, 9.0, 5.0, 7.0, 12.0, 5.0, 7.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-77.0625, -74.501953125, -71.94140625, -69.380859375, -66.8203125, -64.259765625, -61.69921875, -59.138671875, -56.578125, -54.017578125, -51.45703125, -48.896484375, -46.3359375, -43.775390625, -41.21484375, -38.654296875, -36.09375, -33.533203125, -30.97265625, -28.412109375, -25.8515625, -23.291015625, -20.73046875, -18.169921875, -15.609375, -13.048828125, -10.48828125, -7.927734375, -5.3671875, -2.806640625, -0.24609375, 2.314453125, 4.875, 7.435546875, 9.99609375, 12.556640625, 15.1171875, 17.677734375, 20.23828125, 22.798828125, 25.359375, 27.919921875, 30.48046875, 33.041015625, 35.6015625, 38.162109375, 40.72265625, 43.283203125, 45.84375, 48.404296875, 50.96484375, 53.525390625, 56.0859375, 58.646484375, 61.20703125, 63.767578125, 66.328125, 68.888671875, 71.44921875, 74.009765625, 76.5703125, 79.130859375, 81.69140625, 84.251953125, 86.8125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 191.0, 796.0, 26.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-317.7523193359375, -307.25811767578125, -296.763916015625, -286.2696838378906, -275.7754821777344, -265.2812805175781, -254.78707885742188, -244.29287719726562, -233.7986602783203, -223.30445861816406, -212.81024169921875, -202.3160400390625, -191.82183837890625, -181.32762145996094, -170.8334197998047, -160.33920288085938, -149.84500122070312, -139.35079956054688, -128.85658264160156, -118.36238098144531, -107.86817169189453, -97.37396240234375, -86.8797607421875, -76.38555145263672, -65.89134216308594, -55.397132873535156, -44.90292739868164, -34.408721923828125, -23.914512634277344, -13.420303344726562, -2.926097869873047, 7.568107604980469, 18.062286376953125, 28.556493759155273, 39.05070114135742, 49.54490661621094, 60.03911590576172, 70.5333251953125, 81.02752685546875, 91.52173614501953, 102.01594543457031, 112.5101547241211, 123.00436401367188, 133.49856567382812, 143.99276733398438, 154.4869842529297, 164.98118591308594, 175.47540283203125, 185.9696044921875, 196.46380615234375, 206.95802307128906, 217.4522247314453, 227.94644165039062, 238.44064331054688, 248.93484497070312, 259.4290466308594, 269.92327880859375, 280.41748046875, 290.91168212890625, 301.4059143066406, 311.9001159667969, 322.3943176269531, 332.8885192871094, 343.3827209472656, 353.8769226074219]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 9.0, 6.0, 8.0, 6.0, 10.0, 11.0, 13.0, 15.0, 16.0, 32.0, 21.0, 29.0, 33.0, 26.0, 44.0, 48.0, 42.0, 59.0, 50.0, 40.0, 43.0, 57.0, 45.0, 38.0, 37.0, 56.0, 36.0, 25.0, 25.0, 25.0, 24.0, 12.0, 15.0, 9.0, 6.0, 6.0, 14.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-71.51577758789062, -68.93000030517578, -66.3442153930664, -63.7584342956543, -61.17265319824219, -58.586875915527344, -56.001094818115234, -53.415313720703125, -50.829532623291016, -48.243751525878906, -45.6579704284668, -43.07218933105469, -40.486412048339844, -37.90062713623047, -35.314849853515625, -32.729068756103516, -30.143287658691406, -27.557506561279297, -24.971725463867188, -22.38594627380371, -19.8001651763916, -17.214384078979492, -14.6286039352417, -12.042823791503906, -9.457042694091797, -6.871262073516846, -4.2854814529418945, -1.6997008323669434, 0.8860797882080078, 3.471860885620117, 6.05764102935791, 8.643421173095703, 11.229209899902344, 13.814990997314453, 16.400772094726562, 18.98655128479004, 21.57233238220215, 24.158113479614258, 26.743892669677734, 29.329673767089844, 31.915454864501953, 34.50123596191406, 37.08701705932617, 39.67279815673828, 42.258575439453125, 44.8443603515625, 47.430137634277344, 50.01591873168945, 52.60169982910156, 55.18748092651367, 57.77326202392578, 60.35904312133789, 62.94482421875, 65.53060150146484, 68.11638641357422, 70.70216369628906, 73.28794860839844, 75.87372589111328, 78.45951080322266, 81.0452880859375, 83.63107299804688, 86.21685028076172, 88.8026351928711, 91.38841247558594, 93.97418975830078]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 5.0, 2.0, 6.0, 12.0, 6.0, 12.0, 12.0, 15.0, 20.0, 21.0, 26.0, 29.0, 31.0, 41.0, 38.0, 37.0, 47.0, 39.0, 43.0, 48.0, 49.0, 43.0, 33.0, 56.0, 36.0, 49.0, 37.0, 28.0, 24.0, 23.0, 22.0, 24.0, 15.0, 16.0, 16.0, 11.0, 12.0, 6.0, 9.0, 6.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4296875, -12.06640625, -11.703125, -11.33984375, -10.9765625, -10.61328125, -10.25, -9.88671875, -9.5234375, -9.16015625, -8.796875, -8.43359375, -8.0703125, -7.70703125, -7.34375, -6.98046875, -6.6171875, -6.25390625, -5.890625, -5.52734375, -5.1640625, -4.80078125, -4.4375, -4.07421875, -3.7109375, -3.34765625, -2.984375, -2.62109375, -2.2578125, -1.89453125, -1.53125, -1.16796875, -0.8046875, -0.44140625, -0.078125, 0.28515625, 0.6484375, 1.01171875, 1.375, 1.73828125, 2.1015625, 2.46484375, 2.828125, 3.19140625, 3.5546875, 3.91796875, 4.28125, 4.64453125, 5.0078125, 5.37109375, 5.734375, 6.09765625, 6.4609375, 6.82421875, 7.1875, 7.55078125, 7.9140625, 8.27734375, 8.640625, 9.00390625, 9.3671875, 9.73046875, 10.09375, 10.45703125, 10.8203125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 7.0, 10.0, 3.0, 11.0, 14.0, 9.0, 23.0, 25.0, 30.0, 39.0, 41.0, 57.0, 78.0, 87.0, 124.0, 182.0, 278.0, 479.0, 937.0, 2219.0, 7767.0, 55076.0, 1104577.0, 2750701.0, 246945.0, 17519.0, 3781.0, 1375.0, 649.0, 372.0, 224.0, 165.0, 119.0, 78.0, 55.0, 45.0, 40.0, 37.0, 19.0, 22.0, 17.0, 9.0, 12.0, 7.0, 4.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.90625, -23.0888671875, -22.271484375, -21.4541015625, -20.63671875, -19.8193359375, -19.001953125, -18.1845703125, -17.3671875, -16.5498046875, -15.732421875, -14.9150390625, -14.09765625, -13.2802734375, -12.462890625, -11.6455078125, -10.828125, -10.0107421875, -9.193359375, -8.3759765625, -7.55859375, -6.7412109375, -5.923828125, -5.1064453125, -4.2890625, -3.4716796875, -2.654296875, -1.8369140625, -1.01953125, -0.2021484375, 0.615234375, 1.4326171875, 2.25, 3.0673828125, 3.884765625, 4.7021484375, 5.51953125, 6.3369140625, 7.154296875, 7.9716796875, 8.7890625, 9.6064453125, 10.423828125, 11.2412109375, 12.05859375, 12.8759765625, 13.693359375, 14.5107421875, 15.328125, 16.1455078125, 16.962890625, 17.7802734375, 18.59765625, 19.4150390625, 20.232421875, 21.0498046875, 21.8671875, 22.6845703125, 23.501953125, 24.3193359375, 25.13671875, 25.9541015625, 26.771484375, 27.5888671875, 28.40625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 8.0, 10.0, 17.0, 18.0, 46.0, 62.0, 89.0, 178.0, 243.0, 487.0, 923.0, 882.0, 444.0, 241.0, 149.0, 87.0, 63.0, 55.0, 28.0, 15.0, 10.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.6875, -40.717041015625, -39.74658203125, -38.776123046875, -37.8056640625, -36.835205078125, -35.86474609375, -34.894287109375, -33.923828125, -32.953369140625, -31.98291015625, -31.012451171875, -30.0419921875, -29.071533203125, -28.10107421875, -27.130615234375, -26.16015625, -25.189697265625, -24.21923828125, -23.248779296875, -22.2783203125, -21.307861328125, -20.33740234375, -19.366943359375, -18.396484375, -17.426025390625, -16.45556640625, -15.485107421875, -14.5146484375, -13.544189453125, -12.57373046875, -11.603271484375, -10.6328125, -9.662353515625, -8.69189453125, -7.721435546875, -6.7509765625, -5.780517578125, -4.81005859375, -3.839599609375, -2.869140625, -1.898681640625, -0.92822265625, 0.042236328125, 1.0126953125, 1.983154296875, 2.95361328125, 3.924072265625, 4.89453125, 5.864990234375, 6.83544921875, 7.805908203125, 8.7763671875, 9.746826171875, 10.71728515625, 11.687744140625, 12.658203125, 13.628662109375, 14.59912109375, 15.569580078125, 16.5400390625, 17.510498046875, 18.48095703125, 19.451416015625, 20.421875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 12.0, 5.0, 11.0, 23.0, 30.0, 48.0, 101.0, 174.0, 351.0, 885.0, 3939.0, 225386.0, 3939164.0, 21386.0, 1689.0, 532.0, 230.0, 131.0, 66.0, 49.0, 28.0, 12.0, 9.0, 3.0, 10.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.6875, -73.4130859375, -71.138671875, -68.8642578125, -66.58984375, -64.3154296875, -62.041015625, -59.7666015625, -57.4921875, -55.2177734375, -52.943359375, -50.6689453125, -48.39453125, -46.1201171875, -43.845703125, -41.5712890625, -39.296875, -37.0224609375, -34.748046875, -32.4736328125, -30.19921875, -27.9248046875, -25.650390625, -23.3759765625, -21.1015625, -18.8271484375, -16.552734375, -14.2783203125, -12.00390625, -9.7294921875, -7.455078125, -5.1806640625, -2.90625, -0.6318359375, 1.642578125, 3.9169921875, 6.19140625, 8.4658203125, 10.740234375, 13.0146484375, 15.2890625, 17.5634765625, 19.837890625, 22.1123046875, 24.38671875, 26.6611328125, 28.935546875, 31.2099609375, 33.484375, 35.7587890625, 38.033203125, 40.3076171875, 42.58203125, 44.8564453125, 47.130859375, 49.4052734375, 51.6796875, 53.9541015625, 56.228515625, 58.5029296875, 60.77734375, 63.0517578125, 65.326171875, 67.6005859375, 69.875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 130.0, 886.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1407.5731201171875, -1375.745361328125, -1343.9176025390625, -1312.08984375, -1280.261962890625, -1248.4342041015625, -1216.6064453125, -1184.7786865234375, -1152.950927734375, -1121.1231689453125, -1089.29541015625, -1057.4676513671875, -1025.6397705078125, -993.81201171875, -961.9842529296875, -930.156494140625, -898.3287353515625, -866.5009765625, -834.6731567382812, -802.8453979492188, -771.0176391601562, -739.1898193359375, -707.362060546875, -675.5343017578125, -643.7064819335938, -611.8787231445312, -580.0509033203125, -548.22314453125, -516.3953857421875, -484.5675964355469, -452.73980712890625, -420.91204833984375, -389.08428955078125, -357.2565002441406, -325.4287414550781, -293.6009521484375, -261.773193359375, -229.94540405273438, -198.1176300048828, -166.28985595703125, -134.4620819091797, -102.63430786132812, -70.80653381347656, -38.97875213623047, -7.150978088378906, 24.676803588867188, 56.50457763671875, 88.33235168457031, 120.16012573242188, 151.98789978027344, 183.815673828125, 215.64346313476562, 247.47122192382812, 279.29901123046875, 311.12677001953125, 342.9545593261719, 374.7823486328125, 406.6101379394531, 438.4378967285156, 470.26568603515625, 502.09344482421875, 533.9212646484375, 565.7490234375, 597.5767822265625, 629.404541015625]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 10.0, 5.0, 16.0, 21.0, 23.0, 26.0, 34.0, 44.0, 41.0, 50.0, 40.0, 52.0, 56.0, 48.0, 54.0, 50.0, 37.0, 54.0, 56.0, 34.0, 30.0, 36.0, 31.0, 20.0, 21.0, 21.0, 17.0, 14.0, 13.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.45903778076172, -61.92961883544922, -59.40019989013672, -56.87078094482422, -54.34136199951172, -51.81194305419922, -49.282527923583984, -46.753108978271484, -44.223690032958984, -41.694271087646484, -39.164852142333984, -36.635433197021484, -34.10601806640625, -31.576597213745117, -29.04718017578125, -26.51776123046875, -23.98834228515625, -21.45892333984375, -18.92950439453125, -16.400087356567383, -13.870668411254883, -11.341249465942383, -8.8118314743042, -6.282413482666016, -3.7529945373535156, -1.2235760688781738, 1.305842399597168, 3.8352608680725098, 6.364679336547852, 8.894098281860352, 11.423516273498535, 13.952934265136719, 16.482345581054688, 19.011764526367188, 21.541183471679688, 24.070600509643555, 26.600019454956055, 29.129438400268555, 31.658855438232422, 34.18827438354492, 36.71769332885742, 39.24711227416992, 41.77653121948242, 44.30595016479492, 46.835365295410156, 49.364784240722656, 51.894203186035156, 54.423622131347656, 56.953041076660156, 59.482460021972656, 62.011878967285156, 64.54129791259766, 67.07071685791016, 69.60013580322266, 72.12955474853516, 74.65896606445312, 77.18838500976562, 79.71780395507812, 82.24722290039062, 84.77664184570312, 87.30606079101562, 89.83547973632812, 92.36489868164062, 94.89431762695312, 97.42373657226562]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 8.0, 7.0, 8.0, 13.0, 14.0, 8.0, 20.0, 21.0, 29.0, 23.0, 19.0, 35.0, 26.0, 26.0, 37.0, 41.0, 31.0, 36.0, 40.0, 37.0, 53.0, 29.0, 37.0, 22.0, 43.0, 51.0, 35.0, 28.0, 24.0, 31.0, 22.0, 22.0, 14.0, 19.0, 14.0, 12.0, 12.0, 10.0, 5.0, 8.0, 8.0, 7.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.1015625, -7.8494873046875, -7.597412109375, -7.3453369140625, -7.09326171875, -6.8411865234375, -6.589111328125, -6.3370361328125, -6.0849609375, -5.8328857421875, -5.580810546875, -5.3287353515625, -5.07666015625, -4.8245849609375, -4.572509765625, -4.3204345703125, -4.068359375, -3.8162841796875, -3.564208984375, -3.3121337890625, -3.06005859375, -2.8079833984375, -2.555908203125, -2.3038330078125, -2.0517578125, -1.7996826171875, -1.547607421875, -1.2955322265625, -1.04345703125, -0.7913818359375, -0.539306640625, -0.2872314453125, -0.03515625, 0.2169189453125, 0.468994140625, 0.7210693359375, 0.97314453125, 1.2252197265625, 1.477294921875, 1.7293701171875, 1.9814453125, 2.2335205078125, 2.485595703125, 2.7376708984375, 2.98974609375, 3.2418212890625, 3.493896484375, 3.7459716796875, 3.998046875, 4.2501220703125, 4.502197265625, 4.7542724609375, 5.00634765625, 5.2584228515625, 5.510498046875, 5.7625732421875, 6.0146484375, 6.2667236328125, 6.518798828125, 6.7708740234375, 7.02294921875, 7.2750244140625, 7.527099609375, 7.7791748046875, 8.03125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 8.0, 18.0, 14.0, 28.0, 36.0, 57.0, 81.0, 110.0, 162.0, 217.0, 301.0, 468.0, 640.0, 986.0, 1352.0, 2149.0, 3161.0, 4833.0, 7190.0, 10609.0, 16567.0, 25413.0, 38660.0, 59676.0, 91622.0, 135037.0, 173462.0, 155028.0, 110186.0, 72763.0, 47621.0, 30755.0, 19879.0, 13169.0, 8763.0, 5776.0, 3774.0, 2486.0, 1722.0, 1184.0, 789.0, 570.0, 380.0, 263.0, 200.0, 131.0, 84.0, 59.0, 36.0, 24.0, 17.0, 9.0, 14.0, 7.0, 7.0, 4.0, 2.0], "bins": [-0.818359375, -0.794097900390625, -0.76983642578125, -0.745574951171875, -0.7213134765625, -0.697052001953125, -0.67279052734375, -0.648529052734375, -0.624267578125, -0.600006103515625, -0.57574462890625, -0.551483154296875, -0.5272216796875, -0.502960205078125, -0.47869873046875, -0.454437255859375, -0.43017578125, -0.405914306640625, -0.38165283203125, -0.357391357421875, -0.3331298828125, -0.308868408203125, -0.28460693359375, -0.260345458984375, -0.236083984375, -0.211822509765625, -0.18756103515625, -0.163299560546875, -0.1390380859375, -0.114776611328125, -0.09051513671875, -0.066253662109375, -0.0419921875, -0.017730712890625, 0.00653076171875, 0.030792236328125, 0.0550537109375, 0.079315185546875, 0.10357666015625, 0.127838134765625, 0.152099609375, 0.176361083984375, 0.20062255859375, 0.224884033203125, 0.2491455078125, 0.273406982421875, 0.29766845703125, 0.321929931640625, 0.34619140625, 0.370452880859375, 0.39471435546875, 0.418975830078125, 0.4432373046875, 0.467498779296875, 0.49176025390625, 0.516021728515625, 0.540283203125, 0.564544677734375, 0.58880615234375, 0.613067626953125, 0.6373291015625, 0.661590576171875, 0.68585205078125, 0.710113525390625, 0.734375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 9.0, 1.0, 0.0, 8.0, 11.0, 11.0, 9.0, 12.0, 10.0, 26.0, 18.0, 20.0, 28.0, 30.0, 31.0, 31.0, 27.0, 35.0, 30.0, 30.0, 29.0, 30.0, 1057.0, 39.0, 43.0, 43.0, 44.0, 30.0, 32.0, 32.0, 35.0, 34.0, 30.0, 22.0, 25.0, 20.0, 18.0, 17.0, 21.0, 10.0, 7.0, 5.0, 11.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.21484375, -5.05181884765625, -4.8887939453125, -4.72576904296875, -4.562744140625, -4.39971923828125, -4.2366943359375, -4.07366943359375, -3.91064453125, -3.74761962890625, -3.5845947265625, -3.42156982421875, -3.258544921875, -3.09552001953125, -2.9324951171875, -2.76947021484375, -2.6064453125, -2.44342041015625, -2.2803955078125, -2.11737060546875, -1.954345703125, -1.79132080078125, -1.6282958984375, -1.46527099609375, -1.30224609375, -1.13922119140625, -0.9761962890625, -0.81317138671875, -0.650146484375, -0.48712158203125, -0.3240966796875, -0.16107177734375, 0.001953125, 0.16497802734375, 0.3280029296875, 0.49102783203125, 0.654052734375, 0.81707763671875, 0.9801025390625, 1.14312744140625, 1.30615234375, 1.46917724609375, 1.6322021484375, 1.79522705078125, 1.958251953125, 2.12127685546875, 2.2843017578125, 2.44732666015625, 2.6103515625, 2.77337646484375, 2.9364013671875, 3.09942626953125, 3.262451171875, 3.42547607421875, 3.5885009765625, 3.75152587890625, 3.91455078125, 4.07757568359375, 4.2406005859375, 4.40362548828125, 4.566650390625, 4.72967529296875, 4.8927001953125, 5.05572509765625, 5.21875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 8.0, 4.0, 12.0, 13.0, 20.0, 28.0, 42.0, 59.0, 96.0, 112.0, 167.0, 234.0, 397.0, 475.0, 679.0, 974.0, 1435.0, 2118.0, 2926.0, 4151.0, 6210.0, 8786.0, 12692.0, 18476.0, 26746.0, 39132.0, 57123.0, 84035.0, 119397.0, 1189044.0, 155511.0, 113364.0, 79113.0, 54465.0, 36954.0, 25405.0, 17475.0, 12071.0, 8379.0, 5742.0, 4026.0, 2808.0, 1959.0, 1250.0, 869.0, 664.0, 479.0, 295.0, 225.0, 146.0, 105.0, 87.0, 50.0, 35.0, 28.0, 14.0, 11.0, 8.0, 5.0, 7.0, 3.0, 3.0], "bins": [-0.67138671875, -0.6503524780273438, -0.6293182373046875, -0.6082839965820312, -0.587249755859375, -0.5662155151367188, -0.5451812744140625, -0.5241470336914062, -0.50311279296875, -0.48207855224609375, -0.4610443115234375, -0.44001007080078125, -0.418975830078125, -0.39794158935546875, -0.3769073486328125, -0.35587310791015625, -0.3348388671875, -0.31380462646484375, -0.2927703857421875, -0.27173614501953125, -0.250701904296875, -0.22966766357421875, -0.2086334228515625, -0.18759918212890625, -0.16656494140625, -0.14553070068359375, -0.1244964599609375, -0.10346221923828125, -0.082427978515625, -0.06139373779296875, -0.0403594970703125, -0.01932525634765625, 0.001708984375, 0.02274322509765625, 0.0437774658203125, 0.06481170654296875, 0.085845947265625, 0.10688018798828125, 0.1279144287109375, 0.14894866943359375, 0.16998291015625, 0.19101715087890625, 0.2120513916015625, 0.23308563232421875, 0.254119873046875, 0.27515411376953125, 0.2961883544921875, 0.31722259521484375, 0.3382568359375, 0.35929107666015625, 0.3803253173828125, 0.40135955810546875, 0.422393798828125, 0.44342803955078125, 0.4644622802734375, 0.48549652099609375, 0.50653076171875, 0.5275650024414062, 0.5485992431640625, 0.5696334838867188, 0.590667724609375, 0.6117019653320312, 0.6327362060546875, 0.6537704467773438, 0.6748046875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 4.0, 6.0, 8.0, 12.0, 4.0, 13.0, 17.0, 17.0, 30.0, 29.0, 43.0, 38.0, 39.0, 59.0, 53.0, 59.0, 60.0, 68.0, 67.0, 54.0, 46.0, 38.0, 39.0, 28.0, 36.0, 25.0, 23.0, 16.0, 9.0, 15.0, 10.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.002590179443359375, -0.0025174319744110107, -0.0024446845054626465, -0.0023719370365142822, -0.002299189567565918, -0.0022264420986175537, -0.0021536946296691895, -0.002080947160720825, -0.002008199691772461, -0.0019354522228240967, -0.0018627047538757324, -0.0017899572849273682, -0.001717209815979004, -0.0016444623470306396, -0.0015717148780822754, -0.0014989674091339111, -0.0014262199401855469, -0.0013534724712371826, -0.0012807250022888184, -0.001207977533340454, -0.0011352300643920898, -0.0010624825954437256, -0.0009897351264953613, -0.0009169876575469971, -0.0008442401885986328, -0.0007714927196502686, -0.0006987452507019043, -0.00062599778175354, -0.0005532503128051758, -0.0004805028438568115, -0.00040775537490844727, -0.000335007905960083, -0.00026226043701171875, -0.0001895129680633545, -0.00011676549911499023, -4.4018030166625977e-05, 2.872943878173828e-05, 0.00010147690773010254, 0.0001742243766784668, 0.00024697184562683105, 0.0003197193145751953, 0.00039246678352355957, 0.00046521425247192383, 0.0005379617214202881, 0.0006107091903686523, 0.0006834566593170166, 0.0007562041282653809, 0.0008289515972137451, 0.0009016990661621094, 0.0009744465351104736, 0.0010471940040588379, 0.0011199414730072021, 0.0011926889419555664, 0.0012654364109039307, 0.001338183879852295, 0.0014109313488006592, 0.0014836788177490234, 0.0015564262866973877, 0.001629173755645752, 0.0017019212245941162, 0.0017746686935424805, 0.0018474161624908447, 0.001920163631439209, 0.0019929111003875732, 0.0020656585693359375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 8.0, 4.0, 7.0, 6.0, 11.0, 11.0, 16.0, 28.0, 29.0, 47.0, 56.0, 63.0, 83.0, 123.0, 132.0, 215.0, 355.0, 584.0, 1328.0, 255359.0, 786442.0, 1758.0, 651.0, 371.0, 210.0, 178.0, 130.0, 80.0, 61.0, 38.0, 29.0, 32.0, 10.0, 21.0, 14.0, 12.0, 6.0, 15.0, 7.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.036834716796875, -0.035523414611816406, -0.03421211242675781, -0.03290081024169922, -0.031589508056640625, -0.03027820587158203, -0.028966903686523438, -0.027655601501464844, -0.02634429931640625, -0.025032997131347656, -0.023721694946289062, -0.02241039276123047, -0.021099090576171875, -0.01978778839111328, -0.018476486206054688, -0.017165184020996094, -0.0158538818359375, -0.014542579650878906, -0.013231277465820312, -0.011919975280761719, -0.010608673095703125, -0.009297370910644531, -0.007986068725585938, -0.006674766540527344, -0.00536346435546875, -0.004052162170410156, -0.0027408599853515625, -0.0014295578002929688, -0.000118255615234375, 0.0011930465698242188, 0.0025043487548828125, 0.0038156509399414062, 0.005126953125, 0.006438255310058594, 0.0077495574951171875, 0.009060859680175781, 0.010372161865234375, 0.011683464050292969, 0.012994766235351562, 0.014306068420410156, 0.01561737060546875, 0.016928672790527344, 0.018239974975585938, 0.01955127716064453, 0.020862579345703125, 0.02217388153076172, 0.023485183715820312, 0.024796485900878906, 0.0261077880859375, 0.027419090270996094, 0.028730392456054688, 0.03004169464111328, 0.031352996826171875, 0.03266429901123047, 0.03397560119628906, 0.035286903381347656, 0.03659820556640625, 0.037909507751464844, 0.03922080993652344, 0.04053211212158203, 0.041843414306640625, 0.04315471649169922, 0.04446601867675781, 0.045777320861816406, 0.047088623046875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 15.0, 246.0, 626.0, 118.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01261530164629221, -0.012387450784444809, -0.012159600853919983, -0.011931749992072582, -0.011703899130225182, -0.011476049199700356, -0.011248198337852955, -0.011020347476005554, -0.010792496614158154, -0.010564645752310753, -0.010336795821785927, -0.010108944959938526, -0.009881094098091125, -0.0096532441675663, -0.009425393305718899, -0.009197542443871498, -0.008969692513346672, -0.008741841651499271, -0.008513991720974445, -0.008286140859127045, -0.008058289997279644, -0.007830439135432243, -0.007602589204907417, -0.007374738343060017, -0.007146887481212616, -0.006919037085026503, -0.006691186223179102, -0.006463335826992989, -0.006235484965145588, -0.0060076345689594746, -0.005779784172773361, -0.0055519333109259605, -0.005324082914739847, -0.005096232518553734, -0.004868381656706333, -0.00464053126052022, -0.004412680398672819, -0.004184830002486706, -0.003956979140639305, -0.0037291287444531918, -0.0035012783482670784, -0.0032734277192503214, -0.0030455770902335644, -0.002817726694047451, -0.002589876065030694, -0.002362025436013937, -0.00213417480699718, -0.0019063242943957448, -0.001678473548963666, -0.001450622919946909, -0.0012227724073454738, -0.0009949217783287168, -0.0007670712075196207, -0.0005392206367105246, -0.00031137000769376755, -8.351949509233236e-05, 0.00014433113392442465, 0.00037218170473352075, 0.0006000322755426168, 0.0008278829045593739, 0.0010557335335761309, 0.001283584046177566, 0.001511434675194323, 0.0017392851877957582, 0.0019671358168125153]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 3.0, 2.0, 5.0, 11.0, 7.0, 8.0, 13.0, 17.0, 21.0, 21.0, 23.0, 25.0, 22.0, 36.0, 36.0, 40.0, 34.0, 39.0, 38.0, 33.0, 45.0, 41.0, 46.0, 45.0, 42.0, 44.0, 30.0, 36.0, 33.0, 27.0, 28.0, 26.0, 22.0, 19.0, 14.0, 15.0, 10.0, 11.0, 9.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0012742280960083008, -0.0012356508523225784, -0.001197073608636856, -0.0011584963649511337, -0.0011199191212654114, -0.001081341877579689, -0.0010427646338939667, -0.0010041873902082443, -0.000965610146522522, -0.0009270329028367996, -0.0008884556591510773, -0.0008498784154653549, -0.0008113011717796326, -0.0007727239280939102, -0.0007341466844081879, -0.0006955694407224655, -0.0006569921970367432, -0.0006184149533510208, -0.0005798377096652985, -0.0005412604659795761, -0.0005026832222938538, -0.0004641059786081314, -0.00042552873492240906, -0.0003869514912366867, -0.00034837424755096436, -0.000309797003865242, -0.00027121976017951965, -0.0002326425164937973, -0.00019406527280807495, -0.0001554880291223526, -0.00011691078543663025, -7.83335417509079e-05, -3.975629806518555e-05, -1.1790543794631958e-06, 3.7398189306259155e-05, 7.59754329919815e-05, 0.00011455267667770386, 0.0001531299203634262, 0.00019170716404914856, 0.0002302844077348709, 0.00026886165142059326, 0.0003074388951063156, 0.00034601613879203796, 0.0003845933824777603, 0.00042317062616348267, 0.000461747869849205, 0.0005003251135349274, 0.0005389023572206497, 0.0005774796009063721, 0.0006160568445920944, 0.0006546340882778168, 0.0006932113319635391, 0.0007317885756492615, 0.0007703658193349838, 0.0008089430630207062, 0.0008475203067064285, 0.0008860975503921509, 0.0009246747940778732, 0.0009632520377635956, 0.001001829281449318, 0.0010404065251350403, 0.0010789837688207626, 0.001117561012506485, 0.0011561382561922073, 0.0011947154998779297]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 8.0, 7.0, 8.0, 13.0, 14.0, 8.0, 20.0, 21.0, 29.0, 23.0, 19.0, 35.0, 26.0, 26.0, 37.0, 41.0, 31.0, 36.0, 40.0, 37.0, 53.0, 29.0, 36.0, 23.0, 43.0, 51.0, 35.0, 28.0, 24.0, 31.0, 22.0, 22.0, 14.0, 19.0, 14.0, 12.0, 12.0, 10.0, 5.0, 8.0, 8.0, 7.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.1015625, -7.8494873046875, -7.597412109375, -7.3453369140625, -7.09326171875, -6.8411865234375, -6.589111328125, -6.3370361328125, -6.0849609375, -5.8328857421875, -5.580810546875, -5.3287353515625, -5.07666015625, -4.8245849609375, -4.572509765625, -4.3204345703125, -4.068359375, -3.8162841796875, -3.564208984375, -3.3121337890625, -3.06005859375, -2.8079833984375, -2.555908203125, -2.3038330078125, -2.0517578125, -1.7996826171875, -1.547607421875, -1.2955322265625, -1.04345703125, -0.7913818359375, -0.539306640625, -0.2872314453125, -0.03515625, 0.2169189453125, 0.468994140625, 0.7210693359375, 0.97314453125, 1.2252197265625, 1.477294921875, 1.7293701171875, 1.9814453125, 2.2335205078125, 2.485595703125, 2.7376708984375, 2.98974609375, 3.2418212890625, 3.493896484375, 3.7459716796875, 3.998046875, 4.2501220703125, 4.502197265625, 4.7542724609375, 5.00634765625, 5.2584228515625, 5.510498046875, 5.7625732421875, 6.0146484375, 6.2667236328125, 6.518798828125, 6.7708740234375, 7.02294921875, 7.2750244140625, 7.527099609375, 7.7791748046875, 8.03125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 6.0, 8.0, 10.0, 17.0, 18.0, 27.0, 32.0, 50.0, 84.0, 91.0, 140.0, 201.0, 265.0, 346.0, 512.0, 712.0, 1061.0, 1612.0, 2553.0, 4966.0, 16510.0, 126824.0, 717611.0, 143669.0, 18169.0, 5270.0, 2538.0, 1529.0, 1079.0, 782.0, 541.0, 379.0, 267.0, 178.0, 121.0, 107.0, 77.0, 47.0, 42.0, 35.0, 21.0, 12.0, 6.0, 8.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-21.75, -21.081298828125, -20.41259765625, -19.743896484375, -19.0751953125, -18.406494140625, -17.73779296875, -17.069091796875, -16.400390625, -15.731689453125, -15.06298828125, -14.394287109375, -13.7255859375, -13.056884765625, -12.38818359375, -11.719482421875, -11.05078125, -10.382080078125, -9.71337890625, -9.044677734375, -8.3759765625, -7.707275390625, -7.03857421875, -6.369873046875, -5.701171875, -5.032470703125, -4.36376953125, -3.695068359375, -3.0263671875, -2.357666015625, -1.68896484375, -1.020263671875, -0.3515625, 0.317138671875, 0.98583984375, 1.654541015625, 2.3232421875, 2.991943359375, 3.66064453125, 4.329345703125, 4.998046875, 5.666748046875, 6.33544921875, 7.004150390625, 7.6728515625, 8.341552734375, 9.01025390625, 9.678955078125, 10.34765625, 11.016357421875, 11.68505859375, 12.353759765625, 13.0224609375, 13.691162109375, 14.35986328125, 15.028564453125, 15.697265625, 16.365966796875, 17.03466796875, 17.703369140625, 18.3720703125, 19.040771484375, 19.70947265625, 20.378173828125, 21.046875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 9.0, 7.0, 8.0, 8.0, 10.0, 10.0, 21.0, 26.0, 19.0, 27.0, 30.0, 33.0, 49.0, 54.0, 67.0, 81.0, 208.0, 1658.0, 219.0, 86.0, 70.0, 65.0, 37.0, 29.0, 32.0, 28.0, 23.0, 19.0, 15.0, 17.0, 13.0, 18.0, 8.0, 7.0, 9.0, 3.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0], "bins": [-28.03125, -27.26220703125, -26.4931640625, -25.72412109375, -24.955078125, -24.18603515625, -23.4169921875, -22.64794921875, -21.87890625, -21.10986328125, -20.3408203125, -19.57177734375, -18.802734375, -18.03369140625, -17.2646484375, -16.49560546875, -15.7265625, -14.95751953125, -14.1884765625, -13.41943359375, -12.650390625, -11.88134765625, -11.1123046875, -10.34326171875, -9.57421875, -8.80517578125, -8.0361328125, -7.26708984375, -6.498046875, -5.72900390625, -4.9599609375, -4.19091796875, -3.421875, -2.65283203125, -1.8837890625, -1.11474609375, -0.345703125, 0.42333984375, 1.1923828125, 1.96142578125, 2.73046875, 3.49951171875, 4.2685546875, 5.03759765625, 5.806640625, 6.57568359375, 7.3447265625, 8.11376953125, 8.8828125, 9.65185546875, 10.4208984375, 11.18994140625, 11.958984375, 12.72802734375, 13.4970703125, 14.26611328125, 15.03515625, 15.80419921875, 16.5732421875, 17.34228515625, 18.111328125, 18.88037109375, 19.6494140625, 20.41845703125, 21.1875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 9.0, 7.0, 9.0, 6.0, 11.0, 13.0, 19.0, 23.0, 25.0, 37.0, 39.0, 64.0, 76.0, 89.0, 121.0, 178.0, 253.0, 515.0, 1151.0, 9549.0, 3119913.0, 11023.0, 1150.0, 472.0, 273.0, 187.0, 107.0, 98.0, 53.0, 58.0, 40.0, 20.0, 29.0, 19.0, 20.0, 8.0, 10.0, 5.0, 11.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.392578125, -60.34765625, -58.302734375, -56.2578125, -54.212890625, -52.16796875, -50.123046875, -48.078125, -46.033203125, -43.98828125, -41.943359375, -39.8984375, -37.853515625, -35.80859375, -33.763671875, -31.71875, -29.673828125, -27.62890625, -25.583984375, -23.5390625, -21.494140625, -19.44921875, -17.404296875, -15.359375, -13.314453125, -11.26953125, -9.224609375, -7.1796875, -5.134765625, -3.08984375, -1.044921875, 1.0, 3.044921875, 5.08984375, 7.134765625, 9.1796875, 11.224609375, 13.26953125, 15.314453125, 17.359375, 19.404296875, 21.44921875, 23.494140625, 25.5390625, 27.583984375, 29.62890625, 31.673828125, 33.71875, 35.763671875, 37.80859375, 39.853515625, 41.8984375, 43.943359375, 45.98828125, 48.033203125, 50.078125, 52.123046875, 54.16796875, 56.212890625, 58.2578125, 60.302734375, 62.34765625, 64.392578125, 66.4375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 89.0, 765.0, 154.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-438.9984130859375, -429.56573486328125, -420.133056640625, -410.7004089355469, -401.2677307128906, -391.8350524902344, -382.40240478515625, -372.9697265625, -363.53704833984375, -354.1043701171875, -344.67169189453125, -335.2390441894531, -325.8063659667969, -316.3736877441406, -306.9410400390625, -297.50836181640625, -288.07568359375, -278.64300537109375, -269.2103271484375, -259.7776794433594, -250.34500122070312, -240.91232299804688, -231.4796600341797, -222.0469970703125, -212.61431884765625, -203.181640625, -193.7489776611328, -184.31631469726562, -174.88363647460938, -165.45095825195312, -156.01829528808594, -146.58563232421875, -137.1529541015625, -127.72028350830078, -118.28761291503906, -108.85494232177734, -99.42227172851562, -89.9896011352539, -80.55693054199219, -71.12425994873047, -61.69158935546875, -52.25891876220703, -42.82624816894531, -33.393577575683594, -23.960906982421875, -14.528236389160156, -5.0955657958984375, 4.337104797363281, 13.769775390625, 23.20244598388672, 32.63511657714844, 42.067787170410156, 51.500457763671875, 60.933128356933594, 70.36579895019531, 79.79846954345703, 89.23114013671875, 98.66381072998047, 108.09648132324219, 117.5291519165039, 126.96182250976562, 136.39450073242188, 145.82716369628906, 155.25982666015625, 164.6925048828125]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 7.0, 9.0, 6.0, 10.0, 12.0, 9.0, 10.0, 21.0, 14.0, 17.0, 23.0, 30.0, 24.0, 24.0, 36.0, 29.0, 29.0, 39.0, 27.0, 32.0, 40.0, 38.0, 39.0, 50.0, 41.0, 29.0, 34.0, 28.0, 35.0, 31.0, 22.0, 27.0, 20.0, 20.0, 26.0, 20.0, 19.0, 14.0, 10.0, 10.0, 8.0, 6.0, 3.0, 4.0, 3.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-61.25132369995117, -59.25470733642578, -57.25809097290039, -55.261474609375, -53.264854431152344, -51.26824188232422, -49.27162170410156, -47.27500534057617, -45.27838897705078, -43.28177261352539, -41.28515625, -39.28853988647461, -37.29192352294922, -35.29530334472656, -33.29868698120117, -31.30207061767578, -29.30545425415039, -27.308837890625, -25.31222152709961, -23.315603256225586, -21.318986892700195, -19.322370529174805, -17.32575225830078, -15.32913589477539, -13.33251953125, -11.33590316772461, -9.339285850524902, -7.3426690101623535, -5.346052169799805, -3.349435806274414, -1.352818489074707, 0.643798828125, 2.6404190063476562, 4.637035846710205, 6.633652687072754, 8.630270004272461, 10.626886367797852, 12.623502731323242, 14.62012004852295, 16.616737365722656, 18.613353729248047, 20.609970092773438, 22.606586456298828, 24.60320472717285, 26.599821090698242, 28.596437454223633, 30.593055725097656, 32.58967208862305, 34.58628845214844, 36.58290481567383, 38.57952117919922, 40.57613754272461, 42.57275390625, 44.569374084472656, 46.56599044799805, 48.56260681152344, 50.55922317504883, 52.55583953857422, 54.55245590209961, 56.549072265625, 58.545692443847656, 60.54230499267578, 62.53892517089844, 64.53553771972656, 66.53215789794922]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 5.0, 13.0, 14.0, 10.0, 8.0, 7.0, 21.0, 23.0, 29.0, 27.0, 30.0, 26.0, 32.0, 32.0, 39.0, 62.0, 40.0, 38.0, 35.0, 44.0, 54.0, 35.0, 43.0, 49.0, 35.0, 41.0, 34.0, 26.0, 31.0, 18.0, 13.0, 10.0, 15.0, 12.0, 11.0, 7.0, 7.0, 2.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.2109375, -9.9075927734375, -9.604248046875, -9.3009033203125, -8.99755859375, -8.6942138671875, -8.390869140625, -8.0875244140625, -7.7841796875, -7.4808349609375, -7.177490234375, -6.8741455078125, -6.57080078125, -6.2674560546875, -5.964111328125, -5.6607666015625, -5.357421875, -5.0540771484375, -4.750732421875, -4.4473876953125, -4.14404296875, -3.8406982421875, -3.537353515625, -3.2340087890625, -2.9306640625, -2.6273193359375, -2.323974609375, -2.0206298828125, -1.71728515625, -1.4139404296875, -1.110595703125, -0.8072509765625, -0.50390625, -0.2005615234375, 0.102783203125, 0.4061279296875, 0.70947265625, 1.0128173828125, 1.316162109375, 1.6195068359375, 1.9228515625, 2.2261962890625, 2.529541015625, 2.8328857421875, 3.13623046875, 3.4395751953125, 3.742919921875, 4.0462646484375, 4.349609375, 4.6529541015625, 4.956298828125, 5.2596435546875, 5.56298828125, 5.8663330078125, 6.169677734375, 6.4730224609375, 6.7763671875, 7.0797119140625, 7.383056640625, 7.6864013671875, 7.98974609375, 8.2930908203125, 8.596435546875, 8.8997802734375, 9.203125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 9.0, 6.0, 11.0, 16.0, 11.0, 8.0, 28.0, 22.0, 39.0, 48.0, 64.0, 102.0, 148.0, 220.0, 315.0, 559.0, 986.0, 1911.0, 3950.0, 10019.0, 40162.0, 329618.0, 2078585.0, 1492276.0, 193680.0, 26505.0, 7806.0, 3223.0, 1638.0, 856.0, 528.0, 306.0, 192.0, 122.0, 88.0, 63.0, 50.0, 26.0, 22.0, 17.0, 7.0, 7.0, 10.0, 9.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.625, -16.103515625, -15.58203125, -15.060546875, -14.5390625, -14.017578125, -13.49609375, -12.974609375, -12.453125, -11.931640625, -11.41015625, -10.888671875, -10.3671875, -9.845703125, -9.32421875, -8.802734375, -8.28125, -7.759765625, -7.23828125, -6.716796875, -6.1953125, -5.673828125, -5.15234375, -4.630859375, -4.109375, -3.587890625, -3.06640625, -2.544921875, -2.0234375, -1.501953125, -0.98046875, -0.458984375, 0.0625, 0.583984375, 1.10546875, 1.626953125, 2.1484375, 2.669921875, 3.19140625, 3.712890625, 4.234375, 4.755859375, 5.27734375, 5.798828125, 6.3203125, 6.841796875, 7.36328125, 7.884765625, 8.40625, 8.927734375, 9.44921875, 9.970703125, 10.4921875, 11.013671875, 11.53515625, 12.056640625, 12.578125, 13.099609375, 13.62109375, 14.142578125, 14.6640625, 15.185546875, 15.70703125, 16.228515625, 16.75]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 30.0, 314.0, 2596.0, 1060.0, 73.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.625, -126.7578125, -122.890625, -119.0234375, -115.15625, -111.2890625, -107.421875, -103.5546875, -99.6875, -95.8203125, -91.953125, -88.0859375, -84.21875, -80.3515625, -76.484375, -72.6171875, -68.75, -64.8828125, -61.015625, -57.1484375, -53.28125, -49.4140625, -45.546875, -41.6796875, -37.8125, -33.9453125, -30.078125, -26.2109375, -22.34375, -18.4765625, -14.609375, -10.7421875, -6.875, -3.0078125, 0.859375, 4.7265625, 8.59375, 12.4609375, 16.328125, 20.1953125, 24.0625, 27.9296875, 31.796875, 35.6640625, 39.53125, 43.3984375, 47.265625, 51.1328125, 55.0, 58.8671875, 62.734375, 66.6015625, 70.46875, 74.3359375, 78.203125, 82.0703125, 85.9375, 89.8046875, 93.671875, 97.5390625, 101.40625, 105.2734375, 109.140625, 113.0078125, 116.875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 25.0, 72.0, 326.0, 1879.0, 4183204.0, 7894.0, 696.0, 134.0, 28.0, 13.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.125, -176.958984375, -170.79296875, -164.626953125, -158.4609375, -152.294921875, -146.12890625, -139.962890625, -133.796875, -127.630859375, -121.46484375, -115.298828125, -109.1328125, -102.966796875, -96.80078125, -90.634765625, -84.46875, -78.302734375, -72.13671875, -65.970703125, -59.8046875, -53.638671875, -47.47265625, -41.306640625, -35.140625, -28.974609375, -22.80859375, -16.642578125, -10.4765625, -4.310546875, 1.85546875, 8.021484375, 14.1875, 20.353515625, 26.51953125, 32.685546875, 38.8515625, 45.017578125, 51.18359375, 57.349609375, 63.515625, 69.681640625, 75.84765625, 82.013671875, 88.1796875, 94.345703125, 100.51171875, 106.677734375, 112.84375, 119.009765625, 125.17578125, 131.341796875, 137.5078125, 143.673828125, 149.83984375, 156.005859375, 162.171875, 168.337890625, 174.50390625, 180.669921875, 186.8359375, 193.001953125, 199.16796875, 205.333984375, 211.5]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 94.0, 841.0, 77.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-853.7344970703125, -837.7763061523438, -821.818115234375, -805.85986328125, -789.9016723632812, -773.9434814453125, -757.9852905273438, -742.027099609375, -726.06884765625, -710.1106567382812, -694.1524658203125, -678.1942138671875, -662.2360229492188, -646.27783203125, -630.3196411132812, -614.3614501953125, -598.4032592773438, -582.445068359375, -566.4868774414062, -550.5286254882812, -534.5704345703125, -518.6122436523438, -502.654052734375, -486.6958312988281, -470.73760986328125, -454.7794189453125, -438.8211975097656, -422.8630065917969, -406.90478515625, -390.94659423828125, -374.9884033203125, -359.0301818847656, -343.0719909667969, -327.1138000488281, -311.15557861328125, -295.1973876953125, -279.2391662597656, -263.2809753417969, -247.32276916503906, -231.36456298828125, -215.4063720703125, -199.4481658935547, -183.48995971679688, -167.53176879882812, -151.5735626220703, -135.6153564453125, -119.65715026855469, -103.6989517211914, -87.74073791503906, -71.78253173828125, -55.82433319091797, -39.866127014160156, -23.90792465209961, -7.9497222900390625, 8.00848388671875, 23.96668243408203, 39.924888610839844, 55.88309097290039, 71.84129333496094, 87.79949951171875, 103.75770568847656, 119.71590423583984, 135.67410278320312, 151.63230895996094, 167.59051513671875]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 8.0, 6.0, 9.0, 12.0, 14.0, 9.0, 19.0, 24.0, 21.0, 14.0, 35.0, 44.0, 39.0, 38.0, 31.0, 42.0, 40.0, 47.0, 50.0, 36.0, 28.0, 29.0, 53.0, 43.0, 28.0, 44.0, 39.0, 29.0, 33.0, 31.0, 18.0, 11.0, 11.0, 12.0, 11.0, 8.0, 8.0, 1.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-88.91316223144531, -86.46882629394531, -84.02449798583984, -81.58016204833984, -79.13583374023438, -76.69149780273438, -74.2471694946289, -71.8028335571289, -69.35850524902344, -66.91416931152344, -64.46984100341797, -62.025508880615234, -59.5811767578125, -57.136844635009766, -54.69251251220703, -52.24817657470703, -49.8038444519043, -47.35951232910156, -44.91518020629883, -42.470848083496094, -40.02651596069336, -37.582183837890625, -35.137847900390625, -32.693519592285156, -30.24918556213379, -27.804853439331055, -25.36052131652832, -22.916187286376953, -20.47185516357422, -18.027523040771484, -15.58319091796875, -13.138858795166016, -10.694526672363281, -8.250194549560547, -5.805861949920654, -3.3615293502807617, -0.9171972274780273, 1.527134895324707, 3.971467971801758, 6.415800094604492, 8.860132217407227, 11.304464340209961, 13.748796463012695, 16.193130493164062, 18.637462615966797, 21.08179473876953, 23.526126861572266, 25.970458984375, 28.414791107177734, 30.85912322998047, 33.3034553527832, 35.74778747558594, 38.19211959838867, 40.636451721191406, 43.080787658691406, 45.525115966796875, 47.969451904296875, 50.41378402709961, 52.858116149902344, 55.30244827270508, 57.74678039550781, 60.19111251831055, 62.63544464111328, 65.07978057861328, 67.52410888671875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 7.0, 8.0, 8.0, 12.0, 19.0, 22.0, 15.0, 29.0, 28.0, 38.0, 33.0, 44.0, 36.0, 36.0, 35.0, 48.0, 42.0, 48.0, 37.0, 43.0, 49.0, 45.0, 37.0, 23.0, 28.0, 31.0, 31.0, 25.0, 20.0, 18.0, 19.0, 10.0, 20.0, 9.0, 10.0, 7.0, 3.0, 0.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.4296875, -8.169189453125, -7.90869140625, -7.648193359375, -7.3876953125, -7.127197265625, -6.86669921875, -6.606201171875, -6.345703125, -6.085205078125, -5.82470703125, -5.564208984375, -5.3037109375, -5.043212890625, -4.78271484375, -4.522216796875, -4.26171875, -4.001220703125, -3.74072265625, -3.480224609375, -3.2197265625, -2.959228515625, -2.69873046875, -2.438232421875, -2.177734375, -1.917236328125, -1.65673828125, -1.396240234375, -1.1357421875, -0.875244140625, -0.61474609375, -0.354248046875, -0.09375, 0.166748046875, 0.42724609375, 0.687744140625, 0.9482421875, 1.208740234375, 1.46923828125, 1.729736328125, 1.990234375, 2.250732421875, 2.51123046875, 2.771728515625, 3.0322265625, 3.292724609375, 3.55322265625, 3.813720703125, 4.07421875, 4.334716796875, 4.59521484375, 4.855712890625, 5.1162109375, 5.376708984375, 5.63720703125, 5.897705078125, 6.158203125, 6.418701171875, 6.67919921875, 6.939697265625, 7.2001953125, 7.460693359375, 7.72119140625, 7.981689453125, 8.2421875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 5.0, 9.0, 16.0, 21.0, 43.0, 49.0, 80.0, 122.0, 192.0, 288.0, 422.0, 661.0, 966.0, 1442.0, 2129.0, 3395.0, 4836.0, 7372.0, 11006.0, 16524.0, 24816.0, 37773.0, 57723.0, 87374.0, 127806.0, 173026.0, 158664.0, 111138.0, 74892.0, 49948.0, 32355.0, 21379.0, 14094.0, 9220.0, 6279.0, 4201.0, 2740.0, 1842.0, 1216.0, 869.0, 552.0, 333.0, 277.0, 159.0, 120.0, 74.0, 48.0, 32.0, 13.0, 6.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.70263671875, -0.6805496215820312, -0.6584625244140625, -0.6363754272460938, -0.614288330078125, -0.5922012329101562, -0.5701141357421875, -0.5480270385742188, -0.52593994140625, -0.5038528442382812, -0.4817657470703125, -0.45967864990234375, -0.437591552734375, -0.41550445556640625, -0.3934173583984375, -0.37133026123046875, -0.3492431640625, -0.32715606689453125, -0.3050689697265625, -0.28298187255859375, -0.260894775390625, -0.23880767822265625, -0.2167205810546875, -0.19463348388671875, -0.17254638671875, -0.15045928955078125, -0.1283721923828125, -0.10628509521484375, -0.084197998046875, -0.06211090087890625, -0.0400238037109375, -0.01793670654296875, 0.004150390625, 0.02623748779296875, 0.0483245849609375, 0.07041168212890625, 0.092498779296875, 0.11458587646484375, 0.1366729736328125, 0.15876007080078125, 0.18084716796875, 0.20293426513671875, 0.2250213623046875, 0.24710845947265625, 0.269195556640625, 0.29128265380859375, 0.3133697509765625, 0.33545684814453125, 0.3575439453125, 0.37963104248046875, 0.4017181396484375, 0.42380523681640625, 0.445892333984375, 0.46797943115234375, 0.4900665283203125, 0.5121536254882812, 0.53424072265625, 0.5563278198242188, 0.5784149169921875, 0.6005020141601562, 0.622589111328125, 0.6446762084960938, 0.6667633056640625, 0.6888504028320312, 0.7109375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 6.0, 9.0, 6.0, 12.0, 10.0, 14.0, 14.0, 12.0, 18.0, 16.0, 18.0, 23.0, 37.0, 25.0, 38.0, 30.0, 28.0, 25.0, 33.0, 35.0, 34.0, 38.0, 1067.0, 29.0, 37.0, 37.0, 41.0, 28.0, 30.0, 26.0, 30.0, 30.0, 21.0, 18.0, 16.0, 17.0, 22.0, 11.0, 11.0, 19.0, 12.0, 8.0, 8.0, 2.0, 2.0, 4.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.38671875, -4.25323486328125, -4.1197509765625, -3.98626708984375, -3.852783203125, -3.71929931640625, -3.5858154296875, -3.45233154296875, -3.31884765625, -3.18536376953125, -3.0518798828125, -2.91839599609375, -2.784912109375, -2.65142822265625, -2.5179443359375, -2.38446044921875, -2.2509765625, -2.11749267578125, -1.9840087890625, -1.85052490234375, -1.717041015625, -1.58355712890625, -1.4500732421875, -1.31658935546875, -1.18310546875, -1.04962158203125, -0.9161376953125, -0.78265380859375, -0.649169921875, -0.51568603515625, -0.3822021484375, -0.24871826171875, -0.115234375, 0.01824951171875, 0.1517333984375, 0.28521728515625, 0.418701171875, 0.55218505859375, 0.6856689453125, 0.81915283203125, 0.95263671875, 1.08612060546875, 1.2196044921875, 1.35308837890625, 1.486572265625, 1.62005615234375, 1.7535400390625, 1.88702392578125, 2.0205078125, 2.15399169921875, 2.2874755859375, 2.42095947265625, 2.554443359375, 2.68792724609375, 2.8214111328125, 2.95489501953125, 3.08837890625, 3.22186279296875, 3.3553466796875, 3.48883056640625, 3.622314453125, 3.75579833984375, 3.8892822265625, 4.02276611328125, 4.15625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 15.0, 17.0, 36.0, 52.0, 64.0, 110.0, 119.0, 202.0, 270.0, 458.0, 733.0, 1028.0, 1594.0, 2387.0, 3579.0, 5240.0, 8186.0, 12568.0, 19150.0, 29185.0, 44487.0, 68895.0, 104940.0, 151173.0, 1223777.0, 141389.0, 95934.0, 62395.0, 40582.0, 26345.0, 17651.0, 11686.0, 7631.0, 5058.0, 3403.0, 2248.0, 1535.0, 1046.0, 656.0, 433.0, 304.0, 186.0, 131.0, 90.0, 56.0, 41.0, 28.0, 18.0, 11.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.60986328125, -0.5897979736328125, -0.569732666015625, -0.5496673583984375, -0.52960205078125, -0.5095367431640625, -0.489471435546875, -0.4694061279296875, -0.4493408203125, -0.4292755126953125, -0.409210205078125, -0.3891448974609375, -0.36907958984375, -0.3490142822265625, -0.328948974609375, -0.3088836669921875, -0.288818359375, -0.2687530517578125, -0.248687744140625, -0.2286224365234375, -0.20855712890625, -0.1884918212890625, -0.168426513671875, -0.1483612060546875, -0.1282958984375, -0.1082305908203125, -0.088165283203125, -0.0680999755859375, -0.04803466796875, -0.0279693603515625, -0.007904052734375, 0.0121612548828125, 0.0322265625, 0.0522918701171875, 0.072357177734375, 0.0924224853515625, 0.11248779296875, 0.1325531005859375, 0.152618408203125, 0.1726837158203125, 0.1927490234375, 0.2128143310546875, 0.232879638671875, 0.2529449462890625, 0.27301025390625, 0.2930755615234375, 0.313140869140625, 0.3332061767578125, 0.353271484375, 0.3733367919921875, 0.393402099609375, 0.4134674072265625, 0.43353271484375, 0.4535980224609375, 0.473663330078125, 0.4937286376953125, 0.5137939453125, 0.5338592529296875, 0.553924560546875, 0.5739898681640625, 0.59405517578125, 0.6141204833984375, 0.634185791015625, 0.6542510986328125, 0.67431640625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 8.0, 1.0, 5.0, 6.0, 3.0, 9.0, 4.0, 11.0, 13.0, 17.0, 17.0, 17.0, 25.0, 28.0, 40.0, 38.0, 42.0, 46.0, 47.0, 55.0, 52.0, 57.0, 53.0, 49.0, 49.0, 48.0, 47.0, 40.0, 38.0, 24.0, 20.0, 21.0, 11.0, 10.0, 16.0, 12.0, 6.0, 5.0, 4.0, 1.0, 4.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.002719879150390625, -0.0026488155126571655, -0.002577751874923706, -0.0025066882371902466, -0.002435624599456787, -0.0023645609617233276, -0.002293497323989868, -0.0022224336862564087, -0.0021513700485229492, -0.0020803064107894897, -0.0020092427730560303, -0.0019381791353225708, -0.0018671154975891113, -0.0017960518598556519, -0.0017249882221221924, -0.001653924584388733, -0.0015828609466552734, -0.001511797308921814, -0.0014407336711883545, -0.001369670033454895, -0.0012986063957214355, -0.001227542757987976, -0.0011564791202545166, -0.0010854154825210571, -0.0010143518447875977, -0.0009432882070541382, -0.0008722245693206787, -0.0008011609315872192, -0.0007300972938537598, -0.0006590336561203003, -0.0005879700183868408, -0.0005169063806533813, -0.0004458427429199219, -0.0003747791051864624, -0.00030371546745300293, -0.00023265182971954346, -0.00016158819198608398, -9.052455425262451e-05, -1.946091651916504e-05, 5.1602721214294434e-05, 0.0001226663589477539, 0.00019372999668121338, 0.00026479363441467285, 0.0003358572721481323, 0.0004069209098815918, 0.00047798454761505127, 0.0005490481853485107, 0.0006201118230819702, 0.0006911754608154297, 0.0007622390985488892, 0.0008333027362823486, 0.0009043663740158081, 0.0009754300117492676, 0.001046493649482727, 0.0011175572872161865, 0.001188620924949646, 0.0012596845626831055, 0.001330748200416565, 0.0014018118381500244, 0.0014728754758834839, 0.0015439391136169434, 0.0016150027513504028, 0.0016860663890838623, 0.0017571300268173218, 0.0018281936645507812]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 8.0, 3.0, 4.0, 11.0, 12.0, 12.0, 29.0, 25.0, 30.0, 38.0, 66.0, 82.0, 107.0, 163.0, 174.0, 279.0, 486.0, 811.0, 3194.0, 1032623.0, 7883.0, 860.0, 496.0, 311.0, 200.0, 150.0, 100.0, 100.0, 74.0, 52.0, 38.0, 25.0, 22.0, 15.0, 10.0, 14.0, 12.0, 9.0, 2.0, 5.0, 2.0, 6.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03594970703125, -0.03464651107788086, -0.03334331512451172, -0.03204011917114258, -0.030736923217773438, -0.029433727264404297, -0.028130531311035156, -0.026827335357666016, -0.025524139404296875, -0.024220943450927734, -0.022917747497558594, -0.021614551544189453, -0.020311355590820312, -0.019008159637451172, -0.01770496368408203, -0.01640176773071289, -0.01509857177734375, -0.01379537582397461, -0.012492179870605469, -0.011188983917236328, -0.009885787963867188, -0.008582592010498047, -0.007279396057128906, -0.005976200103759766, -0.004673004150390625, -0.0033698081970214844, -0.0020666122436523438, -0.0007634162902832031, 0.0005397796630859375, 0.0018429756164550781, 0.0031461715698242188, 0.004449367523193359, 0.0057525634765625, 0.007055759429931641, 0.008358955383300781, 0.009662151336669922, 0.010965347290039062, 0.012268543243408203, 0.013571739196777344, 0.014874935150146484, 0.016178131103515625, 0.017481327056884766, 0.018784523010253906, 0.020087718963623047, 0.021390914916992188, 0.022694110870361328, 0.02399730682373047, 0.02530050277709961, 0.02660369873046875, 0.02790689468383789, 0.02921009063720703, 0.030513286590576172, 0.03181648254394531, 0.03311967849731445, 0.034422874450683594, 0.035726070404052734, 0.037029266357421875, 0.038332462310791016, 0.039635658264160156, 0.0409388542175293, 0.04224205017089844, 0.04354524612426758, 0.04484844207763672, 0.04615163803100586, 0.047454833984375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 81.0, 889.0, 45.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020622045267373323, -0.0017411672743037343, -0.0014201300218701363, -0.0010990926530212164, -0.0007780554005876184, -0.0004570181481540203, -0.00013598077930510044, 0.00018505635671317577, 0.0005060937255620956, 0.0008271309779956937, 0.0011481682304292917, 0.0014692055992782116, 0.0017902428517118096, 0.0021112801041454077, 0.0024323174729943275, 0.0027533546090126038, 0.0030743919778615236, 0.0033954293467104435, 0.0037164664827287197, 0.004037504084408283, 0.0043585412204265594, 0.004679578356444836, 0.005000615492463112, 0.005321652628481388, 0.005642690230160952, 0.005963727366179228, 0.006284764967858791, 0.0066058021038770676, 0.006926839239895344, 0.00724787637591362, 0.0075689139775931835, 0.007889950647950172, 0.008210987783968449, 0.008532024919986725, 0.008853062056005001, 0.009174099192023277, 0.009495137259364128, 0.009816174395382404, 0.01013721153140068, 0.010458248667418957, 0.010779285803437233, 0.01110032293945551, 0.011421360075473785, 0.011742398142814636, 0.012063435278832912, 0.012384472414851189, 0.012705509550869465, 0.013026546686887741, 0.013347584754228592, 0.013668621890246868, 0.013989659026265144, 0.014310697093605995, 0.014631734229624271, 0.014952771365642548, 0.015273808501660824, 0.0155948456376791, 0.0159158818423748, 0.016236919909715652, 0.016557956114411354, 0.016878994181752205, 0.017200030386447906, 0.017521068453788757, 0.017842106521129608, 0.01816314272582531, 0.01848418079316616]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 3.0, 7.0, 11.0, 7.0, 12.0, 10.0, 12.0, 19.0, 16.0, 24.0, 15.0, 24.0, 32.0, 40.0, 24.0, 45.0, 38.0, 45.0, 31.0, 26.0, 56.0, 34.0, 41.0, 28.0, 32.0, 27.0, 37.0, 33.0, 36.0, 23.0, 24.0, 23.0, 26.0, 21.0, 20.0, 13.0, 16.0, 11.0, 12.0, 12.0, 6.0, 12.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0012066364288330078, -0.001170528121292591, -0.0011344198137521744, -0.0010983115062117577, -0.001062203198671341, -0.0010260948911309242, -0.0009899865835905075, -0.0009538782760500908, -0.0009177699685096741, -0.0008816616609692574, -0.0008455533534288406, -0.0008094450458884239, -0.0007733367383480072, -0.0007372284308075905, -0.0007011201232671738, -0.000665011815726757, -0.0006289035081863403, -0.0005927952006459236, -0.0005566868931055069, -0.0005205785855650902, -0.00048447027802467346, -0.00044836197048425674, -0.00041225366294384, -0.0003761453554034233, -0.0003400370478630066, -0.0003039287403225899, -0.00026782043278217316, -0.00023171212524175644, -0.00019560381770133972, -0.000159495510160923, -0.0001233872026205063, -8.727889508008957e-05, -5.117058753967285e-05, -1.5062279999256134e-05, 2.1046027541160583e-05, 5.71543350815773e-05, 9.326264262199402e-05, 0.00012937095016241074, 0.00016547925770282745, 0.00020158756524324417, 0.0002376958727836609, 0.0002738041803240776, 0.0003099124878644943, 0.00034602079540491104, 0.00038212910294532776, 0.0004182374104857445, 0.0004543457180261612, 0.0004904540255665779, 0.0005265623331069946, 0.0005626706406474113, 0.0005987789481878281, 0.0006348872557282448, 0.0006709955632686615, 0.0007071038708090782, 0.0007432121783494949, 0.0007793204858899117, 0.0008154287934303284, 0.0008515371009707451, 0.0008876454085111618, 0.0009237537160515785, 0.0009598620235919952, 0.000995970331132412, 0.0010320786386728287, 0.0010681869462132454, 0.0011042952537536621]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 7.0, 8.0, 8.0, 12.0, 19.0, 22.0, 15.0, 29.0, 28.0, 38.0, 33.0, 44.0, 37.0, 35.0, 35.0, 48.0, 42.0, 48.0, 37.0, 43.0, 49.0, 45.0, 37.0, 23.0, 28.0, 31.0, 31.0, 25.0, 20.0, 18.0, 19.0, 10.0, 20.0, 9.0, 10.0, 7.0, 3.0, 0.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.4296875, -8.169189453125, -7.90869140625, -7.648193359375, -7.3876953125, -7.127197265625, -6.86669921875, -6.606201171875, -6.345703125, -6.085205078125, -5.82470703125, -5.564208984375, -5.3037109375, -5.043212890625, -4.78271484375, -4.522216796875, -4.26171875, -4.001220703125, -3.74072265625, -3.480224609375, -3.2197265625, -2.959228515625, -2.69873046875, -2.438232421875, -2.177734375, -1.917236328125, -1.65673828125, -1.396240234375, -1.1357421875, -0.875244140625, -0.61474609375, -0.354248046875, -0.09375, 0.166748046875, 0.42724609375, 0.687744140625, 0.9482421875, 1.208740234375, 1.46923828125, 1.729736328125, 1.990234375, 2.250732421875, 2.51123046875, 2.771728515625, 3.0322265625, 3.292724609375, 3.55322265625, 3.813720703125, 4.07421875, 4.334716796875, 4.59521484375, 4.855712890625, 5.1162109375, 5.376708984375, 5.63720703125, 5.897705078125, 6.158203125, 6.418701171875, 6.67919921875, 6.939697265625, 7.2001953125, 7.460693359375, 7.72119140625, 7.981689453125, 8.2421875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 7.0, 12.0, 13.0, 24.0, 19.0, 28.0, 35.0, 55.0, 74.0, 90.0, 164.0, 211.0, 320.0, 535.0, 794.0, 1431.0, 3030.0, 7530.0, 23921.0, 108713.0, 601404.0, 236200.0, 42862.0, 12022.0, 4277.0, 1844.0, 1053.0, 618.0, 388.0, 244.0, 181.0, 117.0, 90.0, 67.0, 49.0, 27.0, 32.0, 20.0, 12.0, 5.0, 8.0, 11.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-14.5, -14.042724609375, -13.58544921875, -13.128173828125, -12.6708984375, -12.213623046875, -11.75634765625, -11.299072265625, -10.841796875, -10.384521484375, -9.92724609375, -9.469970703125, -9.0126953125, -8.555419921875, -8.09814453125, -7.640869140625, -7.18359375, -6.726318359375, -6.26904296875, -5.811767578125, -5.3544921875, -4.897216796875, -4.43994140625, -3.982666015625, -3.525390625, -3.068115234375, -2.61083984375, -2.153564453125, -1.6962890625, -1.239013671875, -0.78173828125, -0.324462890625, 0.1328125, 0.590087890625, 1.04736328125, 1.504638671875, 1.9619140625, 2.419189453125, 2.87646484375, 3.333740234375, 3.791015625, 4.248291015625, 4.70556640625, 5.162841796875, 5.6201171875, 6.077392578125, 6.53466796875, 6.991943359375, 7.44921875, 7.906494140625, 8.36376953125, 8.821044921875, 9.2783203125, 9.735595703125, 10.19287109375, 10.650146484375, 11.107421875, 11.564697265625, 12.02197265625, 12.479248046875, 12.9365234375, 13.393798828125, 13.85107421875, 14.308349609375, 14.765625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 2.0, 11.0, 9.0, 8.0, 16.0, 29.0, 29.0, 46.0, 42.0, 50.0, 47.0, 85.0, 137.0, 1705.0, 370.0, 112.0, 85.0, 45.0, 58.0, 37.0, 31.0, 27.0, 22.0, 13.0, 11.0, 8.0, 2.0, 4.0, 0.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.0625, -33.92578125, -32.7890625, -31.65234375, -30.515625, -29.37890625, -28.2421875, -27.10546875, -25.96875, -24.83203125, -23.6953125, -22.55859375, -21.421875, -20.28515625, -19.1484375, -18.01171875, -16.875, -15.73828125, -14.6015625, -13.46484375, -12.328125, -11.19140625, -10.0546875, -8.91796875, -7.78125, -6.64453125, -5.5078125, -4.37109375, -3.234375, -2.09765625, -0.9609375, 0.17578125, 1.3125, 2.44921875, 3.5859375, 4.72265625, 5.859375, 6.99609375, 8.1328125, 9.26953125, 10.40625, 11.54296875, 12.6796875, 13.81640625, 14.953125, 16.08984375, 17.2265625, 18.36328125, 19.5, 20.63671875, 21.7734375, 22.91015625, 24.046875, 25.18359375, 26.3203125, 27.45703125, 28.59375, 29.73046875, 30.8671875, 32.00390625, 33.140625, 34.27734375, 35.4140625, 36.55078125, 37.6875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 6.0, 7.0, 8.0, 12.0, 20.0, 18.0, 38.0, 43.0, 93.0, 134.0, 367.0, 950.0, 28854.0, 3112633.0, 1487.0, 527.0, 210.0, 92.0, 43.0, 50.0, 42.0, 24.0, 16.0, 11.0, 8.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-111.1875, -107.8369140625, -104.486328125, -101.1357421875, -97.78515625, -94.4345703125, -91.083984375, -87.7333984375, -84.3828125, -81.0322265625, -77.681640625, -74.3310546875, -70.98046875, -67.6298828125, -64.279296875, -60.9287109375, -57.578125, -54.2275390625, -50.876953125, -47.5263671875, -44.17578125, -40.8251953125, -37.474609375, -34.1240234375, -30.7734375, -27.4228515625, -24.072265625, -20.7216796875, -17.37109375, -14.0205078125, -10.669921875, -7.3193359375, -3.96875, -0.6181640625, 2.732421875, 6.0830078125, 9.43359375, 12.7841796875, 16.134765625, 19.4853515625, 22.8359375, 26.1865234375, 29.537109375, 32.8876953125, 36.23828125, 39.5888671875, 42.939453125, 46.2900390625, 49.640625, 52.9912109375, 56.341796875, 59.6923828125, 63.04296875, 66.3935546875, 69.744140625, 73.0947265625, 76.4453125, 79.7958984375, 83.146484375, 86.4970703125, 89.84765625, 93.1982421875, 96.548828125, 99.8994140625, 103.25]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 18.0, 756.0, 239.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-483.0972595214844, -474.2822265625, -465.4671936035156, -456.6521911621094, -447.837158203125, -439.0221252441406, -430.20709228515625, -421.3920593261719, -412.5770263671875, -403.7619934082031, -394.94696044921875, -386.1319580078125, -377.3169250488281, -368.50189208984375, -359.6868591308594, -350.871826171875, -342.05682373046875, -333.2417907714844, -324.4267578125, -315.61175537109375, -306.7967224121094, -297.981689453125, -289.1666564941406, -280.35162353515625, -271.53662109375, -262.7215881347656, -253.9065704345703, -245.09153747558594, -236.27651977539062, -227.46148681640625, -218.64645385742188, -209.8314208984375, -201.01638793945312, -192.20135498046875, -183.38633728027344, -174.57130432128906, -165.75628662109375, -156.94125366210938, -148.126220703125, -139.31118774414062, -130.49618530273438, -121.68115997314453, -112.86613464355469, -104.05110168457031, -95.23607635498047, -86.42105102539062, -77.60601806640625, -68.7909927368164, -59.97595977783203, -51.16093444824219, -42.34590530395508, -33.53087615966797, -24.715850830078125, -15.900825500488281, -7.085796356201172, 1.7292327880859375, 10.544258117675781, 19.359285354614258, 28.174312591552734, 36.989341735839844, 45.80436706542969, 54.61939239501953, 63.43442153930664, 72.24945068359375, 81.0644760131836]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 1.0, 4.0, 8.0, 7.0, 9.0, 12.0, 10.0, 14.0, 17.0, 15.0, 15.0, 19.0, 31.0, 19.0, 35.0, 35.0, 38.0, 30.0, 43.0, 49.0, 43.0, 46.0, 31.0, 37.0, 32.0, 42.0, 33.0, 35.0, 37.0, 23.0, 34.0, 27.0, 21.0, 23.0, 22.0, 24.0, 10.0, 11.0, 9.0, 11.0, 10.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.83848190307617, -58.899139404296875, -56.95979690551758, -55.02045440673828, -53.08111572265625, -51.14176940917969, -49.202430725097656, -47.26308822631836, -45.32374572753906, -43.384403228759766, -41.44506072998047, -39.50571823120117, -37.566375732421875, -35.627037048339844, -33.68769454956055, -31.74835205078125, -29.809009552001953, -27.869667053222656, -25.93032455444336, -23.990983963012695, -22.0516414642334, -20.1122989654541, -18.172958374023438, -16.23361587524414, -14.294273376464844, -12.354930877685547, -10.415589332580566, -8.476247787475586, -6.536905288696289, -4.597562789916992, -2.6582212448120117, -0.7188796997070312, 1.2204666137695312, 3.15980863571167, 5.099150657653809, 7.038492679595947, 8.977834701538086, 10.917177200317383, 12.856518745422363, 14.795860290527344, 16.73520278930664, 18.674545288085938, 20.613887786865234, 22.5532283782959, 24.492570877075195, 26.431913375854492, 28.371253967285156, 30.310596466064453, 32.24993896484375, 34.18928146362305, 36.128623962402344, 38.06796646118164, 40.00730895996094, 41.94664764404297, 43.885990142822266, 45.82533264160156, 47.76467514038086, 49.704017639160156, 51.64336013793945, 53.58270263671875, 55.52204132080078, 57.461387634277344, 59.400726318359375, 61.34006881713867, 63.27941131591797]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 5.0, 7.0, 14.0, 18.0, 19.0, 21.0, 17.0, 29.0, 23.0, 32.0, 50.0, 39.0, 48.0, 48.0, 38.0, 52.0, 44.0, 53.0, 51.0, 35.0, 46.0, 33.0, 44.0, 27.0, 34.0, 36.0, 25.0, 18.0, 20.0, 15.0, 7.0, 10.0, 9.0, 8.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.6640625, -11.3145751953125, -10.965087890625, -10.6156005859375, -10.26611328125, -9.9166259765625, -9.567138671875, -9.2176513671875, -8.8681640625, -8.5186767578125, -8.169189453125, -7.8197021484375, -7.47021484375, -7.1207275390625, -6.771240234375, -6.4217529296875, -6.072265625, -5.7227783203125, -5.373291015625, -5.0238037109375, -4.67431640625, -4.3248291015625, -3.975341796875, -3.6258544921875, -3.2763671875, -2.9268798828125, -2.577392578125, -2.2279052734375, -1.87841796875, -1.5289306640625, -1.179443359375, -0.8299560546875, -0.48046875, -0.1309814453125, 0.218505859375, 0.5679931640625, 0.91748046875, 1.2669677734375, 1.616455078125, 1.9659423828125, 2.3154296875, 2.6649169921875, 3.014404296875, 3.3638916015625, 3.71337890625, 4.0628662109375, 4.412353515625, 4.7618408203125, 5.111328125, 5.4608154296875, 5.810302734375, 6.1597900390625, 6.50927734375, 6.8587646484375, 7.208251953125, 7.5577392578125, 7.9072265625, 8.2567138671875, 8.606201171875, 8.9556884765625, 9.30517578125, 9.6546630859375, 10.004150390625, 10.3536376953125, 10.703125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 7.0, 9.0, 10.0, 28.0, 20.0, 20.0, 37.0, 34.0, 52.0, 48.0, 72.0, 100.0, 114.0, 154.0, 206.0, 283.0, 373.0, 617.0, 1130.0, 3327.0, 67060.0, 3844926.0, 266719.0, 5177.0, 1320.0, 687.0, 440.0, 324.0, 222.0, 194.0, 115.0, 92.0, 70.0, 60.0, 58.0, 34.0, 34.0, 25.0, 27.0, 14.0, 14.0, 12.0, 4.0, 9.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.28125, -56.494140625, -54.70703125, -52.919921875, -51.1328125, -49.345703125, -47.55859375, -45.771484375, -43.984375, -42.197265625, -40.41015625, -38.623046875, -36.8359375, -35.048828125, -33.26171875, -31.474609375, -29.6875, -27.900390625, -26.11328125, -24.326171875, -22.5390625, -20.751953125, -18.96484375, -17.177734375, -15.390625, -13.603515625, -11.81640625, -10.029296875, -8.2421875, -6.455078125, -4.66796875, -2.880859375, -1.09375, 0.693359375, 2.48046875, 4.267578125, 6.0546875, 7.841796875, 9.62890625, 11.416015625, 13.203125, 14.990234375, 16.77734375, 18.564453125, 20.3515625, 22.138671875, 23.92578125, 25.712890625, 27.5, 29.287109375, 31.07421875, 32.861328125, 34.6484375, 36.435546875, 38.22265625, 40.009765625, 41.796875, 43.583984375, 45.37109375, 47.158203125, 48.9453125, 50.732421875, 52.51953125, 54.306640625, 56.09375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 2.0, 5.0, 9.0, 15.0, 20.0, 33.0, 67.0, 147.0, 266.0, 523.0, 820.0, 887.0, 595.0, 281.0, 160.0, 102.0, 52.0, 40.0, 24.0, 13.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.71875, -26.8798828125, -26.041015625, -25.2021484375, -24.36328125, -23.5244140625, -22.685546875, -21.8466796875, -21.0078125, -20.1689453125, -19.330078125, -18.4912109375, -17.65234375, -16.8134765625, -15.974609375, -15.1357421875, -14.296875, -13.4580078125, -12.619140625, -11.7802734375, -10.94140625, -10.1025390625, -9.263671875, -8.4248046875, -7.5859375, -6.7470703125, -5.908203125, -5.0693359375, -4.23046875, -3.3916015625, -2.552734375, -1.7138671875, -0.875, -0.0361328125, 0.802734375, 1.6416015625, 2.48046875, 3.3193359375, 4.158203125, 4.9970703125, 5.8359375, 6.6748046875, 7.513671875, 8.3525390625, 9.19140625, 10.0302734375, 10.869140625, 11.7080078125, 12.546875, 13.3857421875, 14.224609375, 15.0634765625, 15.90234375, 16.7412109375, 17.580078125, 18.4189453125, 19.2578125, 20.0966796875, 20.935546875, 21.7744140625, 22.61328125, 23.4521484375, 24.291015625, 25.1298828125, 25.96875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 11.0, 25.0, 38.0, 102.0, 231.0, 653.0, 2471.0, 16406.0, 380100.0, 3662862.0, 120721.0, 8287.0, 1578.0, 470.0, 172.0, 69.0, 32.0, 26.0, 12.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.9375, -36.893798828125, -35.85009765625, -34.806396484375, -33.7626953125, -32.718994140625, -31.67529296875, -30.631591796875, -29.587890625, -28.544189453125, -27.50048828125, -26.456787109375, -25.4130859375, -24.369384765625, -23.32568359375, -22.281982421875, -21.23828125, -20.194580078125, -19.15087890625, -18.107177734375, -17.0634765625, -16.019775390625, -14.97607421875, -13.932373046875, -12.888671875, -11.844970703125, -10.80126953125, -9.757568359375, -8.7138671875, -7.670166015625, -6.62646484375, -5.582763671875, -4.5390625, -3.495361328125, -2.45166015625, -1.407958984375, -0.3642578125, 0.679443359375, 1.72314453125, 2.766845703125, 3.810546875, 4.854248046875, 5.89794921875, 6.941650390625, 7.9853515625, 9.029052734375, 10.07275390625, 11.116455078125, 12.16015625, 13.203857421875, 14.24755859375, 15.291259765625, 16.3349609375, 17.378662109375, 18.42236328125, 19.466064453125, 20.509765625, 21.553466796875, 22.59716796875, 23.640869140625, 24.6845703125, 25.728271484375, 26.77197265625, 27.815673828125, 28.859375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 10.0, 24.0, 27.0, 38.0, 74.0, 108.0, 129.0, 123.0, 131.0, 102.0, 79.0, 61.0, 40.0, 26.0, 11.0, 10.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.29710388183594, -169.97903442382812, -165.66094970703125, -161.34288024902344, -157.02481079101562, -152.70672607421875, -148.38865661621094, -144.07057189941406, -139.75250244140625, -135.43443298339844, -131.11634826660156, -126.79827880859375, -122.4802017211914, -118.16212463378906, -113.84405517578125, -109.5259780883789, -105.20790100097656, -100.88982391357422, -96.57174682617188, -92.25367736816406, -87.93560028076172, -83.61752319335938, -79.29945373535156, -74.98137664794922, -70.66329956054688, -66.34522247314453, -62.02714920043945, -57.709075927734375, -53.39099884033203, -49.07292175292969, -44.75484848022461, -40.43677520751953, -36.11871337890625, -31.80063819885254, -27.482563018798828, -23.164487838745117, -18.846412658691406, -14.528337478637695, -10.210262298583984, -5.892187118530273, -1.5741119384765625, 2.7439632415771484, 7.062038421630859, 11.38011360168457, 15.698188781738281, 20.016263961791992, 24.334339141845703, 28.652414321899414, 32.970489501953125, 37.28856658935547, 41.60663986206055, 45.924713134765625, 50.24279022216797, 54.56086730957031, 58.87894058227539, 63.19701385498047, 67.51509094238281, 71.83316802978516, 76.1512451171875, 80.46931457519531, 84.78739166259766, 89.10546875, 93.42353820800781, 97.74161529541016, 102.0596923828125]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 6.0, 7.0, 13.0, 8.0, 18.0, 18.0, 19.0, 25.0, 31.0, 35.0, 36.0, 31.0, 39.0, 57.0, 56.0, 50.0, 61.0, 45.0, 53.0, 44.0, 42.0, 37.0, 36.0, 39.0, 30.0, 23.0, 29.0, 21.0, 19.0, 14.0, 19.0, 7.0, 12.0, 6.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-74.80683898925781, -72.54548645019531, -70.28413391113281, -68.02278137207031, -65.76142883300781, -63.50007629394531, -61.23871994018555, -58.97736740112305, -56.71601486206055, -54.45466232299805, -52.19330978393555, -49.93195724487305, -47.67060089111328, -45.40924835205078, -43.14789581298828, -40.88654327392578, -38.62519073486328, -36.36383819580078, -34.10248565673828, -31.84113121032715, -29.57977867126465, -27.31842613220215, -25.057071685791016, -22.795719146728516, -20.534366607666016, -18.273014068603516, -16.011661529541016, -13.750307083129883, -11.488954544067383, -9.227602005004883, -6.966248512268066, -4.70489501953125, -2.4435501098632812, -0.18219709396362305, 2.079155921936035, 4.340508937835693, 6.601861953735352, 8.863214492797852, 11.124567985534668, 13.385921478271484, 15.647274017333984, 17.908626556396484, 20.169979095458984, 22.431333541870117, 24.692686080932617, 26.954038619995117, 29.21539306640625, 31.47674560546875, 33.73809814453125, 35.99945068359375, 38.26080322265625, 40.52215576171875, 42.78350830078125, 45.04486083984375, 47.306217193603516, 49.567569732666016, 51.828922271728516, 54.090274810791016, 56.351627349853516, 58.612979888916016, 60.87433624267578, 63.13568878173828, 65.39704132080078, 67.65839385986328, 69.91974639892578]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 8.0, 9.0, 10.0, 10.0, 17.0, 18.0, 18.0, 21.0, 26.0, 46.0, 34.0, 47.0, 51.0, 49.0, 55.0, 59.0, 47.0, 62.0, 53.0, 52.0, 34.0, 53.0, 21.0, 37.0, 29.0, 27.0, 29.0, 19.0, 17.0, 10.0, 12.0, 7.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-126.875, -122.966796875, -119.05859375, -115.150390625, -111.2421875, -107.333984375, -103.42578125, -99.517578125, -95.609375, -91.701171875, -87.79296875, -83.884765625, -79.9765625, -76.068359375, -72.16015625, -68.251953125, -64.34375, -60.435546875, -56.52734375, -52.619140625, -48.7109375, -44.802734375, -40.89453125, -36.986328125, -33.078125, -29.169921875, -25.26171875, -21.353515625, -17.4453125, -13.537109375, -9.62890625, -5.720703125, -1.8125, 2.095703125, 6.00390625, 9.912109375, 13.8203125, 17.728515625, 21.63671875, 25.544921875, 29.453125, 33.361328125, 37.26953125, 41.177734375, 45.0859375, 48.994140625, 52.90234375, 56.810546875, 60.71875, 64.626953125, 68.53515625, 72.443359375, 76.3515625, 80.259765625, 84.16796875, 88.076171875, 91.984375, 95.892578125, 99.80078125, 103.708984375, 107.6171875, 111.525390625, 115.43359375, 119.341796875, 123.25]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 10.0, 7.0, 21.0, 38.0, 58.0, 69.0, 149.0, 183.0, 271.0, 379.0, 611.0, 917.0, 1319.0, 2019.0, 3091.0, 4726.0, 7395.0, 11245.0, 17728.0, 26999.0, 41763.0, 66671.0, 104668.0, 160860.0, 193050.0, 145006.0, 93651.0, 59446.0, 37439.0, 24235.0, 15438.0, 10108.0, 6618.0, 4143.0, 2795.0, 1751.0, 1203.0, 794.0, 539.0, 386.0, 231.0, 167.0, 125.0, 66.0, 52.0, 36.0, 36.0, 11.0, 13.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.6875, -9.3685302734375, -9.049560546875, -8.7305908203125, -8.41162109375, -8.0926513671875, -7.773681640625, -7.4547119140625, -7.1357421875, -6.8167724609375, -6.497802734375, -6.1788330078125, -5.85986328125, -5.5408935546875, -5.221923828125, -4.9029541015625, -4.583984375, -4.2650146484375, -3.946044921875, -3.6270751953125, -3.30810546875, -2.9891357421875, -2.670166015625, -2.3511962890625, -2.0322265625, -1.7132568359375, -1.394287109375, -1.0753173828125, -0.75634765625, -0.4373779296875, -0.118408203125, 0.2005615234375, 0.51953125, 0.8385009765625, 1.157470703125, 1.4764404296875, 1.79541015625, 2.1143798828125, 2.433349609375, 2.7523193359375, 3.0712890625, 3.3902587890625, 3.709228515625, 4.0281982421875, 4.34716796875, 4.6661376953125, 4.985107421875, 5.3040771484375, 5.623046875, 5.9420166015625, 6.260986328125, 6.5799560546875, 6.89892578125, 7.2178955078125, 7.536865234375, 7.8558349609375, 8.1748046875, 8.4937744140625, 8.812744140625, 9.1317138671875, 9.45068359375, 9.7696533203125, 10.088623046875, 10.4075927734375, 10.7265625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 8.0, 4.0, 8.0, 5.0, 8.0, 8.0, 12.0, 7.0, 15.0, 15.0, 22.0, 19.0, 16.0, 22.0, 38.0, 28.0, 31.0, 30.0, 31.0, 43.0, 38.0, 36.0, 42.0, 1061.0, 47.0, 40.0, 37.0, 31.0, 38.0, 25.0, 30.0, 34.0, 33.0, 19.0, 22.0, 20.0, 23.0, 16.0, 9.0, 14.0, 9.0, 8.0, 9.0, 7.0, 7.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-60.0625, -58.19970703125, -56.3369140625, -54.47412109375, -52.611328125, -50.74853515625, -48.8857421875, -47.02294921875, -45.16015625, -43.29736328125, -41.4345703125, -39.57177734375, -37.708984375, -35.84619140625, -33.9833984375, -32.12060546875, -30.2578125, -28.39501953125, -26.5322265625, -24.66943359375, -22.806640625, -20.94384765625, -19.0810546875, -17.21826171875, -15.35546875, -13.49267578125, -11.6298828125, -9.76708984375, -7.904296875, -6.04150390625, -4.1787109375, -2.31591796875, -0.453125, 1.40966796875, 3.2724609375, 5.13525390625, 6.998046875, 8.86083984375, 10.7236328125, 12.58642578125, 14.44921875, 16.31201171875, 18.1748046875, 20.03759765625, 21.900390625, 23.76318359375, 25.6259765625, 27.48876953125, 29.3515625, 31.21435546875, 33.0771484375, 34.93994140625, 36.802734375, 38.66552734375, 40.5283203125, 42.39111328125, 44.25390625, 46.11669921875, 47.9794921875, 49.84228515625, 51.705078125, 53.56787109375, 55.4306640625, 57.29345703125, 59.15625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 8.0, 7.0, 11.0, 13.0, 24.0, 35.0, 50.0, 59.0, 102.0, 150.0, 235.0, 311.0, 430.0, 628.0, 883.0, 1343.0, 1885.0, 2754.0, 3993.0, 5916.0, 8571.0, 12544.0, 18560.0, 27155.0, 40723.0, 60713.0, 91109.0, 131956.0, 1213670.0, 148750.0, 105523.0, 71545.0, 47591.0, 31521.0, 21458.0, 14627.0, 10030.0, 6905.0, 4797.0, 3378.0, 2232.0, 1523.0, 1058.0, 708.0, 480.0, 371.0, 246.0, 183.0, 110.0, 88.0, 56.0, 36.0, 31.0, 15.0, 15.0, 9.0, 7.0, 5.0, 3.0, 1.0, 3.0], "bins": [-8.140625, -7.8837890625, -7.626953125, -7.3701171875, -7.11328125, -6.8564453125, -6.599609375, -6.3427734375, -6.0859375, -5.8291015625, -5.572265625, -5.3154296875, -5.05859375, -4.8017578125, -4.544921875, -4.2880859375, -4.03125, -3.7744140625, -3.517578125, -3.2607421875, -3.00390625, -2.7470703125, -2.490234375, -2.2333984375, -1.9765625, -1.7197265625, -1.462890625, -1.2060546875, -0.94921875, -0.6923828125, -0.435546875, -0.1787109375, 0.078125, 0.3349609375, 0.591796875, 0.8486328125, 1.10546875, 1.3623046875, 1.619140625, 1.8759765625, 2.1328125, 2.3896484375, 2.646484375, 2.9033203125, 3.16015625, 3.4169921875, 3.673828125, 3.9306640625, 4.1875, 4.4443359375, 4.701171875, 4.9580078125, 5.21484375, 5.4716796875, 5.728515625, 5.9853515625, 6.2421875, 6.4990234375, 6.755859375, 7.0126953125, 7.26953125, 7.5263671875, 7.783203125, 8.0400390625, 8.296875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 9.0, 8.0, 6.0, 12.0, 14.0, 13.0, 28.0, 34.0, 44.0, 47.0, 61.0, 62.0, 73.0, 77.0, 76.0, 77.0, 54.0, 54.0, 52.0, 39.0, 33.0, 35.0, 25.0, 22.0, 15.0, 13.0, 7.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042388916015625, -0.040728092193603516, -0.03906726837158203, -0.03740644454956055, -0.03574562072753906, -0.03408479690551758, -0.032423973083496094, -0.03076314926147461, -0.029102325439453125, -0.02744150161743164, -0.025780677795410156, -0.024119853973388672, -0.022459030151367188, -0.020798206329345703, -0.01913738250732422, -0.017476558685302734, -0.01581573486328125, -0.014154911041259766, -0.012494087219238281, -0.010833263397216797, -0.009172439575195312, -0.007511615753173828, -0.005850791931152344, -0.004189968109130859, -0.002529144287109375, -0.0008683204650878906, 0.0007925033569335938, 0.002453327178955078, 0.0041141510009765625, 0.005774974822998047, 0.007435798645019531, 0.009096622467041016, 0.0107574462890625, 0.012418270111083984, 0.014079093933105469, 0.015739917755126953, 0.017400741577148438, 0.019061565399169922, 0.020722389221191406, 0.02238321304321289, 0.024044036865234375, 0.02570486068725586, 0.027365684509277344, 0.029026508331298828, 0.030687332153320312, 0.0323481559753418, 0.03400897979736328, 0.035669803619384766, 0.03733062744140625, 0.038991451263427734, 0.04065227508544922, 0.0423130989074707, 0.04397392272949219, 0.04563474655151367, 0.047295570373535156, 0.04895639419555664, 0.050617218017578125, 0.05227804183959961, 0.053938865661621094, 0.05559968948364258, 0.05726051330566406, 0.05892133712768555, 0.06058216094970703, 0.062242984771728516, 0.06390380859375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 3.0, 4.0, 10.0, 14.0, 18.0, 23.0, 40.0, 48.0, 95.0, 153.0, 246.0, 387.0, 671.0, 1393.0, 3549.0, 11526.0, 47955.0, 307353.0, 555888.0, 90481.0, 19094.0, 5412.0, 1988.0, 912.0, 461.0, 276.0, 174.0, 108.0, 81.0, 54.0, 33.0, 38.0, 14.0, 16.0, 6.0, 11.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3837890625, -0.3731842041015625, -0.362579345703125, -0.3519744873046875, -0.34136962890625, -0.3307647705078125, -0.320159912109375, -0.3095550537109375, -0.2989501953125, -0.2883453369140625, -0.277740478515625, -0.2671356201171875, -0.25653076171875, -0.2459259033203125, -0.235321044921875, -0.2247161865234375, -0.214111328125, -0.2035064697265625, -0.192901611328125, -0.1822967529296875, -0.17169189453125, -0.1610870361328125, -0.150482177734375, -0.1398773193359375, -0.1292724609375, -0.1186676025390625, -0.108062744140625, -0.0974578857421875, -0.08685302734375, -0.0762481689453125, -0.065643310546875, -0.0550384521484375, -0.04443359375, -0.0338287353515625, -0.023223876953125, -0.0126190185546875, -0.00201416015625, 0.0085906982421875, 0.019195556640625, 0.0298004150390625, 0.0404052734375, 0.0510101318359375, 0.061614990234375, 0.0722198486328125, 0.08282470703125, 0.0934295654296875, 0.104034423828125, 0.1146392822265625, 0.125244140625, 0.1358489990234375, 0.146453857421875, 0.1570587158203125, 0.16766357421875, 0.1782684326171875, 0.188873291015625, 0.1994781494140625, 0.2100830078125, 0.2206878662109375, 0.231292724609375, 0.2418975830078125, 0.25250244140625, 0.2631072998046875, 0.273712158203125, 0.2843170166015625, 0.294921875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 17.0, 18.0, 30.0, 54.0, 77.0, 116.0, 144.0, 192.0, 141.0, 88.0, 48.0, 27.0, 17.0, 9.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09823210537433624, -0.09611334651708603, -0.09399458020925522, -0.091875821352005, -0.08975706249475479, -0.08763830363750458, -0.08551953732967377, -0.08340077847242355, -0.08128201961517334, -0.07916326075792313, -0.07704449445009232, -0.0749257355928421, -0.07280697673559189, -0.07068821787834167, -0.06856945157051086, -0.06645069271326065, -0.06433192640542984, -0.06221316382288933, -0.060094404965639114, -0.0579756423830986, -0.05585688352584839, -0.05373812094330788, -0.051619358360767365, -0.04950059950351715, -0.04738183692097664, -0.04526307433843613, -0.04314431548118591, -0.0410255528986454, -0.03890679031610489, -0.036788031458854675, -0.03466926887631416, -0.03255050629377365, -0.030431754887104034, -0.02831299416720867, -0.02619423344731331, -0.024075470864772797, -0.021956710144877434, -0.01983794942498207, -0.01771918684244156, -0.015600426122546196, -0.013481665402650833, -0.01136290468275547, -0.009244143031537533, -0.007125381845980883, -0.0050066206604242325, -0.0028878599405288696, -0.0007690982893109322, 0.0013496633619070053, 0.003468424081802368, 0.005587185267359018, 0.0077059464529156685, 0.009824708104133606, 0.011943468824028969, 0.014062229543924332, 0.016180992126464844, 0.018299752846360207, 0.02041851356625557, 0.022537274286150932, 0.024656035006046295, 0.026774797588586807, 0.02889355830848217, 0.031012319028377533, 0.033131081610918045, 0.03524984419345856, 0.03736860305070877]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 6.0, 11.0, 9.0, 19.0, 18.0, 26.0, 27.0, 26.0, 33.0, 26.0, 22.0, 39.0, 41.0, 46.0, 49.0, 64.0, 51.0, 34.0, 40.0, 41.0, 45.0, 41.0, 40.0, 28.0, 30.0, 28.0, 26.0, 16.0, 25.0, 13.0, 16.0, 9.0, 8.0, 6.0, 10.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.028933942317962646, -0.02809436060488224, -0.027254778891801834, -0.026415197178721428, -0.02557561546564102, -0.024736033752560616, -0.02389645203948021, -0.023056870326399803, -0.022217288613319397, -0.02137770690023899, -0.020538125187158585, -0.01969854347407818, -0.018858961760997772, -0.018019380047917366, -0.01717979833483696, -0.016340216621756554, -0.015500634908676147, -0.014661053195595741, -0.013821471482515335, -0.012981889769434929, -0.012142308056354523, -0.011302726343274117, -0.01046314463019371, -0.009623562917113304, -0.008783981204032898, -0.007944399490952492, -0.007104817777872086, -0.006265236064791679, -0.005425654351711273, -0.004586072638630867, -0.003746490925550461, -0.0029069092124700546, -0.0020673274993896484, -0.0012277457863092422, -0.00038816407322883606, 0.00045141763985157013, 0.0012909993529319763, 0.0021305810660123825, 0.0029701627790927887, 0.003809744492173195, 0.004649326205253601, 0.005488907918334007, 0.0063284896314144135, 0.00716807134449482, 0.008007653057575226, 0.008847234770655632, 0.009686816483736038, 0.010526398196816444, 0.01136597990989685, 0.012205561622977257, 0.013045143336057663, 0.01388472504913807, 0.014724306762218475, 0.015563888475298882, 0.016403470188379288, 0.017243051901459694, 0.0180826336145401, 0.018922215327620506, 0.019761797040700912, 0.02060137875378132, 0.021440960466861725, 0.02228054217994213, 0.023120123893022537, 0.023959705606102943, 0.02479928731918335]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 8.0, 9.0, 10.0, 10.0, 17.0, 18.0, 19.0, 20.0, 26.0, 46.0, 34.0, 47.0, 51.0, 48.0, 56.0, 60.0, 46.0, 62.0, 53.0, 53.0, 33.0, 54.0, 21.0, 37.0, 27.0, 28.0, 28.0, 20.0, 16.0, 11.0, 12.0, 7.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-126.8125, -122.9052734375, -118.998046875, -115.0908203125, -111.18359375, -107.2763671875, -103.369140625, -99.4619140625, -95.5546875, -91.6474609375, -87.740234375, -83.8330078125, -79.92578125, -76.0185546875, -72.111328125, -68.2041015625, -64.296875, -60.3896484375, -56.482421875, -52.5751953125, -48.66796875, -44.7607421875, -40.853515625, -36.9462890625, -33.0390625, -29.1318359375, -25.224609375, -21.3173828125, -17.41015625, -13.5029296875, -9.595703125, -5.6884765625, -1.78125, 2.1259765625, 6.033203125, 9.9404296875, 13.84765625, 17.7548828125, 21.662109375, 25.5693359375, 29.4765625, 33.3837890625, 37.291015625, 41.1982421875, 45.10546875, 49.0126953125, 52.919921875, 56.8271484375, 60.734375, 64.6416015625, 68.548828125, 72.4560546875, 76.36328125, 80.2705078125, 84.177734375, 88.0849609375, 91.9921875, 95.8994140625, 99.806640625, 103.7138671875, 107.62109375, 111.5283203125, 115.435546875, 119.3427734375, 123.25]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 7.0, 13.0, 12.0, 9.0, 23.0, 40.0, 42.0, 58.0, 67.0, 128.0, 221.0, 349.0, 763.0, 1419.0, 2979.0, 7135.0, 23205.0, 125319.0, 660567.0, 180826.0, 29975.0, 8418.0, 3420.0, 1607.0, 845.0, 406.0, 225.0, 143.0, 89.0, 66.0, 47.0, 38.0, 23.0, 15.0, 20.0, 9.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.78125, -29.836669921875, -28.89208984375, -27.947509765625, -27.0029296875, -26.058349609375, -25.11376953125, -24.169189453125, -23.224609375, -22.280029296875, -21.33544921875, -20.390869140625, -19.4462890625, -18.501708984375, -17.55712890625, -16.612548828125, -15.66796875, -14.723388671875, -13.77880859375, -12.834228515625, -11.8896484375, -10.945068359375, -10.00048828125, -9.055908203125, -8.111328125, -7.166748046875, -6.22216796875, -5.277587890625, -4.3330078125, -3.388427734375, -2.44384765625, -1.499267578125, -0.5546875, 0.389892578125, 1.33447265625, 2.279052734375, 3.2236328125, 4.168212890625, 5.11279296875, 6.057373046875, 7.001953125, 7.946533203125, 8.89111328125, 9.835693359375, 10.7802734375, 11.724853515625, 12.66943359375, 13.614013671875, 14.55859375, 15.503173828125, 16.44775390625, 17.392333984375, 18.3369140625, 19.281494140625, 20.22607421875, 21.170654296875, 22.115234375, 23.059814453125, 24.00439453125, 24.948974609375, 25.8935546875, 26.838134765625, 27.78271484375, 28.727294921875, 29.671875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 11.0, 9.0, 19.0, 12.0, 28.0, 27.0, 41.0, 58.0, 61.0, 77.0, 91.0, 2122.0, 96.0, 94.0, 73.0, 55.0, 54.0, 31.0, 20.0, 21.0, 14.0, 10.0, 9.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-265.0, -256.896484375, -248.79296875, -240.689453125, -232.5859375, -224.482421875, -216.37890625, -208.275390625, -200.171875, -192.068359375, -183.96484375, -175.861328125, -167.7578125, -159.654296875, -151.55078125, -143.447265625, -135.34375, -127.240234375, -119.13671875, -111.033203125, -102.9296875, -94.826171875, -86.72265625, -78.619140625, -70.515625, -62.412109375, -54.30859375, -46.205078125, -38.1015625, -29.998046875, -21.89453125, -13.791015625, -5.6875, 2.416015625, 10.51953125, 18.623046875, 26.7265625, 34.830078125, 42.93359375, 51.037109375, 59.140625, 67.244140625, 75.34765625, 83.451171875, 91.5546875, 99.658203125, 107.76171875, 115.865234375, 123.96875, 132.072265625, 140.17578125, 148.279296875, 156.3828125, 164.486328125, 172.58984375, 180.693359375, 188.796875, 196.900390625, 205.00390625, 213.107421875, 221.2109375, 229.314453125, 237.41796875, 245.521484375, 253.625]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 16.0, 8.0, 19.0, 32.0, 53.0, 72.0, 94.0, 149.0, 237.0, 482.0, 996.0, 2534.0, 15024.0, 1884402.0, 1222027.0, 14934.0, 2406.0, 999.0, 492.0, 265.0, 150.0, 95.0, 62.0, 45.0, 26.0, 29.0, 12.0, 10.0, 6.0, 7.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.1875, -50.50390625, -48.8203125, -47.13671875, -45.453125, -43.76953125, -42.0859375, -40.40234375, -38.71875, -37.03515625, -35.3515625, -33.66796875, -31.984375, -30.30078125, -28.6171875, -26.93359375, -25.25, -23.56640625, -21.8828125, -20.19921875, -18.515625, -16.83203125, -15.1484375, -13.46484375, -11.78125, -10.09765625, -8.4140625, -6.73046875, -5.046875, -3.36328125, -1.6796875, 0.00390625, 1.6875, 3.37109375, 5.0546875, 6.73828125, 8.421875, 10.10546875, 11.7890625, 13.47265625, 15.15625, 16.83984375, 18.5234375, 20.20703125, 21.890625, 23.57421875, 25.2578125, 26.94140625, 28.625, 30.30859375, 31.9921875, 33.67578125, 35.359375, 37.04296875, 38.7265625, 40.41015625, 42.09375, 43.77734375, 45.4609375, 47.14453125, 48.828125, 50.51171875, 52.1953125, 53.87890625, 55.5625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 5.0, 12.0, 9.0, 39.0, 64.0, 101.0, 176.0, 213.0, 150.0, 93.0, 50.0, 30.0, 16.0, 8.0, 5.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-203.7586212158203, -195.46322631835938, -187.16783142089844, -178.8724365234375, -170.57705688476562, -162.2816619873047, -153.98626708984375, -145.6908721923828, -137.39547729492188, -129.10008239746094, -120.80469512939453, -112.5093002319336, -104.21391296386719, -95.91851806640625, -87.62312316894531, -79.32772827148438, -71.0323486328125, -62.73695755004883, -54.441566467285156, -46.14617156982422, -37.85078048706055, -29.555389404296875, -21.259994506835938, -12.964603424072266, -4.669212341308594, 3.6261796951293945, 11.921571731567383, 20.216964721679688, 28.51235580444336, 36.80774688720703, 45.10314178466797, 53.39853286743164, 61.69390869140625, 69.98930358886719, 78.2846908569336, 86.58008575439453, 94.87547302246094, 103.17086791992188, 111.46626281738281, 119.76165771484375, 128.05703735351562, 136.35243225097656, 144.6478271484375, 152.94320678710938, 161.2386016845703, 169.53399658203125, 177.8293914794922, 186.12478637695312, 194.42018127441406, 202.715576171875, 211.01097106933594, 219.30636596679688, 227.60174560546875, 235.8971405029297, 244.19253540039062, 252.48793029785156, 260.7833251953125, 269.0787048339844, 277.3741149902344, 285.66949462890625, 293.96490478515625, 302.2602844238281, 310.5556640625, 318.85107421875, 327.1464538574219]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 5.0, 15.0, 6.0, 11.0, 16.0, 22.0, 17.0, 21.0, 21.0, 25.0, 44.0, 38.0, 49.0, 45.0, 53.0, 57.0, 56.0, 52.0, 51.0, 51.0, 54.0, 38.0, 29.0, 33.0, 30.0, 23.0, 24.0, 25.0, 22.0, 18.0, 12.0, 10.0, 5.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-224.77078247070312, -217.8157196044922, -210.8606414794922, -203.90557861328125, -196.9505157470703, -189.99545288085938, -183.04037475585938, -176.08531188964844, -169.1302490234375, -162.17518615722656, -155.22010803222656, -148.26504516601562, -141.3099822998047, -134.35491943359375, -127.39984130859375, -120.44477844238281, -113.48970794677734, -106.53463745117188, -99.57957458496094, -92.62450408935547, -85.66944122314453, -78.71437072753906, -71.75930786132812, -64.80423736572266, -57.84917068481445, -50.89410400390625, -43.93903732299805, -36.983970642089844, -30.028902053833008, -23.073833465576172, -16.11876678466797, -9.163700103759766, -2.2086334228515625, 4.746433734893799, 11.70150089263916, 18.65656852722168, 25.611635208129883, 32.56670379638672, 39.52177047729492, 46.476837158203125, 53.43190383911133, 60.38697052001953, 67.342041015625, 74.29710388183594, 81.2521743774414, 88.20724487304688, 95.16230773925781, 102.11737060546875, 109.07244110107422, 116.02751159667969, 122.98257446289062, 129.93763732910156, 136.89271545410156, 143.8477783203125, 150.80284118652344, 157.75790405273438, 164.71298217773438, 171.6680450439453, 178.6231231689453, 185.57818603515625, 192.5332489013672, 199.48831176757812, 206.44338989257812, 213.39845275878906, 220.353515625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 6.0, 7.0, 8.0, 7.0, 13.0, 30.0, 28.0, 32.0, 52.0, 51.0, 84.0, 103.0, 150.0, 208.0, 283.0, 370.0, 547.0, 724.0, 1178.0, 1041073.0, 1057.0, 663.0, 487.0, 367.0, 263.0, 204.0, 143.0, 110.0, 73.0, 57.0, 43.0, 32.0, 23.0, 22.0, 17.0, 7.0, 11.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.27511596679688, -74.05817413330078, -71.84123229980469, -69.62429809570312, -67.40735626220703, -65.19041442871094, -62.973472595214844, -60.756534576416016, -58.53959655761719, -56.322654724121094, -54.105716705322266, -51.88877487182617, -49.671836853027344, -47.45489501953125, -45.237953186035156, -43.02101516723633, -40.804073333740234, -38.58713150024414, -36.37019348144531, -34.15325164794922, -31.93631362915039, -29.719371795654297, -27.502431869506836, -25.285491943359375, -23.068552017211914, -20.851612091064453, -18.634672164916992, -16.41773223876953, -14.200791358947754, -11.983851432800293, -9.766910552978516, -7.549970626831055, -5.333030700683594, -3.1160905361175537, -0.8991503715515137, 1.3177900314331055, 3.5347299575805664, 5.751669883728027, 7.968610763549805, 10.185550689697266, 12.402490615844727, 14.619430541992188, 16.83637046813965, 19.05331039428711, 21.270252227783203, 23.48719024658203, 25.704132080078125, 27.921072006225586, 30.138011932373047, 32.35495376586914, 34.57189178466797, 36.78883361816406, 39.00577163696289, 41.222713470458984, 43.43965148925781, 45.656593322753906, 47.87353515625, 50.090476989746094, 52.30741500854492, 54.524356842041016, 56.741294860839844, 58.95823669433594, 61.17517852783203, 63.39211654663086, 65.60905456542969]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 11.0, 4.0, 7.0, 10.0, 17.0, 42.0, 179.0, 51462528.0, 212.0, 56.0, 20.0, 16.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5792.0, -5464.25, -5136.5, -4808.75, -4481.0, -4153.25, -3825.5, -3497.75, -3170.0, -2842.25, -2514.5, -2186.75, -1859.0, -1531.25, -1203.5, -875.75, -548.0, -220.25, 107.5, 435.25, 763.0, 1090.75, 1418.5, 1746.25, 2074.0, 2401.75, 2729.5, 3057.25, 3385.0, 3712.75, 4040.5, 4368.25, 4696.0, 5023.75, 5351.5, 5679.25, 6007.0, 6334.75, 6662.5, 6990.25, 7318.0, 7645.75, 7973.5, 8301.25, 8629.0, 8956.75, 9284.5, 9612.25, 9940.0, 10267.75, 10595.5, 10923.25, 11251.0, 11578.75, 11906.5, 12234.25, 12562.0, 12889.75, 13217.5, 13545.25, 13873.0, 14200.75, 14528.5, 14856.25, 15184.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 14.0, 18.0, 34.0, 38.0, 76.0, 104.0, 187.0, 238.0, 394.0, 660.0, 1083.0, 1727.0, 2582.0, 3994.0, 6474.0, 10270.0, 16543.0, 26888.0, 43998.0, 72823.0, 119715.0, 200089.0, 332026.0, 614399.0, 3642290.0, 477057.0, 284341.0, 170052.0, 102127.0, 61681.0, 37655.0, 23054.0, 14339.0, 8933.0, 5710.0, 3575.0, 2297.0, 1464.0, 898.0, 606.0, 397.0, 239.0, 124.0, 96.0, 57.0, 19.0, 26.0, 20.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.41015625, -4.26947021484375, -4.1287841796875, -3.98809814453125, -3.847412109375, -3.70672607421875, -3.5660400390625, -3.42535400390625, -3.28466796875, -3.14398193359375, -3.0032958984375, -2.86260986328125, -2.721923828125, -2.58123779296875, -2.4405517578125, -2.29986572265625, -2.1591796875, -2.01849365234375, -1.8778076171875, -1.73712158203125, -1.596435546875, -1.45574951171875, -1.3150634765625, -1.17437744140625, -1.03369140625, -0.89300537109375, -0.7523193359375, -0.61163330078125, -0.470947265625, -0.33026123046875, -0.1895751953125, -0.04888916015625, 0.091796875, 0.23248291015625, 0.3731689453125, 0.51385498046875, 0.654541015625, 0.79522705078125, 0.9359130859375, 1.07659912109375, 1.21728515625, 1.35797119140625, 1.4986572265625, 1.63934326171875, 1.780029296875, 1.92071533203125, 2.0614013671875, 2.20208740234375, 2.3427734375, 2.48345947265625, 2.6241455078125, 2.76483154296875, 2.905517578125, 3.04620361328125, 3.1868896484375, 3.32757568359375, 3.46826171875, 3.60894775390625, 3.7496337890625, 3.89031982421875, 4.031005859375, 4.17169189453125, 4.3123779296875, 4.45306396484375, 4.59375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 10.0, 16.0, 15.0, 15.0, 25.0, 16.0, 21.0, 27.0, 28.0, 40.0, 33.0, 48.0, 44.0, 38.0, 78.0, 831.0, 256.0, 60.0, 49.0, 44.0, 48.0, 40.0, 39.0, 43.0, 26.0, 20.0, 20.0, 20.0, 15.0, 12.0, 12.0, 8.0, 3.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.515625, -25.729736328125, -24.94384765625, -24.157958984375, -23.3720703125, -22.586181640625, -21.80029296875, -21.014404296875, -20.228515625, -19.442626953125, -18.65673828125, -17.870849609375, -17.0849609375, -16.299072265625, -15.51318359375, -14.727294921875, -13.94140625, -13.155517578125, -12.36962890625, -11.583740234375, -10.7978515625, -10.011962890625, -9.22607421875, -8.440185546875, -7.654296875, -6.868408203125, -6.08251953125, -5.296630859375, -4.5107421875, -3.724853515625, -2.93896484375, -2.153076171875, -1.3671875, -0.581298828125, 0.20458984375, 0.990478515625, 1.7763671875, 2.562255859375, 3.34814453125, 4.134033203125, 4.919921875, 5.705810546875, 6.49169921875, 7.277587890625, 8.0634765625, 8.849365234375, 9.63525390625, 10.421142578125, 11.20703125, 11.992919921875, 12.77880859375, 13.564697265625, 14.3505859375, 15.136474609375, 15.92236328125, 16.708251953125, 17.494140625, 18.280029296875, 19.06591796875, 19.851806640625, 20.6376953125, 21.423583984375, 22.20947265625, 22.995361328125, 23.78125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 8.0, 3.0, 5.0, 18.0, 13.0, 28.0, 31.0, 45.0, 82.0, 87.0, 131.0, 193.0, 316.0, 425.0, 708.0, 1022.0, 1450.0, 2189.0, 3213.0, 5040.0, 7462.0, 11388.0, 18251.0, 28116.0, 46194.0, 78729.0, 136246.0, 243592.0, 453856.0, 3446334.0, 965527.0, 360276.0, 196850.0, 111321.0, 64769.0, 38874.0, 24179.0, 15150.0, 9954.0, 6449.0, 4322.0, 2732.0, 1912.0, 1243.0, 796.0, 620.0, 395.0, 295.0, 195.0, 138.0, 88.0, 57.0, 31.0, 35.0, 22.0, 14.0, 9.0, 5.0, 9.0, 5.0, 2.0, 1.0], "bins": [-5.9296875, -5.74334716796875, -5.5570068359375, -5.37066650390625, -5.184326171875, -4.99798583984375, -4.8116455078125, -4.62530517578125, -4.43896484375, -4.25262451171875, -4.0662841796875, -3.87994384765625, -3.693603515625, -3.50726318359375, -3.3209228515625, -3.13458251953125, -2.9482421875, -2.76190185546875, -2.5755615234375, -2.38922119140625, -2.202880859375, -2.01654052734375, -1.8302001953125, -1.64385986328125, -1.45751953125, -1.27117919921875, -1.0848388671875, -0.89849853515625, -0.712158203125, -0.52581787109375, -0.3394775390625, -0.15313720703125, 0.033203125, 0.21954345703125, 0.4058837890625, 0.59222412109375, 0.778564453125, 0.96490478515625, 1.1512451171875, 1.33758544921875, 1.52392578125, 1.71026611328125, 1.8966064453125, 2.08294677734375, 2.269287109375, 2.45562744140625, 2.6419677734375, 2.82830810546875, 3.0146484375, 3.20098876953125, 3.3873291015625, 3.57366943359375, 3.760009765625, 3.94635009765625, 4.1326904296875, 4.31903076171875, 4.50537109375, 4.69171142578125, 4.8780517578125, 5.06439208984375, 5.250732421875, 5.43707275390625, 5.6234130859375, 5.80975341796875, 5.99609375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 3.0, 8.0, 6.0, 5.0, 9.0, 5.0, 7.0, 9.0, 15.0, 10.0, 13.0, 26.0, 21.0, 27.0, 33.0, 43.0, 32.0, 34.0, 36.0, 34.0, 46.0, 104.0, 566.0, 435.0, 75.0, 40.0, 34.0, 42.0, 38.0, 34.0, 26.0, 30.0, 24.0, 25.0, 17.0, 17.0, 11.0, 16.0, 18.0, 10.0, 8.0, 10.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.796875, -13.3358154296875, -12.874755859375, -12.4136962890625, -11.95263671875, -11.4915771484375, -11.030517578125, -10.5694580078125, -10.1083984375, -9.6473388671875, -9.186279296875, -8.7252197265625, -8.26416015625, -7.8031005859375, -7.342041015625, -6.8809814453125, -6.419921875, -5.9588623046875, -5.497802734375, -5.0367431640625, -4.57568359375, -4.1146240234375, -3.653564453125, -3.1925048828125, -2.7314453125, -2.2703857421875, -1.809326171875, -1.3482666015625, -0.88720703125, -0.4261474609375, 0.034912109375, 0.4959716796875, 0.95703125, 1.4180908203125, 1.879150390625, 2.3402099609375, 2.80126953125, 3.2623291015625, 3.723388671875, 4.1844482421875, 4.6455078125, 5.1065673828125, 5.567626953125, 6.0286865234375, 6.48974609375, 6.9508056640625, 7.411865234375, 7.8729248046875, 8.333984375, 8.7950439453125, 9.256103515625, 9.7171630859375, 10.17822265625, 10.6392822265625, 11.100341796875, 11.5614013671875, 12.0224609375, 12.4835205078125, 12.944580078125, 13.4056396484375, 13.86669921875, 14.3277587890625, 14.788818359375, 15.2498779296875, 15.7109375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [5.0, 3.0, 1.0, 6.0, 9.0, 18.0, 10.0, 4.0, 8.0, 15.0, 16.0, 23.0, 39.0, 60.0, 65.0, 85.0, 132.0, 151.0, 227.0, 283.0, 359.0, 529.0, 801.0, 1235.0, 1754.0, 2907.0, 5534.0, 11208.0, 29192.0, 105828.0, 5916921.0, 148591.0, 36150.0, 13464.0, 6155.0, 3342.0, 1956.0, 1292.0, 823.0, 619.0, 424.0, 299.0, 174.0, 167.0, 135.0, 111.0, 101.0, 61.0, 45.0, 25.0, 20.0, 19.0, 12.0, 5.0, 5.0, 7.0, 6.0, 11.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-25.328125, -24.500244140625, -23.67236328125, -22.844482421875, -22.0166015625, -21.188720703125, -20.36083984375, -19.532958984375, -18.705078125, -17.877197265625, -17.04931640625, -16.221435546875, -15.3935546875, -14.565673828125, -13.73779296875, -12.909912109375, -12.08203125, -11.254150390625, -10.42626953125, -9.598388671875, -8.7705078125, -7.942626953125, -7.11474609375, -6.286865234375, -5.458984375, -4.631103515625, -3.80322265625, -2.975341796875, -2.1474609375, -1.319580078125, -0.49169921875, 0.336181640625, 1.1640625, 1.991943359375, 2.81982421875, 3.647705078125, 4.4755859375, 5.303466796875, 6.13134765625, 6.959228515625, 7.787109375, 8.614990234375, 9.44287109375, 10.270751953125, 11.0986328125, 11.926513671875, 12.75439453125, 13.582275390625, 14.41015625, 15.238037109375, 16.06591796875, 16.893798828125, 17.7216796875, 18.549560546875, 19.37744140625, 20.205322265625, 21.033203125, 21.861083984375, 22.68896484375, 23.516845703125, 24.3447265625, 25.172607421875, 26.00048828125, 26.828369140625, 27.65625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 7.0, 1.0, 4.0, 1.0, 4.0, 12.0, 6.0, 10.0, 13.0, 21.0, 18.0, 26.0, 15.0, 24.0, 23.0, 35.0, 32.0, 27.0, 37.0, 44.0, 61.0, 114.0, 376.0, 535.0, 137.0, 74.0, 50.0, 25.0, 59.0, 30.0, 28.0, 31.0, 15.0, 16.0, 19.0, 20.0, 16.0, 13.0, 14.0, 7.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.0546875, -10.6875, -10.3203125, -9.953125, -9.5859375, -9.21875, -8.8515625, -8.484375, -8.1171875, -7.75, -7.3828125, -7.015625, -6.6484375, -6.28125, -5.9140625, -5.546875, -5.1796875, -4.8125, -4.4453125, -4.078125, -3.7109375, -3.34375, -2.9765625, -2.609375, -2.2421875, -1.875, -1.5078125, -1.140625, -0.7734375, -0.40625, -0.0390625, 0.328125, 0.6953125, 1.0625, 1.4296875, 1.796875, 2.1640625, 2.53125, 2.8984375, 3.265625, 3.6328125, 4.0, 4.3671875, 4.734375, 5.1015625, 5.46875, 5.8359375, 6.203125, 6.5703125, 6.9375, 7.3046875, 7.671875, 8.0390625, 8.40625, 8.7734375, 9.140625, 9.5078125, 9.875, 10.2421875, 10.609375, 10.9765625, 11.34375, 11.7109375, 12.078125, 12.4453125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 5.0, 14.0, 28.0, 49.0, 128.0, 282.0, 276.0, 116.0, 59.0, 22.0, 14.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.411460876464844, -47.76238250732422, -46.113304138183594, -44.4642219543457, -42.81514358520508, -41.16606521606445, -39.51698303222656, -37.86790466308594, -36.21882629394531, -34.56974792480469, -32.92066955566406, -31.271587371826172, -29.622509002685547, -27.973430633544922, -26.324350357055664, -24.675270080566406, -23.02619171142578, -21.377113342285156, -19.7280330657959, -18.07895278930664, -16.429874420166016, -14.780795097351074, -13.131715774536133, -11.482636451721191, -9.83355712890625, -8.184477806091309, -6.535398483276367, -4.886319160461426, -3.2372398376464844, -1.588160514831543, 0.06091880798339844, 1.7099981307983398, 3.3590736389160156, 5.008152961730957, 6.657232284545898, 8.30631160736084, 9.955390930175781, 11.604470252990723, 13.253549575805664, 14.902628898620605, 16.551708221435547, 18.200786590576172, 19.84986686706543, 21.498947143554688, 23.148025512695312, 24.797103881835938, 26.446184158325195, 28.095264434814453, 29.744342803955078, 31.393421173095703, 33.042503356933594, 34.69158172607422, 36.340660095214844, 37.98973846435547, 39.638816833496094, 41.287899017333984, 42.93697738647461, 44.586055755615234, 46.235137939453125, 47.88421630859375, 49.533294677734375, 51.182373046875, 52.831451416015625, 54.480533599853516, 56.12961196899414]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 12.0, 16.0, 32.0, 30.0, 42.0, 63.0, 54.0, 62.0, 69.0, 74.0, 84.0, 77.0, 82.0, 66.0, 61.0, 38.0, 44.0, 38.0, 18.0, 15.0, 13.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.989278793334961, -14.990968704223633, -13.992659568786621, -12.99435043334961, -11.996040344238281, -10.997730255126953, -9.999421119689941, -9.00111198425293, -8.002801895141602, -7.004492282867432, -6.006182670593262, -5.007873058319092, -4.009563446044922, -3.011253833770752, -2.012944221496582, -1.014634609222412, -0.016324996948242188, 0.9819846153259277, 1.9802942276000977, 2.9786038398742676, 3.9769134521484375, 4.975223064422607, 5.973532676696777, 6.971842288970947, 7.970151901245117, 8.968461990356445, 9.966771125793457, 10.965080261230469, 11.963390350341797, 12.961700439453125, 13.960009574890137, 14.958318710327148, 15.956626892089844, 16.954936981201172, 17.9532470703125, 18.951555252075195, 19.949865341186523, 20.94817543029785, 21.946483612060547, 22.944793701171875, 23.943103790283203, 24.94141387939453, 25.93972396850586, 26.938032150268555, 27.936342239379883, 28.93465232849121, 29.932960510253906, 30.931270599365234, 31.929580688476562, 32.92789077758789, 33.92620086669922, 34.92451095581055, 35.922821044921875, 36.92112731933594, 37.919437408447266, 38.917747497558594, 39.91605758666992, 40.91436767578125, 41.91267776489258, 42.910987854003906, 43.90929412841797, 44.9076042175293, 45.905914306640625, 46.90422439575195, 47.90253448486328]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 5.0, 6.0, 5.0, 10.0, 27.0, 56.0, 61.0, 127.0, 200.0, 355.0, 664.0, 1288.0, 2536.0, 5388.0, 11918.0, 32329.0, 155470.0, 3870715.0, 71432.0, 22558.0, 9364.0, 4290.0, 2155.0, 1161.0, 683.0, 403.0, 265.0, 192.0, 132.0, 88.0, 61.0, 63.0, 40.0, 37.0, 32.0, 22.0, 17.0, 16.0, 16.0, 15.0, 20.0, 16.0, 8.0, 6.0, 8.0, 4.0, 4.0, 4.0, 2.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.49560546875, -0.47118377685546875, -0.4467620849609375, -0.42234039306640625, -0.397918701171875, -0.37349700927734375, -0.3490753173828125, -0.32465362548828125, -0.30023193359375, -0.27581024169921875, -0.2513885498046875, -0.22696685791015625, -0.202545166015625, -0.17812347412109375, -0.1537017822265625, -0.12928009033203125, -0.1048583984375, -0.08043670654296875, -0.0560150146484375, -0.03159332275390625, -0.007171630859375, 0.01725006103515625, 0.0416717529296875, 0.06609344482421875, 0.09051513671875, 0.11493682861328125, 0.1393585205078125, 0.16378021240234375, 0.188201904296875, 0.21262359619140625, 0.2370452880859375, 0.26146697998046875, 0.285888671875, 0.31031036376953125, 0.3347320556640625, 0.35915374755859375, 0.383575439453125, 0.40799713134765625, 0.4324188232421875, 0.45684051513671875, 0.48126220703125, 0.5056838989257812, 0.5301055908203125, 0.5545272827148438, 0.578948974609375, 0.6033706665039062, 0.6277923583984375, 0.6522140502929688, 0.6766357421875, 0.7010574340820312, 0.7254791259765625, 0.7499008178710938, 0.774322509765625, 0.7987442016601562, 0.8231658935546875, 0.8475875854492188, 0.87200927734375, 0.8964309692382812, 0.9208526611328125, 0.9452743530273438, 0.969696044921875, 0.9941177368164062, 1.0185394287109375, 1.0429611206054688, 1.0673828125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 11.0, 8.0, 11.0, 9.0, 25.0, 58.0, 734.0, 58.0, 18.0, 13.0, 11.0, 18.0, 4.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057952880859375, -0.05446672439575195, -0.050980567932128906, -0.04749441146850586, -0.04400825500488281, -0.040522098541259766, -0.03703594207763672, -0.03354978561401367, -0.030063629150390625, -0.026577472686767578, -0.02309131622314453, -0.019605159759521484, -0.016119003295898438, -0.01263284683227539, -0.009146690368652344, -0.005660533905029297, -0.00217437744140625, 0.0013117790222167969, 0.004797935485839844, 0.00828409194946289, 0.011770248413085938, 0.015256404876708984, 0.01874256134033203, 0.022228717803955078, 0.025714874267578125, 0.029201030731201172, 0.03268718719482422, 0.036173343658447266, 0.03965950012207031, 0.04314565658569336, 0.046631813049316406, 0.05011796951293945, 0.0536041259765625, 0.05709028244018555, 0.060576438903808594, 0.06406259536743164, 0.06754875183105469, 0.07103490829467773, 0.07452106475830078, 0.07800722122192383, 0.08149337768554688, 0.08497953414916992, 0.08846569061279297, 0.09195184707641602, 0.09543800354003906, 0.09892416000366211, 0.10241031646728516, 0.1058964729309082, 0.10938262939453125, 0.1128687858581543, 0.11635494232177734, 0.11984109878540039, 0.12332725524902344, 0.12681341171264648, 0.13029956817626953, 0.13378572463989258, 0.13727188110351562, 0.14075803756713867, 0.14424419403076172, 0.14773035049438477, 0.1512165069580078, 0.15470266342163086, 0.1581888198852539, 0.16167497634887695, 0.1651611328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 9.0, 6.0, 12.0, 21.0, 40.0, 42.0, 98.0, 146.0, 254.0, 537.0, 1106.0, 2629.0, 7229.0, 24145.0, 112387.0, 955797.0, 2842386.0, 198382.0, 34972.0, 8856.0, 2894.0, 1166.0, 504.0, 278.0, 143.0, 75.0, 46.0, 40.0, 33.0, 8.0, 11.0, 8.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6806640625, -0.6588211059570312, -0.6369781494140625, -0.6151351928710938, -0.593292236328125, -0.5714492797851562, -0.5496063232421875, -0.5277633666992188, -0.50592041015625, -0.48407745361328125, -0.4622344970703125, -0.44039154052734375, -0.418548583984375, -0.39670562744140625, -0.3748626708984375, -0.35301971435546875, -0.3311767578125, -0.30933380126953125, -0.2874908447265625, -0.26564788818359375, -0.243804931640625, -0.22196197509765625, -0.2001190185546875, -0.17827606201171875, -0.15643310546875, -0.13459014892578125, -0.1127471923828125, -0.09090423583984375, -0.069061279296875, -0.04721832275390625, -0.0253753662109375, -0.00353240966796875, 0.018310546875, 0.04015350341796875, 0.0619964599609375, 0.08383941650390625, 0.105682373046875, 0.12752532958984375, 0.1493682861328125, 0.17121124267578125, 0.19305419921875, 0.21489715576171875, 0.2367401123046875, 0.25858306884765625, 0.280426025390625, 0.30226898193359375, 0.3241119384765625, 0.34595489501953125, 0.3677978515625, 0.38964080810546875, 0.4114837646484375, 0.43332672119140625, 0.455169677734375, 0.47701263427734375, 0.4988555908203125, 0.5206985473632812, 0.54254150390625, 0.5643844604492188, 0.5862274169921875, 0.6080703735351562, 0.629913330078125, 0.6517562866210938, 0.6735992431640625, 0.6954421997070312, 0.71728515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 3.0, 7.0, 16.0, 11.0, 21.0, 31.0, 29.0, 44.0, 54.0, 71.0, 85.0, 112.0, 142.0, 206.0, 251.0, 391.0, 1004.0, 512.0, 313.0, 207.0, 125.0, 129.0, 82.0, 56.0, 51.0, 33.0, 23.0, 17.0, 13.0, 9.0, 3.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.192626953125, -0.1878833770751953, -0.18313980102539062, -0.17839622497558594, -0.17365264892578125, -0.16890907287597656, -0.16416549682617188, -0.1594219207763672, -0.1546783447265625, -0.1499347686767578, -0.14519119262695312, -0.14044761657714844, -0.13570404052734375, -0.13096046447753906, -0.12621688842773438, -0.12147331237792969, -0.116729736328125, -0.11198616027832031, -0.10724258422851562, -0.10249900817871094, -0.09775543212890625, -0.09301185607910156, -0.08826828002929688, -0.08352470397949219, -0.0787811279296875, -0.07403755187988281, -0.06929397583007812, -0.06455039978027344, -0.05980682373046875, -0.05506324768066406, -0.050319671630859375, -0.04557609558105469, -0.04083251953125, -0.03608894348144531, -0.031345367431640625, -0.026601791381835938, -0.02185821533203125, -0.017114639282226562, -0.012371063232421875, -0.0076274871826171875, -0.0028839111328125, 0.0018596649169921875, 0.006603240966796875, 0.011346817016601562, 0.01609039306640625, 0.020833969116210938, 0.025577545166015625, 0.030321121215820312, 0.035064697265625, 0.03980827331542969, 0.044551849365234375, 0.04929542541503906, 0.05403900146484375, 0.05878257751464844, 0.06352615356445312, 0.06826972961425781, 0.0730133056640625, 0.07775688171386719, 0.08250045776367188, 0.08724403381347656, 0.09198760986328125, 0.09673118591308594, 0.10147476196289062, 0.10621833801269531, 0.1109619140625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 11.0, 13.0, 24.0, 38.0, 67.0, 97.0, 200.0, 243.0, 156.0, 68.0, 45.0, 17.0, 8.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.7365546226501465, -3.6595194339752197, -3.582484006881714, -3.505448818206787, -3.4284133911132812, -3.3513782024383545, -3.2743427753448486, -3.197307586669922, -3.120272159576416, -3.0432369709014893, -2.9662015438079834, -2.8891663551330566, -2.812130928039551, -2.735095739364624, -2.658060312271118, -2.5810251235961914, -2.5039896965026855, -2.426954507827759, -2.349919080734253, -2.272883892059326, -2.1958484649658203, -2.1188132762908936, -2.0417778491973877, -1.964742660522461, -1.8877074718475342, -1.8106721639633179, -1.7336368560791016, -1.6566015481948853, -1.579566240310669, -1.5025309324264526, -1.4254956245422363, -1.3484604358673096, -1.2714248895645142, -1.1943895816802979, -1.1173542737960815, -1.0403189659118652, -0.9632836580276489, -0.8862483501434326, -0.8092131018638611, -0.7321777939796448, -0.6551424860954285, -0.5781071782112122, -0.5010718703269958, -0.42403659224510193, -0.3470012843608856, -0.2699659764766693, -0.1929306983947754, -0.11589539051055908, -0.03886008262634277, 0.03817521780729294, 0.11521051824092865, 0.19224581122398376, 0.2692811191082001, 0.3463164269924164, 0.4233517050743103, 0.5003870129585266, 0.5774223208427429, 0.6544576287269592, 0.7314929366111755, 0.8085281848907471, 0.8855634927749634, 0.9625988006591797, 1.039634108543396, 1.1166694164276123, 1.1937047243118286]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 13.0, 9.0, 14.0, 19.0, 39.0, 43.0, 55.0, 51.0, 71.0, 85.0, 88.0, 69.0, 80.0, 80.0, 72.0, 47.0, 45.0, 34.0, 22.0, 22.0, 14.0, 8.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8079376220703125, -1.7587577104568481, -1.7095777988433838, -1.660398006439209, -1.6112180948257446, -1.5620381832122803, -1.512858271598816, -1.4636783599853516, -1.4144984483718872, -1.3653185367584229, -1.3161386251449585, -1.2669587135314941, -1.2177789211273193, -1.168599009513855, -1.1194190979003906, -1.0702391862869263, -1.021059274673462, -0.9718793630599976, -0.922699511051178, -0.8735195994377136, -0.8243396878242493, -0.7751598358154297, -0.7259799242019653, -0.676800012588501, -0.6276202201843262, -0.5784403085708618, -0.5292604565620422, -0.4800805449485779, -0.4309006333351135, -0.38172075152397156, -0.3325408697128296, -0.28336095809936523, -0.23418104648590088, -0.18500114977359772, -0.13582125306129456, -0.08664137125015259, -0.037461474537849426, 0.011718422174453735, 0.0608983039855957, 0.11007821559906006, 0.15925809741020203, 0.2084379941225052, 0.25761789083480835, 0.3067977726459503, 0.3559776544570923, 0.40515756607055664, 0.4543374478816986, 0.5035173892974854, 0.5526972413063049, 0.6018771529197693, 0.6510570049285889, 0.7002369165420532, 0.7494168281555176, 0.7985967397689819, 0.8477765917778015, 0.8969565033912659, 0.9461363554000854, 0.9953162670135498, 1.0444961786270142, 1.0936760902404785, 1.1428558826446533, 1.1920357942581177, 1.241215705871582, 1.2903956174850464, 1.3395755290985107]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 17.0, 12.0, 31.0, 46.0, 85.0, 96.0, 173.0, 249.0, 417.0, 755.0, 1289.0, 2641.0, 5777.0, 15019.0, 62720.0, 697735.0, 216842.0, 27186.0, 9322.0, 3790.0, 1845.0, 998.0, 592.0, 332.0, 202.0, 115.0, 71.0, 64.0, 29.0, 26.0, 20.0, 11.0, 16.0, 7.0, 6.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.465576171875, -0.4504356384277344, -0.43529510498046875, -0.4201545715332031, -0.4050140380859375, -0.3898735046386719, -0.37473297119140625, -0.3595924377441406, -0.344451904296875, -0.3293113708496094, -0.31417083740234375, -0.2990303039550781, -0.2838897705078125, -0.2687492370605469, -0.25360870361328125, -0.23846817016601562, -0.22332763671875, -0.20818710327148438, -0.19304656982421875, -0.17790603637695312, -0.1627655029296875, -0.14762496948242188, -0.13248443603515625, -0.11734390258789062, -0.102203369140625, -0.08706283569335938, -0.07192230224609375, -0.056781768798828125, -0.0416412353515625, -0.026500701904296875, -0.01136016845703125, 0.003780364990234375, 0.0189208984375, 0.034061431884765625, 0.04920196533203125, 0.06434249877929688, 0.0794830322265625, 0.09462356567382812, 0.10976409912109375, 0.12490463256835938, 0.140045166015625, 0.15518569946289062, 0.17032623291015625, 0.18546676635742188, 0.2006072998046875, 0.21574783325195312, 0.23088836669921875, 0.24602890014648438, 0.26116943359375, 0.2763099670410156, 0.29145050048828125, 0.3065910339355469, 0.3217315673828125, 0.3368721008300781, 0.35201263427734375, 0.3671531677246094, 0.382293701171875, 0.3974342346191406, 0.41257476806640625, 0.4277153015136719, 0.4428558349609375, 0.4579963684082031, 0.47313690185546875, 0.4882774353027344, 0.50341796875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 7.0, 10.0, 18.0, 30.0, 51.0, 90.0, 142.0, 189.0, 151.0, 124.0, 67.0, 23.0, 20.0, 8.0, 7.0, 7.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06683349609375, -0.06450939178466797, -0.06218528747558594, -0.059861183166503906, -0.057537078857421875, -0.055212974548339844, -0.05288887023925781, -0.05056476593017578, -0.04824066162109375, -0.04591655731201172, -0.04359245300292969, -0.041268348693847656, -0.038944244384765625, -0.036620140075683594, -0.03429603576660156, -0.03197193145751953, -0.0296478271484375, -0.02732372283935547, -0.024999618530273438, -0.022675514221191406, -0.020351409912109375, -0.018027305603027344, -0.015703201293945312, -0.013379096984863281, -0.01105499267578125, -0.008730888366699219, -0.0064067840576171875, -0.004082679748535156, -0.001758575439453125, 0.0005655288696289062, 0.0028896331787109375, 0.005213737487792969, 0.007537841796875, 0.009861946105957031, 0.012186050415039062, 0.014510154724121094, 0.016834259033203125, 0.019158363342285156, 0.021482467651367188, 0.02380657196044922, 0.02613067626953125, 0.02845478057861328, 0.030778884887695312, 0.033102989196777344, 0.035427093505859375, 0.037751197814941406, 0.04007530212402344, 0.04239940643310547, 0.0447235107421875, 0.04704761505126953, 0.04937171936035156, 0.051695823669433594, 0.054019927978515625, 0.056344032287597656, 0.05866813659667969, 0.06099224090576172, 0.06331634521484375, 0.06564044952392578, 0.06796455383300781, 0.07028865814208984, 0.07261276245117188, 0.0749368667602539, 0.07726097106933594, 0.07958507537841797, 0.0819091796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 2.0, 6.0, 8.0, 10.0, 12.0, 11.0, 14.0, 25.0, 50.0, 64.0, 122.0, 220.0, 434.0, 1114.0, 2859.0, 9667.0, 44090.0, 286709.0, 590497.0, 88277.0, 16940.0, 4609.0, 1519.0, 619.0, 278.0, 143.0, 84.0, 57.0, 21.0, 24.0, 21.0, 11.0, 11.0, 3.0, 8.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.80126953125, -0.7763824462890625, -0.751495361328125, -0.7266082763671875, -0.70172119140625, -0.6768341064453125, -0.651947021484375, -0.6270599365234375, -0.6021728515625, -0.5772857666015625, -0.552398681640625, -0.5275115966796875, -0.50262451171875, -0.4777374267578125, -0.452850341796875, -0.4279632568359375, -0.403076171875, -0.3781890869140625, -0.353302001953125, -0.3284149169921875, -0.30352783203125, -0.2786407470703125, -0.253753662109375, -0.2288665771484375, -0.2039794921875, -0.1790924072265625, -0.154205322265625, -0.1293182373046875, -0.10443115234375, -0.0795440673828125, -0.054656982421875, -0.0297698974609375, -0.0048828125, 0.0200042724609375, 0.044891357421875, 0.0697784423828125, 0.09466552734375, 0.1195526123046875, 0.144439697265625, 0.1693267822265625, 0.1942138671875, 0.2191009521484375, 0.243988037109375, 0.2688751220703125, 0.29376220703125, 0.3186492919921875, 0.343536376953125, 0.3684234619140625, 0.393310546875, 0.4181976318359375, 0.443084716796875, 0.4679718017578125, 0.49285888671875, 0.5177459716796875, 0.542633056640625, 0.5675201416015625, 0.5924072265625, 0.6172943115234375, 0.642181396484375, 0.6670684814453125, 0.69195556640625, 0.7168426513671875, 0.741729736328125, 0.7666168212890625, 0.79150390625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 8.0, 9.0, 12.0, 9.0, 18.0, 33.0, 22.0, 20.0, 37.0, 36.0, 31.0, 37.0, 23.0, 39.0, 40.0, 57.0, 42.0, 53.0, 51.0, 39.0, 38.0, 42.0, 35.0, 33.0, 29.0, 30.0, 20.0, 17.0, 25.0, 28.0, 15.0, 19.0, 8.0, 7.0, 8.0, 3.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.366455078125, -0.355438232421875, -0.34442138671875, -0.333404541015625, -0.3223876953125, -0.311370849609375, -0.30035400390625, -0.289337158203125, -0.2783203125, -0.267303466796875, -0.25628662109375, -0.245269775390625, -0.2342529296875, -0.223236083984375, -0.21221923828125, -0.201202392578125, -0.190185546875, -0.179168701171875, -0.16815185546875, -0.157135009765625, -0.1461181640625, -0.135101318359375, -0.12408447265625, -0.113067626953125, -0.10205078125, -0.091033935546875, -0.08001708984375, -0.069000244140625, -0.0579833984375, -0.046966552734375, -0.03594970703125, -0.024932861328125, -0.013916015625, -0.002899169921875, 0.00811767578125, 0.019134521484375, 0.0301513671875, 0.041168212890625, 0.05218505859375, 0.063201904296875, 0.07421875, 0.085235595703125, 0.09625244140625, 0.107269287109375, 0.1182861328125, 0.129302978515625, 0.14031982421875, 0.151336669921875, 0.162353515625, 0.173370361328125, 0.18438720703125, 0.195404052734375, 0.2064208984375, 0.217437744140625, 0.22845458984375, 0.239471435546875, 0.25048828125, 0.261505126953125, 0.27252197265625, 0.283538818359375, 0.2945556640625, 0.305572509765625, 0.31658935546875, 0.327606201171875, 0.338623046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 9.0, 20.0, 8.0, 19.0, 53.0, 71.0, 130.0, 204.0, 431.0, 1088.0, 3206.0, 18601.0, 851552.0, 161070.0, 8530.0, 2012.0, 768.0, 329.0, 166.0, 102.0, 48.0, 44.0, 25.0, 19.0, 12.0, 8.0, 5.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8984375, -0.8622283935546875, -0.826019287109375, -0.7898101806640625, -0.75360107421875, -0.7173919677734375, -0.681182861328125, -0.6449737548828125, -0.6087646484375, -0.5725555419921875, -0.536346435546875, -0.5001373291015625, -0.46392822265625, -0.4277191162109375, -0.391510009765625, -0.3553009033203125, -0.319091796875, -0.2828826904296875, -0.246673583984375, -0.2104644775390625, -0.17425537109375, -0.1380462646484375, -0.101837158203125, -0.0656280517578125, -0.0294189453125, 0.0067901611328125, 0.042999267578125, 0.0792083740234375, 0.11541748046875, 0.1516265869140625, 0.187835693359375, 0.2240447998046875, 0.26025390625, 0.2964630126953125, 0.332672119140625, 0.3688812255859375, 0.40509033203125, 0.4412994384765625, 0.477508544921875, 0.5137176513671875, 0.5499267578125, 0.5861358642578125, 0.622344970703125, 0.6585540771484375, 0.69476318359375, 0.7309722900390625, 0.767181396484375, 0.8033905029296875, 0.839599609375, 0.8758087158203125, 0.912017822265625, 0.9482269287109375, 0.98443603515625, 1.0206451416015625, 1.056854248046875, 1.0930633544921875, 1.1292724609375, 1.1654815673828125, 1.201690673828125, 1.2378997802734375, 1.27410888671875, 1.3103179931640625, 1.346527099609375, 1.3827362060546875, 1.4189453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 7.0, 3.0, 10.0, 16.0, 32.0, 25.0, 73.0, 108.0, 152.0, 168.0, 134.0, 84.0, 60.0, 42.0, 30.0, 12.0, 10.0, 9.0, 6.0, 7.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.737211227416992e-05, -3.600679337978363e-05, -3.464147448539734e-05, -3.327615559101105e-05, -3.1910836696624756e-05, -3.0545517802238464e-05, -2.9180198907852173e-05, -2.781488001346588e-05, -2.644956111907959e-05, -2.50842422246933e-05, -2.3718923330307007e-05, -2.2353604435920715e-05, -2.0988285541534424e-05, -1.9622966647148132e-05, -1.825764775276184e-05, -1.689232885837555e-05, -1.5527009963989258e-05, -1.4161691069602966e-05, -1.2796372175216675e-05, -1.1431053280830383e-05, -1.0065734386444092e-05, -8.7004154920578e-06, -7.335096597671509e-06, -5.969777703285217e-06, -4.604458808898926e-06, -3.2391399145126343e-06, -1.8738210201263428e-06, -5.085021257400513e-07, 8.568167686462402e-07, 2.2221356630325317e-06, 3.5874545574188232e-06, 4.952773451805115e-06, 6.318092346191406e-06, 7.683411240577698e-06, 9.04873013496399e-06, 1.041404902935028e-05, 1.1779367923736572e-05, 1.3144686818122864e-05, 1.4510005712509155e-05, 1.5875324606895447e-05, 1.7240643501281738e-05, 1.860596239566803e-05, 1.997128129005432e-05, 2.1336600184440613e-05, 2.2701919078826904e-05, 2.4067237973213196e-05, 2.5432556867599487e-05, 2.679787576198578e-05, 2.816319465637207e-05, 2.9528513550758362e-05, 3.089383244514465e-05, 3.2259151339530945e-05, 3.3624470233917236e-05, 3.498978912830353e-05, 3.635510802268982e-05, 3.772042691707611e-05, 3.90857458114624e-05, 4.0451064705848694e-05, 4.1816383600234985e-05, 4.318170249462128e-05, 4.454702138900757e-05, 4.591234028339386e-05, 4.727765917778015e-05, 4.864297807216644e-05, 5.0008296966552734e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 9.0, 13.0, 12.0, 32.0, 30.0, 38.0, 61.0, 96.0, 130.0, 196.0, 310.0, 552.0, 909.0, 1662.0, 3390.0, 7313.0, 19101.0, 62990.0, 325968.0, 491881.0, 90813.0, 24829.0, 9343.0, 4073.0, 2024.0, 1098.0, 584.0, 381.0, 219.0, 147.0, 108.0, 65.0, 45.0, 23.0, 30.0, 22.0, 7.0, 5.0, 10.0, 8.0, 5.0, 2.0, 0.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.376953125, -0.3652191162109375, -0.353485107421875, -0.3417510986328125, -0.33001708984375, -0.3182830810546875, -0.306549072265625, -0.2948150634765625, -0.2830810546875, -0.2713470458984375, -0.259613037109375, -0.2478790283203125, -0.23614501953125, -0.2244110107421875, -0.212677001953125, -0.2009429931640625, -0.189208984375, -0.1774749755859375, -0.165740966796875, -0.1540069580078125, -0.14227294921875, -0.1305389404296875, -0.118804931640625, -0.1070709228515625, -0.0953369140625, -0.0836029052734375, -0.071868896484375, -0.0601348876953125, -0.04840087890625, -0.0366668701171875, -0.024932861328125, -0.0131988525390625, -0.00146484375, 0.0102691650390625, 0.022003173828125, 0.0337371826171875, 0.04547119140625, 0.0572052001953125, 0.068939208984375, 0.0806732177734375, 0.0924072265625, 0.1041412353515625, 0.115875244140625, 0.1276092529296875, 0.13934326171875, 0.1510772705078125, 0.162811279296875, 0.1745452880859375, 0.186279296875, 0.1980133056640625, 0.209747314453125, 0.2214813232421875, 0.23321533203125, 0.2449493408203125, 0.256683349609375, 0.2684173583984375, 0.2801513671875, 0.2918853759765625, 0.303619384765625, 0.3153533935546875, 0.32708740234375, 0.3388214111328125, 0.350555419921875, 0.3622894287109375, 0.3740234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 11.0, 6.0, 15.0, 12.0, 12.0, 23.0, 18.0, 28.0, 51.0, 55.0, 46.0, 54.0, 74.0, 77.0, 69.0, 77.0, 60.0, 66.0, 49.0, 38.0, 32.0, 24.0, 21.0, 14.0, 12.0, 7.0, 4.0, 5.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.28271484375, -0.2748699188232422, -0.2670249938964844, -0.25918006896972656, -0.25133514404296875, -0.24349021911621094, -0.23564529418945312, -0.2278003692626953, -0.2199554443359375, -0.2121105194091797, -0.20426559448242188, -0.19642066955566406, -0.18857574462890625, -0.18073081970214844, -0.17288589477539062, -0.1650409698486328, -0.157196044921875, -0.1493511199951172, -0.14150619506835938, -0.13366127014160156, -0.12581634521484375, -0.11797142028808594, -0.11012649536132812, -0.10228157043457031, -0.0944366455078125, -0.08659172058105469, -0.07874679565429688, -0.07090187072753906, -0.06305694580078125, -0.05521202087402344, -0.047367095947265625, -0.03952217102050781, -0.03167724609375, -0.023832321166992188, -0.015987396240234375, -0.008142471313476562, -0.00029754638671875, 0.0075473785400390625, 0.015392303466796875, 0.023237228393554688, 0.0310821533203125, 0.03892707824707031, 0.046772003173828125, 0.05461692810058594, 0.06246185302734375, 0.07030677795410156, 0.07815170288085938, 0.08599662780761719, 0.093841552734375, 0.10168647766113281, 0.10953140258789062, 0.11737632751464844, 0.12522125244140625, 0.13306617736816406, 0.14091110229492188, 0.1487560272216797, 0.1566009521484375, 0.1644458770751953, 0.17229080200195312, 0.18013572692871094, 0.18798065185546875, 0.19582557678222656, 0.20367050170898438, 0.2115154266357422, 0.2193603515625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 5.0, 9.0, 20.0, 72.0, 169.0, 465.0, 187.0, 53.0, 14.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484010696411133, -8.1088228225708, -7.733633995056152, -7.35844612121582, -6.983257293701172, -6.60806941986084, -6.23288106918335, -5.857692718505859, -5.482504367828369, -5.107316017150879, -4.732127666473389, -4.356939315795898, -3.9817512035369873, -3.606562852859497, -3.231374740600586, -2.8561863899230957, -2.4809980392456055, -2.1058096885681152, -1.7306214570999146, -1.3554332256317139, -0.9802448749542236, -0.6050565242767334, -0.22986841201782227, 0.14531993865966797, 0.5205082893371582, 0.8956965804100037, 1.2708848714828491, 1.6460731029510498, 2.02126145362854, 2.3964498043060303, 2.7716379165649414, 3.1468262672424316, 3.5220136642456055, 3.8972020149230957, 4.272390365600586, 4.647578239440918, 5.022767066955566, 5.397954940795898, 5.773143291473389, 6.148331642150879, 6.523519992828369, 6.898708343505859, 7.27389669418335, 7.64908504486084, 8.024272918701172, 8.39946174621582, 8.774649620056152, 9.149837493896484, 9.525026321411133, 9.900214195251465, 10.275403022766113, 10.650590896606445, 11.025779724121094, 11.400967597961426, 11.776155471801758, 12.151344299316406, 12.526533126831055, 12.901721000671387, 13.276909828186035, 13.652097702026367, 14.027286529541016, 14.402474403381348, 14.77766227722168, 15.152851104736328, 15.52803897857666]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 4.0, 4.0, 6.0, 11.0, 9.0, 20.0, 26.0, 33.0, 63.0, 88.0, 89.0, 109.0, 125.0, 108.0, 78.0, 63.0, 48.0, 27.0, 18.0, 10.0, 13.0, 15.0, 3.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.000021934509277, -5.819125175476074, -5.638228416442871, -5.45733118057251, -5.276434421539307, -5.0955376625061035, -4.9146409034729, -4.733743667602539, -4.552846908569336, -4.371950149536133, -4.19105339050293, -4.010156154632568, -3.8292593955993652, -3.648362636566162, -3.467465877532959, -3.2865688800811768, -3.1056721210479736, -2.9247753620147705, -2.7438783645629883, -2.562981605529785, -2.382084608078003, -2.2011878490448, -2.0202908515930176, -1.8393940925598145, -1.6584972143173218, -1.477600336074829, -1.2967034578323364, -1.1158065795898438, -0.9349097609519958, -0.7540128827095032, -0.5731160640716553, -0.3922191858291626, -0.21132230758666992, -0.03042544424533844, 0.15047141909599304, 0.33136826753616333, 0.512265145778656, 0.6931620240211487, 0.8740588426589966, 1.0549557209014893, 1.235852599143982, 1.4167494773864746, 1.5976463556289673, 1.77854323387146, 1.959439992904663, 2.1403369903564453, 2.3212337493896484, 2.5021305084228516, 2.683027505874634, 2.863924264907837, 3.044821262359619, 3.2257180213928223, 3.4066150188446045, 3.5875117778778076, 3.76840877532959, 3.949305534362793, 4.130202293395996, 4.311099052429199, 4.491995811462402, 4.672893047332764, 4.853789806365967, 5.03468656539917, 5.215583324432373, 5.396480560302734, 5.5773773193359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 11.0, 19.0, 27.0, 51.0, 240.0, 2693.0, 4133989.0, 55573.0, 1230.0, 249.0, 91.0, 37.0, 25.0, 7.0, 10.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.56640625, -4.34686279296875, -4.1273193359375, -3.90777587890625, -3.688232421875, -3.46868896484375, -3.2491455078125, -3.02960205078125, -2.81005859375, -2.59051513671875, -2.3709716796875, -2.15142822265625, -1.931884765625, -1.71234130859375, -1.4927978515625, -1.27325439453125, -1.0537109375, -0.83416748046875, -0.6146240234375, -0.39508056640625, -0.175537109375, 0.04400634765625, 0.2635498046875, 0.48309326171875, 0.70263671875, 0.92218017578125, 1.1417236328125, 1.36126708984375, 1.580810546875, 1.80035400390625, 2.0198974609375, 2.23944091796875, 2.458984375, 2.67852783203125, 2.8980712890625, 3.11761474609375, 3.337158203125, 3.55670166015625, 3.7762451171875, 3.99578857421875, 4.21533203125, 4.43487548828125, 4.6544189453125, 4.87396240234375, 5.093505859375, 5.31304931640625, 5.5325927734375, 5.75213623046875, 5.9716796875, 6.19122314453125, 6.4107666015625, 6.63031005859375, 6.849853515625, 7.06939697265625, 7.2889404296875, 7.50848388671875, 7.72802734375, 7.94757080078125, 8.1671142578125, 8.38665771484375, 8.606201171875, 8.82574462890625, 9.0452880859375, 9.26483154296875, 9.484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 7.0, 2.0, 11.0, 14.0, 23.0, 29.0, 60.0, 93.0, 154.0, 160.0, 130.0, 123.0, 65.0, 37.0, 28.0, 17.0, 13.0, 8.0, 6.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061004638671875, -0.058324337005615234, -0.05564403533935547, -0.0529637336730957, -0.05028343200683594, -0.04760313034057617, -0.044922828674316406, -0.04224252700805664, -0.039562225341796875, -0.03688192367553711, -0.034201622009277344, -0.03152132034301758, -0.028841018676757812, -0.026160717010498047, -0.02348041534423828, -0.020800113677978516, -0.01811981201171875, -0.015439510345458984, -0.012759208679199219, -0.010078907012939453, -0.0073986053466796875, -0.004718303680419922, -0.0020380020141601562, 0.0006422996520996094, 0.003322601318359375, 0.006002902984619141, 0.008683204650878906, 0.011363506317138672, 0.014043807983398438, 0.016724109649658203, 0.01940441131591797, 0.022084712982177734, 0.0247650146484375, 0.027445316314697266, 0.03012561798095703, 0.0328059196472168, 0.03548622131347656, 0.03816652297973633, 0.040846824645996094, 0.04352712631225586, 0.046207427978515625, 0.04888772964477539, 0.051568031311035156, 0.05424833297729492, 0.05692863464355469, 0.05960893630981445, 0.06228923797607422, 0.06496953964233398, 0.06764984130859375, 0.07033014297485352, 0.07301044464111328, 0.07569074630737305, 0.07837104797363281, 0.08105134963989258, 0.08373165130615234, 0.08641195297241211, 0.08909225463867188, 0.09177255630493164, 0.0944528579711914, 0.09713315963745117, 0.09981346130371094, 0.1024937629699707, 0.10517406463623047, 0.10785436630249023, 0.11053466796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 10.0, 35.0, 53.0, 104.0, 219.0, 632.0, 1955.0, 7427.0, 45589.0, 3610800.0, 494640.0, 25924.0, 5011.0, 1326.0, 351.0, 121.0, 42.0, 18.0, 9.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.94140625, -2.8835830688476562, -2.8257598876953125, -2.7679367065429688, -2.710113525390625, -2.6522903442382812, -2.5944671630859375, -2.5366439819335938, -2.47882080078125, -2.4209976196289062, -2.3631744384765625, -2.3053512573242188, -2.247528076171875, -2.1897048950195312, -2.1318817138671875, -2.0740585327148438, -2.0162353515625, -1.9584121704101562, -1.9005889892578125, -1.8427658081054688, -1.784942626953125, -1.7271194458007812, -1.6692962646484375, -1.6114730834960938, -1.55364990234375, -1.4958267211914062, -1.4380035400390625, -1.3801803588867188, -1.322357177734375, -1.2645339965820312, -1.2067108154296875, -1.1488876342773438, -1.091064453125, -1.0332412719726562, -0.9754180908203125, -0.9175949096679688, -0.859771728515625, -0.8019485473632812, -0.7441253662109375, -0.6863021850585938, -0.62847900390625, -0.5706558227539062, -0.5128326416015625, -0.45500946044921875, -0.397186279296875, -0.33936309814453125, -0.2815399169921875, -0.22371673583984375, -0.1658935546875, -0.10807037353515625, -0.0502471923828125, 0.00757598876953125, 0.065399169921875, 0.12322235107421875, 0.1810455322265625, 0.23886871337890625, 0.29669189453125, 0.35451507568359375, 0.4123382568359375, 0.47016143798828125, 0.527984619140625, 0.5858078002929688, 0.6436309814453125, 0.7014541625976562, 0.75927734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 3.0, 2.0, 2.0, 9.0, 6.0, 5.0, 6.0, 6.0, 21.0, 20.0, 16.0, 24.0, 60.0, 45.0, 78.0, 90.0, 224.0, 717.0, 1716.0, 397.0, 187.0, 118.0, 73.0, 56.0, 39.0, 31.0, 27.0, 18.0, 16.0, 11.0, 9.0, 5.0, 3.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.11376953125, -0.11025714874267578, -0.10674476623535156, -0.10323238372802734, -0.09972000122070312, -0.0962076187133789, -0.09269523620605469, -0.08918285369873047, -0.08567047119140625, -0.08215808868408203, -0.07864570617675781, -0.0751333236694336, -0.07162094116210938, -0.06810855865478516, -0.06459617614746094, -0.06108379364013672, -0.0575714111328125, -0.05405902862548828, -0.05054664611816406, -0.047034263610839844, -0.043521881103515625, -0.040009498596191406, -0.03649711608886719, -0.03298473358154297, -0.02947235107421875, -0.02595996856689453, -0.022447586059570312, -0.018935203552246094, -0.015422821044921875, -0.011910438537597656, -0.008398056030273438, -0.004885673522949219, -0.001373291015625, 0.0021390914916992188, 0.0056514739990234375, 0.009163856506347656, 0.012676239013671875, 0.016188621520996094, 0.019701004028320312, 0.02321338653564453, 0.02672576904296875, 0.03023815155029297, 0.03375053405761719, 0.037262916564941406, 0.040775299072265625, 0.044287681579589844, 0.04780006408691406, 0.05131244659423828, 0.0548248291015625, 0.05833721160888672, 0.06184959411621094, 0.06536197662353516, 0.06887435913085938, 0.0723867416381836, 0.07589912414550781, 0.07941150665283203, 0.08292388916015625, 0.08643627166748047, 0.08994865417480469, 0.0934610366821289, 0.09697341918945312, 0.10048580169677734, 0.10399818420410156, 0.10751056671142578, 0.11102294921875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 33.0, 630.0, 317.0, 16.0, 10.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.746166229248047, -13.481243133544922, -13.216320991516113, -12.951397895812988, -12.686474800109863, -12.421552658081055, -12.15662956237793, -11.891706466674805, -11.62678337097168, -11.361860275268555, -11.096938133239746, -10.832015037536621, -10.567091941833496, -10.302169799804688, -10.037246704101562, -9.772323608398438, -9.507401466369629, -9.242478370666504, -8.977556228637695, -8.71263313293457, -8.447710037231445, -8.18278694152832, -7.917864799499512, -7.652941703796387, -7.38801908493042, -7.123096466064453, -6.858173370361328, -6.593250751495361, -6.3283281326293945, -6.0634050369262695, -5.798482418060303, -5.533559799194336, -5.268637657165527, -5.0037150382995605, -4.7387919425964355, -4.473869323730469, -4.208946228027344, -3.944023609161377, -3.67910099029541, -3.4141781330108643, -3.1492552757263184, -2.8843324184417725, -2.6194095611572266, -2.3544869422912598, -2.089564085006714, -1.824641227722168, -1.5597184896469116, -1.2947957515716553, -1.0298728942871094, -0.7649500966072083, -0.5000272989273071, -0.235104501247406, 0.029818296432495117, 0.294741153717041, 0.5596638917922974, 0.8245866298675537, 1.0895094871520996, 1.3544323444366455, 1.6193550825119019, 1.8842778205871582, 2.149200677871704, 2.41412353515625, 2.679046154022217, 2.9439690113067627, 3.2088918685913086]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 6.0, 10.0, 19.0, 20.0, 35.0, 44.0, 60.0, 74.0, 97.0, 106.0, 98.0, 117.0, 85.0, 65.0, 44.0, 41.0, 29.0, 13.0, 16.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2728838920593262, -1.2391839027404785, -1.2054839134216309, -1.1717839241027832, -1.138084053993225, -1.1043840646743774, -1.0706840753555298, -1.0369840860366821, -1.0032840967178345, -0.9695841073989868, -0.9358841776847839, -0.9021841883659363, -0.8684841990470886, -0.8347842693328857, -0.8010842800140381, -0.7673842906951904, -0.7336843609809875, -0.6999843716621399, -0.666284441947937, -0.6325844526290894, -0.5988844633102417, -0.565184473991394, -0.5314845442771912, -0.4977845549583435, -0.46408459544181824, -0.43038463592529297, -0.3966846466064453, -0.36298468708992004, -0.3292847275733948, -0.2955847382545471, -0.26188477873802185, -0.2281848043203354, -0.19448482990264893, -0.16078485548496246, -0.127084881067276, -0.09338492155075073, -0.05968494713306427, -0.025984972715377808, 0.007714986801147461, 0.04141496121883392, 0.07511493563652039, 0.10881491005420685, 0.1425148844718933, 0.17621484398841858, 0.20991481840610504, 0.2436147928237915, 0.2773147523403168, 0.31101471185684204, 0.3447147011756897, 0.37841466069221497, 0.4121146500110626, 0.4458146095275879, 0.47951459884643555, 0.5132145881652832, 0.5469145178794861, 0.5806145071983337, 0.6143144369125366, 0.6480144262313843, 0.6817143559455872, 0.7154143452644348, 0.7491143345832825, 0.7828142642974854, 0.816514253616333, 0.8502142429351807, 0.8839142322540283]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 3.0, 15.0, 18.0, 25.0, 47.0, 89.0, 131.0, 287.0, 598.0, 1239.0, 2488.0, 5914.0, 16150.0, 53206.0, 248258.0, 546885.0, 123893.0, 31211.0, 10412.0, 4141.0, 1774.0, 827.0, 416.0, 228.0, 128.0, 80.0, 38.0, 20.0, 7.0, 14.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.56005859375, -0.5421600341796875, -0.524261474609375, -0.5063629150390625, -0.48846435546875, -0.4705657958984375, -0.452667236328125, -0.4347686767578125, -0.4168701171875, -0.3989715576171875, -0.381072998046875, -0.3631744384765625, -0.34527587890625, -0.3273773193359375, -0.309478759765625, -0.2915802001953125, -0.273681640625, -0.2557830810546875, -0.237884521484375, -0.2199859619140625, -0.20208740234375, -0.1841888427734375, -0.166290283203125, -0.1483917236328125, -0.1304931640625, -0.1125946044921875, -0.094696044921875, -0.0767974853515625, -0.05889892578125, -0.0410003662109375, -0.023101806640625, -0.0052032470703125, 0.0126953125, 0.0305938720703125, 0.048492431640625, 0.0663909912109375, 0.08428955078125, 0.1021881103515625, 0.120086669921875, 0.1379852294921875, 0.1558837890625, 0.1737823486328125, 0.191680908203125, 0.2095794677734375, 0.22747802734375, 0.2453765869140625, 0.263275146484375, 0.2811737060546875, 0.299072265625, 0.3169708251953125, 0.334869384765625, 0.3527679443359375, 0.37066650390625, 0.3885650634765625, 0.406463623046875, 0.4243621826171875, 0.4422607421875, 0.4601593017578125, 0.478057861328125, 0.4959564208984375, 0.51385498046875, 0.5317535400390625, 0.549652099609375, 0.5675506591796875, 0.58544921875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 6.0, 8.0, 9.0, 14.0, 16.0, 14.0, 23.0, 35.0, 44.0, 53.0, 53.0, 61.0, 65.0, 82.0, 75.0, 65.0, 64.0, 47.0, 56.0, 39.0, 29.0, 27.0, 22.0, 15.0, 12.0, 15.0, 9.0, 6.0, 5.0, 4.0, 6.0, 1.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038665771484375, -0.03734254837036133, -0.036019325256347656, -0.034696102142333984, -0.03337287902832031, -0.03204965591430664, -0.03072643280029297, -0.029403209686279297, -0.028079986572265625, -0.026756763458251953, -0.02543354034423828, -0.02411031723022461, -0.022787094116210938, -0.021463871002197266, -0.020140647888183594, -0.018817424774169922, -0.01749420166015625, -0.016170978546142578, -0.014847755432128906, -0.013524532318115234, -0.012201309204101562, -0.01087808609008789, -0.009554862976074219, -0.008231639862060547, -0.006908416748046875, -0.005585193634033203, -0.004261970520019531, -0.0029387474060058594, -0.0016155242919921875, -0.0002923011779785156, 0.0010309219360351562, 0.002354145050048828, 0.0036773681640625, 0.005000591278076172, 0.006323814392089844, 0.007647037506103516, 0.008970260620117188, 0.01029348373413086, 0.011616706848144531, 0.012939929962158203, 0.014263153076171875, 0.015586376190185547, 0.01690959930419922, 0.01823282241821289, 0.019556045532226562, 0.020879268646240234, 0.022202491760253906, 0.023525714874267578, 0.02484893798828125, 0.026172161102294922, 0.027495384216308594, 0.028818607330322266, 0.030141830444335938, 0.03146505355834961, 0.03278827667236328, 0.03411149978637695, 0.035434722900390625, 0.0367579460144043, 0.03808116912841797, 0.03940439224243164, 0.04072761535644531, 0.042050838470458984, 0.043374061584472656, 0.04469728469848633, 0.0460205078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 7.0, 5.0, 5.0, 3.0, 10.0, 20.0, 44.0, 173.0, 634.0, 3169.0, 19115.0, 167904.0, 692905.0, 143799.0, 16944.0, 2956.0, 586.0, 148.0, 50.0, 20.0, 9.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.93408203125, -0.909149169921875, -0.88421630859375, -0.859283447265625, -0.8343505859375, -0.809417724609375, -0.78448486328125, -0.759552001953125, -0.734619140625, -0.709686279296875, -0.68475341796875, -0.659820556640625, -0.6348876953125, -0.609954833984375, -0.58502197265625, -0.560089111328125, -0.53515625, -0.510223388671875, -0.48529052734375, -0.460357666015625, -0.4354248046875, -0.410491943359375, -0.38555908203125, -0.360626220703125, -0.335693359375, -0.310760498046875, -0.28582763671875, -0.260894775390625, -0.2359619140625, -0.211029052734375, -0.18609619140625, -0.161163330078125, -0.13623046875, -0.111297607421875, -0.08636474609375, -0.061431884765625, -0.0364990234375, -0.011566162109375, 0.01336669921875, 0.038299560546875, 0.063232421875, 0.088165283203125, 0.11309814453125, 0.138031005859375, 0.1629638671875, 0.187896728515625, 0.21282958984375, 0.237762451171875, 0.2626953125, 0.287628173828125, 0.31256103515625, 0.337493896484375, 0.3624267578125, 0.387359619140625, 0.41229248046875, 0.437225341796875, 0.462158203125, 0.487091064453125, 0.51202392578125, 0.536956787109375, 0.5618896484375, 0.586822509765625, 0.61175537109375, 0.636688232421875, 0.66162109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 0.0, 0.0, 5.0, 6.0, 2.0, 7.0, 7.0, 12.0, 5.0, 16.0, 19.0, 25.0, 18.0, 25.0, 24.0, 35.0, 27.0, 35.0, 35.0, 28.0, 41.0, 28.0, 49.0, 42.0, 42.0, 36.0, 34.0, 43.0, 29.0, 32.0, 35.0, 34.0, 27.0, 24.0, 32.0, 29.0, 19.0, 19.0, 14.0, 11.0, 7.0, 7.0, 7.0, 6.0, 7.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 2.0], "bins": [-0.1907958984375, -0.185150146484375, -0.17950439453125, -0.173858642578125, -0.168212890625, -0.162567138671875, -0.15692138671875, -0.151275634765625, -0.1456298828125, -0.139984130859375, -0.13433837890625, -0.128692626953125, -0.123046875, -0.117401123046875, -0.11175537109375, -0.106109619140625, -0.1004638671875, -0.094818115234375, -0.08917236328125, -0.083526611328125, -0.077880859375, -0.072235107421875, -0.06658935546875, -0.060943603515625, -0.0552978515625, -0.049652099609375, -0.04400634765625, -0.038360595703125, -0.03271484375, -0.027069091796875, -0.02142333984375, -0.015777587890625, -0.0101318359375, -0.004486083984375, 0.00115966796875, 0.006805419921875, 0.012451171875, 0.018096923828125, 0.02374267578125, 0.029388427734375, 0.0350341796875, 0.040679931640625, 0.04632568359375, 0.051971435546875, 0.0576171875, 0.063262939453125, 0.06890869140625, 0.074554443359375, 0.0802001953125, 0.085845947265625, 0.09149169921875, 0.097137451171875, 0.102783203125, 0.108428955078125, 0.11407470703125, 0.119720458984375, 0.1253662109375, 0.131011962890625, 0.13665771484375, 0.142303466796875, 0.14794921875, 0.153594970703125, 0.15924072265625, 0.164886474609375, 0.1705322265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 10.0, 11.0, 27.0, 62.0, 500.0, 70221.0, 976545.0, 979.0, 114.0, 28.0, 16.0, 6.0, 5.0, 6.0, 5.0, 1.0, 0.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.59765625, -6.43316650390625, -6.2686767578125, -6.10418701171875, -5.939697265625, -5.77520751953125, -5.6107177734375, -5.44622802734375, -5.28173828125, -5.11724853515625, -4.9527587890625, -4.78826904296875, -4.623779296875, -4.45928955078125, -4.2947998046875, -4.13031005859375, -3.9658203125, -3.80133056640625, -3.6368408203125, -3.47235107421875, -3.307861328125, -3.14337158203125, -2.9788818359375, -2.81439208984375, -2.64990234375, -2.48541259765625, -2.3209228515625, -2.15643310546875, -1.991943359375, -1.82745361328125, -1.6629638671875, -1.49847412109375, -1.333984375, -1.16949462890625, -1.0050048828125, -0.84051513671875, -0.676025390625, -0.51153564453125, -0.3470458984375, -0.18255615234375, -0.01806640625, 0.14642333984375, 0.3109130859375, 0.47540283203125, 0.639892578125, 0.80438232421875, 0.9688720703125, 1.13336181640625, 1.2978515625, 1.46234130859375, 1.6268310546875, 1.79132080078125, 1.955810546875, 2.12030029296875, 2.2847900390625, 2.44927978515625, 2.61376953125, 2.77825927734375, 2.9427490234375, 3.10723876953125, 3.271728515625, 3.43621826171875, 3.6007080078125, 3.76519775390625, 3.9296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 9.0, 18.0, 14.0, 33.0, 40.0, 44.0, 84.0, 116.0, 93.0, 128.0, 115.0, 76.0, 50.0, 39.0, 32.0, 21.0, 20.0, 10.0, 12.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.060434341430664e-05, -4.916265606880188e-05, -4.772096872329712e-05, -4.627928137779236e-05, -4.48375940322876e-05, -4.339590668678284e-05, -4.1954219341278076e-05, -4.0512531995773315e-05, -3.9070844650268555e-05, -3.7629157304763794e-05, -3.618746995925903e-05, -3.474578261375427e-05, -3.330409526824951e-05, -3.186240792274475e-05, -3.042072057723999e-05, -2.897903323173523e-05, -2.753734588623047e-05, -2.6095658540725708e-05, -2.4653971195220947e-05, -2.3212283849716187e-05, -2.1770596504211426e-05, -2.0328909158706665e-05, -1.8887221813201904e-05, -1.7445534467697144e-05, -1.6003847122192383e-05, -1.4562159776687622e-05, -1.3120472431182861e-05, -1.16787850856781e-05, -1.023709774017334e-05, -8.795410394668579e-06, -7.353723049163818e-06, -5.912035703659058e-06, -4.470348358154297e-06, -3.028661012649536e-06, -1.5869736671447754e-06, -1.4528632164001465e-07, 1.296401023864746e-06, 2.738088369369507e-06, 4.179775714874268e-06, 5.621463060379028e-06, 7.063150405883789e-06, 8.50483775138855e-06, 9.94652509689331e-06, 1.1388212442398071e-05, 1.2829899787902832e-05, 1.4271587133407593e-05, 1.5713274478912354e-05, 1.7154961824417114e-05, 1.8596649169921875e-05, 2.0038336515426636e-05, 2.1480023860931396e-05, 2.2921711206436157e-05, 2.4363398551940918e-05, 2.580508589744568e-05, 2.724677324295044e-05, 2.86884605884552e-05, 3.013014793395996e-05, 3.157183527946472e-05, 3.301352262496948e-05, 3.445520997047424e-05, 3.5896897315979004e-05, 3.7338584661483765e-05, 3.8780272006988525e-05, 4.0221959352493286e-05, 4.166364669799805e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 10.0, 9.0, 13.0, 20.0, 14.0, 43.0, 60.0, 102.0, 130.0, 203.0, 339.0, 546.0, 994.0, 2032.0, 4503.0, 14337.0, 146152.0, 812651.0, 50655.0, 8930.0, 3299.0, 1557.0, 731.0, 429.0, 255.0, 156.0, 120.0, 73.0, 54.0, 34.0, 34.0, 25.0, 15.0, 11.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0078125, -0.9792861938476562, -0.9507598876953125, -0.9222335815429688, -0.893707275390625, -0.8651809692382812, -0.8366546630859375, -0.8081283569335938, -0.77960205078125, -0.7510757446289062, -0.7225494384765625, -0.6940231323242188, -0.665496826171875, -0.6369705200195312, -0.6084442138671875, -0.5799179077148438, -0.5513916015625, -0.5228652954101562, -0.4943389892578125, -0.46581268310546875, -0.437286376953125, -0.40876007080078125, -0.3802337646484375, -0.35170745849609375, -0.32318115234375, -0.29465484619140625, -0.2661285400390625, -0.23760223388671875, -0.209075927734375, -0.18054962158203125, -0.1520233154296875, -0.12349700927734375, -0.094970703125, -0.06644439697265625, -0.0379180908203125, -0.00939178466796875, 0.019134521484375, 0.04766082763671875, 0.0761871337890625, 0.10471343994140625, 0.13323974609375, 0.16176605224609375, 0.1902923583984375, 0.21881866455078125, 0.247344970703125, 0.27587127685546875, 0.3043975830078125, 0.33292388916015625, 0.3614501953125, 0.38997650146484375, 0.4185028076171875, 0.44702911376953125, 0.475555419921875, 0.5040817260742188, 0.5326080322265625, 0.5611343383789062, 0.58966064453125, 0.6181869506835938, 0.6467132568359375, 0.6752395629882812, 0.703765869140625, 0.7322921752929688, 0.7608184814453125, 0.7893447875976562, 0.81787109375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 11.0, 6.0, 28.0, 28.0, 77.0, 94.0, 136.0, 158.0, 162.0, 132.0, 77.0, 36.0, 23.0, 11.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.317626953125, -0.3042411804199219, -0.29085540771484375, -0.2774696350097656, -0.2640838623046875, -0.2506980895996094, -0.23731231689453125, -0.22392654418945312, -0.210540771484375, -0.19715499877929688, -0.18376922607421875, -0.17038345336914062, -0.1569976806640625, -0.14361190795898438, -0.13022613525390625, -0.11684036254882812, -0.10345458984375, -0.09006881713867188, -0.07668304443359375, -0.06329727172851562, -0.0499114990234375, -0.036525726318359375, -0.02313995361328125, -0.009754180908203125, 0.003631591796875, 0.017017364501953125, 0.03040313720703125, 0.043788909912109375, 0.0571746826171875, 0.07056045532226562, 0.08394622802734375, 0.09733200073242188, 0.1107177734375, 0.12410354614257812, 0.13748931884765625, 0.15087509155273438, 0.1642608642578125, 0.17764663696289062, 0.19103240966796875, 0.20441818237304688, 0.217803955078125, 0.23118972778320312, 0.24457550048828125, 0.2579612731933594, 0.2713470458984375, 0.2847328186035156, 0.29811859130859375, 0.3115043640136719, 0.32489013671875, 0.3382759094238281, 0.35166168212890625, 0.3650474548339844, 0.3784332275390625, 0.3918190002441406, 0.40520477294921875, 0.4185905456542969, 0.431976318359375, 0.4453620910644531, 0.45874786376953125, 0.4721336364746094, 0.4855194091796875, 0.4989051818847656, 0.5122909545898438, 0.5256767272949219, 0.5390625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 17.0, 33.0, 64.0, 170.0, 277.0, 217.0, 93.0, 51.0, 31.0, 12.0, 15.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.351346254348755, -3.1964821815490723, -3.0416183471679688, -2.886754274368286, -2.7318902015686035, -2.5770263671875, -2.4221622943878174, -2.2672982215881348, -2.1124343872070312, -1.9575704336166382, -1.8027064800262451, -1.6478424072265625, -1.4929784536361694, -1.3381145000457764, -1.1832504272460938, -1.0283864736557007, -0.8735225200653076, -0.7186585664749146, -0.5637945532798767, -0.40893056988716125, -0.2540665864944458, -0.09920263290405273, 0.05566138029098511, 0.21052539348602295, 0.365389347076416, 0.5202533006668091, 0.6751173138618469, 0.8299813270568848, 0.9848452806472778, 1.139709234237671, 1.2945733070373535, 1.4494372606277466, 1.6043014526367188, 1.7591654062271118, 1.9140293598175049, 2.0688934326171875, 2.223757266998291, 2.3786213397979736, 2.5334854125976562, 2.6883492469787598, 2.8432133197784424, 2.998077392578125, 3.1529412269592285, 3.307805299758911, 3.4626693725585938, 3.6175332069396973, 3.77239727973938, 3.9272613525390625, 4.082125186920166, 4.2369890213012695, 4.391853332519531, 4.546717166900635, 4.701581001281738, 4.8564453125, 5.0113091468811035, 5.166172981262207, 5.321037292480469, 5.475901126861572, 5.630765438079834, 5.7856292724609375, 5.940493106842041, 6.0953569412231445, 6.250221252441406, 6.40508508682251, 6.559948921203613]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 7.0, 11.0, 10.0, 16.0, 23.0, 24.0, 32.0, 29.0, 41.0, 54.0, 59.0, 68.0, 65.0, 77.0, 77.0, 59.0, 64.0, 58.0, 44.0, 35.0, 32.0, 21.0, 19.0, 17.0, 11.0, 12.0, 7.0, 9.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.070004463195801, -2.0014545917510986, -1.9329047203063965, -1.8643549680709839, -1.7958050966262817, -1.7272552251815796, -1.658705472946167, -1.5901556015014648, -1.5216057300567627, -1.4530558586120605, -1.3845059871673584, -1.3159562349319458, -1.2474063634872437, -1.1788564920425415, -1.110306739807129, -1.0417568683624268, -0.9732069969177246, -0.9046571254730225, -0.8361073136329651, -0.7675575017929077, -0.6990076303482056, -0.6304577589035034, -0.561907947063446, -0.4933581054210663, -0.4248082637786865, -0.35625842213630676, -0.287708580493927, -0.21915873885154724, -0.15060889720916748, -0.08205905556678772, -0.013509213924407959, 0.0550406277179718, 0.12359046936035156, 0.19214031100273132, 0.2606901526451111, 0.32923999428749084, 0.3977898359298706, 0.46633967757225037, 0.5348895192146301, 0.6034393310546875, 0.6719892024993896, 0.7405390739440918, 0.8090888857841492, 0.8776386976242065, 0.9461885690689087, 1.0147384405136108, 1.0832881927490234, 1.1518380641937256, 1.2203879356384277, 1.2889378070831299, 1.357487678527832, 1.4260374307632446, 1.4945873022079468, 1.563137173652649, 1.6316869258880615, 1.7002367973327637, 1.7687866687774658, 1.837336540222168, 1.9058864116668701, 1.9744361639022827, 2.0429859161376953, 2.1115357875823975, 2.1800856590270996, 2.2486355304718018, 2.317185401916504]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 10.0, 9.0, 8.0, 3.0, 15.0, 9.0, 4.0, 11.0, 57.0, 79.0, 139.0, 434.0, 1618.0, 9281.0, 214418.0, 3946473.0, 18526.0, 2284.0, 535.0, 168.0, 76.0, 34.0, 24.0, 14.0, 3.0, 12.0, 8.0, 6.0, 2.0, 6.0, 6.0, 2.0, 4.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.447265625, -3.346343994140625, -3.24542236328125, -3.144500732421875, -3.0435791015625, -2.942657470703125, -2.84173583984375, -2.740814208984375, -2.639892578125, -2.538970947265625, -2.43804931640625, -2.337127685546875, -2.2362060546875, -2.135284423828125, -2.03436279296875, -1.933441162109375, -1.83251953125, -1.731597900390625, -1.63067626953125, -1.529754638671875, -1.4288330078125, -1.327911376953125, -1.22698974609375, -1.126068115234375, -1.025146484375, -0.924224853515625, -0.82330322265625, -0.722381591796875, -0.6214599609375, -0.520538330078125, -0.41961669921875, -0.318695068359375, -0.2177734375, -0.116851806640625, -0.01593017578125, 0.084991455078125, 0.1859130859375, 0.286834716796875, 0.38775634765625, 0.488677978515625, 0.589599609375, 0.690521240234375, 0.79144287109375, 0.892364501953125, 0.9932861328125, 1.094207763671875, 1.19512939453125, 1.296051025390625, 1.39697265625, 1.497894287109375, 1.59881591796875, 1.699737548828125, 1.8006591796875, 1.901580810546875, 2.00250244140625, 2.103424072265625, 2.204345703125, 2.305267333984375, 2.40618896484375, 2.507110595703125, 2.6080322265625, 2.708953857421875, 2.80987548828125, 2.910797119140625, 3.01171875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 3.0, 13.0, 11.0, 14.0, 23.0, 25.0, 34.0, 42.0, 50.0, 73.0, 80.0, 80.0, 97.0, 76.0, 84.0, 71.0, 54.0, 45.0, 29.0, 27.0, 18.0, 11.0, 14.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05865478515625, -0.056993961334228516, -0.05533313751220703, -0.05367231369018555, -0.05201148986816406, -0.05035066604614258, -0.048689842224121094, -0.04702901840209961, -0.045368194580078125, -0.04370737075805664, -0.042046546936035156, -0.04038572311401367, -0.03872489929199219, -0.0370640754699707, -0.03540325164794922, -0.033742427825927734, -0.03208160400390625, -0.030420780181884766, -0.02875995635986328, -0.027099132537841797, -0.025438308715820312, -0.023777484893798828, -0.022116661071777344, -0.02045583724975586, -0.018795013427734375, -0.01713418960571289, -0.015473365783691406, -0.013812541961669922, -0.012151718139648438, -0.010490894317626953, -0.008830070495605469, -0.007169246673583984, -0.0055084228515625, -0.0038475990295410156, -0.0021867752075195312, -0.0005259513854980469, 0.0011348724365234375, 0.002795696258544922, 0.004456520080566406, 0.006117343902587891, 0.007778167724609375, 0.00943899154663086, 0.011099815368652344, 0.012760639190673828, 0.014421463012695312, 0.016082286834716797, 0.01774311065673828, 0.019403934478759766, 0.02106475830078125, 0.022725582122802734, 0.02438640594482422, 0.026047229766845703, 0.027708053588867188, 0.029368877410888672, 0.031029701232910156, 0.03269052505493164, 0.034351348876953125, 0.03601217269897461, 0.037672996520996094, 0.03933382034301758, 0.04099464416503906, 0.04265546798706055, 0.04431629180908203, 0.045977115631103516, 0.047637939453125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 7.0, 17.0, 58.0, 263.0, 2142.0, 134685.0, 4048625.0, 7797.0, 538.0, 103.0, 28.0, 13.0, 5.0, 8.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3681640625, -1.2195892333984375, -1.071014404296875, -0.9224395751953125, -0.77386474609375, -0.6252899169921875, -0.476715087890625, -0.3281402587890625, -0.1795654296875, -0.0309906005859375, 0.117584228515625, 0.2661590576171875, 0.41473388671875, 0.5633087158203125, 0.711883544921875, 0.8604583740234375, 1.009033203125, 1.1576080322265625, 1.306182861328125, 1.4547576904296875, 1.60333251953125, 1.7519073486328125, 1.900482177734375, 2.0490570068359375, 2.1976318359375, 2.3462066650390625, 2.494781494140625, 2.6433563232421875, 2.79193115234375, 2.9405059814453125, 3.089080810546875, 3.2376556396484375, 3.38623046875, 3.5348052978515625, 3.683380126953125, 3.8319549560546875, 3.98052978515625, 4.1291046142578125, 4.277679443359375, 4.4262542724609375, 4.5748291015625, 4.7234039306640625, 4.871978759765625, 5.0205535888671875, 5.16912841796875, 5.3177032470703125, 5.466278076171875, 5.6148529052734375, 5.763427734375, 5.9120025634765625, 6.060577392578125, 6.2091522216796875, 6.35772705078125, 6.5063018798828125, 6.654876708984375, 6.8034515380859375, 6.9520263671875, 7.1006011962890625, 7.249176025390625, 7.3977508544921875, 7.54632568359375, 7.6949005126953125, 7.843475341796875, 7.9920501708984375, 8.140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 4.0, 6.0, 2.0, 8.0, 9.0, 20.0, 27.0, 26.0, 34.0, 53.0, 79.0, 150.0, 312.0, 1914.0, 796.0, 256.0, 125.0, 86.0, 43.0, 37.0, 20.0, 19.0, 10.0, 14.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18359375, -0.17831993103027344, -0.17304611206054688, -0.1677722930908203, -0.16249847412109375, -0.1572246551513672, -0.15195083618164062, -0.14667701721191406, -0.1414031982421875, -0.13612937927246094, -0.13085556030273438, -0.1255817413330078, -0.12030792236328125, -0.11503410339355469, -0.10976028442382812, -0.10448646545410156, -0.099212646484375, -0.09393882751464844, -0.08866500854492188, -0.08339118957519531, -0.07811737060546875, -0.07284355163574219, -0.06756973266601562, -0.06229591369628906, -0.0570220947265625, -0.05174827575683594, -0.046474456787109375, -0.04120063781738281, -0.03592681884765625, -0.030652999877929688, -0.025379180908203125, -0.020105361938476562, -0.01483154296875, -0.009557723999023438, -0.004283905029296875, 0.0009899139404296875, 0.00626373291015625, 0.011537551879882812, 0.016811370849609375, 0.022085189819335938, 0.0273590087890625, 0.03263282775878906, 0.037906646728515625, 0.04318046569824219, 0.04845428466796875, 0.05372810363769531, 0.059001922607421875, 0.06427574157714844, 0.069549560546875, 0.07482337951660156, 0.08009719848632812, 0.08537101745605469, 0.09064483642578125, 0.09591865539550781, 0.10119247436523438, 0.10646629333496094, 0.1117401123046875, 0.11701393127441406, 0.12228775024414062, 0.1275615692138672, 0.13283538818359375, 0.1381092071533203, 0.14338302612304688, 0.14865684509277344, 0.1539306640625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [10.0, 143.0, 839.0, 24.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7362297773361206, -0.4180448353290558, -0.09985989332199097, 0.21832501888275146, 0.5365099906921387, 0.8546949625015259, 1.1728798151016235, 1.4910649061203003, 1.809249758720398, 2.127434730529785, 2.445619583129883, 2.7638044357299805, 3.0819895267486572, 3.400174617767334, 3.7183594703674316, 4.036544322967529, 4.354729175567627, 4.672914028167725, 4.991098880767822, 5.309284210205078, 5.627469062805176, 5.945653915405273, 6.263838768005371, 6.582023620605469, 6.900208950042725, 7.218393802642822, 7.53657865524292, 7.854763984680176, 8.172948837280273, 8.491133689880371, 8.809318542480469, 9.127503395080566, 9.44568920135498, 9.763874053955078, 10.082058906555176, 10.400243759155273, 10.718428611755371, 11.036613464355469, 11.354799270629883, 11.67298412322998, 11.991168975830078, 12.309353828430176, 12.627538681030273, 12.945723533630371, 13.263908386230469, 13.582094192504883, 13.900278091430664, 14.218463897705078, 14.53664779663086, 14.854832649230957, 15.173017501831055, 15.491202354431152, 15.80938720703125, 16.127573013305664, 16.445756912231445, 16.76394271850586, 17.082128524780273, 17.400314331054688, 17.71849822998047, 18.036684036254883, 18.354867935180664, 18.673053741455078, 18.99123764038086, 19.309423446655273, 19.627607345581055]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 6.0, 4.0, 15.0, 17.0, 25.0, 51.0, 46.0, 67.0, 81.0, 74.0, 93.0, 84.0, 99.0, 65.0, 83.0, 57.0, 45.0, 26.0, 17.0, 21.0, 15.0, 7.0, 4.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9549301266670227, -0.9193679690361023, -0.8838058114051819, -0.8482436537742615, -0.8126814961433411, -0.7771193385124207, -0.7415571212768555, -0.7059949636459351, -0.6704328060150146, -0.6348706483840942, -0.5993084907531738, -0.5637463331222534, -0.528184175491333, -0.4926220178604126, -0.4570598304271698, -0.4214976727962494, -0.38593554496765137, -0.35037338733673096, -0.31481122970581055, -0.27924907207489014, -0.24368689954280853, -0.20812474191188812, -0.17256256937980652, -0.1370004117488861, -0.1014382541179657, -0.06587609648704529, -0.03031393140554428, 0.005248233675956726, 0.040810391306877136, 0.07637254893779755, 0.11193472146987915, 0.14749687910079956, 0.18305909633636475, 0.21862125396728516, 0.25418341159820557, 0.289745569229126, 0.3253077268600464, 0.3608698844909668, 0.3964320719242096, 0.43199422955513, 0.4675563871860504, 0.5031185746192932, 0.5386807322502136, 0.574242889881134, 0.6098050475120544, 0.6453672051429749, 0.6809293627738953, 0.7164915204048157, 0.7520536780357361, 0.7876158356666565, 0.8231779932975769, 0.8587401509284973, 0.8943023085594177, 0.9298644661903381, 0.9654266834259033, 1.0009888410568237, 1.0365509986877441, 1.0721131563186646, 1.107675313949585, 1.1432374715805054, 1.1787996292114258, 1.2143617868423462, 1.2499239444732666, 1.285486102104187, 1.3210482597351074]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 3.0, 7.0, 8.0, 6.0, 15.0, 14.0, 12.0, 27.0, 32.0, 21.0, 23.0, 23.0, 38.0, 31.0, 46.0, 60.0, 200.0, 2559.0, 70114.0, 906364.0, 65943.0, 2451.0, 182.0, 68.0, 40.0, 46.0, 37.0, 28.0, 24.0, 18.0, 17.0, 24.0, 14.0, 10.0, 9.0, 5.0, 4.0, 4.0, 4.0, 5.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6787109375, -1.6236572265625, -1.568603515625, -1.5135498046875, -1.45849609375, -1.4034423828125, -1.348388671875, -1.2933349609375, -1.23828125, -1.1832275390625, -1.128173828125, -1.0731201171875, -1.01806640625, -0.9630126953125, -0.907958984375, -0.8529052734375, -0.7978515625, -0.7427978515625, -0.687744140625, -0.6326904296875, -0.57763671875, -0.5225830078125, -0.467529296875, -0.4124755859375, -0.357421875, -0.3023681640625, -0.247314453125, -0.1922607421875, -0.13720703125, -0.0821533203125, -0.027099609375, 0.0279541015625, 0.0830078125, 0.1380615234375, 0.193115234375, 0.2481689453125, 0.30322265625, 0.3582763671875, 0.413330078125, 0.4683837890625, 0.5234375, 0.5784912109375, 0.633544921875, 0.6885986328125, 0.74365234375, 0.7987060546875, 0.853759765625, 0.9088134765625, 0.9638671875, 1.0189208984375, 1.073974609375, 1.1290283203125, 1.18408203125, 1.2391357421875, 1.294189453125, 1.3492431640625, 1.404296875, 1.4593505859375, 1.514404296875, 1.5694580078125, 1.62451171875, 1.6795654296875, 1.734619140625, 1.7896728515625, 1.8447265625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [6.0, 6.0, 16.0, 38.0, 90.0, 144.0, 175.0, 195.0, 148.0, 98.0, 56.0, 31.0, 14.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036102294921875, -0.031128406524658203, -0.026154518127441406, -0.02118062973022461, -0.016206741333007812, -0.011232852935791016, -0.006258964538574219, -0.0012850761413574219, 0.003688812255859375, 0.008662700653076172, 0.013636589050292969, 0.018610477447509766, 0.023584365844726562, 0.02855825424194336, 0.033532142639160156, 0.03850603103637695, 0.04347991943359375, 0.04845380783081055, 0.053427696228027344, 0.05840158462524414, 0.06337547302246094, 0.06834936141967773, 0.07332324981689453, 0.07829713821411133, 0.08327102661132812, 0.08824491500854492, 0.09321880340576172, 0.09819269180297852, 0.10316658020019531, 0.10814046859741211, 0.1131143569946289, 0.1180882453918457, 0.1230621337890625, 0.1280360221862793, 0.1330099105834961, 0.1379837989807129, 0.1429576873779297, 0.14793157577514648, 0.15290546417236328, 0.15787935256958008, 0.16285324096679688, 0.16782712936401367, 0.17280101776123047, 0.17777490615844727, 0.18274879455566406, 0.18772268295288086, 0.19269657135009766, 0.19767045974731445, 0.20264434814453125, 0.20761823654174805, 0.21259212493896484, 0.21756601333618164, 0.22253990173339844, 0.22751379013061523, 0.23248767852783203, 0.23746156692504883, 0.24243545532226562, 0.24740934371948242, 0.2523832321166992, 0.257357120513916, 0.2623310089111328, 0.2673048973083496, 0.2722787857055664, 0.2772526741027832, 0.2822265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 8.0, 10.0, 9.0, 10.0, 31.0, 32.0, 59.0, 96.0, 151.0, 284.0, 549.0, 1101.0, 2580.0, 6719.0, 20069.0, 69083.0, 244283.0, 430962.0, 194016.0, 53062.0, 15922.0, 5415.0, 2100.0, 856.0, 485.0, 253.0, 135.0, 91.0, 48.0, 44.0, 26.0, 10.0, 4.0, 16.0, 6.0, 9.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.67041015625, -0.6514739990234375, -0.632537841796875, -0.6136016845703125, -0.59466552734375, -0.5757293701171875, -0.556793212890625, -0.5378570556640625, -0.5189208984375, -0.4999847412109375, -0.481048583984375, -0.4621124267578125, -0.44317626953125, -0.4242401123046875, -0.405303955078125, -0.3863677978515625, -0.367431640625, -0.3484954833984375, -0.329559326171875, -0.3106231689453125, -0.29168701171875, -0.2727508544921875, -0.253814697265625, -0.2348785400390625, -0.2159423828125, -0.1970062255859375, -0.178070068359375, -0.1591339111328125, -0.14019775390625, -0.1212615966796875, -0.102325439453125, -0.0833892822265625, -0.064453125, -0.0455169677734375, -0.026580810546875, -0.0076446533203125, 0.01129150390625, 0.0302276611328125, 0.049163818359375, 0.0680999755859375, 0.0870361328125, 0.1059722900390625, 0.124908447265625, 0.1438446044921875, 0.16278076171875, 0.1817169189453125, 0.200653076171875, 0.2195892333984375, 0.238525390625, 0.2574615478515625, 0.276397705078125, 0.2953338623046875, 0.31427001953125, 0.3332061767578125, 0.352142333984375, 0.3710784912109375, 0.3900146484375, 0.4089508056640625, 0.427886962890625, 0.4468231201171875, 0.46575927734375, 0.4846954345703125, 0.503631591796875, 0.5225677490234375, 0.54150390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 7.0, 3.0, 10.0, 11.0, 4.0, 27.0, 13.0, 29.0, 33.0, 23.0, 27.0, 36.0, 37.0, 52.0, 49.0, 38.0, 38.0, 37.0, 44.0, 47.0, 45.0, 40.0, 50.0, 42.0, 30.0, 29.0, 28.0, 27.0, 26.0, 17.0, 16.0, 17.0, 11.0, 10.0, 9.0, 11.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.2853851318359375, -0.276336669921875, -0.2672882080078125, -0.25823974609375, -0.2491912841796875, -0.240142822265625, -0.2310943603515625, -0.2220458984375, -0.2129974365234375, -0.203948974609375, -0.1949005126953125, -0.18585205078125, -0.1768035888671875, -0.167755126953125, -0.1587066650390625, -0.149658203125, -0.1406097412109375, -0.131561279296875, -0.1225128173828125, -0.11346435546875, -0.1044158935546875, -0.095367431640625, -0.0863189697265625, -0.0772705078125, -0.0682220458984375, -0.059173583984375, -0.0501251220703125, -0.04107666015625, -0.0320281982421875, -0.022979736328125, -0.0139312744140625, -0.0048828125, 0.0041656494140625, 0.013214111328125, 0.0222625732421875, 0.03131103515625, 0.0403594970703125, 0.049407958984375, 0.0584564208984375, 0.0675048828125, 0.0765533447265625, 0.085601806640625, 0.0946502685546875, 0.10369873046875, 0.1127471923828125, 0.121795654296875, 0.1308441162109375, 0.139892578125, 0.1489410400390625, 0.157989501953125, 0.1670379638671875, 0.17608642578125, 0.1851348876953125, 0.194183349609375, 0.2032318115234375, 0.2122802734375, 0.2213287353515625, 0.230377197265625, 0.2394256591796875, 0.24847412109375, 0.2575225830078125, 0.266571044921875, 0.2756195068359375, 0.28466796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 5.0, 9.0, 3.0, 7.0, 7.0, 8.0, 14.0, 14.0, 29.0, 41.0, 83.0, 136.0, 422.0, 1361.0, 5403.0, 40668.0, 731063.0, 250081.0, 14959.0, 2860.0, 761.0, 286.0, 122.0, 58.0, 36.0, 21.0, 16.0, 11.0, 11.0, 11.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 7.0, 4.0, 1.0, 0.0, 0.0, 3.0, 3.0], "bins": [-1.4541015625, -1.415618896484375, -1.37713623046875, -1.338653564453125, -1.3001708984375, -1.261688232421875, -1.22320556640625, -1.184722900390625, -1.146240234375, -1.107757568359375, -1.06927490234375, -1.030792236328125, -0.9923095703125, -0.953826904296875, -0.91534423828125, -0.876861572265625, -0.83837890625, -0.799896240234375, -0.76141357421875, -0.722930908203125, -0.6844482421875, -0.645965576171875, -0.60748291015625, -0.569000244140625, -0.530517578125, -0.492034912109375, -0.45355224609375, -0.415069580078125, -0.3765869140625, -0.338104248046875, -0.29962158203125, -0.261138916015625, -0.22265625, -0.184173583984375, -0.14569091796875, -0.107208251953125, -0.0687255859375, -0.030242919921875, 0.00823974609375, 0.046722412109375, 0.085205078125, 0.123687744140625, 0.16217041015625, 0.200653076171875, 0.2391357421875, 0.277618408203125, 0.31610107421875, 0.354583740234375, 0.39306640625, 0.431549072265625, 0.47003173828125, 0.508514404296875, 0.5469970703125, 0.585479736328125, 0.62396240234375, 0.662445068359375, 0.700927734375, 0.739410400390625, 0.77789306640625, 0.816375732421875, 0.8548583984375, 0.893341064453125, 0.93182373046875, 0.970306396484375, 1.0087890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 5.0, 8.0, 9.0, 17.0, 32.0, 33.0, 62.0, 90.0, 146.0, 193.0, 146.0, 100.0, 48.0, 44.0, 21.0, 16.0, 8.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011050701141357422, -0.00010711792856454849, -0.00010372884571552277, -0.00010033976286649704, -9.695068001747131e-05, -9.356159716844559e-05, -9.017251431941986e-05, -8.678343147039413e-05, -8.339434862136841e-05, -8.000526577234268e-05, -7.661618292331696e-05, -7.322710007429123e-05, -6.98380172252655e-05, -6.644893437623978e-05, -6.305985152721405e-05, -5.9670768678188324e-05, -5.62816858291626e-05, -5.289260298013687e-05, -4.9503520131111145e-05, -4.611443728208542e-05, -4.272535443305969e-05, -3.9336271584033966e-05, -3.594718873500824e-05, -3.2558105885982513e-05, -2.9169023036956787e-05, -2.577994018793106e-05, -2.2390857338905334e-05, -1.9001774489879608e-05, -1.5612691640853882e-05, -1.2223608791828156e-05, -8.83452594280243e-06, -5.445443093776703e-06, -2.0563602447509766e-06, 1.3327226042747498e-06, 4.721805453300476e-06, 8.110888302326202e-06, 1.1499971151351929e-05, 1.4889054000377655e-05, 1.827813684940338e-05, 2.1667219698429108e-05, 2.5056302547454834e-05, 2.844538539648056e-05, 3.183446824550629e-05, 3.522355109453201e-05, 3.861263394355774e-05, 4.2001716792583466e-05, 4.539079964160919e-05, 4.877988249063492e-05, 5.2168965339660645e-05, 5.555804818868637e-05, 5.89471310377121e-05, 6.233621388673782e-05, 6.572529673576355e-05, 6.911437958478928e-05, 7.2503462433815e-05, 7.589254528284073e-05, 7.928162813186646e-05, 8.267071098089218e-05, 8.605979382991791e-05, 8.944887667894363e-05, 9.283795952796936e-05, 9.622704237699509e-05, 9.961612522602081e-05, 0.00010300520807504654, 0.00010639429092407227]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 8.0, 7.0, 10.0, 15.0, 27.0, 34.0, 60.0, 138.0, 332.0, 1114.0, 4604.0, 29496.0, 672168.0, 319719.0, 16519.0, 3011.0, 784.0, 265.0, 106.0, 39.0, 22.0, 18.0, 12.0, 9.0, 2.0, 7.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.78125, -1.736572265625, -1.69189453125, -1.647216796875, -1.6025390625, -1.557861328125, -1.51318359375, -1.468505859375, -1.423828125, -1.379150390625, -1.33447265625, -1.289794921875, -1.2451171875, -1.200439453125, -1.15576171875, -1.111083984375, -1.06640625, -1.021728515625, -0.97705078125, -0.932373046875, -0.8876953125, -0.843017578125, -0.79833984375, -0.753662109375, -0.708984375, -0.664306640625, -0.61962890625, -0.574951171875, -0.5302734375, -0.485595703125, -0.44091796875, -0.396240234375, -0.3515625, -0.306884765625, -0.26220703125, -0.217529296875, -0.1728515625, -0.128173828125, -0.08349609375, -0.038818359375, 0.005859375, 0.050537109375, 0.09521484375, 0.139892578125, 0.1845703125, 0.229248046875, 0.27392578125, 0.318603515625, 0.36328125, 0.407958984375, 0.45263671875, 0.497314453125, 0.5419921875, 0.586669921875, 0.63134765625, 0.676025390625, 0.720703125, 0.765380859375, 0.81005859375, 0.854736328125, 0.8994140625, 0.944091796875, 0.98876953125, 1.033447265625, 1.078125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 5.0, 13.0, 15.0, 22.0, 28.0, 40.0, 60.0, 93.0, 118.0, 120.0, 122.0, 100.0, 86.0, 53.0, 28.0, 25.0, 10.0, 12.0, 6.0, 8.0, 3.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.572265625, -0.5578651428222656, -0.5434646606445312, -0.5290641784667969, -0.5146636962890625, -0.5002632141113281, -0.48586273193359375, -0.4714622497558594, -0.457061767578125, -0.4426612854003906, -0.42826080322265625, -0.4138603210449219, -0.3994598388671875, -0.3850593566894531, -0.37065887451171875, -0.3562583923339844, -0.34185791015625, -0.3274574279785156, -0.31305694580078125, -0.2986564636230469, -0.2842559814453125, -0.2698554992675781, -0.25545501708984375, -0.24105453491210938, -0.226654052734375, -0.21225357055664062, -0.19785308837890625, -0.18345260620117188, -0.1690521240234375, -0.15465164184570312, -0.14025115966796875, -0.12585067749023438, -0.1114501953125, -0.09704971313476562, -0.08264923095703125, -0.06824874877929688, -0.0538482666015625, -0.039447784423828125, -0.02504730224609375, -0.010646820068359375, 0.003753662109375, 0.018154144287109375, 0.03255462646484375, 0.046955108642578125, 0.0613555908203125, 0.07575607299804688, 0.09015655517578125, 0.10455703735351562, 0.11895751953125, 0.13335800170898438, 0.14775848388671875, 0.16215896606445312, 0.1765594482421875, 0.19095993041992188, 0.20536041259765625, 0.21976089477539062, 0.234161376953125, 0.24856185913085938, 0.26296234130859375, 0.2773628234863281, 0.2917633056640625, 0.3061637878417969, 0.32056427001953125, 0.3349647521972656, 0.349365234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 206.0, 802.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.642921447753906, -5.819841384887695, -3.9967615604400635, -2.1736817359924316, -0.3506016731262207, 1.472477912902832, 3.295557975769043, 5.118638038635254, 6.941718101501465, 8.764798164367676, 10.587878227233887, 12.410957336425781, 14.234037399291992, 16.057117462158203, 17.880197525024414, 19.703277587890625, 21.526357650756836, 23.349437713623047, 25.172517776489258, 26.99559783935547, 28.81867790222168, 30.64175796508789, 32.46483612060547, 34.28791809082031, 36.11099624633789, 37.93407440185547, 39.75715637207031, 41.58023452758789, 43.403316497802734, 45.22639465332031, 47.049476623535156, 48.872554779052734, 50.69563674926758, 52.518714904785156, 54.341796875, 56.16487503051758, 57.98795700073242, 59.81103515625, 61.634117126464844, 63.45719528198242, 65.2802734375, 67.10335540771484, 68.92642974853516, 70.74951171875, 72.57259368896484, 74.39567565917969, 76.21875, 78.04183197021484, 79.86491394042969, 81.68799591064453, 83.51107025146484, 85.33415222167969, 87.15723419189453, 88.98031616210938, 90.80339050292969, 92.62647247314453, 94.44955444335938, 96.27263641357422, 98.09571075439453, 99.91879272460938, 101.74187469482422, 103.56495666503906, 105.38803100585938, 107.21111297607422, 109.03419494628906]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 8.0, 4.0, 11.0, 11.0, 22.0, 31.0, 23.0, 28.0, 36.0, 42.0, 44.0, 61.0, 58.0, 46.0, 68.0, 61.0, 46.0, 48.0, 56.0, 46.0, 40.0, 40.0, 30.0, 36.0, 26.0, 19.0, 17.0, 15.0, 12.0, 6.0, 4.0, 4.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.215603828430176, -2.1301000118255615, -2.0445964336395264, -1.959092617034912, -1.8735888004302979, -1.7880851030349731, -1.7025814056396484, -1.6170775890350342, -1.5315738916397095, -1.4460701942443848, -1.3605663776397705, -1.2750626802444458, -1.189558982849121, -1.1040551662445068, -1.0185514688491821, -0.9330477118492126, -0.8475439548492432, -0.7620401978492737, -0.6765364408493042, -0.5910327434539795, -0.50552898645401, -0.4200252294540405, -0.3345215320587158, -0.24901777505874634, -0.16351401805877686, -0.07801027595996857, 0.007493466138839722, 0.09299719333648682, 0.1785009503364563, 0.2640047073364258, 0.3495084047317505, 0.43501216173171997, 0.5205159187316895, 0.6060196757316589, 0.6915234327316284, 0.7770271301269531, 0.8625308871269226, 0.9480346441268921, 1.0335383415222168, 1.119042158126831, 1.2045458555221558, 1.2900495529174805, 1.3755533695220947, 1.4610570669174194, 1.5465607643127441, 1.6320645809173584, 1.717568278312683, 1.8030719757080078, 1.888575792312622, 1.9740794897079468, 2.0595831871032715, 2.1450870037078857, 2.2305908203125, 2.316094398498535, 2.4015982151031494, 2.4871020317077637, 2.572605609893799, 2.658109426498413, 2.7436130046844482, 2.8291168212890625, 2.9146206378936768, 3.000124454498291, 3.085628032684326, 3.1711318492889404, 3.2566356658935547]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 2.0, 12.0, 21.0, 54.0, 84.0, 122.0, 355.0, 16236.0, 4168088.0, 8264.0, 518.0, 230.0, 127.0, 75.0, 48.0, 24.0, 11.0, 11.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7890625, -2.564697265625, -2.34033203125, -2.115966796875, -1.8916015625, -1.667236328125, -1.44287109375, -1.218505859375, -0.994140625, -0.769775390625, -0.54541015625, -0.321044921875, -0.0966796875, 0.127685546875, 0.35205078125, 0.576416015625, 0.80078125, 1.025146484375, 1.24951171875, 1.473876953125, 1.6982421875, 1.922607421875, 2.14697265625, 2.371337890625, 2.595703125, 2.820068359375, 3.04443359375, 3.268798828125, 3.4931640625, 3.717529296875, 3.94189453125, 4.166259765625, 4.390625, 4.614990234375, 4.83935546875, 5.063720703125, 5.2880859375, 5.512451171875, 5.73681640625, 5.961181640625, 6.185546875, 6.409912109375, 6.63427734375, 6.858642578125, 7.0830078125, 7.307373046875, 7.53173828125, 7.756103515625, 7.98046875, 8.204833984375, 8.42919921875, 8.653564453125, 8.8779296875, 9.102294921875, 9.32666015625, 9.551025390625, 9.775390625, 9.999755859375, 10.22412109375, 10.448486328125, 10.6728515625, 10.897216796875, 11.12158203125, 11.345947265625, 11.5703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 6.0, 13.0, 23.0, 57.0, 77.0, 134.0, 164.0, 160.0, 138.0, 106.0, 64.0, 40.0, 22.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04876708984375, -0.042901039123535156, -0.03703498840332031, -0.03116893768310547, -0.025302886962890625, -0.01943683624267578, -0.013570785522460938, -0.007704734802246094, -0.00183868408203125, 0.004027366638183594, 0.009893417358398438, 0.01575946807861328, 0.021625518798828125, 0.02749156951904297, 0.03335762023925781, 0.039223670959472656, 0.0450897216796875, 0.050955772399902344, 0.05682182312011719, 0.06268787384033203, 0.06855392456054688, 0.07441997528076172, 0.08028602600097656, 0.0861520767211914, 0.09201812744140625, 0.0978841781616211, 0.10375022888183594, 0.10961627960205078, 0.11548233032226562, 0.12134838104248047, 0.1272144317626953, 0.13308048248291016, 0.138946533203125, 0.14481258392333984, 0.1506786346435547, 0.15654468536376953, 0.16241073608398438, 0.16827678680419922, 0.17414283752441406, 0.1800088882446289, 0.18587493896484375, 0.1917409896850586, 0.19760704040527344, 0.20347309112548828, 0.20933914184570312, 0.21520519256591797, 0.2210712432861328, 0.22693729400634766, 0.2328033447265625, 0.23866939544677734, 0.2445354461669922, 0.25040149688720703, 0.2562675476074219, 0.2621335983276367, 0.26799964904785156, 0.2738656997680664, 0.27973175048828125, 0.2855978012084961, 0.29146385192871094, 0.2973299026489258, 0.3031959533691406, 0.30906200408935547, 0.3149280548095703, 0.32079410552978516, 0.32666015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 9.0, 9.0, 12.0, 32.0, 50.0, 99.0, 175.0, 320.0, 1257.0, 4173055.0, 18217.0, 430.0, 202.0, 152.0, 111.0, 58.0, 41.0, 29.0, 16.0, 11.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0859375, -4.6868896484375, -4.287841796875, -3.8887939453125, -3.48974609375, -3.0906982421875, -2.691650390625, -2.2926025390625, -1.8935546875, -1.4945068359375, -1.095458984375, -0.6964111328125, -0.29736328125, 0.1016845703125, 0.500732421875, 0.8997802734375, 1.298828125, 1.6978759765625, 2.096923828125, 2.4959716796875, 2.89501953125, 3.2940673828125, 3.693115234375, 4.0921630859375, 4.4912109375, 4.8902587890625, 5.289306640625, 5.6883544921875, 6.08740234375, 6.4864501953125, 6.885498046875, 7.2845458984375, 7.68359375, 8.0826416015625, 8.481689453125, 8.8807373046875, 9.27978515625, 9.6788330078125, 10.077880859375, 10.4769287109375, 10.8759765625, 11.2750244140625, 11.674072265625, 12.0731201171875, 12.47216796875, 12.8712158203125, 13.270263671875, 13.6693115234375, 14.068359375, 14.4674072265625, 14.866455078125, 15.2655029296875, 15.66455078125, 16.0635986328125, 16.462646484375, 16.8616943359375, 17.2607421875, 17.6597900390625, 18.058837890625, 18.4578857421875, 18.85693359375, 19.2559814453125, 19.655029296875, 20.0540771484375, 20.453125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 16.0, 86.0, 613.0, 3264.0, 95.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88134765625, -0.8355331420898438, -0.7897186279296875, -0.7439041137695312, -0.698089599609375, -0.6522750854492188, -0.6064605712890625, -0.5606460571289062, -0.51483154296875, -0.46901702880859375, -0.4232025146484375, -0.37738800048828125, -0.331573486328125, -0.28575897216796875, -0.2399444580078125, -0.19412994384765625, -0.1483154296875, -0.10250091552734375, -0.0566864013671875, -0.01087188720703125, 0.034942626953125, 0.08075714111328125, 0.1265716552734375, 0.17238616943359375, 0.21820068359375, 0.26401519775390625, 0.3098297119140625, 0.35564422607421875, 0.401458740234375, 0.44727325439453125, 0.4930877685546875, 0.5389022827148438, 0.584716796875, 0.6305313110351562, 0.6763458251953125, 0.7221603393554688, 0.767974853515625, 0.8137893676757812, 0.8596038818359375, 0.9054183959960938, 0.95123291015625, 0.9970474243164062, 1.0428619384765625, 1.0886764526367188, 1.134490966796875, 1.1803054809570312, 1.2261199951171875, 1.2719345092773438, 1.3177490234375, 1.3635635375976562, 1.4093780517578125, 1.4551925659179688, 1.501007080078125, 1.5468215942382812, 1.5926361083984375, 1.6384506225585938, 1.68426513671875, 1.7300796508789062, 1.7758941650390625, 1.8217086791992188, 1.867523193359375, 1.9133377075195312, 1.9591522216796875, 2.0049667358398438, 2.05078125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 10.0, 53.0, 454.0, 394.0, 75.0, 17.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1566619873046875, -4.728206634521484, -4.299750804901123, -3.87129545211792, -3.4428398609161377, -3.0143842697143555, -2.5859289169311523, -2.15747332572937, -1.729017734527588, -1.3005621433258057, -0.872106671333313, -0.4436511993408203, -0.015195608139038086, 0.41325998306274414, 0.8417153358459473, 1.2701709270477295, 1.6986265182495117, 2.127082109451294, 2.555537700653076, 2.9839930534362793, 3.4124486446380615, 3.8409042358398438, 4.269359588623047, 4.69781494140625, 5.126270771026611, 5.5547261238098145, 5.983181953430176, 6.411637306213379, 6.840092658996582, 7.268548488616943, 7.6970038414001465, 8.125459671020508, 8.553915023803711, 8.982370376586914, 9.410825729370117, 9.83928108215332, 10.26773738861084, 10.696192741394043, 11.124648094177246, 11.55310344696045, 11.981559753417969, 12.410015106201172, 12.838470458984375, 13.266925811767578, 13.695382118225098, 14.1238374710083, 14.552292823791504, 14.980748176574707, 15.40920352935791, 15.837658882141113, 16.266115188598633, 16.694570541381836, 17.12302589416504, 17.551481246948242, 17.979936599731445, 18.40839195251465, 18.83684730529785, 19.265302658081055, 19.693758010864258, 20.12221336364746, 20.550668716430664, 20.9791259765625, 21.407581329345703, 21.836036682128906, 22.26449203491211]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 17.0, 31.0, 54.0, 76.0, 104.0, 150.0, 150.0, 119.0, 117.0, 67.0, 45.0, 37.0, 14.0, 4.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.733723163604736, -5.552923202514648, -5.372123718261719, -5.191324234008789, -5.010524272918701, -4.829724311828613, -4.648924827575684, -4.468125343322754, -4.287325382232666, -4.106525421142578, -3.9257259368896484, -3.7449262142181396, -3.564126491546631, -3.383326768875122, -3.2025270462036133, -3.0217273235321045, -2.8409276008605957, -2.660127878189087, -2.479328155517578, -2.2985284328460693, -2.1177287101745605, -1.9369289875030518, -1.756129264831543, -1.5753295421600342, -1.3945298194885254, -1.2137300968170166, -1.0329303741455078, -0.852130651473999, -0.6713309288024902, -0.49053120613098145, -0.30973148345947266, -0.12893176078796387, 0.051868438720703125, 0.23266816139221191, 0.4134678840637207, 0.5942676067352295, 0.7750673294067383, 0.9558670520782471, 1.1366667747497559, 1.3174664974212646, 1.4982662200927734, 1.6790659427642822, 1.859865665435791, 2.0406653881073, 2.2214651107788086, 2.4022648334503174, 2.583064556121826, 2.763864278793335, 2.9446640014648438, 3.1254637241363525, 3.3062634468078613, 3.48706316947937, 3.667862892150879, 3.8486626148223877, 4.0294623374938965, 4.210262298583984, 4.391061782836914, 4.571861267089844, 4.752661228179932, 4.9334611892700195, 5.114260673522949, 5.295060157775879, 5.475860118865967, 5.656660079956055, 5.837459564208984]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 5.0, 4.0, 2.0, 5.0, 3.0, 13.0, 26.0, 18.0, 27.0, 41.0, 57.0, 79.0, 116.0, 197.0, 386.0, 818.0, 2184.0, 8592.0, 75422.0, 749416.0, 189783.0, 15808.0, 3251.0, 1076.0, 458.0, 244.0, 145.0, 111.0, 57.0, 38.0, 40.0, 29.0, 20.0, 25.0, 14.0, 7.0, 6.0, 4.0, 1.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-2.60546875, -2.528076171875, -2.45068359375, -2.373291015625, -2.2958984375, -2.218505859375, -2.14111328125, -2.063720703125, -1.986328125, -1.908935546875, -1.83154296875, -1.754150390625, -1.6767578125, -1.599365234375, -1.52197265625, -1.444580078125, -1.3671875, -1.289794921875, -1.21240234375, -1.135009765625, -1.0576171875, -0.980224609375, -0.90283203125, -0.825439453125, -0.748046875, -0.670654296875, -0.59326171875, -0.515869140625, -0.4384765625, -0.361083984375, -0.28369140625, -0.206298828125, -0.12890625, -0.051513671875, 0.02587890625, 0.103271484375, 0.1806640625, 0.258056640625, 0.33544921875, 0.412841796875, 0.490234375, 0.567626953125, 0.64501953125, 0.722412109375, 0.7998046875, 0.877197265625, 0.95458984375, 1.031982421875, 1.109375, 1.186767578125, 1.26416015625, 1.341552734375, 1.4189453125, 1.496337890625, 1.57373046875, 1.651123046875, 1.728515625, 1.805908203125, 1.88330078125, 1.960693359375, 2.0380859375, 2.115478515625, 2.19287109375, 2.270263671875, 2.34765625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 14.0, 34.0, 60.0, 72.0, 127.0, 157.0, 179.0, 136.0, 90.0, 52.0, 41.0, 17.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2230224609375, -0.21198081970214844, -0.20093917846679688, -0.1898975372314453, -0.17885589599609375, -0.1678142547607422, -0.15677261352539062, -0.14573097229003906, -0.1346893310546875, -0.12364768981933594, -0.11260604858398438, -0.10156440734863281, -0.09052276611328125, -0.07948112487792969, -0.06843948364257812, -0.05739784240722656, -0.046356201171875, -0.03531455993652344, -0.024272918701171875, -0.013231277465820312, -0.00218963623046875, 0.008852005004882812, 0.019893646240234375, 0.030935287475585938, 0.0419769287109375, 0.05301856994628906, 0.06406021118164062, 0.07510185241699219, 0.08614349365234375, 0.09718513488769531, 0.10822677612304688, 0.11926841735839844, 0.13031005859375, 0.14135169982910156, 0.15239334106445312, 0.1634349822998047, 0.17447662353515625, 0.1855182647705078, 0.19655990600585938, 0.20760154724121094, 0.2186431884765625, 0.22968482971191406, 0.24072647094726562, 0.2517681121826172, 0.26280975341796875, 0.2738513946533203, 0.2848930358886719, 0.29593467712402344, 0.306976318359375, 0.31801795959472656, 0.3290596008300781, 0.3401012420654297, 0.35114288330078125, 0.3621845245361328, 0.3732261657714844, 0.38426780700683594, 0.3953094482421875, 0.40635108947753906, 0.4173927307128906, 0.4284343719482422, 0.43947601318359375, 0.4505176544189453, 0.4615592956542969, 0.47260093688964844, 0.483642578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 11.0, 18.0, 8.0, 23.0, 8.0, 23.0, 45.0, 79.0, 159.0, 336.0, 990.0, 3980.0, 26204.0, 310471.0, 633757.0, 62013.0, 7783.0, 1668.0, 506.0, 198.0, 105.0, 42.0, 29.0, 24.0, 10.0, 14.0, 10.0, 8.0, 5.0, 10.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8984375, -1.8429107666015625, -1.787384033203125, -1.7318572998046875, -1.67633056640625, -1.6208038330078125, -1.565277099609375, -1.5097503662109375, -1.4542236328125, -1.3986968994140625, -1.343170166015625, -1.2876434326171875, -1.23211669921875, -1.1765899658203125, -1.121063232421875, -1.0655364990234375, -1.010009765625, -0.9544830322265625, -0.898956298828125, -0.8434295654296875, -0.78790283203125, -0.7323760986328125, -0.676849365234375, -0.6213226318359375, -0.5657958984375, -0.5102691650390625, -0.454742431640625, -0.3992156982421875, -0.34368896484375, -0.2881622314453125, -0.232635498046875, -0.1771087646484375, -0.12158203125, -0.0660552978515625, -0.010528564453125, 0.0449981689453125, 0.10052490234375, 0.1560516357421875, 0.211578369140625, 0.2671051025390625, 0.3226318359375, 0.3781585693359375, 0.433685302734375, 0.4892120361328125, 0.54473876953125, 0.6002655029296875, 0.655792236328125, 0.7113189697265625, 0.766845703125, 0.8223724365234375, 0.877899169921875, 0.9334259033203125, 0.98895263671875, 1.0444793701171875, 1.100006103515625, 1.1555328369140625, 1.2110595703125, 1.2665863037109375, 1.322113037109375, 1.3776397705078125, 1.43316650390625, 1.4886932373046875, 1.544219970703125, 1.5997467041015625, 1.6552734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 11.0, 13.0, 16.0, 16.0, 21.0, 24.0, 18.0, 26.0, 31.0, 45.0, 41.0, 49.0, 59.0, 51.0, 47.0, 62.0, 56.0, 50.0, 42.0, 46.0, 40.0, 45.0, 38.0, 41.0, 25.0, 16.0, 16.0, 13.0, 7.0, 6.0, 7.0, 4.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59130859375, -0.5711288452148438, -0.5509490966796875, -0.5307693481445312, -0.510589599609375, -0.49040985107421875, -0.4702301025390625, -0.45005035400390625, -0.42987060546875, -0.40969085693359375, -0.3895111083984375, -0.36933135986328125, -0.349151611328125, -0.32897186279296875, -0.3087921142578125, -0.28861236572265625, -0.2684326171875, -0.24825286865234375, -0.2280731201171875, -0.20789337158203125, -0.187713623046875, -0.16753387451171875, -0.1473541259765625, -0.12717437744140625, -0.10699462890625, -0.08681488037109375, -0.0666351318359375, -0.04645538330078125, -0.026275634765625, -0.00609588623046875, 0.0140838623046875, 0.03426361083984375, 0.054443359375, 0.07462310791015625, 0.0948028564453125, 0.11498260498046875, 0.135162353515625, 0.15534210205078125, 0.1755218505859375, 0.19570159912109375, 0.21588134765625, 0.23606109619140625, 0.2562408447265625, 0.27642059326171875, 0.296600341796875, 0.31678009033203125, 0.3369598388671875, 0.35713958740234375, 0.3773193359375, 0.39749908447265625, 0.4176788330078125, 0.43785858154296875, 0.458038330078125, 0.47821807861328125, 0.4983978271484375, 0.5185775756835938, 0.53875732421875, 0.5589370727539062, 0.5791168212890625, 0.5992965698242188, 0.619476318359375, 0.6396560668945312, 0.6598358154296875, 0.6800155639648438, 0.7001953125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 4.0, 12.0, 12.0, 24.0, 22.0, 40.0, 63.0, 97.0, 195.0, 324.0, 663.0, 1691.0, 4866.0, 22759.0, 243885.0, 703924.0, 56090.0, 9288.0, 2542.0, 1012.0, 469.0, 238.0, 121.0, 81.0, 41.0, 38.0, 11.0, 14.0, 11.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8837890625, -0.8487548828125, -0.813720703125, -0.7786865234375, -0.74365234375, -0.7086181640625, -0.673583984375, -0.6385498046875, -0.603515625, -0.5684814453125, -0.533447265625, -0.4984130859375, -0.46337890625, -0.4283447265625, -0.393310546875, -0.3582763671875, -0.3232421875, -0.2882080078125, -0.253173828125, -0.2181396484375, -0.18310546875, -0.1480712890625, -0.113037109375, -0.0780029296875, -0.04296875, -0.0079345703125, 0.027099609375, 0.0621337890625, 0.09716796875, 0.1322021484375, 0.167236328125, 0.2022705078125, 0.2373046875, 0.2723388671875, 0.307373046875, 0.3424072265625, 0.37744140625, 0.4124755859375, 0.447509765625, 0.4825439453125, 0.517578125, 0.5526123046875, 0.587646484375, 0.6226806640625, 0.65771484375, 0.6927490234375, 0.727783203125, 0.7628173828125, 0.7978515625, 0.8328857421875, 0.867919921875, 0.9029541015625, 0.93798828125, 0.9730224609375, 1.008056640625, 1.0430908203125, 1.078125, 1.1131591796875, 1.148193359375, 1.1832275390625, 1.21826171875, 1.2532958984375, 1.288330078125, 1.3233642578125, 1.3583984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 10.0, 15.0, 11.0, 12.0, 18.0, 21.0, 35.0, 49.0, 57.0, 79.0, 97.0, 112.0, 99.0, 88.0, 64.0, 45.0, 34.0, 28.0, 28.0, 23.0, 15.0, 12.0, 8.0, 3.0, 10.0, 5.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.821487426757812e-05, -8.568447083234787e-05, -8.315406739711761e-05, -8.062366396188736e-05, -7.80932605266571e-05, -7.556285709142685e-05, -7.30324536561966e-05, -7.050205022096634e-05, -6.797164678573608e-05, -6.544124335050583e-05, -6.291083991527557e-05, -6.038043648004532e-05, -5.7850033044815063e-05, -5.531962960958481e-05, -5.278922617435455e-05, -5.02588227391243e-05, -4.772841930389404e-05, -4.519801586866379e-05, -4.266761243343353e-05, -4.013720899820328e-05, -3.760680556297302e-05, -3.507640212774277e-05, -3.254599869251251e-05, -3.0015595257282257e-05, -2.7485191822052002e-05, -2.4954788386821747e-05, -2.2424384951591492e-05, -1.9893981516361237e-05, -1.736357808113098e-05, -1.4833174645900726e-05, -1.2302771210670471e-05, -9.772367775440216e-06, -7.241964340209961e-06, -4.711560904979706e-06, -2.1811574697494507e-06, 3.4924596548080444e-07, 2.8796494007110596e-06, 5.410052835941315e-06, 7.94045627117157e-06, 1.0470859706401825e-05, 1.300126314163208e-05, 1.5531666576862335e-05, 1.806207001209259e-05, 2.0592473447322845e-05, 2.31228768825531e-05, 2.5653280317783356e-05, 2.818368375301361e-05, 3.0714087188243866e-05, 3.324449062347412e-05, 3.5774894058704376e-05, 3.830529749393463e-05, 4.0835700929164886e-05, 4.336610436439514e-05, 4.58965077996254e-05, 4.842691123485565e-05, 5.095731467008591e-05, 5.348771810531616e-05, 5.601812154054642e-05, 5.854852497577667e-05, 6.107892841100693e-05, 6.360933184623718e-05, 6.613973528146744e-05, 6.867013871669769e-05, 7.120054215192795e-05, 7.37309455871582e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 12.0, 11.0, 39.0, 55.0, 78.0, 149.0, 315.0, 672.0, 1757.0, 5605.0, 24293.0, 239671.0, 689483.0, 70054.0, 11267.0, 3022.0, 1078.0, 479.0, 212.0, 123.0, 54.0, 41.0, 25.0, 16.0, 16.0, 5.0, 5.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78759765625, -0.7551345825195312, -0.7226715087890625, -0.6902084350585938, -0.657745361328125, -0.6252822875976562, -0.5928192138671875, -0.5603561401367188, -0.52789306640625, -0.49542999267578125, -0.4629669189453125, -0.43050384521484375, -0.398040771484375, -0.36557769775390625, -0.3331146240234375, -0.30065155029296875, -0.2681884765625, -0.23572540283203125, -0.2032623291015625, -0.17079925537109375, -0.138336181640625, -0.10587310791015625, -0.0734100341796875, -0.04094696044921875, -0.00848388671875, 0.02397918701171875, 0.0564422607421875, 0.08890533447265625, 0.121368408203125, 0.15383148193359375, 0.1862945556640625, 0.21875762939453125, 0.251220703125, 0.28368377685546875, 0.3161468505859375, 0.34860992431640625, 0.381072998046875, 0.41353607177734375, 0.4459991455078125, 0.47846221923828125, 0.51092529296875, 0.5433883666992188, 0.5758514404296875, 0.6083145141601562, 0.640777587890625, 0.6732406616210938, 0.7057037353515625, 0.7381668090820312, 0.7706298828125, 0.8030929565429688, 0.8355560302734375, 0.8680191040039062, 0.900482177734375, 0.9329452514648438, 0.9654083251953125, 0.9978713989257812, 1.03033447265625, 1.0627975463867188, 1.0952606201171875, 1.1277236938476562, 1.160186767578125, 1.1926498413085938, 1.2251129150390625, 1.2575759887695312, 1.2900390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 9.0, 5.0, 7.0, 10.0, 19.0, 19.0, 33.0, 37.0, 51.0, 82.0, 111.0, 120.0, 119.0, 105.0, 78.0, 51.0, 48.0, 31.0, 19.0, 14.0, 8.0, 5.0, 2.0, 8.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.43115234375, -0.41509246826171875, -0.3990325927734375, -0.38297271728515625, -0.366912841796875, -0.35085296630859375, -0.3347930908203125, -0.31873321533203125, -0.30267333984375, -0.28661346435546875, -0.2705535888671875, -0.25449371337890625, -0.238433837890625, -0.22237396240234375, -0.2063140869140625, -0.19025421142578125, -0.1741943359375, -0.15813446044921875, -0.1420745849609375, -0.12601470947265625, -0.109954833984375, -0.09389495849609375, -0.0778350830078125, -0.06177520751953125, -0.04571533203125, -0.02965545654296875, -0.0135955810546875, 0.00246429443359375, 0.018524169921875, 0.03458404541015625, 0.0506439208984375, 0.06670379638671875, 0.082763671875, 0.09882354736328125, 0.1148834228515625, 0.13094329833984375, 0.147003173828125, 0.16306304931640625, 0.1791229248046875, 0.19518280029296875, 0.21124267578125, 0.22730255126953125, 0.2433624267578125, 0.25942230224609375, 0.275482177734375, 0.29154205322265625, 0.3076019287109375, 0.32366180419921875, 0.3397216796875, 0.35578155517578125, 0.3718414306640625, 0.38790130615234375, 0.403961181640625, 0.42002105712890625, 0.4360809326171875, 0.45214080810546875, 0.46820068359375, 0.48426055908203125, 0.5003204345703125, 0.5163803100585938, 0.532440185546875, 0.5485000610351562, 0.5645599365234375, 0.5806198120117188, 0.5966796875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 23.0, 45.0, 152.0, 323.0, 328.0, 94.0, 22.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.024442672729492, -12.559853553771973, -12.095263481140137, -11.630674362182617, -11.166084289550781, -10.701495170593262, -10.236906051635742, -9.772315979003906, -9.307726860046387, -8.843137741088867, -8.378547668457031, -7.913958549499512, -7.449368953704834, -6.984779357910156, -6.5201897621154785, -6.055600166320801, -5.591010570526123, -5.126420974731445, -4.661831378936768, -4.19724178314209, -3.7326526641845703, -3.2680630683898926, -2.803473472595215, -2.338884115219116, -1.8742945194244385, -1.4097050428390503, -0.9451155066490173, -0.4805259704589844, -0.01593649387359619, 0.448652982711792, 0.9132425785064697, 1.3778319358825684, 1.842421531677246, 2.307011127471924, 2.7716004848480225, 3.2361900806427, 3.700779438018799, 4.165369033813477, 4.629958629608154, 5.094548225402832, 5.559137344360352, 6.023726940155029, 6.488316535949707, 6.952905654907227, 7.417495250701904, 7.882084846496582, 8.346673965454102, 8.811264038085938, 9.275854110717773, 9.740443229675293, 10.205033302307129, 10.669622421264648, 11.134212493896484, 11.598801612854004, 12.063390731811523, 12.52798080444336, 12.992569923400879, 13.457159042358398, 13.921749114990234, 14.386338233947754, 14.85092830657959, 15.31551742553711, 15.780107498168945, 16.24469566345215, 16.709285736083984]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 6.0, 8.0, 9.0, 10.0, 18.0, 22.0, 20.0, 21.0, 31.0, 39.0, 43.0, 36.0, 58.0, 58.0, 59.0, 82.0, 34.0, 64.0, 58.0, 41.0, 45.0, 38.0, 39.0, 30.0, 30.0, 22.0, 15.0, 16.0, 12.0, 8.0, 7.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.738967418670654, -5.582995414733887, -5.427023887634277, -5.27105188369751, -5.115079879760742, -4.959107875823975, -4.803136348724365, -4.647164344787598, -4.49119234085083, -4.3352203369140625, -4.179248809814453, -4.0232768058776855, -3.867304801940918, -3.7113330364227295, -3.555361270904541, -3.3993892669677734, -3.243417501449585, -3.0874457359313965, -2.931473731994629, -2.7755019664764404, -2.619529962539673, -2.4635581970214844, -2.307586193084717, -2.1516144275665283, -1.9956425428390503, -1.8396706581115723, -1.6836987733840942, -1.5277268886566162, -1.3717551231384277, -1.2157831192016602, -1.0598113536834717, -0.9038394689559937, -0.7478675842285156, -0.5918956995010376, -0.43592384457588196, -0.2799519896507263, -0.12398010492324829, 0.031991779804229736, 0.187963604927063, 0.343935489654541, 0.49990737438201904, 0.6558792591094971, 0.8118511438369751, 0.9678229689598083, 1.1237947940826416, 1.2797667980194092, 1.4357385635375977, 1.5917104482650757, 1.7476823329925537, 1.9036542177200317, 2.0596261024475098, 2.2155978679656982, 2.371569871902466, 2.5275416374206543, 2.683513641357422, 2.8394854068756104, 2.995457172393799, 3.1514289379119873, 3.307400941848755, 3.4633727073669434, 3.619344711303711, 3.7753164768218994, 3.931288242340088, 4.0872602462768555, 4.243232250213623]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 10.0, 12.0, 13.0, 14.0, 29.0, 51.0, 63.0, 200.0, 511.0, 1939.0, 11098.0, 131150.0, 3936007.0, 99706.0, 9707.0, 2181.0, 659.0, 313.0, 167.0, 118.0, 80.0, 58.0, 48.0, 28.0, 22.0, 16.0, 14.0, 14.0, 8.0, 6.0, 8.0, 5.0, 4.0, 3.0, 2.0, 5.0, 7.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.912109375, -2.813262939453125, -2.71441650390625, -2.615570068359375, -2.5167236328125, -2.417877197265625, -2.31903076171875, -2.220184326171875, -2.121337890625, -2.022491455078125, -1.92364501953125, -1.824798583984375, -1.7259521484375, -1.627105712890625, -1.52825927734375, -1.429412841796875, -1.33056640625, -1.231719970703125, -1.13287353515625, -1.034027099609375, -0.9351806640625, -0.836334228515625, -0.73748779296875, -0.638641357421875, -0.539794921875, -0.440948486328125, -0.34210205078125, -0.243255615234375, -0.1444091796875, -0.045562744140625, 0.05328369140625, 0.152130126953125, 0.2509765625, 0.349822998046875, 0.44866943359375, 0.547515869140625, 0.6463623046875, 0.745208740234375, 0.84405517578125, 0.942901611328125, 1.041748046875, 1.140594482421875, 1.23944091796875, 1.338287353515625, 1.4371337890625, 1.535980224609375, 1.63482666015625, 1.733673095703125, 1.83251953125, 1.931365966796875, 2.03021240234375, 2.129058837890625, 2.2279052734375, 2.326751708984375, 2.42559814453125, 2.524444580078125, 2.623291015625, 2.722137451171875, 2.82098388671875, 2.919830322265625, 3.0186767578125, 3.117523193359375, 3.21636962890625, 3.315216064453125, 3.4140625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 11.0, 15.0, 24.0, 47.0, 72.0, 91.0, 151.0, 147.0, 133.0, 116.0, 86.0, 47.0, 33.0, 19.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17626953125, -0.16504669189453125, -0.1538238525390625, -0.14260101318359375, -0.131378173828125, -0.12015533447265625, -0.1089324951171875, -0.09770965576171875, -0.08648681640625, -0.07526397705078125, -0.0640411376953125, -0.05281829833984375, -0.041595458984375, -0.03037261962890625, -0.0191497802734375, -0.00792694091796875, 0.0032958984375, 0.01451873779296875, 0.0257415771484375, 0.03696441650390625, 0.048187255859375, 0.05941009521484375, 0.0706329345703125, 0.08185577392578125, 0.09307861328125, 0.10430145263671875, 0.1155242919921875, 0.12674713134765625, 0.137969970703125, 0.14919281005859375, 0.1604156494140625, 0.17163848876953125, 0.182861328125, 0.19408416748046875, 0.2053070068359375, 0.21652984619140625, 0.227752685546875, 0.23897552490234375, 0.2501983642578125, 0.26142120361328125, 0.27264404296875, 0.28386688232421875, 0.2950897216796875, 0.30631256103515625, 0.317535400390625, 0.32875823974609375, 0.3399810791015625, 0.35120391845703125, 0.3624267578125, 0.37364959716796875, 0.3848724365234375, 0.39609527587890625, 0.407318115234375, 0.41854095458984375, 0.4297637939453125, 0.44098663330078125, 0.45220947265625, 0.46343231201171875, 0.4746551513671875, 0.48587799072265625, 0.497100830078125, 0.5083236694335938, 0.5195465087890625, 0.5307693481445312, 0.5419921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 27.0, 83.0, 266.0, 1973.0, 4183373.0, 7582.0, 637.0, 203.0, 83.0, 30.0, 13.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.22393798828125, -4.7330322265625, -4.24212646484375, -3.751220703125, -3.26031494140625, -2.7694091796875, -2.27850341796875, -1.78759765625, -1.29669189453125, -0.8057861328125, -0.31488037109375, 0.176025390625, 0.66693115234375, 1.1578369140625, 1.64874267578125, 2.1396484375, 2.63055419921875, 3.1214599609375, 3.61236572265625, 4.103271484375, 4.59417724609375, 5.0850830078125, 5.57598876953125, 6.06689453125, 6.55780029296875, 7.0487060546875, 7.53961181640625, 8.030517578125, 8.52142333984375, 9.0123291015625, 9.50323486328125, 9.994140625, 10.48504638671875, 10.9759521484375, 11.46685791015625, 11.957763671875, 12.44866943359375, 12.9395751953125, 13.43048095703125, 13.92138671875, 14.41229248046875, 14.9031982421875, 15.39410400390625, 15.885009765625, 16.37591552734375, 16.8668212890625, 17.35772705078125, 17.8486328125, 18.33953857421875, 18.8304443359375, 19.32135009765625, 19.812255859375, 20.30316162109375, 20.7940673828125, 21.28497314453125, 21.77587890625, 22.26678466796875, 22.7576904296875, 23.24859619140625, 23.739501953125, 24.23040771484375, 24.7213134765625, 25.21221923828125, 25.703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 8.0, 18.0, 40.0, 144.0, 1001.0, 2593.0, 196.0, 51.0, 20.0, 9.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3701171875, -0.3294219970703125, -0.288726806640625, -0.2480316162109375, -0.20733642578125, -0.1666412353515625, -0.125946044921875, -0.0852508544921875, -0.0445556640625, -0.0038604736328125, 0.036834716796875, 0.0775299072265625, 0.11822509765625, 0.1589202880859375, 0.199615478515625, 0.2403106689453125, 0.281005859375, 0.3217010498046875, 0.362396240234375, 0.4030914306640625, 0.44378662109375, 0.4844818115234375, 0.525177001953125, 0.5658721923828125, 0.6065673828125, 0.6472625732421875, 0.687957763671875, 0.7286529541015625, 0.76934814453125, 0.8100433349609375, 0.850738525390625, 0.8914337158203125, 0.93212890625, 0.9728240966796875, 1.013519287109375, 1.0542144775390625, 1.09490966796875, 1.1356048583984375, 1.176300048828125, 1.2169952392578125, 1.2576904296875, 1.2983856201171875, 1.339080810546875, 1.3797760009765625, 1.42047119140625, 1.4611663818359375, 1.501861572265625, 1.5425567626953125, 1.583251953125, 1.6239471435546875, 1.664642333984375, 1.7053375244140625, 1.74603271484375, 1.7867279052734375, 1.827423095703125, 1.8681182861328125, 1.9088134765625, 1.9495086669921875, 1.990203857421875, 2.0308990478515625, 2.07159423828125, 2.1122894287109375, 2.152984619140625, 2.1936798095703125, 2.234375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 11.0, 86.0, 735.0, 155.0, 22.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.332279205322266, -23.731731414794922, -23.13118553161621, -22.530637741088867, -21.930091857910156, -21.329544067382812, -20.72899627685547, -20.128448486328125, -19.527902603149414, -18.92735481262207, -18.32680892944336, -17.726261138916016, -17.125713348388672, -16.52516746520996, -15.924619674682617, -15.32407283782959, -14.723526000976562, -14.122979164123535, -13.522432327270508, -12.921884536743164, -12.321337699890137, -11.72079086303711, -11.120243072509766, -10.519696235656738, -9.919149398803711, -9.318602561950684, -8.718055725097656, -8.117507934570312, -7.516961097717285, -6.916414260864258, -6.315866947174072, -5.715319633483887, -5.114770889282227, -4.514224052429199, -3.9136767387390137, -3.3131296634674072, -2.712582588195801, -2.1120355129241943, -1.511488437652588, -0.9109411239624023, -0.310394287109375, 0.29015278816223145, 0.8906998634338379, 1.4912469387054443, 2.091794013977051, 2.6923410892486572, 3.2928881645202637, 3.893435478210449, 4.493982315063477, 5.094529151916504, 5.6950764656066895, 6.295623779296875, 6.896170616149902, 7.49671745300293, 8.097265243530273, 8.6978120803833, 9.298358917236328, 9.898905754089355, 10.499452590942383, 11.100000381469727, 11.700547218322754, 12.301094055175781, 12.901641845703125, 13.502188682556152, 14.10273551940918]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 15.0, 31.0, 53.0, 50.0, 71.0, 95.0, 99.0, 99.0, 115.0, 105.0, 77.0, 61.0, 55.0, 27.0, 18.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.00167989730835, -4.837448596954346, -4.673216819763184, -4.50898551940918, -4.344754219055176, -4.180522918701172, -4.016291618347168, -3.852059841156006, -3.687828540802002, -3.523597240447998, -3.359365701675415, -3.195134162902832, -3.030902862548828, -2.866671562194824, -2.702440023422241, -2.538208484649658, -2.3739771842956543, -2.2097458839416504, -2.0455143451690674, -1.881282925605774, -1.7170515060424805, -1.552820086479187, -1.3885886669158936, -1.2243572473526, -1.0601258277893066, -0.8958944082260132, -0.7316629886627197, -0.5674315690994263, -0.4032001495361328, -0.23896872997283936, -0.0747373104095459, 0.08949410915374756, 0.2537250518798828, 0.41795647144317627, 0.5821878910064697, 0.7464193105697632, 0.9106507301330566, 1.07488214969635, 1.2391135692596436, 1.403344988822937, 1.5675764083862305, 1.731807827949524, 1.8960392475128174, 2.0602707862854004, 2.2245020866394043, 2.388733386993408, 2.552964925765991, 2.717196464538574, 2.881427764892578, 3.045659065246582, 3.209890604019165, 3.374122142791748, 3.538353443145752, 3.702584743499756, 3.866816282272339, 4.031047821044922, 4.195279121398926, 4.35951042175293, 4.523741722106934, 4.687973499298096, 4.8522047996521, 5.0164361000061035, 5.180667877197266, 5.3448991775512695, 5.509130477905273]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 9.0, 8.0, 6.0, 15.0, 17.0, 18.0, 43.0, 48.0, 56.0, 65.0, 97.0, 141.0, 183.0, 297.0, 524.0, 1000.0, 2419.0, 7225.0, 29141.0, 173827.0, 634736.0, 159537.0, 27498.0, 6891.0, 2279.0, 994.0, 503.0, 309.0, 183.0, 127.0, 99.0, 69.0, 43.0, 43.0, 18.0, 18.0, 15.0, 17.0, 9.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.16015625, -2.097503662109375, -2.03485107421875, -1.972198486328125, -1.9095458984375, -1.846893310546875, -1.78424072265625, -1.721588134765625, -1.658935546875, -1.596282958984375, -1.53363037109375, -1.470977783203125, -1.4083251953125, -1.345672607421875, -1.28302001953125, -1.220367431640625, -1.15771484375, -1.095062255859375, -1.03240966796875, -0.969757080078125, -0.9071044921875, -0.844451904296875, -0.78179931640625, -0.719146728515625, -0.656494140625, -0.593841552734375, -0.53118896484375, -0.468536376953125, -0.4058837890625, -0.343231201171875, -0.28057861328125, -0.217926025390625, -0.1552734375, -0.092620849609375, -0.02996826171875, 0.032684326171875, 0.0953369140625, 0.157989501953125, 0.22064208984375, 0.283294677734375, 0.345947265625, 0.408599853515625, 0.47125244140625, 0.533905029296875, 0.5965576171875, 0.659210205078125, 0.72186279296875, 0.784515380859375, 0.84716796875, 0.909820556640625, 0.97247314453125, 1.035125732421875, 1.0977783203125, 1.160430908203125, 1.22308349609375, 1.285736083984375, 1.348388671875, 1.411041259765625, 1.47369384765625, 1.536346435546875, 1.5989990234375, 1.661651611328125, 1.72430419921875, 1.786956787109375, 1.849609375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 9.0, 21.0, 32.0, 45.0, 55.0, 88.0, 84.0, 89.0, 118.0, 96.0, 93.0, 82.0, 63.0, 43.0, 28.0, 22.0, 10.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33447265625, -0.32141876220703125, -0.3083648681640625, -0.29531097412109375, -0.282257080078125, -0.26920318603515625, -0.2561492919921875, -0.24309539794921875, -0.23004150390625, -0.21698760986328125, -0.2039337158203125, -0.19087982177734375, -0.177825927734375, -0.16477203369140625, -0.1517181396484375, -0.13866424560546875, -0.1256103515625, -0.11255645751953125, -0.0995025634765625, -0.08644866943359375, -0.073394775390625, -0.06034088134765625, -0.0472869873046875, -0.03423309326171875, -0.02117919921875, -0.00812530517578125, 0.0049285888671875, 0.01798248291015625, 0.031036376953125, 0.04409027099609375, 0.0571441650390625, 0.07019805908203125, 0.083251953125, 0.09630584716796875, 0.1093597412109375, 0.12241363525390625, 0.135467529296875, 0.14852142333984375, 0.1615753173828125, 0.17462921142578125, 0.18768310546875, 0.20073699951171875, 0.2137908935546875, 0.22684478759765625, 0.239898681640625, 0.25295257568359375, 0.2660064697265625, 0.27906036376953125, 0.2921142578125, 0.30516815185546875, 0.3182220458984375, 0.33127593994140625, 0.344329833984375, 0.35738372802734375, 0.3704376220703125, 0.38349151611328125, 0.39654541015625, 0.40959930419921875, 0.4226531982421875, 0.43570709228515625, 0.448760986328125, 0.46181488037109375, 0.4748687744140625, 0.48792266845703125, 0.5009765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 8.0, 5.0, 15.0, 23.0, 28.0, 57.0, 90.0, 154.0, 391.0, 1044.0, 3329.0, 14706.0, 119519.0, 727403.0, 157939.0, 17883.0, 3913.0, 1155.0, 430.0, 196.0, 103.0, 50.0, 35.0, 22.0, 16.0, 8.0, 14.0, 2.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03515625, -1.9726409912109375, -1.910125732421875, -1.8476104736328125, -1.78509521484375, -1.7225799560546875, -1.660064697265625, -1.5975494384765625, -1.5350341796875, -1.4725189208984375, -1.410003662109375, -1.3474884033203125, -1.28497314453125, -1.2224578857421875, -1.159942626953125, -1.0974273681640625, -1.034912109375, -0.9723968505859375, -0.909881591796875, -0.8473663330078125, -0.78485107421875, -0.7223358154296875, -0.659820556640625, -0.5973052978515625, -0.5347900390625, -0.4722747802734375, -0.409759521484375, -0.3472442626953125, -0.28472900390625, -0.2222137451171875, -0.159698486328125, -0.0971832275390625, -0.03466796875, 0.0278472900390625, 0.090362548828125, 0.1528778076171875, 0.21539306640625, 0.2779083251953125, 0.340423583984375, 0.4029388427734375, 0.4654541015625, 0.5279693603515625, 0.590484619140625, 0.6529998779296875, 0.71551513671875, 0.7780303955078125, 0.840545654296875, 0.9030609130859375, 0.965576171875, 1.0280914306640625, 1.090606689453125, 1.1531219482421875, 1.21563720703125, 1.2781524658203125, 1.340667724609375, 1.4031829833984375, 1.4656982421875, 1.5282135009765625, 1.590728759765625, 1.6532440185546875, 1.71575927734375, 1.7782745361328125, 1.840789794921875, 1.9033050537109375, 1.9658203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 9.0, 9.0, 16.0, 22.0, 19.0, 26.0, 38.0, 40.0, 50.0, 60.0, 58.0, 64.0, 53.0, 68.0, 64.0, 60.0, 56.0, 64.0, 35.0, 40.0, 27.0, 27.0, 24.0, 9.0, 17.0, 5.0, 7.0, 4.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.123046875, -1.0867462158203125, -1.050445556640625, -1.0141448974609375, -0.97784423828125, -0.9415435791015625, -0.905242919921875, -0.8689422607421875, -0.8326416015625, -0.7963409423828125, -0.760040283203125, -0.7237396240234375, -0.68743896484375, -0.6511383056640625, -0.614837646484375, -0.5785369873046875, -0.542236328125, -0.5059356689453125, -0.469635009765625, -0.4333343505859375, -0.39703369140625, -0.3607330322265625, -0.324432373046875, -0.2881317138671875, -0.2518310546875, -0.2155303955078125, -0.179229736328125, -0.1429290771484375, -0.10662841796875, -0.0703277587890625, -0.034027099609375, 0.0022735595703125, 0.03857421875, 0.0748748779296875, 0.111175537109375, 0.1474761962890625, 0.18377685546875, 0.2200775146484375, 0.256378173828125, 0.2926788330078125, 0.3289794921875, 0.3652801513671875, 0.401580810546875, 0.4378814697265625, 0.47418212890625, 0.5104827880859375, 0.546783447265625, 0.5830841064453125, 0.619384765625, 0.6556854248046875, 0.691986083984375, 0.7282867431640625, 0.76458740234375, 0.8008880615234375, 0.837188720703125, 0.8734893798828125, 0.9097900390625, 0.9460906982421875, 0.982391357421875, 1.0186920166015625, 1.05499267578125, 1.0912933349609375, 1.127593994140625, 1.1638946533203125, 1.2001953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 10.0, 16.0, 26.0, 26.0, 47.0, 119.0, 270.0, 712.0, 2849.0, 16103.0, 358638.0, 641017.0, 23550.0, 3671.0, 889.0, 308.0, 132.0, 59.0, 29.0, 19.0, 15.0, 6.0, 10.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98876953125, -0.9459457397460938, -0.9031219482421875, -0.8602981567382812, -0.817474365234375, -0.7746505737304688, -0.7318267822265625, -0.6890029907226562, -0.64617919921875, -0.6033554077148438, -0.5605316162109375, -0.5177078247070312, -0.474884033203125, -0.43206024169921875, -0.3892364501953125, -0.34641265869140625, -0.3035888671875, -0.26076507568359375, -0.2179412841796875, -0.17511749267578125, -0.132293701171875, -0.08946990966796875, -0.0466461181640625, -0.00382232666015625, 0.03900146484375, 0.08182525634765625, 0.1246490478515625, 0.16747283935546875, 0.210296630859375, 0.25312042236328125, 0.2959442138671875, 0.33876800537109375, 0.381591796875, 0.42441558837890625, 0.4672393798828125, 0.5100631713867188, 0.552886962890625, 0.5957107543945312, 0.6385345458984375, 0.6813583374023438, 0.72418212890625, 0.7670059204101562, 0.8098297119140625, 0.8526535034179688, 0.895477294921875, 0.9383010864257812, 0.9811248779296875, 1.0239486694335938, 1.0667724609375, 1.1095962524414062, 1.1524200439453125, 1.1952438354492188, 1.238067626953125, 1.2808914184570312, 1.3237152099609375, 1.3665390014648438, 1.40936279296875, 1.4521865844726562, 1.4950103759765625, 1.5378341674804688, 1.580657958984375, 1.6234817504882812, 1.6663055419921875, 1.7091293334960938, 1.751953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 6.0, 5.0, 2.0, 10.0, 5.0, 12.0, 21.0, 23.0, 30.0, 41.0, 67.0, 78.0, 97.0, 88.0, 86.0, 100.0, 74.0, 68.0, 49.0, 30.0, 28.0, 23.0, 12.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.539987564086914e-05, -7.288530468940735e-05, -7.037073373794556e-05, -6.785616278648376e-05, -6.534159183502197e-05, -6.282702088356018e-05, -6.031244993209839e-05, -5.77978789806366e-05, -5.5283308029174805e-05, -5.276873707771301e-05, -5.025416612625122e-05, -4.773959517478943e-05, -4.522502422332764e-05, -4.2710453271865845e-05, -4.019588232040405e-05, -3.768131136894226e-05, -3.516674041748047e-05, -3.265216946601868e-05, -3.0137598514556885e-05, -2.7623027563095093e-05, -2.51084566116333e-05, -2.259388566017151e-05, -2.0079314708709717e-05, -1.7564743757247925e-05, -1.5050172805786133e-05, -1.253560185432434e-05, -1.0021030902862549e-05, -7.506459951400757e-06, -4.991888999938965e-06, -2.477318048477173e-06, 3.725290298461914e-08, 2.551823854446411e-06, 5.066394805908203e-06, 7.580965757369995e-06, 1.0095536708831787e-05, 1.2610107660293579e-05, 1.5124678611755371e-05, 1.7639249563217163e-05, 2.0153820514678955e-05, 2.2668391466140747e-05, 2.518296241760254e-05, 2.769753336906433e-05, 3.0212104320526123e-05, 3.2726675271987915e-05, 3.524124622344971e-05, 3.77558171749115e-05, 4.027038812637329e-05, 4.278495907783508e-05, 4.5299530029296875e-05, 4.781410098075867e-05, 5.032867193222046e-05, 5.284324288368225e-05, 5.535781383514404e-05, 5.7872384786605835e-05, 6.038695573806763e-05, 6.290152668952942e-05, 6.541609764099121e-05, 6.7930668592453e-05, 7.04452395439148e-05, 7.295981049537659e-05, 7.547438144683838e-05, 7.798895239830017e-05, 8.050352334976196e-05, 8.301809430122375e-05, 8.553266525268555e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 12.0, 11.0, 24.0, 26.0, 48.0, 65.0, 125.0, 196.0, 331.0, 620.0, 1367.0, 3114.0, 8710.0, 33315.0, 321219.0, 599447.0, 59333.0, 12808.0, 4217.0, 1744.0, 782.0, 383.0, 237.0, 121.0, 96.0, 52.0, 26.0, 33.0, 18.0, 18.0, 7.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.673828125, -0.6480712890625, -0.622314453125, -0.5965576171875, -0.57080078125, -0.5450439453125, -0.519287109375, -0.4935302734375, -0.4677734375, -0.4420166015625, -0.416259765625, -0.3905029296875, -0.36474609375, -0.3389892578125, -0.313232421875, -0.2874755859375, -0.26171875, -0.2359619140625, -0.210205078125, -0.1844482421875, -0.15869140625, -0.1329345703125, -0.107177734375, -0.0814208984375, -0.0556640625, -0.0299072265625, -0.004150390625, 0.0216064453125, 0.04736328125, 0.0731201171875, 0.098876953125, 0.1246337890625, 0.150390625, 0.1761474609375, 0.201904296875, 0.2276611328125, 0.25341796875, 0.2791748046875, 0.304931640625, 0.3306884765625, 0.3564453125, 0.3822021484375, 0.407958984375, 0.4337158203125, 0.45947265625, 0.4852294921875, 0.510986328125, 0.5367431640625, 0.5625, 0.5882568359375, 0.614013671875, 0.6397705078125, 0.66552734375, 0.6912841796875, 0.717041015625, 0.7427978515625, 0.7685546875, 0.7943115234375, 0.820068359375, 0.8458251953125, 0.87158203125, 0.8973388671875, 0.923095703125, 0.9488525390625, 0.974609375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 1.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 7.0, 12.0, 21.0, 18.0, 29.0, 42.0, 64.0, 79.0, 90.0, 93.0, 110.0, 94.0, 77.0, 68.0, 49.0, 39.0, 19.0, 20.0, 18.0, 12.0, 4.0, 6.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.355224609375, -0.3392066955566406, -0.32318878173828125, -0.3071708679199219, -0.2911529541015625, -0.2751350402832031, -0.25911712646484375, -0.24309921264648438, -0.227081298828125, -0.21106338500976562, -0.19504547119140625, -0.17902755737304688, -0.1630096435546875, -0.14699172973632812, -0.13097381591796875, -0.11495590209960938, -0.09893798828125, -0.08292007446289062, -0.06690216064453125, -0.050884246826171875, -0.0348663330078125, -0.018848419189453125, -0.00283050537109375, 0.013187408447265625, 0.029205322265625, 0.045223236083984375, 0.06124114990234375, 0.07725906372070312, 0.0932769775390625, 0.10929489135742188, 0.12531280517578125, 0.14133071899414062, 0.1573486328125, 0.17336654663085938, 0.18938446044921875, 0.20540237426757812, 0.2214202880859375, 0.23743820190429688, 0.25345611572265625, 0.2694740295410156, 0.285491943359375, 0.3015098571777344, 0.31752777099609375, 0.3335456848144531, 0.3495635986328125, 0.3655815124511719, 0.38159942626953125, 0.3976173400878906, 0.41363525390625, 0.4296531677246094, 0.44567108154296875, 0.4616889953613281, 0.4777069091796875, 0.4937248229980469, 0.5097427368164062, 0.5257606506347656, 0.541778564453125, 0.5577964782714844, 0.5738143920898438, 0.5898323059082031, 0.6058502197265625, 0.6218681335449219, 0.6378860473632812, 0.6539039611816406, 0.669921875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 26.0, 46.0, 159.0, 268.0, 284.0, 116.0, 50.0, 22.0, 10.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.436612606048584, -7.024399280548096, -6.612185478210449, -6.199972152709961, -5.787758827209473, -5.375545501708984, -4.963331699371338, -4.55111837387085, -4.138904571533203, -3.7266910076141357, -3.3144776821136475, -2.90226411819458, -2.490050792694092, -2.0778372287750244, -1.665623664855957, -1.2534103393554688, -0.8411970138549805, -0.42898353934288025, -0.01677006483078003, 0.3954434394836426, 0.8076568841934204, 1.2198703289031982, 1.6320838928222656, 2.044297218322754, 2.4565107822418213, 2.8687243461608887, 3.280937671661377, 3.6931512355804443, 4.105364799499512, 4.517578125, 4.929791450500488, 5.342004776000977, 5.754218101501465, 6.166431427001953, 6.5786452293396, 6.990858554840088, 7.403071880340576, 7.815285682678223, 8.227499008178711, 8.6397123336792, 9.051925659179688, 9.464138984680176, 9.876352310180664, 10.288566589355469, 10.700779914855957, 11.112993240356445, 11.525206565856934, 11.937419891357422, 12.349634170532227, 12.761847496032715, 13.174060821533203, 13.586275100708008, 13.998488426208496, 14.410701751708984, 14.822915077209473, 15.235128402709961, 15.64734172821045, 16.059555053710938, 16.471769332885742, 16.883981704711914, 17.29619598388672, 17.70840835571289, 18.120622634887695, 18.5328369140625, 18.945049285888672]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 4.0, 10.0, 9.0, 9.0, 17.0, 18.0, 24.0, 24.0, 33.0, 27.0, 40.0, 42.0, 50.0, 55.0, 53.0, 46.0, 44.0, 62.0, 51.0, 50.0, 58.0, 39.0, 29.0, 41.0, 26.0, 22.0, 32.0, 13.0, 10.0, 13.0, 13.0, 8.0, 9.0, 1.0, 8.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.575725555419922, -5.390859603881836, -5.205993175506592, -5.021126747131348, -4.836260795593262, -4.651394844055176, -4.466528415679932, -4.2816619873046875, -4.096796035766602, -3.9119298458099365, -3.7270636558532715, -3.5421974658966064, -3.3573312759399414, -3.1724650859832764, -2.9875988960266113, -2.8027327060699463, -2.6178665161132812, -2.433000326156616, -2.248134136199951, -2.063267946243286, -1.878401756286621, -1.693535566329956, -1.508669376373291, -1.323803186416626, -1.138936996459961, -0.9540708065032959, -0.7692046165466309, -0.5843384265899658, -0.3994722366333008, -0.21460604667663574, -0.029739856719970703, 0.15512633323669434, 0.3399925231933594, 0.5248587131500244, 0.7097249031066895, 0.8945910930633545, 1.0794572830200195, 1.2643234729766846, 1.4491896629333496, 1.6340558528900146, 1.8189220428466797, 2.0037882328033447, 2.1886544227600098, 2.373520612716675, 2.55838680267334, 2.743252992630005, 2.92811918258667, 3.112985372543335, 3.2978515625, 3.482717752456665, 3.66758394241333, 3.852450132369995, 4.03731632232666, 4.222182273864746, 4.40704870223999, 4.591915130615234, 4.77678108215332, 4.961647033691406, 5.14651346206665, 5.3313798904418945, 5.5162458419799805, 5.701111793518066, 5.8859782218933105, 6.070844650268555, 6.255710601806641]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 7.0, 7.0, 11.0, 21.0, 22.0, 51.0, 75.0, 133.0, 279.0, 629.0, 1663.0, 6608.0, 49879.0, 3829284.0, 281969.0, 17265.0, 3820.0, 1234.0, 582.0, 263.0, 172.0, 101.0, 70.0, 32.0, 28.0, 20.0, 17.0, 8.0, 10.0, 3.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.23828125, -2.14788818359375, -2.0574951171875, -1.96710205078125, -1.876708984375, -1.78631591796875, -1.6959228515625, -1.60552978515625, -1.51513671875, -1.42474365234375, -1.3343505859375, -1.24395751953125, -1.153564453125, -1.06317138671875, -0.9727783203125, -0.88238525390625, -0.7919921875, -0.70159912109375, -0.6112060546875, -0.52081298828125, -0.430419921875, -0.34002685546875, -0.2496337890625, -0.15924072265625, -0.06884765625, 0.02154541015625, 0.1119384765625, 0.20233154296875, 0.292724609375, 0.38311767578125, 0.4735107421875, 0.56390380859375, 0.654296875, 0.74468994140625, 0.8350830078125, 0.92547607421875, 1.015869140625, 1.10626220703125, 1.1966552734375, 1.28704833984375, 1.37744140625, 1.46783447265625, 1.5582275390625, 1.64862060546875, 1.739013671875, 1.82940673828125, 1.9197998046875, 2.01019287109375, 2.1005859375, 2.19097900390625, 2.2813720703125, 2.37176513671875, 2.462158203125, 2.55255126953125, 2.6429443359375, 2.73333740234375, 2.82373046875, 2.91412353515625, 3.0045166015625, 3.09490966796875, 3.185302734375, 3.27569580078125, 3.3660888671875, 3.45648193359375, 3.546875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 11.0, 22.0, 27.0, 48.0, 58.0, 83.0, 59.0, 75.0, 91.0, 86.0, 69.0, 97.0, 60.0, 60.0, 45.0, 34.0, 16.0, 18.0, 8.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26318359375, -0.2513275146484375, -0.239471435546875, -0.2276153564453125, -0.21575927734375, -0.2039031982421875, -0.192047119140625, -0.1801910400390625, -0.1683349609375, -0.1564788818359375, -0.144622802734375, -0.1327667236328125, -0.12091064453125, -0.1090545654296875, -0.097198486328125, -0.0853424072265625, -0.073486328125, -0.0616302490234375, -0.049774169921875, -0.0379180908203125, -0.02606201171875, -0.0142059326171875, -0.002349853515625, 0.0095062255859375, 0.0213623046875, 0.0332183837890625, 0.045074462890625, 0.0569305419921875, 0.06878662109375, 0.0806427001953125, 0.092498779296875, 0.1043548583984375, 0.1162109375, 0.1280670166015625, 0.139923095703125, 0.1517791748046875, 0.16363525390625, 0.1754913330078125, 0.187347412109375, 0.1992034912109375, 0.2110595703125, 0.2229156494140625, 0.234771728515625, 0.2466278076171875, 0.25848388671875, 0.2703399658203125, 0.282196044921875, 0.2940521240234375, 0.305908203125, 0.3177642822265625, 0.329620361328125, 0.3414764404296875, 0.35333251953125, 0.3651885986328125, 0.377044677734375, 0.3889007568359375, 0.4007568359375, 0.4126129150390625, 0.424468994140625, 0.4363250732421875, 0.44818115234375, 0.4600372314453125, 0.471893310546875, 0.4837493896484375, 0.49560546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 9.0, 36.0, 83.0, 179.0, 475.0, 6755.0, 4180495.0, 5601.0, 406.0, 144.0, 64.0, 26.0, 11.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1796875, -10.8646240234375, -10.549560546875, -10.2344970703125, -9.91943359375, -9.6043701171875, -9.289306640625, -8.9742431640625, -8.6591796875, -8.3441162109375, -8.029052734375, -7.7139892578125, -7.39892578125, -7.0838623046875, -6.768798828125, -6.4537353515625, -6.138671875, -5.8236083984375, -5.508544921875, -5.1934814453125, -4.87841796875, -4.5633544921875, -4.248291015625, -3.9332275390625, -3.6181640625, -3.3031005859375, -2.988037109375, -2.6729736328125, -2.35791015625, -2.0428466796875, -1.727783203125, -1.4127197265625, -1.09765625, -0.7825927734375, -0.467529296875, -0.1524658203125, 0.16259765625, 0.4776611328125, 0.792724609375, 1.1077880859375, 1.4228515625, 1.7379150390625, 2.052978515625, 2.3680419921875, 2.68310546875, 2.9981689453125, 3.313232421875, 3.6282958984375, 3.943359375, 4.2584228515625, 4.573486328125, 4.8885498046875, 5.20361328125, 5.5186767578125, 5.833740234375, 6.1488037109375, 6.4638671875, 6.7789306640625, 7.093994140625, 7.4090576171875, 7.72412109375, 8.0391845703125, 8.354248046875, 8.6693115234375, 8.984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 21.0, 24.0, 109.0, 969.0, 2729.0, 166.0, 39.0, 18.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.65625, -1.6091156005859375, -1.561981201171875, -1.5148468017578125, -1.46771240234375, -1.4205780029296875, -1.373443603515625, -1.3263092041015625, -1.2791748046875, -1.2320404052734375, -1.184906005859375, -1.1377716064453125, -1.09063720703125, -1.0435028076171875, -0.996368408203125, -0.9492340087890625, -0.902099609375, -0.8549652099609375, -0.807830810546875, -0.7606964111328125, -0.71356201171875, -0.6664276123046875, -0.619293212890625, -0.5721588134765625, -0.5250244140625, -0.4778900146484375, -0.430755615234375, -0.3836212158203125, -0.33648681640625, -0.2893524169921875, -0.242218017578125, -0.1950836181640625, -0.14794921875, -0.1008148193359375, -0.053680419921875, -0.0065460205078125, 0.04058837890625, 0.0877227783203125, 0.134857177734375, 0.1819915771484375, 0.2291259765625, 0.2762603759765625, 0.323394775390625, 0.3705291748046875, 0.41766357421875, 0.4647979736328125, 0.511932373046875, 0.5590667724609375, 0.606201171875, 0.6533355712890625, 0.700469970703125, 0.7476043701171875, 0.79473876953125, 0.8418731689453125, 0.889007568359375, 0.9361419677734375, 0.9832763671875, 1.0304107666015625, 1.077545166015625, 1.1246795654296875, 1.17181396484375, 1.2189483642578125, 1.266082763671875, 1.3132171630859375, 1.3603515625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 36.0, 873.0, 102.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.897687911987305, -11.181527137756348, -10.46536636352539, -9.74920654296875, -9.033045768737793, -8.316884994506836, -7.600724697113037, -6.884564399719238, -6.168403625488281, -5.452242851257324, -4.736082553863525, -4.019922256469727, -3.3037614822387695, -2.5876009464263916, -1.8714404106140137, -1.1552801132202148, -0.4391193389892578, 0.2770411968231201, 0.993201732635498, 1.709362268447876, 2.425522804260254, 3.141683340072632, 3.8578438758850098, 4.574004173278809, 5.290164947509766, 6.006325721740723, 6.7224860191345215, 7.43864631652832, 8.154807090759277, 8.870967864990234, 9.587127685546875, 10.303288459777832, 11.019447326660156, 11.735608100891113, 12.45176887512207, 13.167928695678711, 13.884089469909668, 14.600250244140625, 15.316410064697266, 16.032569885253906, 16.74873161315918, 17.46489143371582, 18.181053161621094, 18.897212982177734, 19.613372802734375, 20.32953453063965, 21.04569435119629, 21.761856079101562, 22.478015899658203, 23.194175720214844, 23.910337448120117, 24.626497268676758, 25.34265899658203, 26.058818817138672, 26.774978637695312, 27.491138458251953, 28.207300186157227, 28.923460006713867, 29.63962173461914, 30.35578155517578, 31.071941375732422, 31.788103103637695, 32.50426483154297, 33.22042465209961, 33.93658447265625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 8.0, 6.0, 13.0, 11.0, 21.0, 33.0, 34.0, 44.0, 54.0, 62.0, 65.0, 70.0, 79.0, 76.0, 109.0, 55.0, 54.0, 59.0, 32.0, 30.0, 24.0, 19.0, 11.0, 10.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7233878374099731, -1.6532824039459229, -1.583177089691162, -1.5130716562271118, -1.4429662227630615, -1.3728609085083008, -1.3027554750442505, -1.2326500415802002, -1.1625447273254395, -1.0924392938613892, -1.0223339796066284, -0.9522285461425781, -0.8821231126785278, -0.8120177388191223, -0.7419123649597168, -0.6718069314956665, -0.6017014980316162, -0.5315961241722107, -0.4614906907081604, -0.3913853168487549, -0.321279913187027, -0.2511745095252991, -0.18106913566589355, -0.11096373200416565, -0.040858328342437744, 0.029247067868709564, 0.09935246407985687, 0.16945785284042358, 0.2395632565021515, 0.3096686601638794, 0.3797740340232849, 0.4498794376850128, 0.5199849605560303, 0.5900903344154358, 0.6601957678794861, 0.7303011417388916, 0.8004065752029419, 0.8705119490623474, 0.9406173229217529, 1.0107227563858032, 1.0808281898498535, 1.1509336233139038, 1.2210389375686646, 1.2911443710327148, 1.3612498044967651, 1.4313552379608154, 1.5014605522155762, 1.5715659856796265, 1.6416712999343872, 1.7117767333984375, 1.7818820476531982, 1.8519874811172485, 1.9220929145812988, 1.9921982288360596, 2.0623035430908203, 2.13240909576416, 2.202514410018921, 2.2726197242736816, 2.3427252769470215, 2.4128305912017822, 2.482935905456543, 2.553041458129883, 2.6231467723846436, 2.6932520866394043, 2.763357639312744]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 13.0, 14.0, 25.0, 39.0, 47.0, 94.0, 136.0, 227.0, 508.0, 1033.0, 2826.0, 10538.0, 61153.0, 512379.0, 400469.0, 46146.0, 8553.0, 2319.0, 912.0, 446.0, 252.0, 148.0, 110.0, 51.0, 40.0, 28.0, 11.0, 9.0, 6.0, 8.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.921875, -2.8521881103515625, -2.782501220703125, -2.7128143310546875, -2.64312744140625, -2.5734405517578125, -2.503753662109375, -2.4340667724609375, -2.3643798828125, -2.2946929931640625, -2.225006103515625, -2.1553192138671875, -2.08563232421875, -2.0159454345703125, -1.946258544921875, -1.8765716552734375, -1.806884765625, -1.7371978759765625, -1.667510986328125, -1.5978240966796875, -1.52813720703125, -1.4584503173828125, -1.388763427734375, -1.3190765380859375, -1.2493896484375, -1.1797027587890625, -1.110015869140625, -1.0403289794921875, -0.97064208984375, -0.9009552001953125, -0.831268310546875, -0.7615814208984375, -0.69189453125, -0.6222076416015625, -0.552520751953125, -0.4828338623046875, -0.41314697265625, -0.3434600830078125, -0.273773193359375, -0.2040863037109375, -0.1343994140625, -0.0647125244140625, 0.004974365234375, 0.0746612548828125, 0.14434814453125, 0.2140350341796875, 0.283721923828125, 0.3534088134765625, 0.423095703125, 0.4927825927734375, 0.562469482421875, 0.6321563720703125, 0.70184326171875, 0.7715301513671875, 0.841217041015625, 0.9109039306640625, 0.9805908203125, 1.0502777099609375, 1.119964599609375, 1.1896514892578125, 1.25933837890625, 1.3290252685546875, 1.398712158203125, 1.4683990478515625, 1.5380859375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 3.0, 10.0, 18.0, 19.0, 28.0, 42.0, 37.0, 58.0, 61.0, 67.0, 68.0, 82.0, 87.0, 82.0, 65.0, 60.0, 42.0, 51.0, 33.0, 24.0, 24.0, 12.0, 5.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.267333984375, -0.2566261291503906, -0.24591827392578125, -0.23521041870117188, -0.2245025634765625, -0.21379470825195312, -0.20308685302734375, -0.19237899780273438, -0.181671142578125, -0.17096328735351562, -0.16025543212890625, -0.14954757690429688, -0.1388397216796875, -0.12813186645507812, -0.11742401123046875, -0.10671615600585938, -0.09600830078125, -0.08530044555664062, -0.07459259033203125, -0.06388473510742188, -0.0531768798828125, -0.042469024658203125, -0.03176116943359375, -0.021053314208984375, -0.010345458984375, 0.000362396240234375, 0.01107025146484375, 0.021778106689453125, 0.0324859619140625, 0.043193817138671875, 0.05390167236328125, 0.06460952758789062, 0.0753173828125, 0.08602523803710938, 0.09673309326171875, 0.10744094848632812, 0.1181488037109375, 0.12885665893554688, 0.13956451416015625, 0.15027236938476562, 0.160980224609375, 0.17168807983398438, 0.18239593505859375, 0.19310379028320312, 0.2038116455078125, 0.21451950073242188, 0.22522735595703125, 0.23593521118164062, 0.24664306640625, 0.2573509216308594, 0.26805877685546875, 0.2787666320800781, 0.2894744873046875, 0.3001823425292969, 0.31089019775390625, 0.3215980529785156, 0.332305908203125, 0.3430137634277344, 0.35372161865234375, 0.3644294738769531, 0.3751373291015625, 0.3858451843261719, 0.39655303955078125, 0.4072608947753906, 0.41796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 7.0, 5.0, 8.0, 19.0, 20.0, 33.0, 51.0, 110.0, 176.0, 348.0, 846.0, 2189.0, 7319.0, 36794.0, 424333.0, 518540.0, 45351.0, 8123.0, 2490.0, 916.0, 395.0, 207.0, 107.0, 60.0, 32.0, 17.0, 21.0, 7.0, 7.0, 4.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9794921875, -1.9089202880859375, -1.838348388671875, -1.7677764892578125, -1.69720458984375, -1.6266326904296875, -1.556060791015625, -1.4854888916015625, -1.4149169921875, -1.3443450927734375, -1.273773193359375, -1.2032012939453125, -1.13262939453125, -1.0620574951171875, -0.991485595703125, -0.9209136962890625, -0.850341796875, -0.7797698974609375, -0.709197998046875, -0.6386260986328125, -0.56805419921875, -0.4974822998046875, -0.426910400390625, -0.3563385009765625, -0.2857666015625, -0.2151947021484375, -0.144622802734375, -0.0740509033203125, -0.00347900390625, 0.0670928955078125, 0.137664794921875, 0.2082366943359375, 0.27880859375, 0.3493804931640625, 0.419952392578125, 0.4905242919921875, 0.56109619140625, 0.6316680908203125, 0.702239990234375, 0.7728118896484375, 0.8433837890625, 0.9139556884765625, 0.984527587890625, 1.0550994873046875, 1.12567138671875, 1.1962432861328125, 1.266815185546875, 1.3373870849609375, 1.407958984375, 1.4785308837890625, 1.549102783203125, 1.6196746826171875, 1.69024658203125, 1.7608184814453125, 1.831390380859375, 1.9019622802734375, 1.9725341796875, 2.0431060791015625, 2.113677978515625, 2.1842498779296875, 2.25482177734375, 2.3253936767578125, 2.395965576171875, 2.4665374755859375, 2.537109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 11.0, 8.0, 16.0, 19.0, 35.0, 38.0, 46.0, 44.0, 90.0, 60.0, 78.0, 78.0, 68.0, 75.0, 64.0, 57.0, 52.0, 31.0, 31.0, 14.0, 19.0, 13.0, 6.0, 8.0, 6.0, 4.0, 7.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3642578125, -1.3163909912109375, -1.268524169921875, -1.2206573486328125, -1.17279052734375, -1.1249237060546875, -1.077056884765625, -1.0291900634765625, -0.9813232421875, -0.9334564208984375, -0.885589599609375, -0.8377227783203125, -0.78985595703125, -0.7419891357421875, -0.694122314453125, -0.6462554931640625, -0.598388671875, -0.5505218505859375, -0.502655029296875, -0.4547882080078125, -0.40692138671875, -0.3590545654296875, -0.311187744140625, -0.2633209228515625, -0.2154541015625, -0.1675872802734375, -0.119720458984375, -0.0718536376953125, -0.02398681640625, 0.0238800048828125, 0.071746826171875, 0.1196136474609375, 0.16748046875, 0.2153472900390625, 0.263214111328125, 0.3110809326171875, 0.35894775390625, 0.4068145751953125, 0.454681396484375, 0.5025482177734375, 0.5504150390625, 0.5982818603515625, 0.646148681640625, 0.6940155029296875, 0.74188232421875, 0.7897491455078125, 0.837615966796875, 0.8854827880859375, 0.933349609375, 0.9812164306640625, 1.029083251953125, 1.0769500732421875, 1.12481689453125, 1.1726837158203125, 1.220550537109375, 1.2684173583984375, 1.3162841796875, 1.3641510009765625, 1.412017822265625, 1.4598846435546875, 1.50775146484375, 1.5556182861328125, 1.603485107421875, 1.6513519287109375, 1.69921875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 14.0, 14.0, 14.0, 24.0, 44.0, 62.0, 101.0, 222.0, 507.0, 1192.0, 4487.0, 50170.0, 912969.0, 70934.0, 5391.0, 1300.0, 513.0, 264.0, 123.0, 70.0, 50.0, 25.0, 15.0, 11.0, 14.0, 7.0, 2.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94873046875, -0.9047012329101562, -0.8606719970703125, -0.8166427612304688, -0.772613525390625, -0.7285842895507812, -0.6845550537109375, -0.6405258178710938, -0.59649658203125, -0.5524673461914062, -0.5084381103515625, -0.46440887451171875, -0.420379638671875, -0.37635040283203125, -0.3323211669921875, -0.28829193115234375, -0.2442626953125, -0.20023345947265625, -0.1562042236328125, -0.11217498779296875, -0.068145751953125, -0.02411651611328125, 0.0199127197265625, 0.06394195556640625, 0.10797119140625, 0.15200042724609375, 0.1960296630859375, 0.24005889892578125, 0.284088134765625, 0.32811737060546875, 0.3721466064453125, 0.41617584228515625, 0.460205078125, 0.5042343139648438, 0.5482635498046875, 0.5922927856445312, 0.636322021484375, 0.6803512573242188, 0.7243804931640625, 0.7684097290039062, 0.81243896484375, 0.8564682006835938, 0.9004974365234375, 0.9445266723632812, 0.988555908203125, 1.0325851440429688, 1.0766143798828125, 1.1206436157226562, 1.1646728515625, 1.2087020874023438, 1.2527313232421875, 1.2967605590820312, 1.340789794921875, 1.3848190307617188, 1.4288482666015625, 1.4728775024414062, 1.51690673828125, 1.5609359741210938, 1.6049652099609375, 1.6489944458007812, 1.693023681640625, 1.7370529174804688, 1.7810821533203125, 1.8251113891601562, 1.869140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 15.0, 25.0, 50.0, 84.0, 128.0, 141.0, 183.0, 149.0, 69.0, 49.0, 37.0, 18.0, 8.0, 8.0, 6.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.000164031982421875, -0.00015936605632305145, -0.0001547001302242279, -0.00015003420412540436, -0.0001453682780265808, -0.00014070235192775726, -0.00013603642582893372, -0.00013137049973011017, -0.00012670457363128662, -0.00012203864753246307, -0.00011737272143363953, -0.00011270679533481598, -0.00010804086923599243, -0.00010337494313716888, -9.870901703834534e-05, -9.404309093952179e-05, -8.937716484069824e-05, -8.47112387418747e-05, -8.004531264305115e-05, -7.53793865442276e-05, -7.071346044540405e-05, -6.60475343465805e-05, -6.138160824775696e-05, -5.671568214893341e-05, -5.204975605010986e-05, -4.7383829951286316e-05, -4.271790385246277e-05, -3.805197775363922e-05, -3.3386051654815674e-05, -2.8720125555992126e-05, -2.405419945716858e-05, -1.9388273358345032e-05, -1.4722347259521484e-05, -1.0056421160697937e-05, -5.39049506187439e-06, -7.245689630508423e-07, 3.941357135772705e-06, 8.607283234596252e-06, 1.32732093334198e-05, 1.7939135432243347e-05, 2.2605061531066895e-05, 2.7270987629890442e-05, 3.193691372871399e-05, 3.660283982753754e-05, 4.1268765926361084e-05, 4.593469202518463e-05, 5.060061812400818e-05, 5.5266544222831726e-05, 5.9932470321655273e-05, 6.459839642047882e-05, 6.926432251930237e-05, 7.393024861812592e-05, 7.859617471694946e-05, 8.326210081577301e-05, 8.792802691459656e-05, 9.25939530134201e-05, 9.725987911224365e-05, 0.0001019258052110672, 0.00010659173130989075, 0.0001112576574087143, 0.00011592358350753784, 0.00012058950960636139, 0.00012525543570518494, 0.00012992136180400848, 0.00013458728790283203]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 9.0, 13.0, 15.0, 16.0, 21.0, 38.0, 65.0, 115.0, 129.0, 263.0, 484.0, 962.0, 2312.0, 6105.0, 22924.0, 165251.0, 663978.0, 153525.0, 21994.0, 6022.0, 2144.0, 958.0, 509.0, 269.0, 145.0, 88.0, 54.0, 38.0, 24.0, 17.0, 12.0, 16.0, 12.0, 10.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58935546875, -0.569366455078125, -0.54937744140625, -0.529388427734375, -0.5093994140625, -0.489410400390625, -0.46942138671875, -0.449432373046875, -0.429443359375, -0.409454345703125, -0.38946533203125, -0.369476318359375, -0.3494873046875, -0.329498291015625, -0.30950927734375, -0.289520263671875, -0.26953125, -0.249542236328125, -0.22955322265625, -0.209564208984375, -0.1895751953125, -0.169586181640625, -0.14959716796875, -0.129608154296875, -0.109619140625, -0.089630126953125, -0.06964111328125, -0.049652099609375, -0.0296630859375, -0.009674072265625, 0.01031494140625, 0.030303955078125, 0.05029296875, 0.070281982421875, 0.09027099609375, 0.110260009765625, 0.1302490234375, 0.150238037109375, 0.17022705078125, 0.190216064453125, 0.210205078125, 0.230194091796875, 0.25018310546875, 0.270172119140625, 0.2901611328125, 0.310150146484375, 0.33013916015625, 0.350128173828125, 0.3701171875, 0.390106201171875, 0.41009521484375, 0.430084228515625, 0.4500732421875, 0.470062255859375, 0.49005126953125, 0.510040283203125, 0.530029296875, 0.550018310546875, 0.57000732421875, 0.589996337890625, 0.6099853515625, 0.629974365234375, 0.64996337890625, 0.669952392578125, 0.68994140625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 7.0, 13.0, 19.0, 11.0, 22.0, 29.0, 47.0, 65.0, 86.0, 107.0, 111.0, 106.0, 94.0, 77.0, 63.0, 26.0, 40.0, 21.0, 17.0, 4.0, 6.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44384765625, -0.4266510009765625, -0.409454345703125, -0.3922576904296875, -0.37506103515625, -0.3578643798828125, -0.340667724609375, -0.3234710693359375, -0.3062744140625, -0.2890777587890625, -0.271881103515625, -0.2546844482421875, -0.23748779296875, -0.2202911376953125, -0.203094482421875, -0.1858978271484375, -0.168701171875, -0.1515045166015625, -0.134307861328125, -0.1171112060546875, -0.09991455078125, -0.0827178955078125, -0.065521240234375, -0.0483245849609375, -0.0311279296875, -0.0139312744140625, 0.003265380859375, 0.0204620361328125, 0.03765869140625, 0.0548553466796875, 0.072052001953125, 0.0892486572265625, 0.1064453125, 0.1236419677734375, 0.140838623046875, 0.1580352783203125, 0.17523193359375, 0.1924285888671875, 0.209625244140625, 0.2268218994140625, 0.2440185546875, 0.2612152099609375, 0.278411865234375, 0.2956085205078125, 0.31280517578125, 0.3300018310546875, 0.347198486328125, 0.3643951416015625, 0.381591796875, 0.3987884521484375, 0.415985107421875, 0.4331817626953125, 0.45037841796875, 0.4675750732421875, 0.484771728515625, 0.5019683837890625, 0.5191650390625, 0.5363616943359375, 0.553558349609375, 0.5707550048828125, 0.58795166015625, 0.6051483154296875, 0.622344970703125, 0.6395416259765625, 0.65673828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [5.0, 3.0, 4.0, 10.0, 41.0, 131.0, 358.0, 316.0, 101.0, 31.0, 9.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.016164779663086, -4.29005241394043, -3.5639398097991943, -2.837827205657959, -2.1117148399353027, -1.3856024742126465, -0.659489631652832, 0.06662273406982422, 0.7927350997924805, 1.5188475847244263, 2.244960069656372, 2.9710726737976074, 3.6971850395202637, 4.42329740524292, 5.149410247802734, 5.875522613525391, 6.601634979248047, 7.327747344970703, 8.05385971069336, 8.779972076416016, 9.506084442138672, 10.232196807861328, 10.9583101272583, 11.684422492980957, 12.410534858703613, 13.13664722442627, 13.862759590148926, 14.588872909545898, 15.314985275268555, 16.04109764099121, 16.767210006713867, 17.493322372436523, 18.219432830810547, 18.945545196533203, 19.67165756225586, 20.397769927978516, 21.123882293701172, 21.849994659423828, 22.576107025146484, 23.30221939086914, 24.028331756591797, 24.754444122314453, 25.48055648803711, 26.206668853759766, 26.932781219482422, 27.658893585205078, 28.385005950927734, 29.11111831665039, 29.83723258972168, 30.563344955444336, 31.289457321166992, 32.01557159423828, 32.74168395996094, 33.467796325683594, 34.19390869140625, 34.920021057128906, 35.64613342285156, 36.37224578857422, 37.098358154296875, 37.82447052001953, 38.55058288574219, 39.276695251464844, 40.0028076171875, 40.728919982910156, 41.45503234863281]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 10.0, 5.0, 3.0, 4.0, 15.0, 8.0, 20.0, 22.0, 20.0, 29.0, 32.0, 29.0, 41.0, 47.0, 44.0, 44.0, 49.0, 49.0, 37.0, 70.0, 45.0, 52.0, 38.0, 37.0, 38.0, 25.0, 32.0, 34.0, 23.0, 17.0, 7.0, 14.0, 11.0, 9.0, 12.0, 9.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.128140449523926, -5.927555084228516, -5.7269697189331055, -5.526384353637695, -5.325798511505127, -5.125213146209717, -4.924627780914307, -4.7240424156188965, -4.523457050323486, -4.322871685028076, -4.122286319732666, -3.9217007160186768, -3.7211153507232666, -3.5205297470092773, -3.319944381713867, -3.119359016418457, -2.9187734127044678, -2.7181880474090576, -2.5176024436950684, -2.317017078399658, -2.116431713104248, -1.9158462285995483, -1.7152607440948486, -1.5146753787994385, -1.3140898942947388, -1.113504409790039, -0.9129190444946289, -0.7123335599899292, -0.5117481350898743, -0.31116271018981934, -0.11057722568511963, 0.09000813961029053, 0.29059362411499023, 0.49117904901504517, 0.6917644739151001, 0.8923499584197998, 1.09293532371521, 1.2935208082199097, 1.4941062927246094, 1.6946916580200195, 1.8952771425247192, 2.095862627029419, 2.296447992324829, 2.4970335960388184, 2.6976189613342285, 2.8982043266296387, 3.098789691925049, 3.299375057220459, 3.4999606609344482, 3.7005460262298584, 3.9011316299438477, 4.101716995239258, 4.302302360534668, 4.502887725830078, 4.703473091125488, 4.904058456420898, 5.104644298553467, 5.305229663848877, 5.505815029144287, 5.7064008712768555, 5.906986236572266, 6.107571601867676, 6.308156967163086, 6.508742332458496, 6.709327697753906]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 11.0, 12.0, 15.0, 34.0, 48.0, 87.0, 125.0, 211.0, 397.0, 718.0, 1584.0, 3839.0, 10604.0, 42147.0, 533477.0, 3481338.0, 91920.0, 17116.0, 5801.0, 2329.0, 1044.0, 507.0, 302.0, 180.0, 111.0, 84.0, 62.0, 41.0, 34.0, 24.0, 13.0, 17.0, 13.0, 9.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7373046875, -1.6683807373046875, -1.599456787109375, -1.5305328369140625, -1.46160888671875, -1.3926849365234375, -1.323760986328125, -1.2548370361328125, -1.1859130859375, -1.1169891357421875, -1.048065185546875, -0.9791412353515625, -0.91021728515625, -0.8412933349609375, -0.772369384765625, -0.7034454345703125, -0.634521484375, -0.5655975341796875, -0.496673583984375, -0.4277496337890625, -0.35882568359375, -0.2899017333984375, -0.220977783203125, -0.1520538330078125, -0.0831298828125, -0.0142059326171875, 0.054718017578125, 0.1236419677734375, 0.19256591796875, 0.2614898681640625, 0.330413818359375, 0.3993377685546875, 0.46826171875, 0.5371856689453125, 0.606109619140625, 0.6750335693359375, 0.74395751953125, 0.8128814697265625, 0.881805419921875, 0.9507293701171875, 1.0196533203125, 1.0885772705078125, 1.157501220703125, 1.2264251708984375, 1.29534912109375, 1.3642730712890625, 1.433197021484375, 1.5021209716796875, 1.571044921875, 1.6399688720703125, 1.708892822265625, 1.7778167724609375, 1.84674072265625, 1.9156646728515625, 1.984588623046875, 2.0535125732421875, 2.1224365234375, 2.1913604736328125, 2.260284423828125, 2.3292083740234375, 2.39813232421875, 2.4670562744140625, 2.535980224609375, 2.6049041748046875, 2.673828125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 6.0, 11.0, 18.0, 32.0, 27.0, 32.0, 68.0, 60.0, 63.0, 71.0, 74.0, 70.0, 100.0, 61.0, 64.0, 51.0, 52.0, 44.0, 29.0, 22.0, 14.0, 10.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30615234375, -0.29451751708984375, -0.2828826904296875, -0.27124786376953125, -0.259613037109375, -0.24797821044921875, -0.2363433837890625, -0.22470855712890625, -0.21307373046875, -0.20143890380859375, -0.1898040771484375, -0.17816925048828125, -0.166534423828125, -0.15489959716796875, -0.1432647705078125, -0.13162994384765625, -0.1199951171875, -0.10836029052734375, -0.0967254638671875, -0.08509063720703125, -0.073455810546875, -0.06182098388671875, -0.0501861572265625, -0.03855133056640625, -0.02691650390625, -0.01528167724609375, -0.0036468505859375, 0.00798797607421875, 0.019622802734375, 0.03125762939453125, 0.0428924560546875, 0.05452728271484375, 0.066162109375, 0.07779693603515625, 0.0894317626953125, 0.10106658935546875, 0.112701416015625, 0.12433624267578125, 0.1359710693359375, 0.14760589599609375, 0.15924072265625, 0.17087554931640625, 0.1825103759765625, 0.19414520263671875, 0.205780029296875, 0.21741485595703125, 0.2290496826171875, 0.24068450927734375, 0.2523193359375, 0.26395416259765625, 0.2755889892578125, 0.28722381591796875, 0.298858642578125, 0.31049346923828125, 0.3221282958984375, 0.33376312255859375, 0.34539794921875, 0.35703277587890625, 0.3686676025390625, 0.38030242919921875, 0.391937255859375, 0.40357208251953125, 0.4152069091796875, 0.42684173583984375, 0.4384765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 8.0, 7.0, 8.0, 19.0, 26.0, 40.0, 62.0, 113.0, 223.0, 439.0, 1297.0, 3882.0, 19607.0, 3241001.0, 906334.0, 15539.0, 3446.0, 1158.0, 480.0, 220.0, 128.0, 73.0, 54.0, 34.0, 20.0, 18.0, 11.0, 12.0, 3.0, 5.0, 5.0, 3.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.1640625, -4.03369140625, -3.9033203125, -3.77294921875, -3.642578125, -3.51220703125, -3.3818359375, -3.25146484375, -3.12109375, -2.99072265625, -2.8603515625, -2.72998046875, -2.599609375, -2.46923828125, -2.3388671875, -2.20849609375, -2.078125, -1.94775390625, -1.8173828125, -1.68701171875, -1.556640625, -1.42626953125, -1.2958984375, -1.16552734375, -1.03515625, -0.90478515625, -0.7744140625, -0.64404296875, -0.513671875, -0.38330078125, -0.2529296875, -0.12255859375, 0.0078125, 0.13818359375, 0.2685546875, 0.39892578125, 0.529296875, 0.65966796875, 0.7900390625, 0.92041015625, 1.05078125, 1.18115234375, 1.3115234375, 1.44189453125, 1.572265625, 1.70263671875, 1.8330078125, 1.96337890625, 2.09375, 2.22412109375, 2.3544921875, 2.48486328125, 2.615234375, 2.74560546875, 2.8759765625, 3.00634765625, 3.13671875, 3.26708984375, 3.3974609375, 3.52783203125, 3.658203125, 3.78857421875, 3.9189453125, 4.04931640625, 4.1796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 15.0, 26.0, 51.0, 120.0, 434.0, 2331.0, 778.0, 172.0, 57.0, 31.0, 15.0, 12.0, 3.0, 7.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8588485717773438, -0.8129119873046875, -0.7669754028320312, -0.721038818359375, -0.6751022338867188, -0.6291656494140625, -0.5832290649414062, -0.53729248046875, -0.49135589599609375, -0.4454193115234375, -0.39948272705078125, -0.353546142578125, -0.30760955810546875, -0.2616729736328125, -0.21573638916015625, -0.1697998046875, -0.12386322021484375, -0.0779266357421875, -0.03199005126953125, 0.013946533203125, 0.05988311767578125, 0.1058197021484375, 0.15175628662109375, 0.19769287109375, 0.24362945556640625, 0.2895660400390625, 0.33550262451171875, 0.381439208984375, 0.42737579345703125, 0.4733123779296875, 0.5192489624023438, 0.565185546875, 0.6111221313476562, 0.6570587158203125, 0.7029953002929688, 0.748931884765625, 0.7948684692382812, 0.8408050537109375, 0.8867416381835938, 0.93267822265625, 0.9786148071289062, 1.0245513916015625, 1.0704879760742188, 1.116424560546875, 1.1623611450195312, 1.2082977294921875, 1.2542343139648438, 1.3001708984375, 1.3461074829101562, 1.3920440673828125, 1.4379806518554688, 1.483917236328125, 1.5298538208007812, 1.5757904052734375, 1.6217269897460938, 1.66766357421875, 1.7136001586914062, 1.7595367431640625, 1.8054733276367188, 1.851409912109375, 1.8973464965820312, 1.9432830810546875, 1.9892196655273438, 2.03515625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 11.0, 23.0, 66.0, 172.0, 331.0, 235.0, 108.0, 35.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.353615760803223, -5.051947116851807, -4.750278472900391, -4.448609352111816, -4.1469407081604, -3.8452720642089844, -3.5436031818389893, -3.241934299468994, -2.940265655517578, -2.638597011566162, -2.336928129196167, -2.035259246826172, -1.7335906028747559, -1.4319218397140503, -1.1302530765533447, -0.8285841941833496, -0.5269155502319336, -0.22524678707122803, 0.07642197608947754, 0.3780907392501831, 0.6797595024108887, 0.9814282655715942, 1.2830970287322998, 1.584765911102295, 1.886434555053711, 2.188103199005127, 2.489772081375122, 2.791440963745117, 3.093109607696533, 3.394778251647949, 3.6964471340179443, 3.9981160163879395, 4.299783706665039, 4.601452350616455, 4.903120994567871, 5.204790115356445, 5.506458759307861, 5.808127403259277, 6.109796524047852, 6.411465167999268, 6.713133811950684, 7.0148024559021, 7.316471099853516, 7.61814022064209, 7.919808864593506, 8.221477508544922, 8.523146629333496, 8.82481575012207, 9.126483917236328, 9.428153038024902, 9.72982120513916, 10.031490325927734, 10.333158493041992, 10.634827613830566, 10.93649673461914, 11.238164901733398, 11.539834022521973, 11.841503143310547, 12.143171310424805, 12.444840431213379, 12.746509552001953, 13.048177719116211, 13.349846839904785, 13.65151596069336, 13.953184127807617]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 8.0, 4.0, 10.0, 19.0, 12.0, 18.0, 32.0, 31.0, 47.0, 57.0, 68.0, 66.0, 64.0, 67.0, 54.0, 82.0, 55.0, 58.0, 51.0, 48.0, 32.0, 32.0, 20.0, 16.0, 16.0, 9.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.464890956878662, -3.3439502716064453, -3.2230098247528076, -3.102069139480591, -2.981128692626953, -2.8601880073547363, -2.7392475605010986, -2.618306875228882, -2.497366428375244, -2.3764257431030273, -2.2554852962493896, -2.134544610977173, -2.013604164123535, -1.8926634788513184, -1.7717230319976807, -1.6507823467254639, -1.5298417806625366, -1.4089012145996094, -1.2879606485366821, -1.1670200824737549, -1.0460795164108276, -0.9251388907432556, -0.8041983246803284, -0.6832577586174011, -0.5623171925544739, -0.44137662649154663, -0.3204360604286194, -0.19949546456336975, -0.0785548985004425, 0.04238569736480713, 0.16332626342773438, 0.2842668294906616, 0.40520739555358887, 0.5261479616165161, 0.6470885276794434, 0.7680290937423706, 0.8889696598052979, 1.0099103450775146, 1.1308507919311523, 1.2517914772033691, 1.3727319240570068, 1.493672490119934, 1.6146130561828613, 1.7355536222457886, 1.8564941883087158, 1.9774348735809326, 2.0983753204345703, 2.219316005706787, 2.340256690979004, 2.4611973762512207, 2.5821378231048584, 2.703078508377075, 2.824018955230713, 2.9449596405029297, 3.0659000873565674, 3.186840772628784, 3.307781219482422, 3.4287219047546387, 3.5496623516082764, 3.670603036880493, 3.791543483734131, 3.9124841690063477, 4.0334248542785645, 4.154365062713623, 4.27530574798584]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 7.0, 11.0, 14.0, 19.0, 32.0, 34.0, 37.0, 68.0, 114.0, 165.0, 262.0, 429.0, 843.0, 1709.0, 4168.0, 13281.0, 65318.0, 431817.0, 441549.0, 66953.0, 13701.0, 4242.0, 1759.0, 807.0, 451.0, 258.0, 146.0, 119.0, 66.0, 37.0, 30.0, 21.0, 14.0, 21.0, 9.0, 8.0, 6.0, 2.0, 6.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9169921875, -1.8571014404296875, -1.797210693359375, -1.7373199462890625, -1.67742919921875, -1.6175384521484375, -1.557647705078125, -1.4977569580078125, -1.4378662109375, -1.3779754638671875, -1.318084716796875, -1.2581939697265625, -1.19830322265625, -1.1384124755859375, -1.078521728515625, -1.0186309814453125, -0.958740234375, -0.8988494873046875, -0.838958740234375, -0.7790679931640625, -0.71917724609375, -0.6592864990234375, -0.599395751953125, -0.5395050048828125, -0.4796142578125, -0.4197235107421875, -0.359832763671875, -0.2999420166015625, -0.24005126953125, -0.1801605224609375, -0.120269775390625, -0.0603790283203125, -0.00048828125, 0.0594024658203125, 0.119293212890625, 0.1791839599609375, 0.23907470703125, 0.2989654541015625, 0.358856201171875, 0.4187469482421875, 0.4786376953125, 0.5385284423828125, 0.598419189453125, 0.6583099365234375, 0.71820068359375, 0.7780914306640625, 0.837982177734375, 0.8978729248046875, 0.957763671875, 1.0176544189453125, 1.077545166015625, 1.1374359130859375, 1.19732666015625, 1.2572174072265625, 1.317108154296875, 1.3769989013671875, 1.4368896484375, 1.4967803955078125, 1.556671142578125, 1.6165618896484375, 1.67645263671875, 1.7363433837890625, 1.796234130859375, 1.8561248779296875, 1.916015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 6.0, 5.0, 19.0, 29.0, 45.0, 51.0, 59.0, 86.0, 85.0, 114.0, 100.0, 83.0, 89.0, 61.0, 55.0, 44.0, 36.0, 10.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.3426361083984375, -0.328338623046875, -0.3140411376953125, -0.29974365234375, -0.2854461669921875, -0.271148681640625, -0.2568511962890625, -0.2425537109375, -0.2282562255859375, -0.213958740234375, -0.1996612548828125, -0.18536376953125, -0.1710662841796875, -0.156768798828125, -0.1424713134765625, -0.128173828125, -0.1138763427734375, -0.099578857421875, -0.0852813720703125, -0.07098388671875, -0.0566864013671875, -0.042388916015625, -0.0280914306640625, -0.0137939453125, 0.0005035400390625, 0.014801025390625, 0.0290985107421875, 0.04339599609375, 0.0576934814453125, 0.071990966796875, 0.0862884521484375, 0.1005859375, 0.1148834228515625, 0.129180908203125, 0.1434783935546875, 0.15777587890625, 0.1720733642578125, 0.186370849609375, 0.2006683349609375, 0.2149658203125, 0.2292633056640625, 0.243560791015625, 0.2578582763671875, 0.27215576171875, 0.2864532470703125, 0.300750732421875, 0.3150482177734375, 0.329345703125, 0.3436431884765625, 0.357940673828125, 0.3722381591796875, 0.38653564453125, 0.4008331298828125, 0.415130615234375, 0.4294281005859375, 0.4437255859375, 0.4580230712890625, 0.472320556640625, 0.4866180419921875, 0.50091552734375, 0.5152130126953125, 0.529510498046875, 0.5438079833984375, 0.55810546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 6.0, 11.0, 16.0, 22.0, 34.0, 36.0, 77.0, 121.0, 197.0, 329.0, 526.0, 948.0, 2076.0, 4256.0, 10319.0, 28349.0, 90170.0, 289727.0, 397630.0, 150543.0, 45487.0, 15469.0, 6203.0, 2845.0, 1351.0, 740.0, 410.0, 232.0, 152.0, 102.0, 53.0, 37.0, 32.0, 19.0, 8.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98046875, -0.9490509033203125, -0.917633056640625, -0.8862152099609375, -0.85479736328125, -0.8233795166015625, -0.791961669921875, -0.7605438232421875, -0.7291259765625, -0.6977081298828125, -0.666290283203125, -0.6348724365234375, -0.60345458984375, -0.5720367431640625, -0.540618896484375, -0.5092010498046875, -0.477783203125, -0.4463653564453125, -0.414947509765625, -0.3835296630859375, -0.35211181640625, -0.3206939697265625, -0.289276123046875, -0.2578582763671875, -0.2264404296875, -0.1950225830078125, -0.163604736328125, -0.1321868896484375, -0.10076904296875, -0.0693511962890625, -0.037933349609375, -0.0065155029296875, 0.02490234375, 0.0563201904296875, 0.087738037109375, 0.1191558837890625, 0.15057373046875, 0.1819915771484375, 0.213409423828125, 0.2448272705078125, 0.2762451171875, 0.3076629638671875, 0.339080810546875, 0.3704986572265625, 0.40191650390625, 0.4333343505859375, 0.464752197265625, 0.4961700439453125, 0.527587890625, 0.5590057373046875, 0.590423583984375, 0.6218414306640625, 0.65325927734375, 0.6846771240234375, 0.716094970703125, 0.7475128173828125, 0.7789306640625, 0.8103485107421875, 0.841766357421875, 0.8731842041015625, 0.90460205078125, 0.9360198974609375, 0.967437744140625, 0.9988555908203125, 1.0302734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 7.0, 13.0, 13.0, 14.0, 11.0, 29.0, 19.0, 29.0, 27.0, 38.0, 50.0, 35.0, 58.0, 50.0, 47.0, 37.0, 51.0, 53.0, 39.0, 46.0, 52.0, 35.0, 43.0, 42.0, 32.0, 28.0, 17.0, 18.0, 16.0, 12.0, 13.0, 8.0, 4.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.030029296875, -0.99658203125, -0.963134765625, -0.9296875, -0.896240234375, -0.86279296875, -0.829345703125, -0.7958984375, -0.762451171875, -0.72900390625, -0.695556640625, -0.662109375, -0.628662109375, -0.59521484375, -0.561767578125, -0.5283203125, -0.494873046875, -0.46142578125, -0.427978515625, -0.39453125, -0.361083984375, -0.32763671875, -0.294189453125, -0.2607421875, -0.227294921875, -0.19384765625, -0.160400390625, -0.126953125, -0.093505859375, -0.06005859375, -0.026611328125, 0.0068359375, 0.040283203125, 0.07373046875, 0.107177734375, 0.140625, 0.174072265625, 0.20751953125, 0.240966796875, 0.2744140625, 0.307861328125, 0.34130859375, 0.374755859375, 0.408203125, 0.441650390625, 0.47509765625, 0.508544921875, 0.5419921875, 0.575439453125, 0.60888671875, 0.642333984375, 0.67578125, 0.709228515625, 0.74267578125, 0.776123046875, 0.8095703125, 0.843017578125, 0.87646484375, 0.909912109375, 0.943359375, 0.976806640625, 1.01025390625, 1.043701171875, 1.0771484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 4.0, 8.0, 12.0, 11.0, 10.0, 27.0, 22.0, 25.0, 33.0, 42.0, 75.0, 135.0, 267.0, 629.0, 2060.0, 10452.0, 156184.0, 801535.0, 67945.0, 6480.0, 1478.0, 524.0, 224.0, 118.0, 69.0, 41.0, 27.0, 32.0, 17.0, 17.0, 6.0, 14.0, 10.0, 11.0, 6.0, 5.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -1.0096893310546875, -0.980316162109375, -0.9509429931640625, -0.92156982421875, -0.8921966552734375, -0.862823486328125, -0.8334503173828125, -0.8040771484375, -0.7747039794921875, -0.745330810546875, -0.7159576416015625, -0.68658447265625, -0.6572113037109375, -0.627838134765625, -0.5984649658203125, -0.569091796875, -0.5397186279296875, -0.510345458984375, -0.4809722900390625, -0.45159912109375, -0.4222259521484375, -0.392852783203125, -0.3634796142578125, -0.3341064453125, -0.3047332763671875, -0.275360107421875, -0.2459869384765625, -0.21661376953125, -0.1872406005859375, -0.157867431640625, -0.1284942626953125, -0.09912109375, -0.0697479248046875, -0.040374755859375, -0.0110015869140625, 0.01837158203125, 0.0477447509765625, 0.077117919921875, 0.1064910888671875, 0.1358642578125, 0.1652374267578125, 0.194610595703125, 0.2239837646484375, 0.25335693359375, 0.2827301025390625, 0.312103271484375, 0.3414764404296875, 0.370849609375, 0.4002227783203125, 0.429595947265625, 0.4589691162109375, 0.48834228515625, 0.5177154541015625, 0.547088623046875, 0.5764617919921875, 0.6058349609375, 0.6352081298828125, 0.664581298828125, 0.6939544677734375, 0.72332763671875, 0.7527008056640625, 0.782073974609375, 0.8114471435546875, 0.8408203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 9.0, 9.0, 12.0, 24.0, 27.0, 46.0, 77.0, 93.0, 127.0, 131.0, 118.0, 119.0, 76.0, 46.0, 29.0, 21.0, 15.0, 5.0, 11.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00016045570373535156, -0.00015677232295274734, -0.00015308894217014313, -0.0001494055613875389, -0.0001457221806049347, -0.00014203879982233047, -0.00013835541903972626, -0.00013467203825712204, -0.00013098865747451782, -0.0001273052766919136, -0.0001236218959093094, -0.00011993851512670517, -0.00011625513434410095, -0.00011257175356149673, -0.00010888837277889252, -0.0001052049919962883, -0.00010152161121368408, -9.783823043107986e-05, -9.415484964847565e-05, -9.047146886587143e-05, -8.678808808326721e-05, -8.3104707300663e-05, -7.942132651805878e-05, -7.573794573545456e-05, -7.205456495285034e-05, -6.837118417024612e-05, -6.46878033876419e-05, -6.100442260503769e-05, -5.732104182243347e-05, -5.3637661039829254e-05, -4.995428025722504e-05, -4.627089947462082e-05, -4.25875186920166e-05, -3.8904137909412384e-05, -3.5220757126808167e-05, -3.153737634420395e-05, -2.785399556159973e-05, -2.4170614778995514e-05, -2.0487233996391296e-05, -1.680385321378708e-05, -1.3120472431182861e-05, -9.437091648578644e-06, -5.753710865974426e-06, -2.0703300833702087e-06, 1.6130506992340088e-06, 5.296431481838226e-06, 8.979812264442444e-06, 1.2663193047046661e-05, 1.634657382965088e-05, 2.0029954612255096e-05, 2.3713335394859314e-05, 2.739671617746353e-05, 3.108009696006775e-05, 3.4763477742671967e-05, 3.8446858525276184e-05, 4.21302393078804e-05, 4.581362009048462e-05, 4.949700087308884e-05, 5.3180381655693054e-05, 5.686376243829727e-05, 6.054714322090149e-05, 6.423052400350571e-05, 6.791390478610992e-05, 7.159728556871414e-05, 7.528066635131836e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 11.0, 20.0, 27.0, 35.0, 62.0, 87.0, 144.0, 300.0, 575.0, 1514.0, 5442.0, 31662.0, 344666.0, 584919.0, 66479.0, 8888.0, 2238.0, 715.0, 333.0, 139.0, 81.0, 71.0, 35.0, 28.0, 22.0, 11.0, 10.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6220703125, -0.6014480590820312, -0.5808258056640625, -0.5602035522460938, -0.539581298828125, -0.5189590454101562, -0.4983367919921875, -0.47771453857421875, -0.45709228515625, -0.43647003173828125, -0.4158477783203125, -0.39522552490234375, -0.374603271484375, -0.35398101806640625, -0.3333587646484375, -0.31273651123046875, -0.2921142578125, -0.27149200439453125, -0.2508697509765625, -0.23024749755859375, -0.209625244140625, -0.18900299072265625, -0.1683807373046875, -0.14775848388671875, -0.12713623046875, -0.10651397705078125, -0.0858917236328125, -0.06526947021484375, -0.044647216796875, -0.02402496337890625, -0.0034027099609375, 0.01721954345703125, 0.037841796875, 0.05846405029296875, 0.0790863037109375, 0.09970855712890625, 0.120330810546875, 0.14095306396484375, 0.1615753173828125, 0.18219757080078125, 0.20281982421875, 0.22344207763671875, 0.2440643310546875, 0.26468658447265625, 0.285308837890625, 0.30593109130859375, 0.3265533447265625, 0.34717559814453125, 0.3677978515625, 0.38842010498046875, 0.4090423583984375, 0.42966461181640625, 0.450286865234375, 0.47090911865234375, 0.4915313720703125, 0.5121536254882812, 0.53277587890625, 0.5533981323242188, 0.5740203857421875, 0.5946426391601562, 0.615264892578125, 0.6358871459960938, 0.6565093994140625, 0.6771316528320312, 0.69775390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 6.0, 4.0, 16.0, 30.0, 51.0, 91.0, 128.0, 172.0, 188.0, 113.0, 83.0, 57.0, 26.0, 14.0, 11.0, 7.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39501953125, -0.36861419677734375, -0.3422088623046875, -0.31580352783203125, -0.289398193359375, -0.26299285888671875, -0.2365875244140625, -0.21018218994140625, -0.18377685546875, -0.15737152099609375, -0.1309661865234375, -0.10456085205078125, -0.078155517578125, -0.05175018310546875, -0.0253448486328125, 0.00106048583984375, 0.0274658203125, 0.05387115478515625, 0.0802764892578125, 0.10668182373046875, 0.133087158203125, 0.15949249267578125, 0.1858978271484375, 0.21230316162109375, 0.23870849609375, 0.26511383056640625, 0.2915191650390625, 0.31792449951171875, 0.344329833984375, 0.37073516845703125, 0.3971405029296875, 0.42354583740234375, 0.449951171875, 0.47635650634765625, 0.5027618408203125, 0.5291671752929688, 0.555572509765625, 0.5819778442382812, 0.6083831787109375, 0.6347885131835938, 0.66119384765625, 0.6875991821289062, 0.7140045166015625, 0.7404098510742188, 0.766815185546875, 0.7932205200195312, 0.8196258544921875, 0.8460311889648438, 0.8724365234375, 0.8988418579101562, 0.9252471923828125, 0.9516525268554688, 0.978057861328125, 1.0044631958007812, 1.0308685302734375, 1.0572738647460938, 1.08367919921875, 1.1100845336914062, 1.1364898681640625, 1.1628952026367188, 1.189300537109375, 1.2157058715820312, 1.2421112060546875, 1.2685165405273438, 1.294921875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 21.0, 34.0, 58.0, 77.0, 135.0, 197.0, 157.0, 129.0, 70.0, 51.0, 31.0, 15.0, 8.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.331611633300781, -10.025470733642578, -9.719329833984375, -9.413188934326172, -9.107048034667969, -8.800907135009766, -8.494766235351562, -8.18862533569336, -7.882484436035156, -7.576343536376953, -7.27020263671875, -6.964061737060547, -6.657920837402344, -6.351779937744141, -6.0456390380859375, -5.739498138427734, -5.433357238769531, -5.127216339111328, -4.821075439453125, -4.514934539794922, -4.208793640136719, -3.9026527404785156, -3.5965118408203125, -3.2903709411621094, -2.9842300415039062, -2.678089141845703, -2.3719482421875, -2.065807342529297, -1.7596664428710938, -1.4535255432128906, -1.1473846435546875, -0.8412437438964844, -0.5351028442382812, -0.22896194458007812, 0.077178955078125, 0.3833198547363281, 0.6894607543945312, 0.9956016540527344, 1.3017425537109375, 1.6078834533691406, 1.9140243530273438, 2.220165252685547, 2.52630615234375, 2.832447052001953, 3.1385879516601562, 3.4447288513183594, 3.7508697509765625, 4.057010650634766, 4.363151550292969, 4.669292449951172, 4.975433349609375, 5.281574249267578, 5.587715148925781, 5.893856048583984, 6.1999969482421875, 6.506137847900391, 6.812278747558594, 7.118419647216797, 7.424560546875, 7.730701446533203, 8.036842346191406, 8.34298324584961, 8.649124145507812, 8.955265045166016, 9.261405944824219]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 9.0, 8.0, 6.0, 12.0, 17.0, 15.0, 22.0, 28.0, 25.0, 32.0, 27.0, 40.0, 33.0, 52.0, 51.0, 51.0, 39.0, 50.0, 49.0, 45.0, 39.0, 46.0, 38.0, 31.0, 33.0, 28.0, 30.0, 29.0, 14.0, 14.0, 8.0, 11.0, 12.0, 15.0, 14.0, 8.0, 2.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.056171417236328, -4.8680806159973145, -4.679989337921143, -4.491898536682129, -4.303807735443115, -4.115716934204102, -3.9276256561279297, -3.739534854888916, -3.5514438152313232, -3.3633527755737305, -3.175261974334717, -2.987170934677124, -2.7990798950195312, -2.6109890937805176, -2.422898054122925, -2.234807014465332, -2.0467162132263184, -1.8586252927780151, -1.670534372329712, -1.4824433326721191, -1.294352412223816, -1.1062614917755127, -0.9181704521179199, -0.7300795316696167, -0.5419886112213135, -0.35389766097068787, -0.16580671072006226, 0.022284269332885742, 0.21037518978118896, 0.3984661102294922, 0.586557149887085, 0.7746480703353882, 0.9627394676208496, 1.1508303880691528, 1.338921308517456, 1.5270123481750488, 1.715103268623352, 1.9031941890716553, 2.091285228729248, 2.2793760299682617, 2.4674670696258545, 2.6555581092834473, 2.843648910522461, 3.0317399501800537, 3.2198309898376465, 3.40792179107666, 3.596012830734253, 3.7841038703918457, 3.9721946716308594, 4.160285472869873, 4.348376750946045, 4.536467552185059, 4.724558353424072, 4.912649154663086, 5.100740432739258, 5.2888312339782715, 5.476922035217285, 5.665012836456299, 5.853104114532471, 6.041194915771484, 6.229285717010498, 6.417376518249512, 6.605467796325684, 6.793558597564697, 6.981649875640869]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 7.0, 7.0, 9.0, 12.0, 10.0, 16.0, 22.0, 38.0, 49.0, 71.0, 98.0, 159.0, 305.0, 717.0, 1644.0, 5410.0, 28598.0, 513871.0, 3575551.0, 54377.0, 8653.0, 2515.0, 984.0, 467.0, 257.0, 148.0, 80.0, 67.0, 34.0, 34.0, 21.0, 10.0, 15.0, 7.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.259765625, -2.1954803466796875, -2.131195068359375, -2.0669097900390625, -2.00262451171875, -1.9383392333984375, -1.874053955078125, -1.8097686767578125, -1.7454833984375, -1.6811981201171875, -1.616912841796875, -1.5526275634765625, -1.48834228515625, -1.4240570068359375, -1.359771728515625, -1.2954864501953125, -1.231201171875, -1.1669158935546875, -1.102630615234375, -1.0383453369140625, -0.97406005859375, -0.9097747802734375, -0.845489501953125, -0.7812042236328125, -0.7169189453125, -0.6526336669921875, -0.588348388671875, -0.5240631103515625, -0.45977783203125, -0.3954925537109375, -0.331207275390625, -0.2669219970703125, -0.20263671875, -0.1383514404296875, -0.074066162109375, -0.0097808837890625, 0.05450439453125, 0.1187896728515625, 0.183074951171875, 0.2473602294921875, 0.3116455078125, 0.3759307861328125, 0.440216064453125, 0.5045013427734375, 0.56878662109375, 0.6330718994140625, 0.697357177734375, 0.7616424560546875, 0.825927734375, 0.8902130126953125, 0.954498291015625, 1.0187835693359375, 1.08306884765625, 1.1473541259765625, 1.211639404296875, 1.2759246826171875, 1.3402099609375, 1.4044952392578125, 1.468780517578125, 1.5330657958984375, 1.59735107421875, 1.6616363525390625, 1.725921630859375, 1.7902069091796875, 1.8544921875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 9.0, 15.0, 26.0, 30.0, 31.0, 42.0, 77.0, 78.0, 67.0, 87.0, 55.0, 89.0, 102.0, 80.0, 48.0, 60.0, 28.0, 22.0, 23.0, 10.0, 12.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361083984375, -0.3474464416503906, -0.33380889892578125, -0.3201713562011719, -0.3065338134765625, -0.2928962707519531, -0.27925872802734375, -0.2656211853027344, -0.251983642578125, -0.23834609985351562, -0.22470855712890625, -0.21107101440429688, -0.1974334716796875, -0.18379592895507812, -0.17015838623046875, -0.15652084350585938, -0.14288330078125, -0.12924575805664062, -0.11560821533203125, -0.10197067260742188, -0.0883331298828125, -0.07469558715820312, -0.06105804443359375, -0.047420501708984375, -0.033782958984375, -0.020145416259765625, -0.00650787353515625, 0.007129669189453125, 0.0207672119140625, 0.034404754638671875, 0.04804229736328125, 0.061679840087890625, 0.0753173828125, 0.08895492553710938, 0.10259246826171875, 0.11623001098632812, 0.1298675537109375, 0.14350509643554688, 0.15714263916015625, 0.17078018188476562, 0.184417724609375, 0.19805526733398438, 0.21169281005859375, 0.22533035278320312, 0.2389678955078125, 0.2526054382324219, 0.26624298095703125, 0.2798805236816406, 0.29351806640625, 0.3071556091308594, 0.32079315185546875, 0.3344306945800781, 0.3480682373046875, 0.3617057800292969, 0.37534332275390625, 0.3889808654785156, 0.402618408203125, 0.4162559509277344, 0.42989349365234375, 0.4435310363769531, 0.4571685791015625, 0.4708061218261719, 0.48444366455078125, 0.4980812072753906, 0.51171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 7.0, 8.0, 21.0, 25.0, 44.0, 55.0, 86.0, 100.0, 157.0, 258.0, 491.0, 925.0, 2400.0, 7666.0, 39391.0, 823024.0, 3235909.0, 67171.0, 11045.0, 3123.0, 1108.0, 494.0, 288.0, 161.0, 107.0, 64.0, 44.0, 31.0, 27.0, 17.0, 5.0, 11.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.48828125, -1.4371795654296875, -1.386077880859375, -1.3349761962890625, -1.28387451171875, -1.2327728271484375, -1.181671142578125, -1.1305694580078125, -1.0794677734375, -1.0283660888671875, -0.977264404296875, -0.9261627197265625, -0.87506103515625, -0.8239593505859375, -0.772857666015625, -0.7217559814453125, -0.670654296875, -0.6195526123046875, -0.568450927734375, -0.5173492431640625, -0.46624755859375, -0.4151458740234375, -0.364044189453125, -0.3129425048828125, -0.2618408203125, -0.2107391357421875, -0.159637451171875, -0.1085357666015625, -0.05743408203125, -0.0063323974609375, 0.044769287109375, 0.0958709716796875, 0.14697265625, 0.1980743408203125, 0.249176025390625, 0.3002777099609375, 0.35137939453125, 0.4024810791015625, 0.453582763671875, 0.5046844482421875, 0.5557861328125, 0.6068878173828125, 0.657989501953125, 0.7090911865234375, 0.76019287109375, 0.8112945556640625, 0.862396240234375, 0.9134979248046875, 0.964599609375, 1.0157012939453125, 1.066802978515625, 1.1179046630859375, 1.16900634765625, 1.2201080322265625, 1.271209716796875, 1.3223114013671875, 1.3734130859375, 1.4245147705078125, 1.475616455078125, 1.5267181396484375, 1.57781982421875, 1.6289215087890625, 1.680023193359375, 1.7311248779296875, 1.7822265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 10.0, 21.0, 31.0, 82.0, 146.0, 370.0, 1645.0, 1202.0, 283.0, 126.0, 53.0, 34.0, 23.0, 8.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85498046875, -0.8335723876953125, -0.812164306640625, -0.7907562255859375, -0.76934814453125, -0.7479400634765625, -0.726531982421875, -0.7051239013671875, -0.6837158203125, -0.6623077392578125, -0.640899658203125, -0.6194915771484375, -0.59808349609375, -0.5766754150390625, -0.555267333984375, -0.5338592529296875, -0.512451171875, -0.4910430908203125, -0.469635009765625, -0.4482269287109375, -0.42681884765625, -0.4054107666015625, -0.384002685546875, -0.3625946044921875, -0.3411865234375, -0.3197784423828125, -0.298370361328125, -0.2769622802734375, -0.25555419921875, -0.2341461181640625, -0.212738037109375, -0.1913299560546875, -0.169921875, -0.1485137939453125, -0.127105712890625, -0.1056976318359375, -0.08428955078125, -0.0628814697265625, -0.041473388671875, -0.0200653076171875, 0.0013427734375, 0.0227508544921875, 0.044158935546875, 0.0655670166015625, 0.08697509765625, 0.1083831787109375, 0.129791259765625, 0.1511993408203125, 0.172607421875, 0.1940155029296875, 0.215423583984375, 0.2368316650390625, 0.25823974609375, 0.2796478271484375, 0.301055908203125, 0.3224639892578125, 0.3438720703125, 0.3652801513671875, 0.386688232421875, 0.4080963134765625, 0.42950439453125, 0.4509124755859375, 0.472320556640625, 0.4937286376953125, 0.51513671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 7.0, 14.0, 32.0, 91.0, 190.0, 228.0, 208.0, 120.0, 65.0, 22.0, 13.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.120685577392578, -5.9781622886657715, -5.835639476776123, -5.693116188049316, -5.55059289932251, -5.408069610595703, -5.265546798706055, -5.123023509979248, -4.980500221252441, -4.837976932525635, -4.695454120635986, -4.55293083190918, -4.410407543182373, -4.267884254455566, -4.125361442565918, -3.9828381538391113, -3.840315341949463, -3.6977922916412354, -3.5552690029144287, -3.412745952606201, -3.2702226638793945, -3.127699613571167, -2.9851765632629395, -2.842653274536133, -2.7001302242279053, -2.5576071739196777, -2.415083885192871, -2.2725608348846436, -2.130037784576416, -1.9875144958496094, -1.8449914455413818, -1.7024682760238647, -1.5599455833435059, -1.4174224138259888, -1.2748992443084717, -1.1323761940002441, -0.989853024482727, -0.84732985496521, -0.7048067450523376, -0.5622836351394653, -0.41976046562194824, -0.27723732590675354, -0.13471418619155884, 0.007808953523635864, 0.15033209323883057, 0.29285526275634766, 0.43537837266921997, 0.5779014825820923, 0.7204246520996094, 0.8629478216171265, 1.0054709911346436, 1.147994041442871, 1.2905172109603882, 1.4330403804779053, 1.5755634307861328, 1.71808660030365, 1.860609769821167, 2.0031328201293945, 2.145656108856201, 2.2881791591644287, 2.4307022094726562, 2.573225498199463, 2.7157485485076904, 2.858271598815918, 3.0007948875427246]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 9.0, 13.0, 13.0, 13.0, 29.0, 38.0, 20.0, 43.0, 32.0, 42.0, 57.0, 66.0, 52.0, 65.0, 69.0, 73.0, 48.0, 51.0, 51.0, 45.0, 36.0, 37.0, 19.0, 25.0, 11.0, 12.0, 9.0, 8.0, 6.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6215457916259766, -2.553701400756836, -2.485856771469116, -2.4180123805999756, -2.350167989730835, -2.2823235988616943, -2.2144789695739746, -2.146634578704834, -2.0787901878356934, -2.0109457969665527, -1.9431012868881226, -1.8752567768096924, -1.8074123859405518, -1.7395678758621216, -1.6717233657836914, -1.6038789749145508, -1.5360344648361206, -1.4681899547576904, -1.4003455638885498, -1.3325010538101196, -1.264656662940979, -1.1968121528625488, -1.1289677619934082, -1.061123251914978, -0.9932788014411926, -0.9254343509674072, -0.8575899004936218, -0.7897454500198364, -0.7219009399414062, -0.6540565490722656, -0.5862120389938354, -0.51836758852005, -0.4505232572555542, -0.3826788067817688, -0.3148343563079834, -0.2469898760318756, -0.1791454255580902, -0.11130097508430481, -0.04345649480819702, 0.02438795566558838, 0.09223240613937378, 0.16007685661315918, 0.22792132198810577, 0.29576578736305237, 0.36361023783683777, 0.43145468831062317, 0.49929916858673096, 0.5671436190605164, 0.6349880695343018, 0.7028325200080872, 0.7706769704818726, 0.8385214805603027, 0.9063658714294434, 0.9742103815078735, 1.0420548915863037, 1.1098992824554443, 1.177743673324585, 1.2455881834030151, 1.3134325742721558, 1.381277084350586, 1.4491214752197266, 1.5169659852981567, 1.584810495376587, 1.6526548862457275, 1.7204993963241577]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 7.0, 15.0, 20.0, 22.0, 21.0, 41.0, 74.0, 104.0, 210.0, 385.0, 778.0, 1570.0, 4572.0, 17048.0, 88830.0, 462744.0, 384493.0, 67142.0, 13664.0, 3799.0, 1483.0, 698.0, 326.0, 188.0, 113.0, 72.0, 33.0, 26.0, 22.0, 14.0, 14.0, 12.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6689453125, -1.6149749755859375, -1.561004638671875, -1.5070343017578125, -1.45306396484375, -1.3990936279296875, -1.345123291015625, -1.2911529541015625, -1.2371826171875, -1.1832122802734375, -1.129241943359375, -1.0752716064453125, -1.02130126953125, -0.9673309326171875, -0.913360595703125, -0.8593902587890625, -0.805419921875, -0.7514495849609375, -0.697479248046875, -0.6435089111328125, -0.58953857421875, -0.5355682373046875, -0.481597900390625, -0.4276275634765625, -0.3736572265625, -0.3196868896484375, -0.265716552734375, -0.2117462158203125, -0.15777587890625, -0.1038055419921875, -0.049835205078125, 0.0041351318359375, 0.05810546875, 0.1120758056640625, 0.166046142578125, 0.2200164794921875, 0.27398681640625, 0.3279571533203125, 0.381927490234375, 0.4358978271484375, 0.4898681640625, 0.5438385009765625, 0.597808837890625, 0.6517791748046875, 0.70574951171875, 0.7597198486328125, 0.813690185546875, 0.8676605224609375, 0.921630859375, 0.9756011962890625, 1.029571533203125, 1.0835418701171875, 1.13751220703125, 1.1914825439453125, 1.245452880859375, 1.2994232177734375, 1.3533935546875, 1.4073638916015625, 1.461334228515625, 1.5153045654296875, 1.56927490234375, 1.6232452392578125, 1.677215576171875, 1.7311859130859375, 1.78515625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 10.0, 17.0, 12.0, 21.0, 32.0, 37.0, 46.0, 59.0, 63.0, 58.0, 74.0, 81.0, 81.0, 70.0, 75.0, 57.0, 48.0, 42.0, 27.0, 27.0, 24.0, 16.0, 7.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.345947265625, -0.3338470458984375, -0.321746826171875, -0.3096466064453125, -0.29754638671875, -0.2854461669921875, -0.273345947265625, -0.2612457275390625, -0.2491455078125, -0.2370452880859375, -0.224945068359375, -0.2128448486328125, -0.20074462890625, -0.1886444091796875, -0.176544189453125, -0.1644439697265625, -0.15234375, -0.1402435302734375, -0.128143310546875, -0.1160430908203125, -0.10394287109375, -0.0918426513671875, -0.079742431640625, -0.0676422119140625, -0.0555419921875, -0.0434417724609375, -0.031341552734375, -0.0192413330078125, -0.00714111328125, 0.0049591064453125, 0.017059326171875, 0.0291595458984375, 0.041259765625, 0.0533599853515625, 0.065460205078125, 0.0775604248046875, 0.08966064453125, 0.1017608642578125, 0.113861083984375, 0.1259613037109375, 0.1380615234375, 0.1501617431640625, 0.162261962890625, 0.1743621826171875, 0.18646240234375, 0.1985626220703125, 0.210662841796875, 0.2227630615234375, 0.23486328125, 0.2469635009765625, 0.259063720703125, 0.2711639404296875, 0.28326416015625, 0.2953643798828125, 0.307464599609375, 0.3195648193359375, 0.3316650390625, 0.3437652587890625, 0.355865478515625, 0.3679656982421875, 0.38006591796875, 0.3921661376953125, 0.404266357421875, 0.4163665771484375, 0.428466796875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 12.0, 9.0, 13.0, 17.0, 32.0, 31.0, 41.0, 50.0, 105.0, 135.0, 169.0, 257.0, 401.0, 636.0, 975.0, 1677.0, 3009.0, 5540.0, 10717.0, 22598.0, 50178.0, 116776.0, 247039.0, 293695.0, 161881.0, 70742.0, 30745.0, 14620.0, 7156.0, 3845.0, 2060.0, 1212.0, 723.0, 487.0, 286.0, 189.0, 137.0, 104.0, 75.0, 43.0, 36.0, 27.0, 16.0, 14.0, 8.0, 10.0, 4.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.7080078125, -0.6866836547851562, -0.6653594970703125, -0.6440353393554688, -0.622711181640625, -0.6013870239257812, -0.5800628662109375, -0.5587387084960938, -0.53741455078125, -0.5160903930664062, -0.4947662353515625, -0.47344207763671875, -0.452117919921875, -0.43079376220703125, -0.4094696044921875, -0.38814544677734375, -0.3668212890625, -0.34549713134765625, -0.3241729736328125, -0.30284881591796875, -0.281524658203125, -0.26020050048828125, -0.2388763427734375, -0.21755218505859375, -0.19622802734375, -0.17490386962890625, -0.1535797119140625, -0.13225555419921875, -0.110931396484375, -0.08960723876953125, -0.0682830810546875, -0.04695892333984375, -0.025634765625, -0.00431060791015625, 0.0170135498046875, 0.03833770751953125, 0.059661865234375, 0.08098602294921875, 0.1023101806640625, 0.12363433837890625, 0.14495849609375, 0.16628265380859375, 0.1876068115234375, 0.20893096923828125, 0.230255126953125, 0.25157928466796875, 0.2729034423828125, 0.29422760009765625, 0.3155517578125, 0.33687591552734375, 0.3582000732421875, 0.37952423095703125, 0.400848388671875, 0.42217254638671875, 0.4434967041015625, 0.46482086181640625, 0.48614501953125, 0.5074691772460938, 0.5287933349609375, 0.5501174926757812, 0.571441650390625, 0.5927658081054688, 0.6140899658203125, 0.6354141235351562, 0.65673828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 5.0, 6.0, 11.0, 8.0, 11.0, 23.0, 15.0, 21.0, 27.0, 27.0, 25.0, 23.0, 35.0, 33.0, 40.0, 36.0, 45.0, 45.0, 36.0, 42.0, 48.0, 35.0, 41.0, 35.0, 40.0, 27.0, 26.0, 28.0, 39.0, 24.0, 27.0, 17.0, 13.0, 12.0, 11.0, 9.0, 10.0, 6.0, 9.0, 6.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.9853515625, -0.9544219970703125, -0.923492431640625, -0.8925628662109375, -0.86163330078125, -0.8307037353515625, -0.799774169921875, -0.7688446044921875, -0.7379150390625, -0.7069854736328125, -0.676055908203125, -0.6451263427734375, -0.61419677734375, -0.5832672119140625, -0.552337646484375, -0.5214080810546875, -0.490478515625, -0.4595489501953125, -0.428619384765625, -0.3976898193359375, -0.36676025390625, -0.3358306884765625, -0.304901123046875, -0.2739715576171875, -0.2430419921875, -0.2121124267578125, -0.181182861328125, -0.1502532958984375, -0.11932373046875, -0.0883941650390625, -0.057464599609375, -0.0265350341796875, 0.00439453125, 0.0353240966796875, 0.066253662109375, 0.0971832275390625, 0.12811279296875, 0.1590423583984375, 0.189971923828125, 0.2209014892578125, 0.2518310546875, 0.2827606201171875, 0.313690185546875, 0.3446197509765625, 0.37554931640625, 0.4064788818359375, 0.437408447265625, 0.4683380126953125, 0.499267578125, 0.5301971435546875, 0.561126708984375, 0.5920562744140625, 0.62298583984375, 0.6539154052734375, 0.684844970703125, 0.7157745361328125, 0.7467041015625, 0.7776336669921875, 0.808563232421875, 0.8394927978515625, 0.87042236328125, 0.9013519287109375, 0.932281494140625, 0.9632110595703125, 0.994140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 12.0, 5.0, 14.0, 23.0, 37.0, 55.0, 95.0, 147.0, 298.0, 629.0, 1765.0, 6916.0, 61666.0, 660382.0, 291153.0, 19730.0, 3509.0, 1149.0, 448.0, 226.0, 114.0, 55.0, 30.0, 33.0, 9.0, 15.0, 12.0, 5.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52197265625, -0.499053955078125, -0.47613525390625, -0.453216552734375, -0.4302978515625, -0.407379150390625, -0.38446044921875, -0.361541748046875, -0.338623046875, -0.315704345703125, -0.29278564453125, -0.269866943359375, -0.2469482421875, -0.224029541015625, -0.20111083984375, -0.178192138671875, -0.1552734375, -0.132354736328125, -0.10943603515625, -0.086517333984375, -0.0635986328125, -0.040679931640625, -0.01776123046875, 0.005157470703125, 0.028076171875, 0.050994873046875, 0.07391357421875, 0.096832275390625, 0.1197509765625, 0.142669677734375, 0.16558837890625, 0.188507080078125, 0.21142578125, 0.234344482421875, 0.25726318359375, 0.280181884765625, 0.3031005859375, 0.326019287109375, 0.34893798828125, 0.371856689453125, 0.394775390625, 0.417694091796875, 0.44061279296875, 0.463531494140625, 0.4864501953125, 0.509368896484375, 0.53228759765625, 0.555206298828125, 0.578125, 0.601043701171875, 0.62396240234375, 0.646881103515625, 0.6697998046875, 0.692718505859375, 0.71563720703125, 0.738555908203125, 0.761474609375, 0.784393310546875, 0.80731201171875, 0.830230712890625, 0.8531494140625, 0.876068115234375, 0.89898681640625, 0.921905517578125, 0.94482421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 6.0, 5.0, 5.0, 13.0, 21.0, 31.0, 38.0, 55.0, 78.0, 98.0, 102.0, 103.0, 110.0, 93.0, 80.0, 58.0, 46.0, 20.0, 17.0, 12.0, 2.0, 7.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.175041198730469e-05, -5.8736652135849e-05, -5.572289228439331e-05, -5.270913243293762e-05, -4.9695372581481934e-05, -4.6681612730026245e-05, -4.366785287857056e-05, -4.065409302711487e-05, -3.764033317565918e-05, -3.462657332420349e-05, -3.16128134727478e-05, -2.8599053621292114e-05, -2.5585293769836426e-05, -2.2571533918380737e-05, -1.955777406692505e-05, -1.654401421546936e-05, -1.3530254364013672e-05, -1.0516494512557983e-05, -7.502734661102295e-06, -4.4889748096466064e-06, -1.475214958190918e-06, 1.5385448932647705e-06, 4.552304744720459e-06, 7.5660645961761475e-06, 1.0579824447631836e-05, 1.3593584299087524e-05, 1.6607344150543213e-05, 1.96211040019989e-05, 2.263486385345459e-05, 2.564862370491028e-05, 2.8662383556365967e-05, 3.1676143407821655e-05, 3.4689903259277344e-05, 3.770366311073303e-05, 4.071742296218872e-05, 4.373118281364441e-05, 4.67449426651001e-05, 4.9758702516555786e-05, 5.2772462368011475e-05, 5.578622221946716e-05, 5.879998207092285e-05, 6.181374192237854e-05, 6.482750177383423e-05, 6.784126162528992e-05, 7.08550214767456e-05, 7.38687813282013e-05, 7.688254117965698e-05, 7.989630103111267e-05, 8.291006088256836e-05, 8.592382073402405e-05, 8.893758058547974e-05, 9.195134043693542e-05, 9.496510028839111e-05, 9.79788601398468e-05, 0.00010099261999130249, 0.00010400637984275818, 0.00010702013969421387, 0.00011003389954566956, 0.00011304765939712524, 0.00011606141924858093, 0.00011907517910003662, 0.0001220889389514923, 0.000125102698802948, 0.0001281164586544037, 0.00013113021850585938]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 13.0, 5.0, 12.0, 35.0, 57.0, 80.0, 155.0, 369.0, 711.0, 1672.0, 5483.0, 28807.0, 234067.0, 607737.0, 143986.0, 18713.0, 4120.0, 1356.0, 570.0, 275.0, 139.0, 76.0, 36.0, 27.0, 16.0, 7.0, 2.0, 4.0, 4.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.66064453125, -0.6434326171875, -0.626220703125, -0.6090087890625, -0.591796875, -0.5745849609375, -0.557373046875, -0.5401611328125, -0.52294921875, -0.5057373046875, -0.488525390625, -0.4713134765625, -0.4541015625, -0.4368896484375, -0.419677734375, -0.4024658203125, -0.38525390625, -0.3680419921875, -0.350830078125, -0.3336181640625, -0.31640625, -0.2991943359375, -0.281982421875, -0.2647705078125, -0.24755859375, -0.2303466796875, -0.213134765625, -0.1959228515625, -0.1787109375, -0.1614990234375, -0.144287109375, -0.1270751953125, -0.10986328125, -0.0926513671875, -0.075439453125, -0.0582275390625, -0.041015625, -0.0238037109375, -0.006591796875, 0.0106201171875, 0.02783203125, 0.0450439453125, 0.062255859375, 0.0794677734375, 0.0966796875, 0.1138916015625, 0.131103515625, 0.1483154296875, 0.16552734375, 0.1827392578125, 0.199951171875, 0.2171630859375, 0.234375, 0.2515869140625, 0.268798828125, 0.2860107421875, 0.30322265625, 0.3204345703125, 0.337646484375, 0.3548583984375, 0.3720703125, 0.3892822265625, 0.406494140625, 0.4237060546875, 0.44091796875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 8.0, 8.0, 6.0, 14.0, 20.0, 29.0, 39.0, 38.0, 45.0, 56.0, 67.0, 70.0, 95.0, 87.0, 73.0, 63.0, 60.0, 68.0, 40.0, 25.0, 28.0, 14.0, 11.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.453369140625, -0.4397125244140625, -0.426055908203125, -0.4123992919921875, -0.39874267578125, -0.3850860595703125, -0.371429443359375, -0.3577728271484375, -0.3441162109375, -0.3304595947265625, -0.316802978515625, -0.3031463623046875, -0.28948974609375, -0.2758331298828125, -0.262176513671875, -0.2485198974609375, -0.23486328125, -0.2212066650390625, -0.207550048828125, -0.1938934326171875, -0.18023681640625, -0.1665802001953125, -0.152923583984375, -0.1392669677734375, -0.1256103515625, -0.1119537353515625, -0.098297119140625, -0.0846405029296875, -0.07098388671875, -0.0573272705078125, -0.043670654296875, -0.0300140380859375, -0.016357421875, -0.0027008056640625, 0.010955810546875, 0.0246124267578125, 0.03826904296875, 0.0519256591796875, 0.065582275390625, 0.0792388916015625, 0.0928955078125, 0.1065521240234375, 0.120208740234375, 0.1338653564453125, 0.14752197265625, 0.1611785888671875, 0.174835205078125, 0.1884918212890625, 0.2021484375, 0.2158050537109375, 0.229461669921875, 0.2431182861328125, 0.25677490234375, 0.2704315185546875, 0.284088134765625, 0.2977447509765625, 0.3114013671875, 0.3250579833984375, 0.338714599609375, 0.3523712158203125, 0.36602783203125, 0.3796844482421875, 0.393341064453125, 0.4069976806640625, 0.420654296875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 19.0, 70.0, 307.0, 423.0, 135.0, 27.0, 12.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.30960464477539, -15.541488647460938, -14.773372650146484, -14.005256652832031, -13.237139701843262, -12.469023704528809, -11.700907707214355, -10.932790756225586, -10.164674758911133, -9.39655876159668, -8.628442764282227, -7.860326290130615, -7.092209815979004, -6.324093818664551, -5.555977821350098, -4.787861347198486, -4.019745826721191, -3.251629590988159, -2.483513355255127, -1.7153973579406738, -0.9472811222076416, -0.17916488647460938, 0.5889511108398438, 1.357067584991455, 2.125183582305908, 2.8932998180389404, 3.6614160537719727, 4.429532051086426, 5.197648048400879, 5.96576452255249, 6.733880519866943, 7.501996994018555, 8.270112991333008, 9.038228988647461, 9.806344985961914, 10.574460983276367, 11.342577934265137, 12.11069393157959, 12.878809928894043, 13.646926879882812, 14.415042877197266, 15.183158874511719, 15.951274871826172, 16.719390869140625, 17.487506866455078, 18.25562286376953, 19.023738861083984, 19.79185676574707, 20.55997085571289, 21.328086853027344, 22.096202850341797, 22.86431884765625, 23.632434844970703, 24.400550842285156, 25.16866683959961, 25.936784744262695, 26.70490074157715, 27.4730167388916, 28.241132736206055, 29.009248733520508, 29.77736473083496, 30.545482635498047, 31.3135986328125, 32.08171463012695, 32.849830627441406]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 2.0, 7.0, 4.0, 8.0, 9.0, 13.0, 10.0, 15.0, 13.0, 26.0, 33.0, 23.0, 30.0, 45.0, 39.0, 43.0, 36.0, 46.0, 49.0, 60.0, 47.0, 48.0, 44.0, 45.0, 41.0, 50.0, 31.0, 26.0, 19.0, 31.0, 24.0, 16.0, 13.0, 13.0, 12.0, 9.0, 8.0, 3.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.164831161499023, -7.949597358703613, -7.734363555908203, -7.519130229949951, -7.303896427154541, -7.088662624359131, -6.873429298400879, -6.658195495605469, -6.442961692810059, -6.227727890014648, -6.012494087219238, -5.797260761260986, -5.582026958465576, -5.366793155670166, -5.151559829711914, -4.936326026916504, -4.721092224121094, -4.505858421325684, -4.290624618530273, -4.0753912925720215, -3.8601574897766113, -3.644923686981201, -3.42969012260437, -3.214456558227539, -2.999222755432129, -2.7839889526367188, -2.5687553882598877, -2.3535218238830566, -2.1382880210876465, -1.9230543375015259, -1.7078206539154053, -1.4925869703292847, -1.277353286743164, -1.0621196031570435, -0.8468859195709229, -0.6316522359848022, -0.41641855239868164, -0.20118486881256104, 0.01404881477355957, 0.22928249835968018, 0.4445161819458008, 0.6597498655319214, 0.874983549118042, 1.0902172327041626, 1.3054509162902832, 1.5206845998764038, 1.7359182834625244, 1.951151967048645, 2.1663856506347656, 2.381619453430176, 2.596853017807007, 2.812086582183838, 3.027320384979248, 3.242554187774658, 3.4577877521514893, 3.6730213165283203, 3.8882551193237305, 4.103488922119141, 4.318722724914551, 4.533956050872803, 4.749189853668213, 4.964423656463623, 5.179656982421875, 5.394890785217285, 5.610124588012695]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 5.0, 8.0, 13.0, 22.0, 21.0, 38.0, 41.0, 66.0, 81.0, 147.0, 232.0, 416.0, 700.0, 1461.0, 3660.0, 11372.0, 55104.0, 1077043.0, 2953568.0, 69202.0, 13358.0, 4154.0, 1758.0, 796.0, 408.0, 240.0, 119.0, 77.0, 62.0, 35.0, 18.0, 16.0, 7.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5830078125, -1.53363037109375, -1.4842529296875, -1.43487548828125, -1.385498046875, -1.33612060546875, -1.2867431640625, -1.23736572265625, -1.18798828125, -1.13861083984375, -1.0892333984375, -1.03985595703125, -0.990478515625, -0.94110107421875, -0.8917236328125, -0.84234619140625, -0.79296875, -0.74359130859375, -0.6942138671875, -0.64483642578125, -0.595458984375, -0.54608154296875, -0.4967041015625, -0.44732666015625, -0.39794921875, -0.34857177734375, -0.2991943359375, -0.24981689453125, -0.200439453125, -0.15106201171875, -0.1016845703125, -0.05230712890625, -0.0029296875, 0.04644775390625, 0.0958251953125, 0.14520263671875, 0.194580078125, 0.24395751953125, 0.2933349609375, 0.34271240234375, 0.39208984375, 0.44146728515625, 0.4908447265625, 0.54022216796875, 0.589599609375, 0.63897705078125, 0.6883544921875, 0.73773193359375, 0.787109375, 0.83648681640625, 0.8858642578125, 0.93524169921875, 0.984619140625, 1.03399658203125, 1.0833740234375, 1.13275146484375, 1.18212890625, 1.23150634765625, 1.2808837890625, 1.33026123046875, 1.379638671875, 1.42901611328125, 1.4783935546875, 1.52777099609375, 1.5771484375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 7.0, 2.0, 5.0, 9.0, 9.0, 15.0, 17.0, 16.0, 27.0, 27.0, 35.0, 52.0, 62.0, 59.0, 49.0, 61.0, 66.0, 65.0, 59.0, 63.0, 55.0, 58.0, 38.0, 35.0, 30.0, 25.0, 15.0, 17.0, 12.0, 6.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.411376953125, -0.39914703369140625, -0.3869171142578125, -0.37468719482421875, -0.362457275390625, -0.35022735595703125, -0.3379974365234375, -0.32576751708984375, -0.31353759765625, -0.30130767822265625, -0.2890777587890625, -0.27684783935546875, -0.264617919921875, -0.25238800048828125, -0.2401580810546875, -0.22792816162109375, -0.2156982421875, -0.20346832275390625, -0.1912384033203125, -0.17900848388671875, -0.166778564453125, -0.15454864501953125, -0.1423187255859375, -0.13008880615234375, -0.11785888671875, -0.10562896728515625, -0.0933990478515625, -0.08116912841796875, -0.068939208984375, -0.05670928955078125, -0.0444793701171875, -0.03224945068359375, -0.02001953125, -0.00778961181640625, 0.0044403076171875, 0.01667022705078125, 0.028900146484375, 0.04113006591796875, 0.0533599853515625, 0.06558990478515625, 0.07781982421875, 0.09004974365234375, 0.1022796630859375, 0.11450958251953125, 0.126739501953125, 0.13896942138671875, 0.1511993408203125, 0.16342926025390625, 0.1756591796875, 0.18788909912109375, 0.2001190185546875, 0.21234893798828125, 0.224578857421875, 0.23680877685546875, 0.2490386962890625, 0.26126861572265625, 0.27349853515625, 0.28572845458984375, 0.2979583740234375, 0.31018829345703125, 0.322418212890625, 0.33464813232421875, 0.3468780517578125, 0.35910797119140625, 0.371337890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 11.0, 13.0, 13.0, 33.0, 44.0, 80.0, 99.0, 155.0, 261.0, 458.0, 792.0, 1735.0, 3768.0, 9641.0, 31142.0, 153158.0, 3126032.0, 760150.0, 76063.0, 18916.0, 6443.0, 2556.0, 1170.0, 657.0, 351.0, 213.0, 120.0, 69.0, 50.0, 28.0, 22.0, 18.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2421875, -1.2054443359375, -1.168701171875, -1.1319580078125, -1.09521484375, -1.0584716796875, -1.021728515625, -0.9849853515625, -0.9482421875, -0.9114990234375, -0.874755859375, -0.8380126953125, -0.80126953125, -0.7645263671875, -0.727783203125, -0.6910400390625, -0.654296875, -0.6175537109375, -0.580810546875, -0.5440673828125, -0.50732421875, -0.4705810546875, -0.433837890625, -0.3970947265625, -0.3603515625, -0.3236083984375, -0.286865234375, -0.2501220703125, -0.21337890625, -0.1766357421875, -0.139892578125, -0.1031494140625, -0.06640625, -0.0296630859375, 0.007080078125, 0.0438232421875, 0.08056640625, 0.1173095703125, 0.154052734375, 0.1907958984375, 0.2275390625, 0.2642822265625, 0.301025390625, 0.3377685546875, 0.37451171875, 0.4112548828125, 0.447998046875, 0.4847412109375, 0.521484375, 0.5582275390625, 0.594970703125, 0.6317138671875, 0.66845703125, 0.7052001953125, 0.741943359375, 0.7786865234375, 0.8154296875, 0.8521728515625, 0.888916015625, 0.9256591796875, 0.96240234375, 0.9991455078125, 1.035888671875, 1.0726318359375, 1.109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 8.0, 11.0, 19.0, 32.0, 38.0, 49.0, 101.0, 161.0, 298.0, 941.0, 1471.0, 436.0, 194.0, 104.0, 58.0, 36.0, 33.0, 14.0, 18.0, 9.0, 6.0, 7.0, 1.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.76708984375, -0.7469940185546875, -0.726898193359375, -0.7068023681640625, -0.68670654296875, -0.6666107177734375, -0.646514892578125, -0.6264190673828125, -0.6063232421875, -0.5862274169921875, -0.566131591796875, -0.5460357666015625, -0.52593994140625, -0.5058441162109375, -0.485748291015625, -0.4656524658203125, -0.445556640625, -0.4254608154296875, -0.405364990234375, -0.3852691650390625, -0.36517333984375, -0.3450775146484375, -0.324981689453125, -0.3048858642578125, -0.2847900390625, -0.2646942138671875, -0.244598388671875, -0.2245025634765625, -0.20440673828125, -0.1843109130859375, -0.164215087890625, -0.1441192626953125, -0.1240234375, -0.1039276123046875, -0.083831787109375, -0.0637359619140625, -0.04364013671875, -0.0235443115234375, -0.003448486328125, 0.0166473388671875, 0.0367431640625, 0.0568389892578125, 0.076934814453125, 0.0970306396484375, 0.11712646484375, 0.1372222900390625, 0.157318115234375, 0.1774139404296875, 0.197509765625, 0.2176055908203125, 0.237701416015625, 0.2577972412109375, 0.27789306640625, 0.2979888916015625, 0.318084716796875, 0.3381805419921875, 0.3582763671875, 0.3783721923828125, 0.398468017578125, 0.4185638427734375, 0.43865966796875, 0.4587554931640625, 0.478851318359375, 0.4989471435546875, 0.51904296875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 0.0, 5.0, 9.0, 9.0, 34.0, 63.0, 160.0, 286.0, 243.0, 135.0, 44.0, 10.0, 8.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.038534164428711, -7.837335586547852, -7.636137008666992, -7.434938430786133, -7.233740329742432, -7.032541751861572, -6.831343173980713, -6.6301445960998535, -6.428946018218994, -6.227747440338135, -6.026548862457275, -5.825350761413574, -5.624152183532715, -5.4229536056518555, -5.221755027770996, -5.020556449890137, -4.819357872009277, -4.618159294128418, -4.416960716247559, -4.215762138366699, -4.014564037322998, -3.8133654594421387, -3.6121668815612793, -3.41096830368042, -3.2097702026367188, -3.0085716247558594, -2.807373285293579, -2.6061747074127197, -2.4049761295318604, -2.20377779006958, -2.0025792121887207, -1.8013806343078613, -1.600182056427002, -1.3989835977554321, -1.1977850198745728, -0.9965865612030029, -0.7953880429267883, -0.5941895246505737, -0.3929910659790039, -0.19179248809814453, 0.009405970573425293, 0.2106044739484787, 0.4118029773235321, 0.6130014657974243, 0.8141999840736389, 1.0153985023498535, 1.2165969610214233, 1.4177955389022827, 1.6189939975738525, 1.8201924562454224, 2.021390914916992, 2.2225894927978516, 2.423788070678711, 2.6249866485595703, 2.8261849880218506, 3.02738356590271, 3.2285819053649902, 3.4297804832458496, 3.63097882270813, 3.8321774005889893, 4.0333757400512695, 4.234574317932129, 4.435772895812988, 4.636971473693848, 4.838170051574707]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 9.0, 3.0, 4.0, 6.0, 9.0, 17.0, 22.0, 23.0, 27.0, 42.0, 54.0, 45.0, 65.0, 60.0, 74.0, 63.0, 81.0, 53.0, 55.0, 43.0, 55.0, 43.0, 36.0, 23.0, 20.0, 21.0, 16.0, 11.0, 5.0, 6.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7592930793762207, -2.672353744506836, -2.585414409637451, -2.4984750747680664, -2.4115357398986816, -2.324596405029297, -2.237657070159912, -2.1507177352905273, -2.0637784004211426, -1.9768390655517578, -1.889899730682373, -1.8029603958129883, -1.7160210609436035, -1.6290817260742188, -1.5421425104141235, -1.4552031755447388, -1.3682639598846436, -1.2813246250152588, -1.194385290145874, -1.1074459552764893, -1.0205066204071045, -0.9335673451423645, -0.8466280698776245, -0.7596887350082397, -0.672749400138855, -0.5858100652694702, -0.49887076020240784, -0.41193145513534546, -0.3249921202659607, -0.23805278539657593, -0.15111351013183594, -0.06417417526245117, 0.022765398025512695, 0.10970471799373627, 0.19664403796195984, 0.2835833430290222, 0.370522677898407, 0.45746201276779175, 0.5444012880325317, 0.6313406229019165, 0.7182799577713013, 0.805219292640686, 0.8921586275100708, 0.9790979027748108, 1.0660371780395508, 1.1529765129089355, 1.2399158477783203, 1.326855182647705, 1.4137945175170898, 1.5007338523864746, 1.5876731872558594, 1.6746125221252441, 1.761551856994629, 1.8484911918640137, 1.9354304075241089, 2.022369861602783, 2.109309196472168, 2.1962485313415527, 2.2831878662109375, 2.3701272010803223, 2.457066535949707, 2.544005870819092, 2.6309452056884766, 2.7178845405578613, 2.804823637008667]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 12.0, 19.0, 32.0, 37.0, 69.0, 114.0, 234.0, 420.0, 945.0, 2294.0, 5813.0, 19043.0, 90385.0, 515071.0, 337941.0, 55228.0, 13287.0, 4324.0, 1715.0, 708.0, 367.0, 185.0, 101.0, 66.0, 48.0, 31.0, 18.0, 15.0, 5.0, 8.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9599609375, -1.902069091796875, -1.84417724609375, -1.786285400390625, -1.7283935546875, -1.670501708984375, -1.61260986328125, -1.554718017578125, -1.496826171875, -1.438934326171875, -1.38104248046875, -1.323150634765625, -1.2652587890625, -1.207366943359375, -1.14947509765625, -1.091583251953125, -1.03369140625, -0.975799560546875, -0.91790771484375, -0.860015869140625, -0.8021240234375, -0.744232177734375, -0.68634033203125, -0.628448486328125, -0.570556640625, -0.512664794921875, -0.45477294921875, -0.396881103515625, -0.3389892578125, -0.281097412109375, -0.22320556640625, -0.165313720703125, -0.107421875, -0.049530029296875, 0.00836181640625, 0.066253662109375, 0.1241455078125, 0.182037353515625, 0.23992919921875, 0.297821044921875, 0.355712890625, 0.413604736328125, 0.47149658203125, 0.529388427734375, 0.5872802734375, 0.645172119140625, 0.70306396484375, 0.760955810546875, 0.81884765625, 0.876739501953125, 0.93463134765625, 0.992523193359375, 1.0504150390625, 1.108306884765625, 1.16619873046875, 1.224090576171875, 1.281982421875, 1.339874267578125, 1.39776611328125, 1.455657958984375, 1.5135498046875, 1.571441650390625, 1.62933349609375, 1.687225341796875, 1.7451171875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 8.0, 7.0, 11.0, 13.0, 11.0, 14.0, 21.0, 31.0, 27.0, 32.0, 45.0, 39.0, 48.0, 52.0, 66.0, 52.0, 62.0, 56.0, 60.0, 46.0, 55.0, 55.0, 39.0, 29.0, 25.0, 19.0, 19.0, 14.0, 8.0, 8.0, 9.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.40234375, -0.3911857604980469, -0.38002777099609375, -0.3688697814941406, -0.3577117919921875, -0.3465538024902344, -0.33539581298828125, -0.3242378234863281, -0.313079833984375, -0.3019218444824219, -0.29076385498046875, -0.2796058654785156, -0.2684478759765625, -0.2572898864746094, -0.24613189697265625, -0.23497390747070312, -0.22381591796875, -0.21265792846679688, -0.20149993896484375, -0.19034194946289062, -0.1791839599609375, -0.16802597045898438, -0.15686798095703125, -0.14570999145507812, -0.134552001953125, -0.12339401245117188, -0.11223602294921875, -0.10107803344726562, -0.0899200439453125, -0.07876205444335938, -0.06760406494140625, -0.056446075439453125, -0.0452880859375, -0.034130096435546875, -0.02297210693359375, -0.011814117431640625, -0.0006561279296875, 0.010501861572265625, 0.02165985107421875, 0.032817840576171875, 0.043975830078125, 0.055133819580078125, 0.06629180908203125, 0.07744979858398438, 0.0886077880859375, 0.09976577758789062, 0.11092376708984375, 0.12208175659179688, 0.13323974609375, 0.14439773559570312, 0.15555572509765625, 0.16671371459960938, 0.1778717041015625, 0.18902969360351562, 0.20018768310546875, 0.21134567260742188, 0.222503662109375, 0.23366165161132812, 0.24481964111328125, 0.2559776306152344, 0.2671356201171875, 0.2782936096191406, 0.28945159912109375, 0.3006095886230469, 0.311767578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 8.0, 14.0, 25.0, 27.0, 33.0, 43.0, 58.0, 106.0, 185.0, 291.0, 497.0, 906.0, 1824.0, 3749.0, 8339.0, 21755.0, 65783.0, 246014.0, 468857.0, 157479.0, 44107.0, 15797.0, 6452.0, 2810.0, 1467.0, 788.0, 436.0, 246.0, 136.0, 114.0, 63.0, 39.0, 28.0, 15.0, 15.0, 7.0, 8.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1708984375, -1.1346893310546875, -1.098480224609375, -1.0622711181640625, -1.02606201171875, -0.9898529052734375, -0.953643798828125, -0.9174346923828125, -0.8812255859375, -0.8450164794921875, -0.808807373046875, -0.7725982666015625, -0.73638916015625, -0.7001800537109375, -0.663970947265625, -0.6277618408203125, -0.591552734375, -0.5553436279296875, -0.519134521484375, -0.4829254150390625, -0.44671630859375, -0.4105072021484375, -0.374298095703125, -0.3380889892578125, -0.3018798828125, -0.2656707763671875, -0.229461669921875, -0.1932525634765625, -0.15704345703125, -0.1208343505859375, -0.084625244140625, -0.0484161376953125, -0.01220703125, 0.0240020751953125, 0.060211181640625, 0.0964202880859375, 0.13262939453125, 0.1688385009765625, 0.205047607421875, 0.2412567138671875, 0.2774658203125, 0.3136749267578125, 0.349884033203125, 0.3860931396484375, 0.42230224609375, 0.4585113525390625, 0.494720458984375, 0.5309295654296875, 0.567138671875, 0.6033477783203125, 0.639556884765625, 0.6757659912109375, 0.71197509765625, 0.7481842041015625, 0.784393310546875, 0.8206024169921875, 0.8568115234375, 0.8930206298828125, 0.929229736328125, 0.9654388427734375, 1.00164794921875, 1.0378570556640625, 1.074066162109375, 1.1102752685546875, 1.146484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 3.0, 11.0, 11.0, 6.0, 12.0, 14.0, 21.0, 25.0, 16.0, 26.0, 22.0, 24.0, 23.0, 27.0, 32.0, 40.0, 35.0, 51.0, 40.0, 47.0, 46.0, 41.0, 38.0, 51.0, 44.0, 40.0, 30.0, 36.0, 29.0, 26.0, 17.0, 18.0, 19.0, 18.0, 13.0, 10.0, 11.0, 3.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.072265625, -1.034149169921875, -0.99603271484375, -0.957916259765625, -0.9197998046875, -0.881683349609375, -0.84356689453125, -0.805450439453125, -0.767333984375, -0.729217529296875, -0.69110107421875, -0.652984619140625, -0.6148681640625, -0.576751708984375, -0.53863525390625, -0.500518798828125, -0.46240234375, -0.424285888671875, -0.38616943359375, -0.348052978515625, -0.3099365234375, -0.271820068359375, -0.23370361328125, -0.195587158203125, -0.157470703125, -0.119354248046875, -0.08123779296875, -0.043121337890625, -0.0050048828125, 0.033111572265625, 0.07122802734375, 0.109344482421875, 0.1474609375, 0.185577392578125, 0.22369384765625, 0.261810302734375, 0.2999267578125, 0.338043212890625, 0.37615966796875, 0.414276123046875, 0.452392578125, 0.490509033203125, 0.52862548828125, 0.566741943359375, 0.6048583984375, 0.642974853515625, 0.68109130859375, 0.719207763671875, 0.75732421875, 0.795440673828125, 0.83355712890625, 0.871673583984375, 0.9097900390625, 0.947906494140625, 0.98602294921875, 1.024139404296875, 1.062255859375, 1.100372314453125, 1.13848876953125, 1.176605224609375, 1.2147216796875, 1.252838134765625, 1.29095458984375, 1.329071044921875, 1.3671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 8.0, 5.0, 1.0, 14.0, 32.0, 43.0, 70.0, 123.0, 207.0, 374.0, 614.0, 1174.0, 2585.0, 10377.0, 119293.0, 733552.0, 161700.0, 12724.0, 2803.0, 1216.0, 679.0, 377.0, 236.0, 139.0, 85.0, 46.0, 19.0, 12.0, 16.0, 11.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.80859375, -0.7858505249023438, -0.7631072998046875, -0.7403640747070312, -0.717620849609375, -0.6948776245117188, -0.6721343994140625, -0.6493911743164062, -0.62664794921875, -0.6039047241210938, -0.5811614990234375, -0.5584182739257812, -0.535675048828125, -0.5129318237304688, -0.4901885986328125, -0.46744537353515625, -0.4447021484375, -0.42195892333984375, -0.3992156982421875, -0.37647247314453125, -0.353729248046875, -0.33098602294921875, -0.3082427978515625, -0.28549957275390625, -0.26275634765625, -0.24001312255859375, -0.2172698974609375, -0.19452667236328125, -0.171783447265625, -0.14904022216796875, -0.1262969970703125, -0.10355377197265625, -0.080810546875, -0.05806732177734375, -0.0353240966796875, -0.01258087158203125, 0.010162353515625, 0.03290557861328125, 0.0556488037109375, 0.07839202880859375, 0.10113525390625, 0.12387847900390625, 0.1466217041015625, 0.16936492919921875, 0.192108154296875, 0.21485137939453125, 0.2375946044921875, 0.26033782958984375, 0.2830810546875, 0.30582427978515625, 0.3285675048828125, 0.35131072998046875, 0.374053955078125, 0.39679718017578125, 0.4195404052734375, 0.44228363037109375, 0.46502685546875, 0.48777008056640625, 0.5105133056640625, 0.5332565307617188, 0.555999755859375, 0.5787429809570312, 0.6014862060546875, 0.6242294311523438, 0.64697265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 10.0, 3.0, 6.0, 6.0, 12.0, 17.0, 21.0, 46.0, 57.0, 71.0, 97.0, 99.0, 116.0, 114.0, 97.0, 76.0, 45.0, 36.0, 26.0, 17.0, 12.0, 7.0, 7.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.808208465576172e-05, -7.50245526432991e-05, -7.196702063083649e-05, -6.890948861837387e-05, -6.585195660591125e-05, -6.279442459344864e-05, -5.973689258098602e-05, -5.667936056852341e-05, -5.362182855606079e-05, -5.0564296543598175e-05, -4.750676453113556e-05, -4.444923251867294e-05, -4.139170050621033e-05, -3.833416849374771e-05, -3.5276636481285095e-05, -3.221910446882248e-05, -2.9161572456359863e-05, -2.6104040443897247e-05, -2.304650843143463e-05, -1.9988976418972015e-05, -1.69314444065094e-05, -1.3873912394046783e-05, -1.0816380381584167e-05, -7.758848369121552e-06, -4.7013163566589355e-06, -1.6437843441963196e-06, 1.4137476682662964e-06, 4.471279680728912e-06, 7.528811693191528e-06, 1.0586343705654144e-05, 1.364387571811676e-05, 1.6701407730579376e-05, 1.9758939743041992e-05, 2.2816471755504608e-05, 2.5874003767967224e-05, 2.893153578042984e-05, 3.1989067792892456e-05, 3.504659980535507e-05, 3.810413181781769e-05, 4.1161663830280304e-05, 4.421919584274292e-05, 4.7276727855205536e-05, 5.033425986766815e-05, 5.339179188013077e-05, 5.6449323892593384e-05, 5.9506855905056e-05, 6.256438791751862e-05, 6.562191992998123e-05, 6.867945194244385e-05, 7.173698395490646e-05, 7.479451596736908e-05, 7.78520479798317e-05, 8.090957999229431e-05, 8.396711200475693e-05, 8.702464401721954e-05, 9.008217602968216e-05, 9.313970804214478e-05, 9.619724005460739e-05, 9.925477206707001e-05, 0.00010231230407953262, 0.00010536983609199524, 0.00010842736810445786, 0.00011148490011692047, 0.00011454243212938309, 0.0001175999641418457]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 13.0, 7.0, 11.0, 11.0, 20.0, 31.0, 37.0, 74.0, 84.0, 145.0, 289.0, 616.0, 1398.0, 4397.0, 32477.0, 516731.0, 457543.0, 27865.0, 4130.0, 1296.0, 619.0, 302.0, 178.0, 97.0, 69.0, 37.0, 22.0, 20.0, 9.0, 7.0, 2.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.712890625, -0.6898727416992188, -0.6668548583984375, -0.6438369750976562, -0.620819091796875, -0.5978012084960938, -0.5747833251953125, -0.5517654418945312, -0.52874755859375, -0.5057296752929688, -0.4827117919921875, -0.45969390869140625, -0.436676025390625, -0.41365814208984375, -0.3906402587890625, -0.36762237548828125, -0.3446044921875, -0.32158660888671875, -0.2985687255859375, -0.27555084228515625, -0.252532958984375, -0.22951507568359375, -0.2064971923828125, -0.18347930908203125, -0.16046142578125, -0.13744354248046875, -0.1144256591796875, -0.09140777587890625, -0.068389892578125, -0.04537200927734375, -0.0223541259765625, 0.00066375732421875, 0.023681640625, 0.04669952392578125, 0.0697174072265625, 0.09273529052734375, 0.115753173828125, 0.13877105712890625, 0.1617889404296875, 0.18480682373046875, 0.20782470703125, 0.23084259033203125, 0.2538604736328125, 0.27687835693359375, 0.299896240234375, 0.32291412353515625, 0.3459320068359375, 0.36894989013671875, 0.3919677734375, 0.41498565673828125, 0.4380035400390625, 0.46102142333984375, 0.484039306640625, 0.5070571899414062, 0.5300750732421875, 0.5530929565429688, 0.57611083984375, 0.5991287231445312, 0.6221466064453125, 0.6451644897460938, 0.668182373046875, 0.6912002563476562, 0.7142181396484375, 0.7372360229492188, 0.76025390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 13.0, 12.0, 10.0, 32.0, 38.0, 39.0, 54.0, 72.0, 83.0, 103.0, 101.0, 100.0, 83.0, 75.0, 56.0, 45.0, 27.0, 24.0, 12.0, 9.0, 6.0, 5.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5283203125, -0.50830078125, -0.48828125, -0.46826171875, -0.4482421875, -0.42822265625, -0.408203125, -0.38818359375, -0.3681640625, -0.34814453125, -0.328125, -0.30810546875, -0.2880859375, -0.26806640625, -0.248046875, -0.22802734375, -0.2080078125, -0.18798828125, -0.16796875, -0.14794921875, -0.1279296875, -0.10791015625, -0.087890625, -0.06787109375, -0.0478515625, -0.02783203125, -0.0078125, 0.01220703125, 0.0322265625, 0.05224609375, 0.072265625, 0.09228515625, 0.1123046875, 0.13232421875, 0.15234375, 0.17236328125, 0.1923828125, 0.21240234375, 0.232421875, 0.25244140625, 0.2724609375, 0.29248046875, 0.3125, 0.33251953125, 0.3525390625, 0.37255859375, 0.392578125, 0.41259765625, 0.4326171875, 0.45263671875, 0.47265625, 0.49267578125, 0.5126953125, 0.53271484375, 0.552734375, 0.57275390625, 0.5927734375, 0.61279296875, 0.6328125, 0.65283203125, 0.6728515625, 0.69287109375, 0.712890625, 0.73291015625, 0.7529296875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 6.0, 5.0, 7.0, 12.0, 27.0, 39.0, 61.0, 110.0, 153.0, 187.0, 146.0, 93.0, 71.0, 36.0, 25.0, 10.0, 7.0, 8.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.999483108520508, -12.677781105041504, -12.356078147888184, -12.03437614440918, -11.712674140930176, -11.390972137451172, -11.069269180297852, -10.747567176818848, -10.425865173339844, -10.10416316986084, -9.78246021270752, -9.460758209228516, -9.139056205749512, -8.817354202270508, -8.495651245117188, -8.173949241638184, -7.8522467613220215, -7.530544281005859, -7.2088422775268555, -6.887139797210693, -6.5654377937316895, -6.243735313415527, -5.922033309936523, -5.600330829620361, -5.278628349304199, -4.956925868988037, -4.635223865509033, -4.313521385192871, -3.991819381713867, -3.670116901397705, -3.348414659500122, -3.026712417602539, -2.705010414123535, -2.383308172225952, -2.061605930328369, -1.7399035692214966, -1.4182013273239136, -1.0964990854263306, -0.774796724319458, -0.453094482421875, -0.131392240524292, 0.1903100311756134, 0.5120123028755188, 0.8337146043777466, 1.1554168462753296, 1.4771190881729126, 1.7988214492797852, 2.120523691177368, 2.442225933074951, 2.763928174972534, 3.085630416870117, 3.4073328971862793, 3.729034900665283, 4.050737380981445, 4.372439384460449, 4.694141864776611, 5.015844345092773, 5.3375468254089355, 5.6592488288879395, 5.980951309204102, 6.3026533126831055, 6.624355792999268, 6.94605827331543, 7.267760276794434, 7.5894622802734375]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 3.0, 7.0, 13.0, 5.0, 14.0, 14.0, 15.0, 16.0, 16.0, 17.0, 24.0, 32.0, 30.0, 32.0, 32.0, 30.0, 36.0, 32.0, 38.0, 48.0, 52.0, 46.0, 45.0, 48.0, 36.0, 37.0, 31.0, 33.0, 28.0, 22.0, 31.0, 14.0, 21.0, 20.0, 16.0, 5.0, 10.0, 13.0, 7.0, 10.0, 4.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.410104274749756, -6.220709323883057, -6.031314849853516, -5.841919898986816, -5.652524948120117, -5.463129997253418, -5.273735523223877, -5.084340572357178, -4.894946098327637, -4.7055511474609375, -4.5161566734313965, -4.326761722564697, -4.137366771697998, -3.947972059249878, -3.758577346801758, -3.5691823959350586, -3.3797874450683594, -3.1903927326202393, -3.00099778175354, -2.81160306930542, -2.6222081184387207, -2.4328134059906006, -2.2434186935424805, -2.0540237426757812, -1.8646290302276611, -1.6752341985702515, -1.4858393669128418, -1.2964446544647217, -1.107049822807312, -0.9176549911499023, -0.7282602787017822, -0.5388654470443726, -0.3494701385498047, -0.1600753366947174, 0.029319465160369873, 0.21871423721313477, 0.40810906887054443, 0.5975039005279541, 0.7868986129760742, 0.9762934446334839, 1.1656882762908936, 1.3550831079483032, 1.544477939605713, 1.733872652053833, 1.9232674837112427, 2.1126623153686523, 2.3020570278167725, 2.4914517402648926, 2.680846691131592, 2.870241403579712, 3.059636354446411, 3.2490310668945312, 3.4384260177612305, 3.6278207302093506, 3.8172154426574707, 4.00661039352417, 4.196004867553711, 4.38539981842041, 4.574794292449951, 4.76418924331665, 4.95358419418335, 5.142978668212891, 5.33237361907959, 5.521768569946289, 5.711163520812988]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 5.0, 8.0, 15.0, 15.0, 18.0, 49.0, 60.0, 102.0, 132.0, 243.0, 403.0, 725.0, 1359.0, 3218.0, 8477.0, 29581.0, 210525.0, 3746237.0, 155977.0, 24701.0, 7082.0, 2708.0, 1202.0, 593.0, 305.0, 211.0, 115.0, 67.0, 42.0, 33.0, 20.0, 14.0, 13.0, 12.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6240234375, -1.5754547119140625, -1.526885986328125, -1.4783172607421875, -1.42974853515625, -1.3811798095703125, -1.332611083984375, -1.2840423583984375, -1.2354736328125, -1.1869049072265625, -1.138336181640625, -1.0897674560546875, -1.04119873046875, -0.9926300048828125, -0.944061279296875, -0.8954925537109375, -0.846923828125, -0.7983551025390625, -0.749786376953125, -0.7012176513671875, -0.65264892578125, -0.6040802001953125, -0.555511474609375, -0.5069427490234375, -0.4583740234375, -0.4098052978515625, -0.361236572265625, -0.3126678466796875, -0.26409912109375, -0.2155303955078125, -0.166961669921875, -0.1183929443359375, -0.06982421875, -0.0212554931640625, 0.027313232421875, 0.0758819580078125, 0.12445068359375, 0.1730194091796875, 0.221588134765625, 0.2701568603515625, 0.3187255859375, 0.3672943115234375, 0.415863037109375, 0.4644317626953125, 0.51300048828125, 0.5615692138671875, 0.610137939453125, 0.6587066650390625, 0.707275390625, 0.7558441162109375, 0.804412841796875, 0.8529815673828125, 0.90155029296875, 0.9501190185546875, 0.998687744140625, 1.0472564697265625, 1.0958251953125, 1.1443939208984375, 1.192962646484375, 1.2415313720703125, 1.29010009765625, 1.3386688232421875, 1.387237548828125, 1.4358062744140625, 1.484375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 11.0, 12.0, 16.0, 15.0, 10.0, 28.0, 37.0, 42.0, 35.0, 41.0, 57.0, 46.0, 68.0, 55.0, 55.0, 66.0, 54.0, 54.0, 47.0, 42.0, 39.0, 34.0, 30.0, 25.0, 22.0, 18.0, 11.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.46826171875, -0.45526123046875, -0.4422607421875, -0.42926025390625, -0.416259765625, -0.40325927734375, -0.3902587890625, -0.37725830078125, -0.3642578125, -0.35125732421875, -0.3382568359375, -0.32525634765625, -0.312255859375, -0.29925537109375, -0.2862548828125, -0.27325439453125, -0.26025390625, -0.24725341796875, -0.2342529296875, -0.22125244140625, -0.208251953125, -0.19525146484375, -0.1822509765625, -0.16925048828125, -0.15625, -0.14324951171875, -0.1302490234375, -0.11724853515625, -0.104248046875, -0.09124755859375, -0.0782470703125, -0.06524658203125, -0.05224609375, -0.03924560546875, -0.0262451171875, -0.01324462890625, -0.000244140625, 0.01275634765625, 0.0257568359375, 0.03875732421875, 0.0517578125, 0.06475830078125, 0.0777587890625, 0.09075927734375, 0.103759765625, 0.11676025390625, 0.1297607421875, 0.14276123046875, 0.15576171875, 0.16876220703125, 0.1817626953125, 0.19476318359375, 0.207763671875, 0.22076416015625, 0.2337646484375, 0.24676513671875, 0.259765625, 0.27276611328125, 0.2857666015625, 0.29876708984375, 0.311767578125, 0.32476806640625, 0.3377685546875, 0.35076904296875, 0.36376953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 6.0, 10.0, 6.0, 16.0, 20.0, 38.0, 56.0, 92.0, 172.0, 282.0, 520.0, 821.0, 1518.0, 2804.0, 6033.0, 15083.0, 47967.0, 243056.0, 3370485.0, 407919.0, 64380.0, 18740.0, 7083.0, 3273.0, 1650.0, 918.0, 555.0, 320.0, 177.0, 100.0, 55.0, 53.0, 35.0, 13.0, 11.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.302734375, -1.268096923828125, -1.23345947265625, -1.198822021484375, -1.1641845703125, -1.129547119140625, -1.09490966796875, -1.060272216796875, -1.025634765625, -0.990997314453125, -0.95635986328125, -0.921722412109375, -0.8870849609375, -0.852447509765625, -0.81781005859375, -0.783172607421875, -0.74853515625, -0.713897705078125, -0.67926025390625, -0.644622802734375, -0.6099853515625, -0.575347900390625, -0.54071044921875, -0.506072998046875, -0.471435546875, -0.436798095703125, -0.40216064453125, -0.367523193359375, -0.3328857421875, -0.298248291015625, -0.26361083984375, -0.228973388671875, -0.1943359375, -0.159698486328125, -0.12506103515625, -0.090423583984375, -0.0557861328125, -0.021148681640625, 0.01348876953125, 0.048126220703125, 0.082763671875, 0.117401123046875, 0.15203857421875, 0.186676025390625, 0.2213134765625, 0.255950927734375, 0.29058837890625, 0.325225830078125, 0.35986328125, 0.394500732421875, 0.42913818359375, 0.463775634765625, 0.4984130859375, 0.533050537109375, 0.56768798828125, 0.602325439453125, 0.636962890625, 0.671600341796875, 0.70623779296875, 0.740875244140625, 0.7755126953125, 0.810150146484375, 0.84478759765625, 0.879425048828125, 0.9140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 10.0, 10.0, 18.0, 20.0, 31.0, 56.0, 71.0, 122.0, 252.0, 555.0, 1802.0, 545.0, 225.0, 127.0, 74.0, 45.0, 24.0, 21.0, 15.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59130859375, -0.5736236572265625, -0.555938720703125, -0.5382537841796875, -0.52056884765625, -0.5028839111328125, -0.485198974609375, -0.4675140380859375, -0.4498291015625, -0.4321441650390625, -0.414459228515625, -0.3967742919921875, -0.37908935546875, -0.3614044189453125, -0.343719482421875, -0.3260345458984375, -0.308349609375, -0.2906646728515625, -0.272979736328125, -0.2552947998046875, -0.23760986328125, -0.2199249267578125, -0.202239990234375, -0.1845550537109375, -0.1668701171875, -0.1491851806640625, -0.131500244140625, -0.1138153076171875, -0.09613037109375, -0.0784454345703125, -0.060760498046875, -0.0430755615234375, -0.025390625, -0.0077056884765625, 0.009979248046875, 0.0276641845703125, 0.04534912109375, 0.0630340576171875, 0.080718994140625, 0.0984039306640625, 0.1160888671875, 0.1337738037109375, 0.151458740234375, 0.1691436767578125, 0.18682861328125, 0.2045135498046875, 0.222198486328125, 0.2398834228515625, 0.257568359375, 0.2752532958984375, 0.292938232421875, 0.3106231689453125, 0.32830810546875, 0.3459930419921875, 0.363677978515625, 0.3813629150390625, 0.3990478515625, 0.4167327880859375, 0.434417724609375, 0.4521026611328125, 0.46978759765625, 0.4874725341796875, 0.505157470703125, 0.5228424072265625, 0.54052734375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 11.0, 14.0, 23.0, 68.0, 170.0, 272.0, 237.0, 133.0, 45.0, 19.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.422682762145996, -10.220623970031738, -10.01856517791748, -9.816506385803223, -9.614447593688965, -9.41238784790039, -9.210329055786133, -9.008270263671875, -8.806211471557617, -8.60415267944336, -8.402093887329102, -8.200035095214844, -7.997975826263428, -7.79591703414917, -7.593858242034912, -7.391799449920654, -7.1897406578063965, -6.987681865692139, -6.785623073577881, -6.583563804626465, -6.381505012512207, -6.179446220397949, -5.977387428283691, -5.775328636169434, -5.573269844055176, -5.371211051940918, -5.16915225982666, -4.967093467712402, -4.765034198760986, -4.5629754066467285, -4.360916614532471, -4.158857822418213, -3.956798791885376, -3.754739999771118, -3.5526809692382812, -3.3506221771240234, -3.1485633850097656, -2.9465043544769287, -2.744445562362671, -2.542386531829834, -2.340327739715576, -2.1382689476013184, -1.9362099170684814, -1.7341511249542236, -1.5320922136306763, -1.330033302307129, -1.127974510192871, -0.9259155988693237, -0.7238566875457764, -0.521797776222229, -0.3197389245033264, -0.11768007278442383, 0.08437883853912354, 0.2864377498626709, 0.4884965419769287, 0.6905554533004761, 0.8926143646240234, 1.0946732759475708, 1.2967321872711182, 1.498790979385376, 1.7008498907089233, 1.9029088020324707, 2.1049675941467285, 2.3070263862609863, 2.5090854167938232]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 8.0, 11.0, 18.0, 24.0, 25.0, 30.0, 36.0, 49.0, 57.0, 61.0, 55.0, 62.0, 68.0, 75.0, 62.0, 52.0, 60.0, 46.0, 40.0, 21.0, 34.0, 16.0, 17.0, 14.0, 11.0, 14.0, 8.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3463339805603027, -2.274996519088745, -2.2036588191986084, -2.132321357727051, -2.060983657836914, -1.9896461963653564, -1.9183086156845093, -1.846971035003662, -1.7756335735321045, -1.7042959928512573, -1.6329584121704102, -1.5616209506988525, -1.4902833700180054, -1.4189457893371582, -1.347608208656311, -1.2762706279754639, -1.2049330472946167, -1.1335954666137695, -1.0622578859329224, -0.99092036485672, -0.9195828437805176, -0.8482452630996704, -0.7769076824188232, -0.7055701017379761, -0.6342325806617737, -0.5628949999809265, -0.4915574789047241, -0.42021989822387695, -0.3488823473453522, -0.2775447964668274, -0.20620721578598022, -0.13486966490745544, -0.06353211402893066, 0.007805444300174713, 0.07914300262928009, 0.15048056840896606, 0.22181811928749084, 0.2931556701660156, 0.3644932508468628, 0.4358308017253876, 0.5071683526039124, 0.5785059332847595, 0.6498434543609619, 0.7211810350418091, 0.7925186157226562, 0.8638561367988586, 0.9351937174797058, 1.0065312385559082, 1.0778688192367554, 1.1492063999176025, 1.2205439805984497, 1.2918815612792969, 1.3632190227508545, 1.4345566034317017, 1.5058941841125488, 1.577231764793396, 1.6485693454742432, 1.7199069261550903, 1.7912445068359375, 1.8625819683074951, 1.9339195489883423, 2.0052571296691895, 2.076594829559326, 2.147932291030884, 2.2192697525024414]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 8.0, 9.0, 12.0, 16.0, 29.0, 29.0, 50.0, 64.0, 112.0, 186.0, 360.0, 667.0, 1296.0, 2743.0, 6752.0, 20957.0, 78855.0, 313590.0, 441175.0, 131281.0, 32930.0, 10042.0, 3829.0, 1674.0, 827.0, 405.0, 223.0, 154.0, 94.0, 61.0, 35.0, 22.0, 25.0, 11.0, 4.0, 9.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.49609375, -1.4510040283203125, -1.405914306640625, -1.3608245849609375, -1.31573486328125, -1.2706451416015625, -1.225555419921875, -1.1804656982421875, -1.1353759765625, -1.0902862548828125, -1.045196533203125, -1.0001068115234375, -0.95501708984375, -0.9099273681640625, -0.864837646484375, -0.8197479248046875, -0.774658203125, -0.7295684814453125, -0.684478759765625, -0.6393890380859375, -0.59429931640625, -0.5492095947265625, -0.504119873046875, -0.4590301513671875, -0.4139404296875, -0.3688507080078125, -0.323760986328125, -0.2786712646484375, -0.23358154296875, -0.1884918212890625, -0.143402099609375, -0.0983123779296875, -0.05322265625, -0.0081329345703125, 0.036956787109375, 0.0820465087890625, 0.12713623046875, 0.1722259521484375, 0.217315673828125, 0.2624053955078125, 0.3074951171875, 0.3525848388671875, 0.397674560546875, 0.4427642822265625, 0.48785400390625, 0.5329437255859375, 0.578033447265625, 0.6231231689453125, 0.668212890625, 0.7133026123046875, 0.758392333984375, 0.8034820556640625, 0.84857177734375, 0.8936614990234375, 0.938751220703125, 0.9838409423828125, 1.0289306640625, 1.0740203857421875, 1.119110107421875, 1.1641998291015625, 1.20928955078125, 1.2543792724609375, 1.299468994140625, 1.3445587158203125, 1.3896484375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 5.0, 8.0, 8.0, 17.0, 12.0, 21.0, 23.0, 23.0, 27.0, 45.0, 39.0, 52.0, 63.0, 54.0, 64.0, 54.0, 48.0, 62.0, 52.0, 52.0, 61.0, 35.0, 39.0, 22.0, 24.0, 22.0, 17.0, 17.0, 13.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47021484375, -0.4569854736328125, -0.443756103515625, -0.4305267333984375, -0.41729736328125, -0.4040679931640625, -0.390838623046875, -0.3776092529296875, -0.3643798828125, -0.3511505126953125, -0.337921142578125, -0.3246917724609375, -0.31146240234375, -0.2982330322265625, -0.285003662109375, -0.2717742919921875, -0.258544921875, -0.2453155517578125, -0.232086181640625, -0.2188568115234375, -0.20562744140625, -0.1923980712890625, -0.179168701171875, -0.1659393310546875, -0.1527099609375, -0.1394805908203125, -0.126251220703125, -0.1130218505859375, -0.09979248046875, -0.0865631103515625, -0.073333740234375, -0.0601043701171875, -0.046875, -0.0336456298828125, -0.020416259765625, -0.0071868896484375, 0.00604248046875, 0.0192718505859375, 0.032501220703125, 0.0457305908203125, 0.0589599609375, 0.0721893310546875, 0.085418701171875, 0.0986480712890625, 0.11187744140625, 0.1251068115234375, 0.138336181640625, 0.1515655517578125, 0.164794921875, 0.1780242919921875, 0.191253662109375, 0.2044830322265625, 0.21771240234375, 0.2309417724609375, 0.244171142578125, 0.2574005126953125, 0.2706298828125, 0.2838592529296875, 0.297088623046875, 0.3103179931640625, 0.32354736328125, 0.3367767333984375, 0.350006103515625, 0.3632354736328125, 0.37646484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 7.0, 16.0, 18.0, 25.0, 42.0, 69.0, 105.0, 212.0, 362.0, 711.0, 1353.0, 3149.0, 7436.0, 19379.0, 56659.0, 177192.0, 408071.0, 248904.0, 80245.0, 26911.0, 9977.0, 4038.0, 1794.0, 822.0, 432.0, 236.0, 136.0, 76.0, 52.0, 24.0, 20.0, 16.0, 15.0, 7.0, 9.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89013671875, -0.8567428588867188, -0.8233489990234375, -0.7899551391601562, -0.756561279296875, -0.7231674194335938, -0.6897735595703125, -0.6563796997070312, -0.62298583984375, -0.5895919799804688, -0.5561981201171875, -0.5228042602539062, -0.489410400390625, -0.45601654052734375, -0.4226226806640625, -0.38922882080078125, -0.3558349609375, -0.32244110107421875, -0.2890472412109375, -0.25565338134765625, -0.222259521484375, -0.18886566162109375, -0.1554718017578125, -0.12207794189453125, -0.08868408203125, -0.05529022216796875, -0.0218963623046875, 0.01149749755859375, 0.044891357421875, 0.07828521728515625, 0.1116790771484375, 0.14507293701171875, 0.178466796875, 0.21186065673828125, 0.2452545166015625, 0.27864837646484375, 0.312042236328125, 0.34543609619140625, 0.3788299560546875, 0.41222381591796875, 0.44561767578125, 0.47901153564453125, 0.5124053955078125, 0.5457992553710938, 0.579193115234375, 0.6125869750976562, 0.6459808349609375, 0.6793746948242188, 0.7127685546875, 0.7461624145507812, 0.7795562744140625, 0.8129501342773438, 0.846343994140625, 0.8797378540039062, 0.9131317138671875, 0.9465255737304688, 0.97991943359375, 1.0133132934570312, 1.0467071533203125, 1.0801010131835938, 1.113494873046875, 1.1468887329101562, 1.1802825927734375, 1.2136764526367188, 1.2470703125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 17.0, 9.0, 18.0, 13.0, 12.0, 15.0, 28.0, 25.0, 27.0, 27.0, 34.0, 39.0, 45.0, 34.0, 30.0, 39.0, 44.0, 41.0, 40.0, 50.0, 47.0, 45.0, 38.0, 30.0, 40.0, 36.0, 27.0, 21.0, 15.0, 21.0, 22.0, 11.0, 14.0, 10.0, 9.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2734375, -1.2305908203125, -1.187744140625, -1.1448974609375, -1.10205078125, -1.0592041015625, -1.016357421875, -0.9735107421875, -0.9306640625, -0.8878173828125, -0.844970703125, -0.8021240234375, -0.75927734375, -0.7164306640625, -0.673583984375, -0.6307373046875, -0.587890625, -0.5450439453125, -0.502197265625, -0.4593505859375, -0.41650390625, -0.3736572265625, -0.330810546875, -0.2879638671875, -0.2451171875, -0.2022705078125, -0.159423828125, -0.1165771484375, -0.07373046875, -0.0308837890625, 0.011962890625, 0.0548095703125, 0.09765625, 0.1405029296875, 0.183349609375, 0.2261962890625, 0.26904296875, 0.3118896484375, 0.354736328125, 0.3975830078125, 0.4404296875, 0.4832763671875, 0.526123046875, 0.5689697265625, 0.61181640625, 0.6546630859375, 0.697509765625, 0.7403564453125, 0.783203125, 0.8260498046875, 0.868896484375, 0.9117431640625, 0.95458984375, 0.9974365234375, 1.040283203125, 1.0831298828125, 1.1259765625, 1.1688232421875, 1.211669921875, 1.2545166015625, 1.29736328125, 1.3402099609375, 1.383056640625, 1.4259033203125, 1.46875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 6.0, 8.0, 15.0, 23.0, 24.0, 28.0, 56.0, 61.0, 106.0, 197.0, 373.0, 719.0, 1845.0, 5891.0, 26724.0, 175623.0, 577735.0, 215775.0, 32676.0, 6779.0, 2172.0, 788.0, 370.0, 206.0, 129.0, 81.0, 45.0, 35.0, 23.0, 16.0, 10.0, 7.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5556640625, -0.538055419921875, -0.52044677734375, -0.502838134765625, -0.4852294921875, -0.467620849609375, -0.45001220703125, -0.432403564453125, -0.414794921875, -0.397186279296875, -0.37957763671875, -0.361968994140625, -0.3443603515625, -0.326751708984375, -0.30914306640625, -0.291534423828125, -0.27392578125, -0.256317138671875, -0.23870849609375, -0.221099853515625, -0.2034912109375, -0.185882568359375, -0.16827392578125, -0.150665283203125, -0.133056640625, -0.115447998046875, -0.09783935546875, -0.080230712890625, -0.0626220703125, -0.045013427734375, -0.02740478515625, -0.009796142578125, 0.0078125, 0.025421142578125, 0.04302978515625, 0.060638427734375, 0.0782470703125, 0.095855712890625, 0.11346435546875, 0.131072998046875, 0.148681640625, 0.166290283203125, 0.18389892578125, 0.201507568359375, 0.2191162109375, 0.236724853515625, 0.25433349609375, 0.271942138671875, 0.28955078125, 0.307159423828125, 0.32476806640625, 0.342376708984375, 0.3599853515625, 0.377593994140625, 0.39520263671875, 0.412811279296875, 0.430419921875, 0.448028564453125, 0.46563720703125, 0.483245849609375, 0.5008544921875, 0.518463134765625, 0.53607177734375, 0.553680419921875, 0.5712890625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 3.0, 13.0, 15.0, 28.0, 48.0, 58.0, 93.0, 117.0, 124.0, 150.0, 114.0, 75.0, 72.0, 34.0, 17.0, 19.0, 7.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001341104507446289, -0.00013002939522266388, -0.00012594833970069885, -0.00012186728417873383, -0.0001177862286567688, -0.00011370517313480377, -0.00010962411761283875, -0.00010554306209087372, -0.00010146200656890869, -9.738095104694366e-05, -9.329989552497864e-05, -8.921884000301361e-05, -8.513778448104858e-05, -8.105672895908356e-05, -7.697567343711853e-05, -7.28946179151535e-05, -6.881356239318848e-05, -6.473250687122345e-05, -6.065145134925842e-05, -5.6570395827293396e-05, -5.248934030532837e-05, -4.840828478336334e-05, -4.4327229261398315e-05, -4.024617373943329e-05, -3.616511821746826e-05, -3.2084062695503235e-05, -2.8003007173538208e-05, -2.392195165157318e-05, -1.9840896129608154e-05, -1.5759840607643127e-05, -1.16787850856781e-05, -7.597729563713074e-06, -3.516674041748047e-06, 5.6438148021698e-07, 4.645437002182007e-06, 8.726492524147034e-06, 1.280754804611206e-05, 1.6888603568077087e-05, 2.0969659090042114e-05, 2.505071461200714e-05, 2.9131770133972168e-05, 3.3212825655937195e-05, 3.729388117790222e-05, 4.137493669986725e-05, 4.5455992221832275e-05, 4.95370477437973e-05, 5.361810326576233e-05, 5.7699158787727356e-05, 6.178021430969238e-05, 6.586126983165741e-05, 6.994232535362244e-05, 7.402338087558746e-05, 7.810443639755249e-05, 8.218549191951752e-05, 8.626654744148254e-05, 9.034760296344757e-05, 9.44286584854126e-05, 9.850971400737762e-05, 0.00010259076952934265, 0.00010667182505130768, 0.0001107528805732727, 0.00011483393609523773, 0.00011891499161720276, 0.00012299604713916779, 0.0001270771026611328]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 7.0, 13.0, 24.0, 39.0, 91.0, 171.0, 422.0, 1175.0, 3980.0, 28506.0, 431183.0, 538316.0, 37815.0, 4613.0, 1345.0, 481.0, 205.0, 82.0, 38.0, 25.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66552734375, -0.639984130859375, -0.61444091796875, -0.588897705078125, -0.5633544921875, -0.537811279296875, -0.51226806640625, -0.486724853515625, -0.461181640625, -0.435638427734375, -0.41009521484375, -0.384552001953125, -0.3590087890625, -0.333465576171875, -0.30792236328125, -0.282379150390625, -0.2568359375, -0.231292724609375, -0.20574951171875, -0.180206298828125, -0.1546630859375, -0.129119873046875, -0.10357666015625, -0.078033447265625, -0.052490234375, -0.026947021484375, -0.00140380859375, 0.024139404296875, 0.0496826171875, 0.075225830078125, 0.10076904296875, 0.126312255859375, 0.15185546875, 0.177398681640625, 0.20294189453125, 0.228485107421875, 0.2540283203125, 0.279571533203125, 0.30511474609375, 0.330657958984375, 0.356201171875, 0.381744384765625, 0.40728759765625, 0.432830810546875, 0.4583740234375, 0.483917236328125, 0.50946044921875, 0.535003662109375, 0.560546875, 0.586090087890625, 0.61163330078125, 0.637176513671875, 0.6627197265625, 0.688262939453125, 0.71380615234375, 0.739349365234375, 0.764892578125, 0.790435791015625, 0.81597900390625, 0.841522216796875, 0.8670654296875, 0.892608642578125, 0.91815185546875, 0.943695068359375, 0.96923828125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 7.0, 8.0, 12.0, 25.0, 35.0, 37.0, 52.0, 62.0, 101.0, 120.0, 118.0, 102.0, 99.0, 84.0, 47.0, 35.0, 25.0, 17.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.8583984375, -0.8381233215332031, -0.8178482055664062, -0.7975730895996094, -0.7772979736328125, -0.7570228576660156, -0.7367477416992188, -0.7164726257324219, -0.696197509765625, -0.6759223937988281, -0.6556472778320312, -0.6353721618652344, -0.6150970458984375, -0.5948219299316406, -0.5745468139648438, -0.5542716979980469, -0.53399658203125, -0.5137214660644531, -0.49344635009765625, -0.4731712341308594, -0.4528961181640625, -0.4326210021972656, -0.41234588623046875, -0.3920707702636719, -0.371795654296875, -0.3515205383300781, -0.33124542236328125, -0.3109703063964844, -0.2906951904296875, -0.2704200744628906, -0.25014495849609375, -0.22986984252929688, -0.2095947265625, -0.18931961059570312, -0.16904449462890625, -0.14876937866210938, -0.1284942626953125, -0.10821914672851562, -0.08794403076171875, -0.06766891479492188, -0.047393798828125, -0.027118682861328125, -0.00684356689453125, 0.013431549072265625, 0.0337066650390625, 0.053981781005859375, 0.07425689697265625, 0.09453201293945312, 0.11480712890625, 0.13508224487304688, 0.15535736083984375, 0.17563247680664062, 0.1959075927734375, 0.21618270874023438, 0.23645782470703125, 0.2567329406738281, 0.277008056640625, 0.2972831726074219, 0.31755828857421875, 0.3378334045410156, 0.3581085205078125, 0.3783836364746094, 0.39865875244140625, 0.4189338684082031, 0.439208984375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 12.0, 56.0, 215.0, 433.0, 221.0, 66.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.420352935791016, -7.532642841339111, -6.644932746887207, -5.7572221755981445, -4.86951208114624, -3.981801986694336, -3.0940914154052734, -2.206381320953369, -1.3186712265014648, -0.430961012840271, 0.45674920082092285, 1.3444595336914062, 2.2321696281433105, 3.119879722595215, 4.007590293884277, 4.895300388336182, 5.783010482788086, 6.67072057723999, 7.5584306716918945, 8.446141242980957, 9.333850860595703, 10.221561431884766, 11.109272003173828, 11.99698257446289, 12.884692192077637, 13.7724027633667, 14.660112380981445, 15.547822952270508, 16.43553352355957, 17.3232421875, 18.210952758789062, 19.098663330078125, 19.986373901367188, 20.87408447265625, 21.761795043945312, 22.649505615234375, 23.537214279174805, 24.424924850463867, 25.31263542175293, 26.200345993041992, 27.088054656982422, 27.975765228271484, 28.863475799560547, 29.75118637084961, 30.63889503479004, 31.5266056060791, 32.41431427001953, 33.302024841308594, 34.189735412597656, 35.07744598388672, 35.96515655517578, 36.852867126464844, 37.740577697753906, 38.62828826904297, 39.51599884033203, 40.40370559692383, 41.291419982910156, 42.17913055419922, 43.06684112548828, 43.954551696777344, 44.842262268066406, 45.72997283935547, 46.61768341064453, 47.50539016723633, 48.39310073852539]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 9.0, 13.0, 6.0, 6.0, 17.0, 16.0, 22.0, 15.0, 26.0, 24.0, 30.0, 32.0, 33.0, 42.0, 44.0, 63.0, 54.0, 44.0, 51.0, 59.0, 56.0, 31.0, 43.0, 39.0, 30.0, 26.0, 23.0, 29.0, 17.0, 9.0, 15.0, 10.0, 13.0, 9.0, 7.0, 8.0, 11.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.35746955871582, -6.138973712921143, -5.920477867126465, -5.701982021331787, -5.483486175537109, -5.26499080657959, -5.046494483947754, -4.827999114990234, -4.609503269195557, -4.391007423400879, -4.172511577606201, -3.9540157318115234, -3.735520124435425, -3.517024278640747, -3.2985284328460693, -3.0800328254699707, -2.861536741256714, -2.643040895462036, -2.4245450496673584, -2.2060494422912598, -1.987553596496582, -1.7690577507019043, -1.5505619049072266, -1.3320661783218384, -1.1135703325271606, -0.8950745463371277, -0.6765787601470947, -0.458082914352417, -0.23958712816238403, -0.021091341972351074, 0.19740450382232666, 0.41590023040771484, 0.6343960762023926, 0.8528918623924255, 1.0713876485824585, 1.2898834943771362, 1.5083792209625244, 1.7268750667572021, 1.9453709125518799, 2.1638665199279785, 2.3823623657226562, 2.600858211517334, 2.8193540573120117, 3.0378499031066895, 3.256345510482788, 3.474841356277466, 3.6933372020721436, 3.911832809448242, 4.130329132080078, 4.348824977874756, 4.567320823669434, 4.785816669464111, 5.004312515258789, 5.222807884216309, 5.4413042068481445, 5.659799575805664, 5.878295421600342, 6.0967912673950195, 6.315287113189697, 6.533782958984375, 6.752278804779053, 6.9707746505737305, 7.18927001953125, 7.407765865325928, 7.6262617111206055]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 5.0, 7.0, 7.0, 7.0, 15.0, 22.0, 22.0, 28.0, 31.0, 45.0, 61.0, 75.0, 98.0, 191.0, 246.0, 392.0, 564.0, 961.0, 1618.0, 3195.0, 6641.0, 15657.0, 46183.0, 266953.0, 3667510.0, 130034.0, 31173.0, 11293.0, 5071.0, 2612.0, 1415.0, 776.0, 472.0, 271.0, 196.0, 104.0, 89.0, 71.0, 38.0, 37.0, 24.0, 18.0, 10.0, 7.0, 12.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.4638671875, -1.419952392578125, -1.37603759765625, -1.332122802734375, -1.2882080078125, -1.244293212890625, -1.20037841796875, -1.156463623046875, -1.112548828125, -1.068634033203125, -1.02471923828125, -0.980804443359375, -0.9368896484375, -0.892974853515625, -0.84906005859375, -0.805145263671875, -0.76123046875, -0.717315673828125, -0.67340087890625, -0.629486083984375, -0.5855712890625, -0.541656494140625, -0.49774169921875, -0.453826904296875, -0.409912109375, -0.365997314453125, -0.32208251953125, -0.278167724609375, -0.2342529296875, -0.190338134765625, -0.14642333984375, -0.102508544921875, -0.05859375, -0.014678955078125, 0.02923583984375, 0.073150634765625, 0.1170654296875, 0.160980224609375, 0.20489501953125, 0.248809814453125, 0.292724609375, 0.336639404296875, 0.38055419921875, 0.424468994140625, 0.4683837890625, 0.512298583984375, 0.55621337890625, 0.600128173828125, 0.64404296875, 0.687957763671875, 0.73187255859375, 0.775787353515625, 0.8197021484375, 0.863616943359375, 0.90753173828125, 0.951446533203125, 0.995361328125, 1.039276123046875, 1.08319091796875, 1.127105712890625, 1.1710205078125, 1.214935302734375, 1.25885009765625, 1.302764892578125, 1.3466796875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 5.0, 7.0, 8.0, 17.0, 12.0, 9.0, 16.0, 27.0, 50.0, 44.0, 45.0, 36.0, 53.0, 54.0, 47.0, 62.0, 56.0, 64.0, 50.0, 42.0, 46.0, 49.0, 37.0, 30.0, 31.0, 18.0, 15.0, 8.0, 13.0, 9.0, 13.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.465576171875, -0.452178955078125, -0.43878173828125, -0.425384521484375, -0.4119873046875, -0.398590087890625, -0.38519287109375, -0.371795654296875, -0.3583984375, -0.345001220703125, -0.33160400390625, -0.318206787109375, -0.3048095703125, -0.291412353515625, -0.27801513671875, -0.264617919921875, -0.251220703125, -0.237823486328125, -0.22442626953125, -0.211029052734375, -0.1976318359375, -0.184234619140625, -0.17083740234375, -0.157440185546875, -0.14404296875, -0.130645751953125, -0.11724853515625, -0.103851318359375, -0.0904541015625, -0.077056884765625, -0.06365966796875, -0.050262451171875, -0.036865234375, -0.023468017578125, -0.01007080078125, 0.003326416015625, 0.0167236328125, 0.030120849609375, 0.04351806640625, 0.056915283203125, 0.0703125, 0.083709716796875, 0.09710693359375, 0.110504150390625, 0.1239013671875, 0.137298583984375, 0.15069580078125, 0.164093017578125, 0.177490234375, 0.190887451171875, 0.20428466796875, 0.217681884765625, 0.2310791015625, 0.244476318359375, 0.25787353515625, 0.271270751953125, 0.28466796875, 0.298065185546875, 0.31146240234375, 0.324859619140625, 0.3382568359375, 0.351654052734375, 0.36505126953125, 0.378448486328125, 0.391845703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 10.0, 9.0, 11.0, 7.0, 11.0, 15.0, 19.0, 26.0, 35.0, 46.0, 73.0, 92.0, 127.0, 173.0, 293.0, 479.0, 820.0, 1537.0, 3380.0, 9219.0, 35773.0, 317717.0, 3688656.0, 104941.0, 19354.0, 5998.0, 2387.0, 1196.0, 666.0, 416.0, 247.0, 138.0, 98.0, 71.0, 58.0, 45.0, 37.0, 28.0, 27.0, 16.0, 9.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5576171875, -1.5025634765625, -1.447509765625, -1.3924560546875, -1.33740234375, -1.2823486328125, -1.227294921875, -1.1722412109375, -1.1171875, -1.0621337890625, -1.007080078125, -0.9520263671875, -0.89697265625, -0.8419189453125, -0.786865234375, -0.7318115234375, -0.6767578125, -0.6217041015625, -0.566650390625, -0.5115966796875, -0.45654296875, -0.4014892578125, -0.346435546875, -0.2913818359375, -0.236328125, -0.1812744140625, -0.126220703125, -0.0711669921875, -0.01611328125, 0.0389404296875, 0.093994140625, 0.1490478515625, 0.2041015625, 0.2591552734375, 0.314208984375, 0.3692626953125, 0.42431640625, 0.4793701171875, 0.534423828125, 0.5894775390625, 0.64453125, 0.6995849609375, 0.754638671875, 0.8096923828125, 0.86474609375, 0.9197998046875, 0.974853515625, 1.0299072265625, 1.0849609375, 1.1400146484375, 1.195068359375, 1.2501220703125, 1.30517578125, 1.3602294921875, 1.415283203125, 1.4703369140625, 1.525390625, 1.5804443359375, 1.635498046875, 1.6905517578125, 1.74560546875, 1.8006591796875, 1.855712890625, 1.9107666015625, 1.9658203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 3.0, 9.0, 9.0, 19.0, 17.0, 29.0, 50.0, 105.0, 272.0, 1729.0, 1351.0, 213.0, 113.0, 53.0, 30.0, 19.0, 14.0, 12.0, 8.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8623046875, -0.8376617431640625, -0.813018798828125, -0.7883758544921875, -0.76373291015625, -0.7390899658203125, -0.714447021484375, -0.6898040771484375, -0.6651611328125, -0.6405181884765625, -0.615875244140625, -0.5912322998046875, -0.56658935546875, -0.5419464111328125, -0.517303466796875, -0.4926605224609375, -0.468017578125, -0.4433746337890625, -0.418731689453125, -0.3940887451171875, -0.36944580078125, -0.3448028564453125, -0.320159912109375, -0.2955169677734375, -0.2708740234375, -0.2462310791015625, -0.221588134765625, -0.1969451904296875, -0.17230224609375, -0.1476593017578125, -0.123016357421875, -0.0983734130859375, -0.07373046875, -0.0490875244140625, -0.024444580078125, 0.0001983642578125, 0.02484130859375, 0.0494842529296875, 0.074127197265625, 0.0987701416015625, 0.1234130859375, 0.1480560302734375, 0.172698974609375, 0.1973419189453125, 0.22198486328125, 0.2466278076171875, 0.271270751953125, 0.2959136962890625, 0.320556640625, 0.3451995849609375, 0.369842529296875, 0.3944854736328125, 0.41912841796875, 0.4437713623046875, 0.468414306640625, 0.4930572509765625, 0.5177001953125, 0.5423431396484375, 0.566986083984375, 0.5916290283203125, 0.61627197265625, 0.6409149169921875, 0.665557861328125, 0.6902008056640625, 0.71484375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 9.0, 11.0, 72.0, 411.0, 421.0, 75.0, 12.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.539602279663086, -18.117950439453125, -17.696298599243164, -17.274646759033203, -16.852996826171875, -16.431344985961914, -16.009693145751953, -15.588041305541992, -15.166389465332031, -14.74473762512207, -14.323086738586426, -13.901434898376465, -13.479783058166504, -13.05813217163086, -12.636480331420898, -12.214828491210938, -11.793177604675293, -11.371525764465332, -10.949874877929688, -10.528223037719727, -10.106571197509766, -9.684919357299805, -9.26326847076416, -8.8416166305542, -8.419965744018555, -7.998314380645752, -7.576662540435791, -7.155011177062988, -6.733359336853027, -6.311707973480225, -5.890056610107422, -5.468404769897461, -5.046751976013184, -4.625100612640381, -4.20344877243042, -3.781797409057617, -3.3601458072662354, -2.9384942054748535, -2.516842842102051, -2.095191240310669, -1.673539638519287, -1.2518880367279053, -0.830236554145813, -0.4085850715637207, 0.013066530227661133, 0.43471813201904297, 0.8563694953918457, 1.2780210971832275, 1.6996726989746094, 2.121324300765991, 2.542975902557373, 2.964627265930176, 3.3862788677215576, 3.8079304695129395, 4.229581832885742, 4.651233673095703, 5.072885036468506, 5.494536399841309, 5.9161882400512695, 6.337839603424072, 6.759490966796875, 7.181142807006836, 7.602794170379639, 8.024445533752441, 8.446097373962402]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 7.0, 4.0, 15.0, 15.0, 16.0, 26.0, 21.0, 25.0, 24.0, 34.0, 37.0, 49.0, 42.0, 58.0, 39.0, 46.0, 42.0, 55.0, 44.0, 51.0, 47.0, 49.0, 28.0, 37.0, 37.0, 38.0, 26.0, 25.0, 9.0, 12.0, 11.0, 8.0, 2.0, 5.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5370347499847412, -1.4825516939163208, -1.4280686378479004, -1.3735857009887695, -1.3191026449203491, -1.2646195888519287, -1.2101365327835083, -1.155653476715088, -1.101170539855957, -1.0466874837875366, -0.992204487323761, -0.9377214312553406, -0.8832384347915649, -0.8287553787231445, -0.7742723226547241, -0.7197892665863037, -0.6653062105178833, -0.6108231544494629, -0.5563401579856873, -0.5018571019172668, -0.4473740756511688, -0.3928910493850708, -0.3384079933166504, -0.28392496705055237, -0.22944194078445435, -0.17495891451835632, -0.1204758733510971, -0.06599283218383789, -0.011509805917739868, 0.042973220348358154, 0.09745627641677856, 0.1519393026828766, 0.2064223289489746, 0.26090535521507263, 0.31538838148117065, 0.36987143754959106, 0.4243544638156891, 0.4788374900817871, 0.5333205461502075, 0.5878036022186279, 0.6422865986824036, 0.696769654750824, 0.7512526512145996, 0.80573570728302, 0.8602187633514404, 0.9147017598152161, 0.9691848158836365, 1.023667812347412, 1.0781508684158325, 1.132633924484253, 1.1871169805526733, 1.2416000366210938, 1.2960829734802246, 1.350566029548645, 1.4050490856170654, 1.4595321416854858, 1.5140151977539062, 1.5684982538223267, 1.622981309890747, 1.677464246749878, 1.7319473028182983, 1.7864303588867188, 1.8409134149551392, 1.8953964710235596, 1.9498794078826904]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 14.0, 19.0, 15.0, 29.0, 43.0, 73.0, 99.0, 143.0, 232.0, 395.0, 643.0, 1189.0, 2214.0, 4289.0, 9037.0, 20423.0, 49708.0, 126645.0, 279111.0, 303040.0, 148355.0, 57990.0, 23617.0, 10718.0, 4822.0, 2494.0, 1241.0, 748.0, 427.0, 246.0, 163.0, 111.0, 85.0, 50.0, 27.0, 19.0, 21.0, 14.0, 14.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0849609375, -1.0511474609375, -1.017333984375, -0.9835205078125, -0.94970703125, -0.9158935546875, -0.882080078125, -0.8482666015625, -0.814453125, -0.7806396484375, -0.746826171875, -0.7130126953125, -0.67919921875, -0.6453857421875, -0.611572265625, -0.5777587890625, -0.5439453125, -0.5101318359375, -0.476318359375, -0.4425048828125, -0.40869140625, -0.3748779296875, -0.341064453125, -0.3072509765625, -0.2734375, -0.2396240234375, -0.205810546875, -0.1719970703125, -0.13818359375, -0.1043701171875, -0.070556640625, -0.0367431640625, -0.0029296875, 0.0308837890625, 0.064697265625, 0.0985107421875, 0.13232421875, 0.1661376953125, 0.199951171875, 0.2337646484375, 0.267578125, 0.3013916015625, 0.335205078125, 0.3690185546875, 0.40283203125, 0.4366455078125, 0.470458984375, 0.5042724609375, 0.5380859375, 0.5718994140625, 0.605712890625, 0.6395263671875, 0.67333984375, 0.7071533203125, 0.740966796875, 0.7747802734375, 0.80859375, 0.8424072265625, 0.876220703125, 0.9100341796875, 0.94384765625, 0.9776611328125, 1.011474609375, 1.0452880859375, 1.0791015625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 0.0, 6.0, 7.0, 4.0, 9.0, 10.0, 10.0, 11.0, 18.0, 17.0, 24.0, 24.0, 35.0, 23.0, 53.0, 45.0, 42.0, 51.0, 47.0, 58.0, 49.0, 57.0, 57.0, 43.0, 42.0, 45.0, 47.0, 27.0, 22.0, 27.0, 31.0, 18.0, 11.0, 9.0, 7.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.465576171875, -0.451812744140625, -0.43804931640625, -0.424285888671875, -0.4105224609375, -0.396759033203125, -0.38299560546875, -0.369232177734375, -0.35546875, -0.341705322265625, -0.32794189453125, -0.314178466796875, -0.3004150390625, -0.286651611328125, -0.27288818359375, -0.259124755859375, -0.245361328125, -0.231597900390625, -0.21783447265625, -0.204071044921875, -0.1903076171875, -0.176544189453125, -0.16278076171875, -0.149017333984375, -0.13525390625, -0.121490478515625, -0.10772705078125, -0.093963623046875, -0.0802001953125, -0.066436767578125, -0.05267333984375, -0.038909912109375, -0.025146484375, -0.011383056640625, 0.00238037109375, 0.016143798828125, 0.0299072265625, 0.043670654296875, 0.05743408203125, 0.071197509765625, 0.0849609375, 0.098724365234375, 0.11248779296875, 0.126251220703125, 0.1400146484375, 0.153778076171875, 0.16754150390625, 0.181304931640625, 0.195068359375, 0.208831787109375, 0.22259521484375, 0.236358642578125, 0.2501220703125, 0.263885498046875, 0.27764892578125, 0.291412353515625, 0.30517578125, 0.318939208984375, 0.33270263671875, 0.346466064453125, 0.3602294921875, 0.373992919921875, 0.38775634765625, 0.401519775390625, 0.415283203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 7.0, 6.0, 6.0, 13.0, 13.0, 27.0, 23.0, 37.0, 54.0, 95.0, 129.0, 179.0, 339.0, 578.0, 1087.0, 1983.0, 4427.0, 10485.0, 29614.0, 96821.0, 314870.0, 387444.0, 135699.0, 40227.0, 13733.0, 5313.0, 2491.0, 1165.0, 666.0, 349.0, 210.0, 146.0, 104.0, 58.0, 41.0, 39.0, 22.0, 14.0, 14.0, 5.0, 8.0, 7.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.28125, -1.24371337890625, -1.2061767578125, -1.16864013671875, -1.131103515625, -1.09356689453125, -1.0560302734375, -1.01849365234375, -0.98095703125, -0.94342041015625, -0.9058837890625, -0.86834716796875, -0.830810546875, -0.79327392578125, -0.7557373046875, -0.71820068359375, -0.6806640625, -0.64312744140625, -0.6055908203125, -0.56805419921875, -0.530517578125, -0.49298095703125, -0.4554443359375, -0.41790771484375, -0.38037109375, -0.34283447265625, -0.3052978515625, -0.26776123046875, -0.230224609375, -0.19268798828125, -0.1551513671875, -0.11761474609375, -0.080078125, -0.04254150390625, -0.0050048828125, 0.03253173828125, 0.070068359375, 0.10760498046875, 0.1451416015625, 0.18267822265625, 0.22021484375, 0.25775146484375, 0.2952880859375, 0.33282470703125, 0.370361328125, 0.40789794921875, 0.4454345703125, 0.48297119140625, 0.5205078125, 0.55804443359375, 0.5955810546875, 0.63311767578125, 0.670654296875, 0.70819091796875, 0.7457275390625, 0.78326416015625, 0.82080078125, 0.85833740234375, 0.8958740234375, 0.93341064453125, 0.970947265625, 1.00848388671875, 1.0460205078125, 1.08355712890625, 1.12109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 6.0, 3.0, 5.0, 8.0, 5.0, 13.0, 12.0, 7.0, 12.0, 17.0, 14.0, 26.0, 26.0, 36.0, 32.0, 30.0, 43.0, 49.0, 49.0, 40.0, 41.0, 38.0, 41.0, 41.0, 43.0, 36.0, 46.0, 25.0, 39.0, 36.0, 20.0, 20.0, 33.0, 19.0, 25.0, 15.0, 12.0, 10.0, 7.0, 5.0, 4.0, 8.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.87890625, -1.8277435302734375, -1.776580810546875, -1.7254180908203125, -1.67425537109375, -1.6230926513671875, -1.571929931640625, -1.5207672119140625, -1.4696044921875, -1.4184417724609375, -1.367279052734375, -1.3161163330078125, -1.26495361328125, -1.2137908935546875, -1.162628173828125, -1.1114654541015625, -1.060302734375, -1.0091400146484375, -0.957977294921875, -0.9068145751953125, -0.85565185546875, -0.8044891357421875, -0.753326416015625, -0.7021636962890625, -0.6510009765625, -0.5998382568359375, -0.548675537109375, -0.4975128173828125, -0.44635009765625, -0.3951873779296875, -0.344024658203125, -0.2928619384765625, -0.24169921875, -0.1905364990234375, -0.139373779296875, -0.0882110595703125, -0.03704833984375, 0.0141143798828125, 0.065277099609375, 0.1164398193359375, 0.1676025390625, 0.2187652587890625, 0.269927978515625, 0.3210906982421875, 0.37225341796875, 0.4234161376953125, 0.474578857421875, 0.5257415771484375, 0.576904296875, 0.6280670166015625, 0.679229736328125, 0.7303924560546875, 0.78155517578125, 0.8327178955078125, 0.883880615234375, 0.9350433349609375, 0.9862060546875, 1.0373687744140625, 1.088531494140625, 1.1396942138671875, 1.19085693359375, 1.2420196533203125, 1.293182373046875, 1.3443450927734375, 1.3955078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 7.0, 5.0, 7.0, 11.0, 22.0, 30.0, 50.0, 102.0, 205.0, 469.0, 1177.0, 3852.0, 21713.0, 258483.0, 674848.0, 75198.0, 8934.0, 2059.0, 758.0, 272.0, 139.0, 86.0, 43.0, 29.0, 13.0, 11.0, 10.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.025390625, -0.9963150024414062, -0.9672393798828125, -0.9381637573242188, -0.909088134765625, -0.8800125122070312, -0.8509368896484375, -0.8218612670898438, -0.79278564453125, -0.7637100219726562, -0.7346343994140625, -0.7055587768554688, -0.676483154296875, -0.6474075317382812, -0.6183319091796875, -0.5892562866210938, -0.5601806640625, -0.5311050415039062, -0.5020294189453125, -0.47295379638671875, -0.443878173828125, -0.41480255126953125, -0.3857269287109375, -0.35665130615234375, -0.32757568359375, -0.29850006103515625, -0.2694244384765625, -0.24034881591796875, -0.211273193359375, -0.18219757080078125, -0.1531219482421875, -0.12404632568359375, -0.094970703125, -0.06589508056640625, -0.0368194580078125, -0.00774383544921875, 0.021331787109375, 0.05040740966796875, 0.0794830322265625, 0.10855865478515625, 0.13763427734375, 0.16670989990234375, 0.1957855224609375, 0.22486114501953125, 0.253936767578125, 0.28301239013671875, 0.3120880126953125, 0.34116363525390625, 0.3702392578125, 0.39931488037109375, 0.4283905029296875, 0.45746612548828125, 0.486541748046875, 0.5156173706054688, 0.5446929931640625, 0.5737686157226562, 0.60284423828125, 0.6319198608398438, 0.6609954833984375, 0.6900711059570312, 0.719146728515625, 0.7482223510742188, 0.7772979736328125, 0.8063735961914062, 0.83544921875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 7.0, 11.0, 24.0, 25.0, 25.0, 38.0, 51.0, 55.0, 77.0, 91.0, 104.0, 89.0, 85.0, 79.0, 58.0, 47.0, 29.0, 29.0, 16.0, 12.0, 8.0, 10.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.828805923461914e-05, -9.500980377197266e-05, -9.173154830932617e-05, -8.845329284667969e-05, -8.51750373840332e-05, -8.189678192138672e-05, -7.861852645874023e-05, -7.534027099609375e-05, -7.206201553344727e-05, -6.878376007080078e-05, -6.55055046081543e-05, -6.222724914550781e-05, -5.894899368286133e-05, -5.5670738220214844e-05, -5.239248275756836e-05, -4.9114227294921875e-05, -4.583597183227539e-05, -4.2557716369628906e-05, -3.927946090698242e-05, -3.600120544433594e-05, -3.272294998168945e-05, -2.944469451904297e-05, -2.6166439056396484e-05, -2.288818359375e-05, -1.9609928131103516e-05, -1.633167266845703e-05, -1.3053417205810547e-05, -9.775161743164062e-06, -6.496906280517578e-06, -3.2186508178710938e-06, 5.960464477539063e-08, 3.337860107421875e-06, 6.616115570068359e-06, 9.894371032714844e-06, 1.3172626495361328e-05, 1.6450881958007812e-05, 1.9729137420654297e-05, 2.300739288330078e-05, 2.6285648345947266e-05, 2.956390380859375e-05, 3.2842159271240234e-05, 3.612041473388672e-05, 3.93986701965332e-05, 4.267692565917969e-05, 4.595518112182617e-05, 4.9233436584472656e-05, 5.251169204711914e-05, 5.5789947509765625e-05, 5.906820297241211e-05, 6.23464584350586e-05, 6.562471389770508e-05, 6.890296936035156e-05, 7.218122482299805e-05, 7.545948028564453e-05, 7.873773574829102e-05, 8.20159912109375e-05, 8.529424667358398e-05, 8.857250213623047e-05, 9.185075759887695e-05, 9.512901306152344e-05, 9.840726852416992e-05, 0.0001016855239868164, 0.00010496377944946289, 0.00010824203491210938, 0.00011152029037475586]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 10.0, 15.0, 24.0, 9.0, 22.0, 31.0, 33.0, 72.0, 86.0, 156.0, 310.0, 670.0, 1857.0, 6881.0, 38366.0, 285305.0, 577042.0, 114876.0, 16917.0, 3723.0, 1107.0, 448.0, 197.0, 113.0, 57.0, 52.0, 32.0, 23.0, 24.0, 19.0, 16.0, 10.0, 9.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.88671875, -0.8615798950195312, -0.8364410400390625, -0.8113021850585938, -0.786163330078125, -0.7610244750976562, -0.7358856201171875, -0.7107467651367188, -0.68560791015625, -0.6604690551757812, -0.6353302001953125, -0.6101913452148438, -0.585052490234375, -0.5599136352539062, -0.5347747802734375, -0.5096359252929688, -0.4844970703125, -0.45935821533203125, -0.4342193603515625, -0.40908050537109375, -0.383941650390625, -0.35880279541015625, -0.3336639404296875, -0.30852508544921875, -0.28338623046875, -0.25824737548828125, -0.2331085205078125, -0.20796966552734375, -0.182830810546875, -0.15769195556640625, -0.1325531005859375, -0.10741424560546875, -0.082275390625, -0.05713653564453125, -0.0319976806640625, -0.00685882568359375, 0.018280029296875, 0.04341888427734375, 0.0685577392578125, 0.09369659423828125, 0.11883544921875, 0.14397430419921875, 0.1691131591796875, 0.19425201416015625, 0.219390869140625, 0.24452972412109375, 0.2696685791015625, 0.29480743408203125, 0.3199462890625, 0.34508514404296875, 0.3702239990234375, 0.39536285400390625, 0.420501708984375, 0.44564056396484375, 0.4707794189453125, 0.49591827392578125, 0.52105712890625, 0.5461959838867188, 0.5713348388671875, 0.5964736938476562, 0.621612548828125, 0.6467514038085938, 0.6718902587890625, 0.6970291137695312, 0.72216796875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 5.0, 25.0, 36.0, 52.0, 68.0, 105.0, 132.0, 128.0, 115.0, 107.0, 75.0, 49.0, 36.0, 30.0, 11.0, 9.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.462890625, -1.4300079345703125, -1.397125244140625, -1.3642425537109375, -1.33135986328125, -1.2984771728515625, -1.265594482421875, -1.2327117919921875, -1.1998291015625, -1.1669464111328125, -1.134063720703125, -1.1011810302734375, -1.06829833984375, -1.0354156494140625, -1.002532958984375, -0.9696502685546875, -0.936767578125, -0.9038848876953125, -0.871002197265625, -0.8381195068359375, -0.80523681640625, -0.7723541259765625, -0.739471435546875, -0.7065887451171875, -0.6737060546875, -0.6408233642578125, -0.607940673828125, -0.5750579833984375, -0.54217529296875, -0.5092926025390625, -0.476409912109375, -0.4435272216796875, -0.41064453125, -0.3777618408203125, -0.344879150390625, -0.3119964599609375, -0.27911376953125, -0.2462310791015625, -0.213348388671875, -0.1804656982421875, -0.1475830078125, -0.1147003173828125, -0.081817626953125, -0.0489349365234375, -0.01605224609375, 0.0168304443359375, 0.049713134765625, 0.0825958251953125, 0.115478515625, 0.1483612060546875, 0.181243896484375, 0.2141265869140625, 0.24700927734375, 0.2798919677734375, 0.312774658203125, 0.3456573486328125, 0.3785400390625, 0.4114227294921875, 0.444305419921875, 0.4771881103515625, 0.51007080078125, 0.5429534912109375, 0.575836181640625, 0.6087188720703125, 0.6416015625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 7.0, 14.0, 20.0, 54.0, 76.0, 128.0, 182.0, 142.0, 121.0, 104.0, 55.0, 51.0, 27.0, 14.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-21.69822120666504, -21.273588180541992, -20.848957061767578, -20.42432403564453, -19.999691009521484, -19.57505989074707, -19.150426864624023, -18.725793838500977, -18.301162719726562, -17.876529693603516, -17.4518985748291, -17.027265548706055, -16.602632522583008, -16.178001403808594, -15.753368377685547, -15.328736305236816, -14.90410327911377, -14.479471206665039, -14.054838180541992, -13.630206108093262, -13.205574035644531, -12.780941009521484, -12.356308937072754, -11.931676864624023, -11.507043838500977, -11.082411766052246, -10.6577787399292, -10.233146667480469, -9.808514595031738, -9.383882522583008, -8.959249496459961, -8.53461742401123, -8.109986305236816, -7.685353755950928, -7.260721683502197, -6.836089134216309, -6.411457061767578, -5.9868245124816895, -5.562191963195801, -5.13755989074707, -4.712927341461182, -4.288294792175293, -3.8636627197265625, -3.439030170440674, -3.0143978595733643, -2.5897655487060547, -2.165132999420166, -1.7405006885528564, -1.3158683776855469, -0.8912360072135925, -0.4666036367416382, -0.04197120666503906, 0.3826611042022705, 0.8072934150695801, 1.2319259643554688, 1.6565582752227783, 2.081190586090088, 2.5058228969573975, 2.930455207824707, 3.3550877571105957, 3.7797200679779053, 4.204352378845215, 4.6289849281311035, 5.053617477416992, 5.478249549865723]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 9.0, 5.0, 2.0, 14.0, 8.0, 15.0, 12.0, 12.0, 25.0, 19.0, 21.0, 25.0, 30.0, 30.0, 23.0, 28.0, 33.0, 61.0, 40.0, 46.0, 57.0, 57.0, 51.0, 50.0, 31.0, 39.0, 33.0, 32.0, 25.0, 19.0, 21.0, 18.0, 25.0, 11.0, 15.0, 13.0, 13.0, 10.0, 7.0, 10.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-10.004802703857422, -9.733983993530273, -9.463165283203125, -9.19234561920166, -8.921526908874512, -8.650708198547363, -8.379888534545898, -8.10906982421875, -7.838251113891602, -7.567432403564453, -7.2966132164001465, -7.02579402923584, -6.754975318908691, -6.484156608581543, -6.213337421417236, -5.94251823425293, -5.671699523925781, -5.400880813598633, -5.130061626434326, -4.8592424392700195, -4.588423728942871, -4.317605018615723, -4.046785831451416, -3.7759668827056885, -3.505147933959961, -3.2343289852142334, -2.963510036468506, -2.6926910877227783, -2.421872138977051, -2.1510531902313232, -1.8802342414855957, -1.6094152927398682, -1.3385963439941406, -1.067777395248413, -0.7969584465026855, -0.526139497756958, -0.25532054901123047, 0.01549839973449707, 0.2863173484802246, 0.5571362972259521, 0.8279552459716797, 1.0987741947174072, 1.3695931434631348, 1.6404120922088623, 1.9112310409545898, 2.1820499897003174, 2.452868938446045, 2.7236878871917725, 2.9945068359375, 3.2653257846832275, 3.536144733428955, 3.8069636821746826, 4.07778263092041, 4.348601341247559, 4.619420528411865, 4.890239715576172, 5.16105842590332, 5.431877136230469, 5.702696323394775, 5.973515510559082, 6.2443342208862305, 6.515152931213379, 6.7859721183776855, 7.056791305541992, 7.327610015869141]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 7.0, 2.0, 7.0, 11.0, 18.0, 35.0, 28.0, 44.0, 69.0, 79.0, 129.0, 191.0, 245.0, 391.0, 562.0, 936.0, 1474.0, 2657.0, 5063.0, 11460.0, 31483.0, 143923.0, 3673498.0, 250999.0, 43162.0, 14351.0, 6029.0, 3043.0, 1748.0, 924.0, 585.0, 407.0, 217.0, 141.0, 114.0, 84.0, 57.0, 37.0, 27.0, 11.0, 7.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.4525604248046875, -1.405120849609375, -1.3576812744140625, -1.31024169921875, -1.2628021240234375, -1.215362548828125, -1.1679229736328125, -1.1204833984375, -1.0730438232421875, -1.025604248046875, -0.9781646728515625, -0.93072509765625, -0.8832855224609375, -0.835845947265625, -0.7884063720703125, -0.740966796875, -0.6935272216796875, -0.646087646484375, -0.5986480712890625, -0.55120849609375, -0.5037689208984375, -0.456329345703125, -0.4088897705078125, -0.3614501953125, -0.3140106201171875, -0.266571044921875, -0.2191314697265625, -0.17169189453125, -0.1242523193359375, -0.076812744140625, -0.0293731689453125, 0.01806640625, 0.0655059814453125, 0.112945556640625, 0.1603851318359375, 0.20782470703125, 0.2552642822265625, 0.302703857421875, 0.3501434326171875, 0.3975830078125, 0.4450225830078125, 0.492462158203125, 0.5399017333984375, 0.58734130859375, 0.6347808837890625, 0.682220458984375, 0.7296600341796875, 0.777099609375, 0.8245391845703125, 0.871978759765625, 0.9194183349609375, 0.96685791015625, 1.0142974853515625, 1.061737060546875, 1.1091766357421875, 1.1566162109375, 1.2040557861328125, 1.251495361328125, 1.2989349365234375, 1.34637451171875, 1.3938140869140625, 1.441253662109375, 1.4886932373046875, 1.5361328125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 7.0, 7.0, 13.0, 12.0, 11.0, 23.0, 7.0, 19.0, 24.0, 29.0, 33.0, 40.0, 44.0, 55.0, 34.0, 49.0, 53.0, 52.0, 49.0, 53.0, 44.0, 45.0, 35.0, 42.0, 44.0, 34.0, 25.0, 12.0, 27.0, 20.0, 10.0, 16.0, 15.0, 5.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4569664001464844, -0.44249725341796875, -0.4280281066894531, -0.4135589599609375, -0.3990898132324219, -0.38462066650390625, -0.3701515197753906, -0.355682373046875, -0.3412132263183594, -0.32674407958984375, -0.3122749328613281, -0.2978057861328125, -0.2833366394042969, -0.26886749267578125, -0.2543983459472656, -0.23992919921875, -0.22546005249023438, -0.21099090576171875, -0.19652175903320312, -0.1820526123046875, -0.16758346557617188, -0.15311431884765625, -0.13864517211914062, -0.124176025390625, -0.10970687866210938, -0.09523773193359375, -0.08076858520507812, -0.0662994384765625, -0.051830291748046875, -0.03736114501953125, -0.022891998291015625, -0.0084228515625, 0.006046295166015625, 0.02051544189453125, 0.034984588623046875, 0.0494537353515625, 0.06392288208007812, 0.07839202880859375, 0.09286117553710938, 0.107330322265625, 0.12179946899414062, 0.13626861572265625, 0.15073776245117188, 0.1652069091796875, 0.17967605590820312, 0.19414520263671875, 0.20861434936523438, 0.22308349609375, 0.23755264282226562, 0.25202178955078125, 0.2664909362792969, 0.2809600830078125, 0.2954292297363281, 0.30989837646484375, 0.3243675231933594, 0.338836669921875, 0.3533058166503906, 0.36777496337890625, 0.3822441101074219, 0.3967132568359375, 0.4111824035644531, 0.42565155029296875, 0.4401206970214844, 0.45458984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 7.0, 9.0, 16.0, 23.0, 34.0, 46.0, 70.0, 107.0, 164.0, 236.0, 357.0, 599.0, 940.0, 1505.0, 2718.0, 5077.0, 11613.0, 33843.0, 181537.0, 3625493.0, 262508.0, 41107.0, 13127.0, 5738.0, 2866.0, 1702.0, 968.0, 666.0, 440.0, 260.0, 156.0, 123.0, 81.0, 48.0, 28.0, 16.0, 19.0, 10.0, 10.0, 10.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.7744140625, -1.7271881103515625, -1.679962158203125, -1.6327362060546875, -1.58551025390625, -1.5382843017578125, -1.491058349609375, -1.4438323974609375, -1.3966064453125, -1.3493804931640625, -1.302154541015625, -1.2549285888671875, -1.20770263671875, -1.1604766845703125, -1.113250732421875, -1.0660247802734375, -1.018798828125, -0.9715728759765625, -0.924346923828125, -0.8771209716796875, -0.82989501953125, -0.7826690673828125, -0.735443115234375, -0.6882171630859375, -0.6409912109375, -0.5937652587890625, -0.546539306640625, -0.4993133544921875, -0.45208740234375, -0.4048614501953125, -0.357635498046875, -0.3104095458984375, -0.26318359375, -0.2159576416015625, -0.168731689453125, -0.1215057373046875, -0.07427978515625, -0.0270538330078125, 0.020172119140625, 0.0673980712890625, 0.1146240234375, 0.1618499755859375, 0.209075927734375, 0.2563018798828125, 0.30352783203125, 0.3507537841796875, 0.397979736328125, 0.4452056884765625, 0.492431640625, 0.5396575927734375, 0.586883544921875, 0.6341094970703125, 0.68133544921875, 0.7285614013671875, 0.775787353515625, 0.8230133056640625, 0.8702392578125, 0.9174652099609375, 0.964691162109375, 1.0119171142578125, 1.05914306640625, 1.1063690185546875, 1.153594970703125, 1.2008209228515625, 1.248046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 9.0, 5.0, 15.0, 12.0, 14.0, 29.0, 40.0, 47.0, 107.0, 195.0, 690.0, 2189.0, 368.0, 137.0, 62.0, 38.0, 27.0, 19.0, 17.0, 11.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.935546875, -0.9074478149414062, -0.8793487548828125, -0.8512496948242188, -0.823150634765625, -0.7950515747070312, -0.7669525146484375, -0.7388534545898438, -0.71075439453125, -0.6826553344726562, -0.6545562744140625, -0.6264572143554688, -0.598358154296875, -0.5702590942382812, -0.5421600341796875, -0.5140609741210938, -0.4859619140625, -0.45786285400390625, -0.4297637939453125, -0.40166473388671875, -0.373565673828125, -0.34546661376953125, -0.3173675537109375, -0.28926849365234375, -0.26116943359375, -0.23307037353515625, -0.2049713134765625, -0.17687225341796875, -0.148773193359375, -0.12067413330078125, -0.0925750732421875, -0.06447601318359375, -0.036376953125, -0.00827789306640625, 0.0198211669921875, 0.04792022705078125, 0.076019287109375, 0.10411834716796875, 0.1322174072265625, 0.16031646728515625, 0.18841552734375, 0.21651458740234375, 0.2446136474609375, 0.27271270751953125, 0.300811767578125, 0.32891082763671875, 0.3570098876953125, 0.38510894775390625, 0.4132080078125, 0.44130706787109375, 0.4694061279296875, 0.49750518798828125, 0.525604248046875, 0.5537033081054688, 0.5818023681640625, 0.6099014282226562, 0.63800048828125, 0.6660995483398438, 0.6941986083984375, 0.7222976684570312, 0.750396728515625, 0.7784957885742188, 0.8065948486328125, 0.8346939086914062, 0.86279296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 17.0, 162.0, 513.0, 282.0, 31.0, 5.0, 1.0, 1.0], "bins": [-41.62603759765625, -40.91968536376953, -40.21333312988281, -39.50697708129883, -38.80062484741211, -38.09427261352539, -37.38792037963867, -36.68156433105469, -35.97521209716797, -35.26885986328125, -34.56250762939453, -33.85615158081055, -33.14979934692383, -32.44344711303711, -31.73709487915039, -31.03074073791504, -30.32438850402832, -29.6180362701416, -28.91168212890625, -28.20532989501953, -27.49897575378418, -26.79262351989746, -26.08626937866211, -25.37991714477539, -24.673564910888672, -23.967212677001953, -23.2608585357666, -22.554506301879883, -21.84815216064453, -21.141799926757812, -20.435447692871094, -19.729093551635742, -19.022741317749023, -18.316389083862305, -17.610034942626953, -16.903682708740234, -16.197328567504883, -15.490976333618164, -14.784623146057129, -14.078269958496094, -13.371915817260742, -12.665562629699707, -11.959209442138672, -11.252857208251953, -10.546503067016602, -9.840150833129883, -9.133797645568848, -8.427444458007812, -7.7210917472839355, -7.0147385597229, -6.308385848999023, -5.602032661437988, -4.895679473876953, -4.189326286315918, -3.482973575592041, -2.776620388031006, -2.0702672004699707, -1.363914132118225, -0.6575610637664795, 0.04879188537597656, 0.7551450729370117, 1.4614982604980469, 2.167850971221924, 2.874204158782959, 3.580557346343994]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 2.0, 11.0, 12.0, 13.0, 22.0, 14.0, 28.0, 30.0, 35.0, 30.0, 47.0, 32.0, 39.0, 33.0, 45.0, 46.0, 39.0, 40.0, 51.0, 47.0, 29.0, 45.0, 35.0, 31.0, 30.0, 23.0, 34.0, 31.0, 20.0, 24.0, 18.0, 9.0, 15.0, 10.0, 8.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.381999969482422, -3.291018009185791, -3.2000362873077393, -3.1090543270111084, -3.0180726051330566, -2.927090644836426, -2.836108684539795, -2.745126962661743, -2.6541452407836914, -2.5631632804870605, -2.472181558609009, -2.381199598312378, -2.290217876434326, -2.1992359161376953, -2.1082539558410645, -2.0172722339630127, -1.9262902736663818, -1.8353084325790405, -1.7443265914916992, -1.6533446311950684, -1.5623629093170166, -1.4713809490203857, -1.3803991079330444, -1.2894172668457031, -1.1984354257583618, -1.1074535846710205, -1.0164717435836792, -0.9254898428916931, -0.8345080018043518, -0.7435261607170105, -0.6525442600250244, -0.5615624189376831, -0.4705808162689209, -0.3795989751815796, -0.2886171042919159, -0.1976352334022522, -0.10665339231491089, -0.01567155122756958, 0.0753103494644165, 0.1662921905517578, 0.2572740316390991, 0.34825587272644043, 0.4392377436161041, 0.5302196145057678, 0.6212014555931091, 0.7121832966804504, 0.8031651973724365, 0.8941470384597778, 0.9851288795471191, 1.0761107206344604, 1.1670925617218018, 1.2580745220184326, 1.3490562438964844, 1.4400382041931152, 1.5310200452804565, 1.6220018863677979, 1.7129837274551392, 1.8039655685424805, 1.8949474096298218, 1.985929250717163, 2.076911211013794, 2.1678929328918457, 2.2588748931884766, 2.3498568534851074, 2.440838575363159]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 23.0, 27.0, 39.0, 61.0, 84.0, 110.0, 177.0, 317.0, 496.0, 877.0, 1627.0, 3205.0, 6434.0, 14279.0, 34197.0, 90082.0, 247820.0, 368963.0, 172521.0, 61698.0, 24378.0, 10604.0, 4933.0, 2469.0, 1259.0, 712.0, 448.0, 242.0, 175.0, 106.0, 54.0, 38.0, 32.0, 27.0, 11.0, 9.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.26953125, -1.2289886474609375, -1.188446044921875, -1.1479034423828125, -1.10736083984375, -1.0668182373046875, -1.026275634765625, -0.9857330322265625, -0.9451904296875, -0.9046478271484375, -0.864105224609375, -0.8235626220703125, -0.78302001953125, -0.7424774169921875, -0.701934814453125, -0.6613922119140625, -0.620849609375, -0.5803070068359375, -0.539764404296875, -0.4992218017578125, -0.45867919921875, -0.4181365966796875, -0.377593994140625, -0.3370513916015625, -0.2965087890625, -0.2559661865234375, -0.215423583984375, -0.1748809814453125, -0.13433837890625, -0.0937957763671875, -0.053253173828125, -0.0127105712890625, 0.02783203125, 0.0683746337890625, 0.108917236328125, 0.1494598388671875, 0.19000244140625, 0.2305450439453125, 0.271087646484375, 0.3116302490234375, 0.3521728515625, 0.3927154541015625, 0.433258056640625, 0.4738006591796875, 0.51434326171875, 0.5548858642578125, 0.595428466796875, 0.6359710693359375, 0.676513671875, 0.7170562744140625, 0.757598876953125, 0.7981414794921875, 0.83868408203125, 0.8792266845703125, 0.919769287109375, 0.9603118896484375, 1.0008544921875, 1.0413970947265625, 1.081939697265625, 1.1224822998046875, 1.16302490234375, 1.2035675048828125, 1.244110107421875, 1.2846527099609375, 1.3251953125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 5.0, 9.0, 9.0, 5.0, 9.0, 12.0, 13.0, 26.0, 22.0, 29.0, 22.0, 29.0, 45.0, 42.0, 43.0, 60.0, 51.0, 39.0, 46.0, 48.0, 53.0, 39.0, 42.0, 44.0, 34.0, 35.0, 37.0, 25.0, 31.0, 19.0, 18.0, 16.0, 15.0, 10.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.513671875, -0.49832916259765625, -0.4829864501953125, -0.46764373779296875, -0.452301025390625, -0.43695831298828125, -0.4216156005859375, -0.40627288818359375, -0.39093017578125, -0.37558746337890625, -0.3602447509765625, -0.34490203857421875, -0.329559326171875, -0.31421661376953125, -0.2988739013671875, -0.28353118896484375, -0.2681884765625, -0.25284576416015625, -0.2375030517578125, -0.22216033935546875, -0.206817626953125, -0.19147491455078125, -0.1761322021484375, -0.16078948974609375, -0.14544677734375, -0.13010406494140625, -0.1147613525390625, -0.09941864013671875, -0.084075927734375, -0.06873321533203125, -0.0533905029296875, -0.03804779052734375, -0.022705078125, -0.00736236572265625, 0.0079803466796875, 0.02332305908203125, 0.038665771484375, 0.05400848388671875, 0.0693511962890625, 0.08469390869140625, 0.10003662109375, 0.11537933349609375, 0.1307220458984375, 0.14606475830078125, 0.161407470703125, 0.17675018310546875, 0.1920928955078125, 0.20743560791015625, 0.2227783203125, 0.23812103271484375, 0.2534637451171875, 0.26880645751953125, 0.284149169921875, 0.29949188232421875, 0.3148345947265625, 0.33017730712890625, 0.34552001953125, 0.36086273193359375, 0.3762054443359375, 0.39154815673828125, 0.406890869140625, 0.42223358154296875, 0.4375762939453125, 0.45291900634765625, 0.46826171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 9.0, 11.0, 12.0, 20.0, 18.0, 30.0, 48.0, 49.0, 86.0, 116.0, 177.0, 275.0, 476.0, 784.0, 1471.0, 3008.0, 6927.0, 17788.0, 55691.0, 223516.0, 502914.0, 166062.0, 43046.0, 14363.0, 5750.0, 2635.0, 1332.0, 752.0, 395.0, 245.0, 162.0, 118.0, 66.0, 46.0, 45.0, 33.0, 22.0, 14.0, 9.0, 8.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.6875, -1.6384429931640625, -1.589385986328125, -1.5403289794921875, -1.49127197265625, -1.4422149658203125, -1.393157958984375, -1.3441009521484375, -1.2950439453125, -1.2459869384765625, -1.196929931640625, -1.1478729248046875, -1.09881591796875, -1.0497589111328125, -1.000701904296875, -0.9516448974609375, -0.902587890625, -0.8535308837890625, -0.804473876953125, -0.7554168701171875, -0.70635986328125, -0.6573028564453125, -0.608245849609375, -0.5591888427734375, -0.5101318359375, -0.4610748291015625, -0.412017822265625, -0.3629608154296875, -0.31390380859375, -0.2648468017578125, -0.215789794921875, -0.1667327880859375, -0.11767578125, -0.0686187744140625, -0.019561767578125, 0.0294952392578125, 0.07855224609375, 0.1276092529296875, 0.176666259765625, 0.2257232666015625, 0.2747802734375, 0.3238372802734375, 0.372894287109375, 0.4219512939453125, 0.47100830078125, 0.5200653076171875, 0.569122314453125, 0.6181793212890625, 0.667236328125, 0.7162933349609375, 0.765350341796875, 0.8144073486328125, 0.86346435546875, 0.9125213623046875, 0.961578369140625, 1.0106353759765625, 1.0596923828125, 1.1087493896484375, 1.157806396484375, 1.2068634033203125, 1.25592041015625, 1.3049774169921875, 1.354034423828125, 1.4030914306640625, 1.4521484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 5.0, 11.0, 10.0, 13.0, 16.0, 16.0, 28.0, 31.0, 26.0, 47.0, 49.0, 51.0, 36.0, 42.0, 63.0, 67.0, 47.0, 57.0, 63.0, 36.0, 37.0, 42.0, 38.0, 33.0, 27.0, 28.0, 17.0, 10.0, 6.0, 13.0, 14.0, 9.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.318359375, -3.2392425537109375, -3.160125732421875, -3.0810089111328125, -3.00189208984375, -2.9227752685546875, -2.843658447265625, -2.7645416259765625, -2.6854248046875, -2.6063079833984375, -2.527191162109375, -2.4480743408203125, -2.36895751953125, -2.2898406982421875, -2.210723876953125, -2.1316070556640625, -2.052490234375, -1.9733734130859375, -1.894256591796875, -1.8151397705078125, -1.73602294921875, -1.6569061279296875, -1.577789306640625, -1.4986724853515625, -1.4195556640625, -1.3404388427734375, -1.261322021484375, -1.1822052001953125, -1.10308837890625, -1.0239715576171875, -0.944854736328125, -0.8657379150390625, -0.78662109375, -0.7075042724609375, -0.628387451171875, -0.5492706298828125, -0.47015380859375, -0.3910369873046875, -0.311920166015625, -0.2328033447265625, -0.1536865234375, -0.0745697021484375, 0.004547119140625, 0.0836639404296875, 0.16278076171875, 0.2418975830078125, 0.321014404296875, 0.4001312255859375, 0.479248046875, 0.5583648681640625, 0.637481689453125, 0.7165985107421875, 0.79571533203125, 0.8748321533203125, 0.953948974609375, 1.0330657958984375, 1.1121826171875, 1.1912994384765625, 1.270416259765625, 1.3495330810546875, 1.42864990234375, 1.5077667236328125, 1.586883544921875, 1.6660003662109375, 1.7451171875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 16.0, 16.0, 29.0, 44.0, 82.0, 169.0, 268.0, 419.0, 879.0, 2596.0, 11998.0, 98048.0, 788334.0, 126473.0, 14165.0, 2942.0, 985.0, 463.0, 260.0, 133.0, 95.0, 48.0, 33.0, 23.0, 8.0, 9.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2216796875, -1.1816864013671875, -1.141693115234375, -1.1016998291015625, -1.06170654296875, -1.0217132568359375, -0.981719970703125, -0.9417266845703125, -0.9017333984375, -0.8617401123046875, -0.821746826171875, -0.7817535400390625, -0.74176025390625, -0.7017669677734375, -0.661773681640625, -0.6217803955078125, -0.581787109375, -0.5417938232421875, -0.501800537109375, -0.4618072509765625, -0.42181396484375, -0.3818206787109375, -0.341827392578125, -0.3018341064453125, -0.2618408203125, -0.2218475341796875, -0.181854248046875, -0.1418609619140625, -0.10186767578125, -0.0618743896484375, -0.021881103515625, 0.0181121826171875, 0.05810546875, 0.0980987548828125, 0.138092041015625, 0.1780853271484375, 0.21807861328125, 0.2580718994140625, 0.298065185546875, 0.3380584716796875, 0.3780517578125, 0.4180450439453125, 0.458038330078125, 0.4980316162109375, 0.53802490234375, 0.5780181884765625, 0.618011474609375, 0.6580047607421875, 0.697998046875, 0.7379913330078125, 0.777984619140625, 0.8179779052734375, 0.85797119140625, 0.8979644775390625, 0.937957763671875, 0.9779510498046875, 1.0179443359375, 1.0579376220703125, 1.097930908203125, 1.1379241943359375, 1.17791748046875, 1.2179107666015625, 1.257904052734375, 1.2978973388671875, 1.337890625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 13.0, 9.0, 13.0, 13.0, 21.0, 44.0, 71.0, 101.0, 141.0, 163.0, 113.0, 98.0, 71.0, 48.0, 28.0, 17.0, 11.0, 14.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00024139881134033203, -0.00023528560996055603, -0.00022917240858078003, -0.00022305920720100403, -0.00021694600582122803, -0.00021083280444145203, -0.00020471960306167603, -0.00019860640168190002, -0.00019249320030212402, -0.00018637999892234802, -0.00018026679754257202, -0.00017415359616279602, -0.00016804039478302002, -0.00016192719340324402, -0.00015581399202346802, -0.00014970079064369202, -0.00014358758926391602, -0.00013747438788414001, -0.00013136118650436401, -0.000125247985124588, -0.00011913478374481201, -0.00011302158236503601, -0.00010690838098526001, -0.00010079517960548401, -9.468197822570801e-05, -8.856877684593201e-05, -8.2455575466156e-05, -7.634237408638e-05, -7.0229172706604e-05, -6.4115971326828e-05, -5.8002769947052e-05, -5.1889568567276e-05, -4.57763671875e-05, -3.9663165807724e-05, -3.3549964427948e-05, -2.7436763048171997e-05, -2.1323561668395996e-05, -1.5210360288619995e-05, -9.097158908843994e-06, -2.983957529067993e-06, 3.129243850708008e-06, 9.242445230484009e-06, 1.535564661026001e-05, 2.146884799003601e-05, 2.7582049369812012e-05, 3.369525074958801e-05, 3.9808452129364014e-05, 4.5921653509140015e-05, 5.2034854888916016e-05, 5.8148056268692017e-05, 6.426125764846802e-05, 7.037445902824402e-05, 7.648766040802002e-05, 8.260086178779602e-05, 8.871406316757202e-05, 9.482726454734802e-05, 0.00010094046592712402, 0.00010705366730690002, 0.00011316686868667603, 0.00011928007006645203, 0.00012539327144622803, 0.00013150647282600403, 0.00013761967420578003, 0.00014373287558555603, 0.00014984607696533203]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 7.0, 6.0, 7.0, 13.0, 12.0, 25.0, 31.0, 41.0, 56.0, 87.0, 196.0, 261.0, 493.0, 965.0, 2123.0, 5073.0, 16428.0, 77442.0, 457139.0, 399230.0, 65557.0, 14787.0, 4633.0, 1833.0, 914.0, 503.0, 292.0, 132.0, 104.0, 71.0, 35.0, 24.0, 13.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.7714614868164062, -0.7465362548828125, -0.7216110229492188, -0.696685791015625, -0.6717605590820312, -0.6468353271484375, -0.6219100952148438, -0.59698486328125, -0.5720596313476562, -0.5471343994140625, -0.5222091674804688, -0.497283935546875, -0.47235870361328125, -0.4474334716796875, -0.42250823974609375, -0.3975830078125, -0.37265777587890625, -0.3477325439453125, -0.32280731201171875, -0.297882080078125, -0.27295684814453125, -0.2480316162109375, -0.22310638427734375, -0.19818115234375, -0.17325592041015625, -0.1483306884765625, -0.12340545654296875, -0.098480224609375, -0.07355499267578125, -0.0486297607421875, -0.02370452880859375, 0.001220703125, 0.02614593505859375, 0.0510711669921875, 0.07599639892578125, 0.100921630859375, 0.12584686279296875, 0.1507720947265625, 0.17569732666015625, 0.20062255859375, 0.22554779052734375, 0.2504730224609375, 0.27539825439453125, 0.300323486328125, 0.32524871826171875, 0.3501739501953125, 0.37509918212890625, 0.4000244140625, 0.42494964599609375, 0.4498748779296875, 0.47480010986328125, 0.499725341796875, 0.5246505737304688, 0.5495758056640625, 0.5745010375976562, 0.59942626953125, 0.6243515014648438, 0.6492767333984375, 0.6742019653320312, 0.699127197265625, 0.7240524291992188, 0.7489776611328125, 0.7739028930664062, 0.798828125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 8.0, 6.0, 8.0, 15.0, 30.0, 32.0, 62.0, 90.0, 114.0, 134.0, 137.0, 117.0, 77.0, 55.0, 31.0, 17.0, 20.0, 10.0, 6.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0029296875, -0.962677001953125, -0.92242431640625, -0.882171630859375, -0.8419189453125, -0.801666259765625, -0.76141357421875, -0.721160888671875, -0.680908203125, -0.640655517578125, -0.60040283203125, -0.560150146484375, -0.5198974609375, -0.479644775390625, -0.43939208984375, -0.399139404296875, -0.35888671875, -0.318634033203125, -0.27838134765625, -0.238128662109375, -0.1978759765625, -0.157623291015625, -0.11737060546875, -0.077117919921875, -0.036865234375, 0.003387451171875, 0.04364013671875, 0.083892822265625, 0.1241455078125, 0.164398193359375, 0.20465087890625, 0.244903564453125, 0.28515625, 0.325408935546875, 0.36566162109375, 0.405914306640625, 0.4461669921875, 0.486419677734375, 0.52667236328125, 0.566925048828125, 0.607177734375, 0.647430419921875, 0.68768310546875, 0.727935791015625, 0.7681884765625, 0.808441162109375, 0.84869384765625, 0.888946533203125, 0.92919921875, 0.969451904296875, 1.00970458984375, 1.049957275390625, 1.0902099609375, 1.130462646484375, 1.17071533203125, 1.210968017578125, 1.251220703125, 1.291473388671875, 1.33172607421875, 1.371978759765625, 1.4122314453125, 1.452484130859375, 1.49273681640625, 1.532989501953125, 1.5732421875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 10.0, 26.0, 39.0, 61.0, 99.0, 143.0, 171.0, 155.0, 113.0, 72.0, 51.0, 26.0, 22.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.57172679901123, -12.040033340454102, -11.508339881896973, -10.976646423339844, -10.444953918457031, -9.913260459899902, -9.381567001342773, -8.849873542785645, -8.318180084228516, -7.786486625671387, -7.254793643951416, -6.723100185394287, -6.191407203674316, -5.6597137451171875, -5.128020286560059, -4.59632682800293, -4.064634323120117, -3.5329411029815674, -3.0012478828430176, -2.4695544242858887, -1.9378612041473389, -1.406167984008789, -0.8744745254516602, -0.34278130531311035, 0.18891191482543945, 0.720605194568634, 1.2522984743118286, 1.783991813659668, 2.3156850337982178, 2.8473782539367676, 3.3790717124938965, 3.9107649326324463, 4.44245719909668, 4.974150657653809, 5.505843639373779, 6.037537097930908, 6.569230079650879, 7.100923538208008, 7.632616996765137, 8.164310455322266, 8.696002960205078, 9.227696418762207, 9.759389877319336, 10.291082382202148, 10.822775840759277, 11.354469299316406, 11.886162757873535, 12.417856216430664, 12.949549674987793, 13.481243133544922, 14.01293659210205, 14.54463005065918, 15.076322555541992, 15.608016014099121, 16.13970947265625, 16.671401977539062, 17.203096389770508, 17.73478889465332, 18.266483306884766, 18.798175811767578, 19.329870223999023, 19.861562728881836, 20.39325714111328, 20.924949645996094, 21.456642150878906]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 9.0, 10.0, 8.0, 10.0, 12.0, 9.0, 14.0, 12.0, 25.0, 25.0, 21.0, 31.0, 39.0, 34.0, 27.0, 37.0, 47.0, 56.0, 44.0, 36.0, 63.0, 43.0, 38.0, 45.0, 36.0, 38.0, 37.0, 26.0, 24.0, 22.0, 24.0, 19.0, 17.0, 11.0, 16.0, 6.0, 9.0, 3.0, 7.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.329910278320312, -10.9769926071167, -10.624074935913086, -10.271157264709473, -9.91823959350586, -9.565321922302246, -9.212404251098633, -8.859485626220703, -8.506568908691406, -8.153651237487793, -7.80073356628418, -7.447815895080566, -7.094898223876953, -6.74198055267334, -6.389062404632568, -6.036144733428955, -5.683226585388184, -5.33030891418457, -4.977391242980957, -4.624473571777344, -4.2715559005737305, -3.918637990951538, -3.5657200813293457, -3.2128024101257324, -2.859884738922119, -2.506967067718506, -2.1540493965148926, -1.8011314868927002, -1.448213815689087, -1.0952961444854736, -0.7423782348632812, -0.38946056365966797, -0.03654193878173828, 0.3163757920265198, 0.6692935228347778, 1.0222113132476807, 1.375128984451294, 1.7280466556549072, 2.0809645652770996, 2.433882236480713, 2.786799907684326, 3.1397175788879395, 3.4926352500915527, 3.845553159713745, 4.1984710693359375, 4.551388740539551, 4.904306411743164, 5.257224082946777, 5.610141754150391, 5.963059425354004, 6.315977096557617, 6.6688947677612305, 7.021812438964844, 7.374730110168457, 7.7276482582092285, 8.08056640625, 8.433483123779297, 8.78640079498291, 9.139318466186523, 9.492236137390137, 9.84515380859375, 10.198071479797363, 10.550989151000977, 10.903907775878906, 11.25682544708252]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 3.0, 8.0, 14.0, 28.0, 45.0, 43.0, 39.0, 81.0, 102.0, 180.0, 328.0, 522.0, 911.0, 1710.0, 3643.0, 8661.0, 34477.0, 4070557.0, 53385.0, 10694.0, 4296.0, 2034.0, 1029.0, 580.0, 328.0, 183.0, 115.0, 84.0, 64.0, 36.0, 25.0, 13.0, 15.0, 9.0, 8.0, 7.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.06640625, -2.001007080078125, -1.93560791015625, -1.870208740234375, -1.8048095703125, -1.739410400390625, -1.67401123046875, -1.608612060546875, -1.543212890625, -1.477813720703125, -1.41241455078125, -1.347015380859375, -1.2816162109375, -1.216217041015625, -1.15081787109375, -1.085418701171875, -1.02001953125, -0.954620361328125, -0.88922119140625, -0.823822021484375, -0.7584228515625, -0.693023681640625, -0.62762451171875, -0.562225341796875, -0.496826171875, -0.431427001953125, -0.36602783203125, -0.300628662109375, -0.2352294921875, -0.169830322265625, -0.10443115234375, -0.039031982421875, 0.0263671875, 0.091766357421875, 0.15716552734375, 0.222564697265625, 0.2879638671875, 0.353363037109375, 0.41876220703125, 0.484161376953125, 0.549560546875, 0.614959716796875, 0.68035888671875, 0.745758056640625, 0.8111572265625, 0.876556396484375, 0.94195556640625, 1.007354736328125, 1.07275390625, 1.138153076171875, 1.20355224609375, 1.268951416015625, 1.3343505859375, 1.399749755859375, 1.46514892578125, 1.530548095703125, 1.595947265625, 1.661346435546875, 1.72674560546875, 1.792144775390625, 1.8575439453125, 1.922943115234375, 1.98834228515625, 2.053741455078125, 2.119140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 4.0, 9.0, 6.0, 15.0, 12.0, 13.0, 14.0, 14.0, 25.0, 24.0, 35.0, 30.0, 35.0, 33.0, 40.0, 37.0, 52.0, 53.0, 53.0, 42.0, 55.0, 53.0, 47.0, 44.0, 37.0, 33.0, 31.0, 23.0, 19.0, 20.0, 12.0, 18.0, 15.0, 16.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54248046875, -0.5247344970703125, -0.506988525390625, -0.4892425537109375, -0.47149658203125, -0.4537506103515625, -0.436004638671875, -0.4182586669921875, -0.4005126953125, -0.3827667236328125, -0.365020751953125, -0.3472747802734375, -0.32952880859375, -0.3117828369140625, -0.294036865234375, -0.2762908935546875, -0.258544921875, -0.2407989501953125, -0.223052978515625, -0.2053070068359375, -0.18756103515625, -0.1698150634765625, -0.152069091796875, -0.1343231201171875, -0.1165771484375, -0.0988311767578125, -0.081085205078125, -0.0633392333984375, -0.04559326171875, -0.0278472900390625, -0.010101318359375, 0.0076446533203125, 0.025390625, 0.0431365966796875, 0.060882568359375, 0.0786285400390625, 0.09637451171875, 0.1141204833984375, 0.131866455078125, 0.1496124267578125, 0.1673583984375, 0.1851043701171875, 0.202850341796875, 0.2205963134765625, 0.23834228515625, 0.2560882568359375, 0.273834228515625, 0.2915802001953125, 0.309326171875, 0.3270721435546875, 0.344818115234375, 0.3625640869140625, 0.38031005859375, 0.3980560302734375, 0.415802001953125, 0.4335479736328125, 0.4512939453125, 0.4690399169921875, 0.486785888671875, 0.5045318603515625, 0.52227783203125, 0.5400238037109375, 0.557769775390625, 0.5755157470703125, 0.59326171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 8.0, 4.0, 3.0, 9.0, 12.0, 14.0, 17.0, 21.0, 37.0, 35.0, 62.0, 98.0, 136.0, 246.0, 437.0, 842.0, 1773.0, 4277.0, 14062.0, 106874.0, 4016489.0, 34985.0, 8157.0, 2850.0, 1289.0, 608.0, 355.0, 206.0, 129.0, 81.0, 50.0, 30.0, 29.0, 18.0, 14.0, 7.0, 9.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.087890625, -2.021148681640625, -1.95440673828125, -1.887664794921875, -1.8209228515625, -1.754180908203125, -1.68743896484375, -1.620697021484375, -1.553955078125, -1.487213134765625, -1.42047119140625, -1.353729248046875, -1.2869873046875, -1.220245361328125, -1.15350341796875, -1.086761474609375, -1.02001953125, -0.953277587890625, -0.88653564453125, -0.819793701171875, -0.7530517578125, -0.686309814453125, -0.61956787109375, -0.552825927734375, -0.486083984375, -0.419342041015625, -0.35260009765625, -0.285858154296875, -0.2191162109375, -0.152374267578125, -0.08563232421875, -0.018890380859375, 0.0478515625, 0.114593505859375, 0.18133544921875, 0.248077392578125, 0.3148193359375, 0.381561279296875, 0.44830322265625, 0.515045166015625, 0.581787109375, 0.648529052734375, 0.71527099609375, 0.782012939453125, 0.8487548828125, 0.915496826171875, 0.98223876953125, 1.048980712890625, 1.11572265625, 1.182464599609375, 1.24920654296875, 1.315948486328125, 1.3826904296875, 1.449432373046875, 1.51617431640625, 1.582916259765625, 1.649658203125, 1.716400146484375, 1.78314208984375, 1.849884033203125, 1.9166259765625, 1.983367919921875, 2.05010986328125, 2.116851806640625, 2.18359375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 6.0, 5.0, 15.0, 23.0, 58.0, 144.0, 3537.0, 160.0, 52.0, 22.0, 16.0, 6.0, 11.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4853515625, -0.47042083740234375, -0.4554901123046875, -0.44055938720703125, -0.425628662109375, -0.41069793701171875, -0.3957672119140625, -0.38083648681640625, -0.36590576171875, -0.35097503662109375, -0.3360443115234375, -0.32111358642578125, -0.306182861328125, -0.29125213623046875, -0.2763214111328125, -0.26139068603515625, -0.2464599609375, -0.23152923583984375, -0.2165985107421875, -0.20166778564453125, -0.186737060546875, -0.17180633544921875, -0.1568756103515625, -0.14194488525390625, -0.12701416015625, -0.11208343505859375, -0.0971527099609375, -0.08222198486328125, -0.067291259765625, -0.05236053466796875, -0.0374298095703125, -0.02249908447265625, -0.007568359375, 0.00736236572265625, 0.0222930908203125, 0.03722381591796875, 0.052154541015625, 0.06708526611328125, 0.0820159912109375, 0.09694671630859375, 0.11187744140625, 0.12680816650390625, 0.1417388916015625, 0.15666961669921875, 0.171600341796875, 0.18653106689453125, 0.2014617919921875, 0.21639251708984375, 0.2313232421875, 0.24625396728515625, 0.2611846923828125, 0.27611541748046875, 0.291046142578125, 0.30597686767578125, 0.3209075927734375, 0.33583831787109375, 0.35076904296875, 0.36569976806640625, 0.3806304931640625, 0.39556121826171875, 0.410491943359375, 0.42542266845703125, 0.4403533935546875, 0.45528411865234375, 0.47021484375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 10.0, 35.0, 66.0, 79.0, 149.0, 168.0, 178.0, 142.0, 79.0, 49.0, 25.0, 9.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6465842723846436, -1.589664340019226, -1.5327444076538086, -1.4758244752883911, -1.4189045429229736, -1.3619846105575562, -1.3050646781921387, -1.2481447458267212, -1.1912248134613037, -1.1343048810958862, -1.0773849487304688, -1.0204650163650513, -0.9635450839996338, -0.9066251516342163, -0.8497052192687988, -0.7927852869033813, -0.7358652949333191, -0.6789453625679016, -0.6220254302024841, -0.5651054978370667, -0.5081855654716492, -0.4512656033039093, -0.3943456709384918, -0.33742573857307434, -0.28050580620765686, -0.22358587384223938, -0.1666659414768219, -0.10974599421024323, -0.052826061844825745, 0.00409388542175293, 0.06101381778717041, 0.11793375015258789, 0.17485368251800537, 0.23177361488342285, 0.28869354724884033, 0.3456134796142578, 0.4025334119796753, 0.45945337414741516, 0.5163732767105103, 0.5732932090759277, 0.6302131414413452, 0.6871330738067627, 0.7440530061721802, 0.8009729385375977, 0.8578928709030151, 0.9148128032684326, 0.9717327356338501, 1.0286526679992676, 1.0855727195739746, 1.142492651939392, 1.1994125843048096, 1.256332516670227, 1.3132524490356445, 1.370172381401062, 1.4270923137664795, 1.484012246131897, 1.5409321784973145, 1.597852110862732, 1.6547720432281494, 1.711691975593567, 1.7686119079589844, 1.8255318403244019, 1.8824517726898193, 1.9393717050552368, 1.9962916374206543]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 5.0, 8.0, 11.0, 11.0, 11.0, 16.0, 9.0, 15.0, 18.0, 17.0, 21.0, 22.0, 24.0, 34.0, 32.0, 39.0, 42.0, 38.0, 54.0, 40.0, 37.0, 48.0, 41.0, 36.0, 37.0, 45.0, 29.0, 33.0, 38.0, 23.0, 24.0, 26.0, 17.0, 13.0, 14.0, 20.0, 15.0, 10.0, 7.0, 1.0, 4.0, 5.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5965712070465088, -0.5762914419174194, -0.5560117363929749, -0.5357319712638855, -0.5154522657394409, -0.49517250061035156, -0.4748927354812622, -0.45461300015449524, -0.43433326482772827, -0.4140535295009613, -0.39377379417419434, -0.373494029045105, -0.353214293718338, -0.33293455839157104, -0.3126547932624817, -0.2923750579357147, -0.27209532260894775, -0.2518155872821808, -0.23153583705425262, -0.21125608682632446, -0.1909763514995575, -0.17069661617279053, -0.15041686594486237, -0.1301371157169342, -0.10985738039016724, -0.08957763761281967, -0.0692978948354721, -0.04901815205812454, -0.028738409280776978, -0.008458666503429413, 0.011821076273918152, 0.032100826501846313, 0.052380502223968506, 0.07266024500131607, 0.09293998777866364, 0.1132197305560112, 0.13349947333335876, 0.15377920866012573, 0.1740589588880539, 0.19433870911598206, 0.21461844444274902, 0.234898179769516, 0.25517791509628296, 0.2754576802253723, 0.2957374155521393, 0.31601715087890625, 0.3362969160079956, 0.3565766513347626, 0.37685638666152954, 0.3971361219882965, 0.4174158573150635, 0.43769562244415283, 0.4579753577709198, 0.47825509309768677, 0.4985348582267761, 0.5188145637512207, 0.5390943288803101, 0.5593740940093994, 0.579653799533844, 0.5999335646629333, 0.6202132701873779, 0.6404930353164673, 0.6607728004455566, 0.681052565574646, 0.7013322710990906]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 5.0, 5.0, 15.0, 8.0, 15.0, 20.0, 31.0, 41.0, 62.0, 78.0, 117.0, 209.0, 294.0, 413.0, 640.0, 974.0, 1520.0, 2495.0, 4184.0, 7432.0, 13872.0, 27025.0, 54844.0, 114480.0, 226695.0, 272324.0, 162539.0, 77550.0, 37514.0, 19029.0, 9959.0, 5613.0, 3194.0, 1935.0, 1171.0, 759.0, 471.0, 334.0, 223.0, 162.0, 103.0, 55.0, 39.0, 28.0, 20.0, 20.0, 16.0, 4.0, 4.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0], "bins": [-1.0595703125, -1.0256500244140625, -0.991729736328125, -0.9578094482421875, -0.92388916015625, -0.8899688720703125, -0.856048583984375, -0.8221282958984375, -0.7882080078125, -0.7542877197265625, -0.720367431640625, -0.6864471435546875, -0.65252685546875, -0.6186065673828125, -0.584686279296875, -0.5507659912109375, -0.516845703125, -0.4829254150390625, -0.449005126953125, -0.4150848388671875, -0.38116455078125, -0.3472442626953125, -0.313323974609375, -0.2794036865234375, -0.2454833984375, -0.2115631103515625, -0.177642822265625, -0.1437225341796875, -0.10980224609375, -0.0758819580078125, -0.041961669921875, -0.0080413818359375, 0.02587890625, 0.0597991943359375, 0.093719482421875, 0.1276397705078125, 0.16156005859375, 0.1954803466796875, 0.229400634765625, 0.2633209228515625, 0.2972412109375, 0.3311614990234375, 0.365081787109375, 0.3990020751953125, 0.43292236328125, 0.4668426513671875, 0.500762939453125, 0.5346832275390625, 0.568603515625, 0.6025238037109375, 0.636444091796875, 0.6703643798828125, 0.70428466796875, 0.7382049560546875, 0.772125244140625, 0.8060455322265625, 0.8399658203125, 0.8738861083984375, 0.907806396484375, 0.9417266845703125, 0.97564697265625, 1.0095672607421875, 1.043487548828125, 1.0774078369140625, 1.111328125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 8.0, 9.0, 17.0, 11.0, 14.0, 17.0, 15.0, 16.0, 20.0, 38.0, 43.0, 26.0, 40.0, 46.0, 46.0, 53.0, 45.0, 54.0, 68.0, 46.0, 48.0, 37.0, 37.0, 36.0, 42.0, 30.0, 22.0, 23.0, 14.0, 13.0, 16.0, 10.0, 4.0, 12.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.564453125, -0.5450515747070312, -0.5256500244140625, -0.5062484741210938, -0.486846923828125, -0.46744537353515625, -0.4480438232421875, -0.42864227294921875, -0.40924072265625, -0.38983917236328125, -0.3704376220703125, -0.35103607177734375, -0.331634521484375, -0.31223297119140625, -0.2928314208984375, -0.27342987060546875, -0.2540283203125, -0.23462677001953125, -0.2152252197265625, -0.19582366943359375, -0.176422119140625, -0.15702056884765625, -0.1376190185546875, -0.11821746826171875, -0.09881591796875, -0.07941436767578125, -0.0600128173828125, -0.04061126708984375, -0.021209716796875, -0.00180816650390625, 0.0175933837890625, 0.03699493408203125, 0.056396484375, 0.07579803466796875, 0.0951995849609375, 0.11460113525390625, 0.134002685546875, 0.15340423583984375, 0.1728057861328125, 0.19220733642578125, 0.21160888671875, 0.23101043701171875, 0.2504119873046875, 0.26981353759765625, 0.289215087890625, 0.30861663818359375, 0.3280181884765625, 0.34741973876953125, 0.3668212890625, 0.38622283935546875, 0.4056243896484375, 0.42502593994140625, 0.444427490234375, 0.46382904052734375, 0.4832305908203125, 0.5026321411132812, 0.52203369140625, 0.5414352416992188, 0.5608367919921875, 0.5802383422851562, 0.599639892578125, 0.6190414428710938, 0.6384429931640625, 0.6578445434570312, 0.67724609375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 1.0, 1.0, 4.0, 10.0, 14.0, 13.0, 11.0, 23.0, 44.0, 36.0, 53.0, 81.0, 117.0, 256.0, 481.0, 1146.0, 3489.0, 13080.0, 79087.0, 669904.0, 242477.0, 28410.0, 6299.0, 1912.0, 722.0, 325.0, 185.0, 109.0, 82.0, 53.0, 33.0, 20.0, 26.0, 8.0, 10.0, 7.0, 5.0, 0.0, 5.0, 5.0, 1.0, 3.0, 6.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.55859375, -3.46173095703125, -3.3648681640625, -3.26800537109375, -3.171142578125, -3.07427978515625, -2.9774169921875, -2.88055419921875, -2.78369140625, -2.68682861328125, -2.5899658203125, -2.49310302734375, -2.396240234375, -2.29937744140625, -2.2025146484375, -2.10565185546875, -2.0087890625, -1.91192626953125, -1.8150634765625, -1.71820068359375, -1.621337890625, -1.52447509765625, -1.4276123046875, -1.33074951171875, -1.23388671875, -1.13702392578125, -1.0401611328125, -0.94329833984375, -0.846435546875, -0.74957275390625, -0.6527099609375, -0.55584716796875, -0.458984375, -0.36212158203125, -0.2652587890625, -0.16839599609375, -0.071533203125, 0.02532958984375, 0.1221923828125, 0.21905517578125, 0.31591796875, 0.41278076171875, 0.5096435546875, 0.60650634765625, 0.703369140625, 0.80023193359375, 0.8970947265625, 0.99395751953125, 1.0908203125, 1.18768310546875, 1.2845458984375, 1.38140869140625, 1.478271484375, 1.57513427734375, 1.6719970703125, 1.76885986328125, 1.86572265625, 1.96258544921875, 2.0594482421875, 2.15631103515625, 2.253173828125, 2.35003662109375, 2.4468994140625, 2.54376220703125, 2.640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 6.0, 6.0, 11.0, 13.0, 25.0, 27.0, 51.0, 47.0, 59.0, 70.0, 94.0, 86.0, 85.0, 84.0, 65.0, 60.0, 68.0, 38.0, 29.0, 23.0, 24.0, 12.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.767578125, -3.602569580078125, -3.43756103515625, -3.272552490234375, -3.1075439453125, -2.942535400390625, -2.77752685546875, -2.612518310546875, -2.447509765625, -2.282501220703125, -2.11749267578125, -1.952484130859375, -1.7874755859375, -1.622467041015625, -1.45745849609375, -1.292449951171875, -1.12744140625, -0.962432861328125, -0.79742431640625, -0.632415771484375, -0.4674072265625, -0.302398681640625, -0.13739013671875, 0.027618408203125, 0.192626953125, 0.357635498046875, 0.52264404296875, 0.687652587890625, 0.8526611328125, 1.017669677734375, 1.18267822265625, 1.347686767578125, 1.5126953125, 1.677703857421875, 1.84271240234375, 2.007720947265625, 2.1727294921875, 2.337738037109375, 2.50274658203125, 2.667755126953125, 2.832763671875, 2.997772216796875, 3.16278076171875, 3.327789306640625, 3.4927978515625, 3.657806396484375, 3.82281494140625, 3.987823486328125, 4.15283203125, 4.317840576171875, 4.48284912109375, 4.647857666015625, 4.8128662109375, 4.977874755859375, 5.14288330078125, 5.307891845703125, 5.472900390625, 5.637908935546875, 5.80291748046875, 5.967926025390625, 6.1329345703125, 6.297943115234375, 6.46295166015625, 6.627960205078125, 6.79296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 5.0, 11.0, 22.0, 23.0, 63.0, 107.0, 224.0, 612.0, 2439.0, 43621.0, 996024.0, 3948.0, 879.0, 295.0, 145.0, 56.0, 40.0, 23.0, 8.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3203125, -10.978759765625, -10.63720703125, -10.295654296875, -9.9541015625, -9.612548828125, -9.27099609375, -8.929443359375, -8.587890625, -8.246337890625, -7.90478515625, -7.563232421875, -7.2216796875, -6.880126953125, -6.53857421875, -6.197021484375, -5.85546875, -5.513916015625, -5.17236328125, -4.830810546875, -4.4892578125, -4.147705078125, -3.80615234375, -3.464599609375, -3.123046875, -2.781494140625, -2.43994140625, -2.098388671875, -1.7568359375, -1.415283203125, -1.07373046875, -0.732177734375, -0.390625, -0.049072265625, 0.29248046875, 0.634033203125, 0.9755859375, 1.317138671875, 1.65869140625, 2.000244140625, 2.341796875, 2.683349609375, 3.02490234375, 3.366455078125, 3.7080078125, 4.049560546875, 4.39111328125, 4.732666015625, 5.07421875, 5.415771484375, 5.75732421875, 6.098876953125, 6.4404296875, 6.781982421875, 7.12353515625, 7.465087890625, 7.806640625, 8.148193359375, 8.48974609375, 8.831298828125, 9.1728515625, 9.514404296875, 9.85595703125, 10.197509765625, 10.5390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 13.0, 50.0, 189.0, 386.0, 255.0, 82.0, 16.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028252601623535156, -0.0002632327377796173, -0.00024393945932388306, -0.0002246461808681488, -0.00020535290241241455, -0.0001860596239566803, -0.00016676634550094604, -0.0001474730670452118, -0.00012817978858947754, -0.00010888651013374329, -8.959323167800903e-05, -7.029995322227478e-05, -5.100667476654053e-05, -3.1713396310806274e-05, -1.2420117855072021e-05, 6.8731606006622314e-06, 2.6166439056396484e-05, 4.545971751213074e-05, 6.475299596786499e-05, 8.404627442359924e-05, 0.0001033395528793335, 0.00012263283133506775, 0.000141926109790802, 0.00016121938824653625, 0.0001805126667022705, 0.00019980594515800476, 0.00021909922361373901, 0.00023839250206947327, 0.0002576857805252075, 0.00027697905898094177, 0.000296272337436676, 0.0003155656158924103, 0.00033485889434814453, 0.0003541521728038788, 0.00037344545125961304, 0.0003927387297153473, 0.00041203200817108154, 0.0004313252866268158, 0.00045061856508255005, 0.0004699118435382843, 0.0004892051219940186, 0.0005084984004497528, 0.0005277916789054871, 0.0005470849573612213, 0.0005663782358169556, 0.0005856715142726898, 0.0006049647927284241, 0.0006242580711841583, 0.0006435513496398926, 0.0006628446280956268, 0.0006821379065513611, 0.0007014311850070953, 0.0007207244634628296, 0.0007400177419185638, 0.0007593110203742981, 0.0007786042988300323, 0.0007978975772857666, 0.0008171908557415009, 0.0008364841341972351, 0.0008557774126529694, 0.0008750706911087036, 0.0008943639695644379, 0.0009136572480201721, 0.0009329505264759064, 0.0009522438049316406]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 7.0, 8.0, 13.0, 22.0, 44.0, 61.0, 78.0, 128.0, 264.0, 447.0, 897.0, 1822.0, 4140.0, 14939.0, 493940.0, 508381.0, 15468.0, 4031.0, 1901.0, 913.0, 398.0, 280.0, 118.0, 74.0, 54.0, 44.0, 20.0, 15.0, 13.0, 11.0, 7.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.845703125, -2.76666259765625, -2.6876220703125, -2.60858154296875, -2.529541015625, -2.45050048828125, -2.3714599609375, -2.29241943359375, -2.21337890625, -2.13433837890625, -2.0552978515625, -1.97625732421875, -1.897216796875, -1.81817626953125, -1.7391357421875, -1.66009521484375, -1.5810546875, -1.50201416015625, -1.4229736328125, -1.34393310546875, -1.264892578125, -1.18585205078125, -1.1068115234375, -1.02777099609375, -0.94873046875, -0.86968994140625, -0.7906494140625, -0.71160888671875, -0.632568359375, -0.55352783203125, -0.4744873046875, -0.39544677734375, -0.31640625, -0.23736572265625, -0.1583251953125, -0.07928466796875, -0.000244140625, 0.07879638671875, 0.1578369140625, 0.23687744140625, 0.31591796875, 0.39495849609375, 0.4739990234375, 0.55303955078125, 0.632080078125, 0.71112060546875, 0.7901611328125, 0.86920166015625, 0.9482421875, 1.02728271484375, 1.1063232421875, 1.18536376953125, 1.264404296875, 1.34344482421875, 1.4224853515625, 1.50152587890625, 1.58056640625, 1.65960693359375, 1.7386474609375, 1.81768798828125, 1.896728515625, 1.97576904296875, 2.0548095703125, 2.13385009765625, 2.212890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 15.0, 16.0, 76.0, 202.0, 362.0, 187.0, 68.0, 20.0, 13.0, 9.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.00390625, -5.851654052734375, -5.69940185546875, -5.547149658203125, -5.3948974609375, -5.242645263671875, -5.09039306640625, -4.938140869140625, -4.785888671875, -4.633636474609375, -4.48138427734375, -4.329132080078125, -4.1768798828125, -4.024627685546875, -3.87237548828125, -3.720123291015625, -3.56787109375, -3.415618896484375, -3.26336669921875, -3.111114501953125, -2.9588623046875, -2.806610107421875, -2.65435791015625, -2.502105712890625, -2.349853515625, -2.197601318359375, -2.04534912109375, -1.893096923828125, -1.7408447265625, -1.588592529296875, -1.43634033203125, -1.284088134765625, -1.1318359375, -0.979583740234375, -0.82733154296875, -0.675079345703125, -0.5228271484375, -0.370574951171875, -0.21832275390625, -0.066070556640625, 0.086181640625, 0.238433837890625, 0.39068603515625, 0.542938232421875, 0.6951904296875, 0.847442626953125, 0.99969482421875, 1.151947021484375, 1.30419921875, 1.456451416015625, 1.60870361328125, 1.760955810546875, 1.9132080078125, 2.065460205078125, 2.21771240234375, 2.369964599609375, 2.522216796875, 2.674468994140625, 2.82672119140625, 2.978973388671875, 3.1312255859375, 3.283477783203125, 3.43572998046875, 3.587982177734375, 3.740234375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 9.0, 22.0, 66.0, 142.0, 298.0, 278.0, 121.0, 47.0, 17.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.88834381103516, -63.996337890625, -62.10433578491211, -60.21232986450195, -58.32032775878906, -56.428321838378906, -54.53631591796875, -52.644309997558594, -50.7523078918457, -48.86030197143555, -46.968299865722656, -45.0762939453125, -43.184288024902344, -41.29228591918945, -39.4002799987793, -37.508277893066406, -35.61627197265625, -33.724266052246094, -31.832263946533203, -29.940258026123047, -28.048254013061523, -26.15625, -24.264244079589844, -22.37224006652832, -20.480236053466797, -18.588232040405273, -16.69622802734375, -14.804222106933594, -12.91221809387207, -11.020214080810547, -9.128209114074707, -7.236204147338867, -5.344203948974609, -3.4521994590759277, -1.560194969177246, 0.33180952072143555, 2.223814010620117, 4.115818023681641, 6.0078229904174805, 7.89982795715332, 9.791831970214844, 11.683835983276367, 13.575840950012207, 15.467845916748047, 17.35984992980957, 19.251853942871094, 21.14385986328125, 23.035863876342773, 24.927867889404297, 26.81987190246582, 28.711875915527344, 30.6038818359375, 32.495887756347656, 34.38788986206055, 36.2798957824707, 38.171897888183594, 40.06390380859375, 41.955909729003906, 43.8479118347168, 45.73991775512695, 47.631919860839844, 49.52392578125, 51.415931701660156, 53.30793762207031, 55.1999397277832]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 6.0, 8.0, 10.0, 16.0, 15.0, 22.0, 16.0, 31.0, 33.0, 28.0, 31.0, 43.0, 43.0, 58.0, 45.0, 45.0, 54.0, 43.0, 52.0, 53.0, 43.0, 35.0, 32.0, 39.0, 23.0, 20.0, 30.0, 21.0, 11.0, 20.0, 7.0, 15.0, 15.0, 5.0, 5.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.40088653564453, -17.84254264831543, -17.28420066833496, -16.72585678100586, -16.167512893676758, -15.609169960021973, -15.050827026367188, -14.492483139038086, -13.9341402053833, -13.375797271728516, -12.817453384399414, -12.259110450744629, -11.700767517089844, -11.142423629760742, -10.584080696105957, -10.025737762451172, -9.46739387512207, -8.909050941467285, -8.350707054138184, -7.792364120483398, -7.234020709991455, -6.675677299499512, -6.117334365844727, -5.558990955352783, -5.00064754486084, -4.4423041343688965, -3.8839609622955322, -3.325617790222168, -2.7672743797302246, -2.2089309692382812, -1.650587797164917, -1.0922446250915527, -0.5339012145996094, 0.024442076683044434, 0.5827853679656982, 1.141128659248352, 1.6994719505310059, 2.257815361022949, 2.8161585330963135, 3.3745017051696777, 3.932845115661621, 4.4911885261535645, 5.049531936645508, 5.607874870300293, 6.166218280792236, 6.72456169128418, 7.282904624938965, 7.841248035430908, 8.399591445922852, 8.957934379577637, 9.516278266906738, 10.074621200561523, 10.632965087890625, 11.19130802154541, 11.749650955200195, 12.307994842529297, 12.866337776184082, 13.424680709838867, 13.983024597167969, 14.541367530822754, 15.099710464477539, 15.65805435180664, 16.216398239135742, 16.77474021911621, 17.333084106445312]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 9.0, 7.0, 9.0, 9.0, 19.0, 24.0, 38.0, 54.0, 97.0, 127.0, 284.0, 584.0, 1394.0, 4391.0, 30312.0, 4137252.0, 14662.0, 3033.0, 1052.0, 432.0, 220.0, 103.0, 69.0, 36.0, 23.0, 15.0, 11.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8046875, -8.5968017578125, -8.388916015625, -8.1810302734375, -7.97314453125, -7.7652587890625, -7.557373046875, -7.3494873046875, -7.1416015625, -6.9337158203125, -6.725830078125, -6.5179443359375, -6.31005859375, -6.1021728515625, -5.894287109375, -5.6864013671875, -5.478515625, -5.2706298828125, -5.062744140625, -4.8548583984375, -4.64697265625, -4.4390869140625, -4.231201171875, -4.0233154296875, -3.8154296875, -3.6075439453125, -3.399658203125, -3.1917724609375, -2.98388671875, -2.7760009765625, -2.568115234375, -2.3602294921875, -2.15234375, -1.9444580078125, -1.736572265625, -1.5286865234375, -1.32080078125, -1.1129150390625, -0.905029296875, -0.6971435546875, -0.4892578125, -0.2813720703125, -0.073486328125, 0.1343994140625, 0.34228515625, 0.5501708984375, 0.758056640625, 0.9659423828125, 1.173828125, 1.3817138671875, 1.589599609375, 1.7974853515625, 2.00537109375, 2.2132568359375, 2.421142578125, 2.6290283203125, 2.8369140625, 3.0447998046875, 3.252685546875, 3.4605712890625, 3.66845703125, 3.8763427734375, 4.084228515625, 4.2921142578125, 4.5]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 9.0, 14.0, 28.0, 23.0, 33.0, 46.0, 42.0, 68.0, 58.0, 51.0, 62.0, 93.0, 89.0, 66.0, 65.0, 54.0, 41.0, 33.0, 29.0, 22.0, 20.0, 15.0, 12.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2060546875, -1.1736297607421875, -1.141204833984375, -1.1087799072265625, -1.07635498046875, -1.0439300537109375, -1.011505126953125, -0.9790802001953125, -0.9466552734375, -0.9142303466796875, -0.881805419921875, -0.8493804931640625, -0.81695556640625, -0.7845306396484375, -0.752105712890625, -0.7196807861328125, -0.687255859375, -0.6548309326171875, -0.622406005859375, -0.5899810791015625, -0.55755615234375, -0.5251312255859375, -0.492706298828125, -0.4602813720703125, -0.4278564453125, -0.3954315185546875, -0.363006591796875, -0.3305816650390625, -0.29815673828125, -0.2657318115234375, -0.233306884765625, -0.2008819580078125, -0.16845703125, -0.1360321044921875, -0.103607177734375, -0.0711822509765625, -0.03875732421875, -0.0063323974609375, 0.026092529296875, 0.0585174560546875, 0.0909423828125, 0.1233673095703125, 0.155792236328125, 0.1882171630859375, 0.22064208984375, 0.2530670166015625, 0.285491943359375, 0.3179168701171875, 0.350341796875, 0.3827667236328125, 0.415191650390625, 0.4476165771484375, 0.48004150390625, 0.5124664306640625, 0.544891357421875, 0.5773162841796875, 0.6097412109375, 0.6421661376953125, 0.674591064453125, 0.7070159912109375, 0.73944091796875, 0.7718658447265625, 0.804290771484375, 0.8367156982421875, 0.869140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 7.0, 11.0, 10.0, 8.0, 17.0, 13.0, 22.0, 32.0, 43.0, 43.0, 77.0, 108.0, 144.0, 339.0, 796.0, 3062.0, 20014.0, 4112128.0, 49953.0, 5207.0, 1172.0, 408.0, 206.0, 131.0, 57.0, 60.0, 49.0, 28.0, 26.0, 22.0, 12.0, 11.0, 16.0, 11.0, 7.0, 3.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.2890625, -7.0433349609375, -6.797607421875, -6.5518798828125, -6.30615234375, -6.0604248046875, -5.814697265625, -5.5689697265625, -5.3232421875, -5.0775146484375, -4.831787109375, -4.5860595703125, -4.34033203125, -4.0946044921875, -3.848876953125, -3.6031494140625, -3.357421875, -3.1116943359375, -2.865966796875, -2.6202392578125, -2.37451171875, -2.1287841796875, -1.883056640625, -1.6373291015625, -1.3916015625, -1.1458740234375, -0.900146484375, -0.6544189453125, -0.40869140625, -0.1629638671875, 0.082763671875, 0.3284912109375, 0.57421875, 0.8199462890625, 1.065673828125, 1.3114013671875, 1.55712890625, 1.8028564453125, 2.048583984375, 2.2943115234375, 2.5400390625, 2.7857666015625, 3.031494140625, 3.2772216796875, 3.52294921875, 3.7686767578125, 4.014404296875, 4.2601318359375, 4.505859375, 4.7515869140625, 4.997314453125, 5.2430419921875, 5.48876953125, 5.7344970703125, 5.980224609375, 6.2259521484375, 6.4716796875, 6.7174072265625, 6.963134765625, 7.2088623046875, 7.45458984375, 7.7003173828125, 7.946044921875, 8.1917724609375, 8.4375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 11.0, 20.0, 12.0, 53.0, 339.0, 3503.0, 75.0, 31.0, 15.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.65234375, -2.5960311889648438, -2.5397186279296875, -2.4834060668945312, -2.427093505859375, -2.3707809448242188, -2.3144683837890625, -2.2581558227539062, -2.20184326171875, -2.1455307006835938, -2.0892181396484375, -2.0329055786132812, -1.976593017578125, -1.9202804565429688, -1.8639678955078125, -1.8076553344726562, -1.7513427734375, -1.6950302124023438, -1.6387176513671875, -1.5824050903320312, -1.526092529296875, -1.4697799682617188, -1.4134674072265625, -1.3571548461914062, -1.30084228515625, -1.2445297241210938, -1.1882171630859375, -1.1319046020507812, -1.075592041015625, -1.0192794799804688, -0.9629669189453125, -0.9066543579101562, -0.850341796875, -0.7940292358398438, -0.7377166748046875, -0.6814041137695312, -0.625091552734375, -0.5687789916992188, -0.5124664306640625, -0.45615386962890625, -0.39984130859375, -0.34352874755859375, -0.2872161865234375, -0.23090362548828125, -0.174591064453125, -0.11827850341796875, -0.0619659423828125, -0.00565338134765625, 0.0506591796875, 0.10697174072265625, 0.1632843017578125, 0.21959686279296875, 0.275909423828125, 0.33222198486328125, 0.3885345458984375, 0.44484710693359375, 0.50115966796875, 0.5574722290039062, 0.6137847900390625, 0.6700973510742188, 0.726409912109375, 0.7827224731445312, 0.8390350341796875, 0.8953475952148438, 0.95166015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 8.0, 9.0, 11.0, 20.0, 27.0, 42.0, 46.0, 80.0, 102.0, 114.0, 123.0, 119.0, 80.0, 64.0, 50.0, 34.0, 21.0, 20.0, 14.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8842575550079346, -1.775377631187439, -1.6664977073669434, -1.5576176643371582, -1.4487377405166626, -1.339857816696167, -1.2309777736663818, -1.1220978498458862, -1.0132179260253906, -0.904338002204895, -0.7954580187797546, -0.6865780353546143, -0.5776981115341187, -0.46881818771362305, -0.35993820428848267, -0.2510582208633423, -0.14217829704284668, -0.033298343420028687, 0.0755816102027893, 0.1844615638256073, 0.2933415174484253, 0.4022214412689209, 0.5111014246940613, 0.6199814081192017, 0.7288613319396973, 0.8377412557601929, 0.9466212391853333, 1.0555012226104736, 1.1643811464309692, 1.2732610702514648, 1.38214111328125, 1.4910210371017456, 1.599900722503662, 1.7087806463241577, 1.8176605701446533, 1.9265406131744385, 2.0354204177856445, 2.1443004608154297, 2.253180503845215, 2.362060546875, 2.470940351486206, 2.579820394515991, 2.6887001991271973, 2.7975802421569824, 2.9064602851867676, 3.0153400897979736, 3.124220132827759, 3.233099937438965, 3.34197998046875, 3.450860023498535, 3.559739828109741, 3.6686198711395264, 3.7774996757507324, 3.8863797187805176, 3.9952597618103027, 4.104139804840088, 4.213019371032715, 4.3218994140625, 4.430779457092285, 4.539659023284912, 4.648539066314697, 4.757419109344482, 4.866299152374268, 4.975179195404053, 5.084059238433838]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 10.0, 7.0, 7.0, 6.0, 12.0, 17.0, 19.0, 17.0, 22.0, 27.0, 23.0, 28.0, 37.0, 31.0, 38.0, 35.0, 40.0, 45.0, 51.0, 35.0, 40.0, 43.0, 44.0, 41.0, 36.0, 37.0, 41.0, 37.0, 31.0, 23.0, 17.0, 22.0, 17.0, 14.0, 14.0, 10.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.229278087615967, -2.1545631885528564, -2.079848527908325, -2.005133628845215, -1.9304189682006836, -1.8557040691375732, -1.7809892892837524, -1.7062745094299316, -1.6315597295761108, -1.55684494972229, -1.4821301698684692, -1.4074153900146484, -1.332700490951538, -1.2579858303070068, -1.1832709312438965, -1.1085561513900757, -1.0338413715362549, -0.9591265916824341, -0.8844118118286133, -0.8096969723701477, -0.7349821925163269, -0.6602674126625061, -0.5855525732040405, -0.5108377933502197, -0.4361230134963989, -0.3614082336425781, -0.28669342398643494, -0.21197862923145294, -0.13726383447647095, -0.06254905462265015, 0.012165755033493042, 0.08688056468963623, 0.16159534454345703, 0.23631013929843903, 0.311024934053421, 0.3857397437095642, 0.460454523563385, 0.5351693034172058, 0.6098841428756714, 0.6845989227294922, 0.759313702583313, 0.8340284824371338, 0.9087432622909546, 0.9834581017494202, 1.0581729412078857, 1.132887601852417, 1.2076025009155273, 1.2823172807693481, 1.357032060623169, 1.4317468404769897, 1.5064616203308105, 1.5811764001846313, 1.6558911800384521, 1.7306060791015625, 1.8053208589553833, 1.880035638809204, 1.954750418663025, 2.0294651985168457, 2.104180097579956, 2.1788947582244873, 2.2536096572875977, 2.328324317932129, 2.4030392169952393, 2.4777541160583496, 2.552468776702881]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 9.0, 3.0, 9.0, 23.0, 28.0, 34.0, 52.0, 81.0, 119.0, 193.0, 286.0, 488.0, 977.0, 1731.0, 3434.0, 7385.0, 17119.0, 44720.0, 130028.0, 344723.0, 315516.0, 113362.0, 39085.0, 15559.0, 6644.0, 3140.0, 1592.0, 841.0, 528.0, 310.0, 172.0, 118.0, 81.0, 53.0, 30.0, 28.0, 9.0, 13.0, 13.0, 2.0, 7.0, 7.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8408203125, -1.7772064208984375, -1.713592529296875, -1.6499786376953125, -1.58636474609375, -1.5227508544921875, -1.459136962890625, -1.3955230712890625, -1.3319091796875, -1.2682952880859375, -1.204681396484375, -1.1410675048828125, -1.07745361328125, -1.0138397216796875, -0.950225830078125, -0.8866119384765625, -0.822998046875, -0.7593841552734375, -0.695770263671875, -0.6321563720703125, -0.56854248046875, -0.5049285888671875, -0.441314697265625, -0.3777008056640625, -0.3140869140625, -0.2504730224609375, -0.186859130859375, -0.1232452392578125, -0.05963134765625, 0.0039825439453125, 0.067596435546875, 0.1312103271484375, 0.19482421875, 0.2584381103515625, 0.322052001953125, 0.3856658935546875, 0.44927978515625, 0.5128936767578125, 0.576507568359375, 0.6401214599609375, 0.7037353515625, 0.7673492431640625, 0.830963134765625, 0.8945770263671875, 0.95819091796875, 1.0218048095703125, 1.085418701171875, 1.1490325927734375, 1.212646484375, 1.2762603759765625, 1.339874267578125, 1.4034881591796875, 1.46710205078125, 1.5307159423828125, 1.594329833984375, 1.6579437255859375, 1.7215576171875, 1.7851715087890625, 1.848785400390625, 1.9123992919921875, 1.97601318359375, 2.0396270751953125, 2.103240966796875, 2.1668548583984375, 2.23046875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 9.0, 12.0, 20.0, 22.0, 30.0, 31.0, 33.0, 47.0, 37.0, 50.0, 53.0, 59.0, 71.0, 69.0, 50.0, 50.0, 53.0, 42.0, 42.0, 38.0, 44.0, 39.0, 24.0, 16.0, 16.0, 10.0, 6.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1201171875, -1.0883560180664062, -1.0565948486328125, -1.0248336791992188, -0.993072509765625, -0.9613113403320312, -0.9295501708984375, -0.8977890014648438, -0.86602783203125, -0.8342666625976562, -0.8025054931640625, -0.7707443237304688, -0.738983154296875, -0.7072219848632812, -0.6754608154296875, -0.6436996459960938, -0.6119384765625, -0.5801773071289062, -0.5484161376953125, -0.5166549682617188, -0.484893798828125, -0.45313262939453125, -0.4213714599609375, -0.38961029052734375, -0.35784912109375, -0.32608795166015625, -0.2943267822265625, -0.26256561279296875, -0.230804443359375, -0.19904327392578125, -0.1672821044921875, -0.13552093505859375, -0.103759765625, -0.07199859619140625, -0.0402374267578125, -0.00847625732421875, 0.023284912109375, 0.05504608154296875, 0.0868072509765625, 0.11856842041015625, 0.15032958984375, 0.18209075927734375, 0.2138519287109375, 0.24561309814453125, 0.277374267578125, 0.30913543701171875, 0.3408966064453125, 0.37265777587890625, 0.4044189453125, 0.43618011474609375, 0.4679412841796875, 0.49970245361328125, 0.531463623046875, 0.5632247924804688, 0.5949859619140625, 0.6267471313476562, 0.65850830078125, 0.6902694702148438, 0.7220306396484375, 0.7537918090820312, 0.785552978515625, 0.8173141479492188, 0.8490753173828125, 0.8808364868164062, 0.91259765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 8.0, 15.0, 9.0, 29.0, 39.0, 93.0, 160.0, 388.0, 1195.0, 4779.0, 55332.0, 932432.0, 47613.0, 4566.0, 1103.0, 406.0, 170.0, 85.0, 39.0, 23.0, 14.0, 11.0, 8.0, 6.0, 2.0, 5.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.203125, -11.885986328125, -11.56884765625, -11.251708984375, -10.9345703125, -10.617431640625, -10.30029296875, -9.983154296875, -9.666015625, -9.348876953125, -9.03173828125, -8.714599609375, -8.3974609375, -8.080322265625, -7.76318359375, -7.446044921875, -7.12890625, -6.811767578125, -6.49462890625, -6.177490234375, -5.8603515625, -5.543212890625, -5.22607421875, -4.908935546875, -4.591796875, -4.274658203125, -3.95751953125, -3.640380859375, -3.3232421875, -3.006103515625, -2.68896484375, -2.371826171875, -2.0546875, -1.737548828125, -1.42041015625, -1.103271484375, -0.7861328125, -0.468994140625, -0.15185546875, 0.165283203125, 0.482421875, 0.799560546875, 1.11669921875, 1.433837890625, 1.7509765625, 2.068115234375, 2.38525390625, 2.702392578125, 3.01953125, 3.336669921875, 3.65380859375, 3.970947265625, 4.2880859375, 4.605224609375, 4.92236328125, 5.239501953125, 5.556640625, 5.873779296875, 6.19091796875, 6.508056640625, 6.8251953125, 7.142333984375, 7.45947265625, 7.776611328125, 8.09375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 12.0, 4.0, 7.0, 8.0, 20.0, 18.0, 20.0, 29.0, 34.0, 42.0, 54.0, 61.0, 62.0, 50.0, 61.0, 52.0, 63.0, 56.0, 58.0, 46.0, 49.0, 31.0, 25.0, 36.0, 25.0, 16.0, 17.0, 10.0, 4.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-6.3984375, -6.22637939453125, -6.0543212890625, -5.88226318359375, -5.710205078125, -5.53814697265625, -5.3660888671875, -5.19403076171875, -5.02197265625, -4.84991455078125, -4.6778564453125, -4.50579833984375, -4.333740234375, -4.16168212890625, -3.9896240234375, -3.81756591796875, -3.6455078125, -3.47344970703125, -3.3013916015625, -3.12933349609375, -2.957275390625, -2.78521728515625, -2.6131591796875, -2.44110107421875, -2.26904296875, -2.09698486328125, -1.9249267578125, -1.75286865234375, -1.580810546875, -1.40875244140625, -1.2366943359375, -1.06463623046875, -0.892578125, -0.72052001953125, -0.5484619140625, -0.37640380859375, -0.204345703125, -0.03228759765625, 0.1397705078125, 0.31182861328125, 0.48388671875, 0.65594482421875, 0.8280029296875, 1.00006103515625, 1.172119140625, 1.34417724609375, 1.5162353515625, 1.68829345703125, 1.8603515625, 2.03240966796875, 2.2044677734375, 2.37652587890625, 2.548583984375, 2.72064208984375, 2.8927001953125, 3.06475830078125, 3.23681640625, 3.40887451171875, 3.5809326171875, 3.75299072265625, 3.925048828125, 4.09710693359375, 4.2691650390625, 4.44122314453125, 4.61328125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 5.0, 11.0, 15.0, 14.0, 14.0, 27.0, 48.0, 72.0, 121.0, 170.0, 282.0, 564.0, 1390.0, 4746.0, 33327.0, 888088.0, 107527.0, 8351.0, 2092.0, 765.0, 337.0, 227.0, 113.0, 75.0, 46.0, 28.0, 32.0, 11.0, 13.0, 8.0, 7.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.8828125, -3.77398681640625, -3.6651611328125, -3.55633544921875, -3.447509765625, -3.33868408203125, -3.2298583984375, -3.12103271484375, -3.01220703125, -2.90338134765625, -2.7945556640625, -2.68572998046875, -2.576904296875, -2.46807861328125, -2.3592529296875, -2.25042724609375, -2.1416015625, -2.03277587890625, -1.9239501953125, -1.81512451171875, -1.706298828125, -1.59747314453125, -1.4886474609375, -1.37982177734375, -1.27099609375, -1.16217041015625, -1.0533447265625, -0.94451904296875, -0.835693359375, -0.72686767578125, -0.6180419921875, -0.50921630859375, -0.400390625, -0.29156494140625, -0.1827392578125, -0.07391357421875, 0.034912109375, 0.14373779296875, 0.2525634765625, 0.36138916015625, 0.47021484375, 0.57904052734375, 0.6878662109375, 0.79669189453125, 0.905517578125, 1.01434326171875, 1.1231689453125, 1.23199462890625, 1.3408203125, 1.44964599609375, 1.5584716796875, 1.66729736328125, 1.776123046875, 1.88494873046875, 1.9937744140625, 2.10260009765625, 2.21142578125, 2.32025146484375, 2.4290771484375, 2.53790283203125, 2.646728515625, 2.75555419921875, 2.8643798828125, 2.97320556640625, 3.08203125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 5.0, 17.0, 30.0, 80.0, 169.0, 313.0, 218.0, 90.0, 40.0, 15.0, 8.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000644683837890625, -0.0006243214011192322, -0.0006039589643478394, -0.0005835965275764465, -0.0005632340908050537, -0.0005428716540336609, -0.0005225092172622681, -0.0005021467804908752, -0.0004817843437194824, -0.0004614219069480896, -0.0004410594701766968, -0.00042069703340530396, -0.00040033459663391113, -0.0003799721598625183, -0.0003596097230911255, -0.00033924728631973267, -0.00031888484954833984, -0.000298522412776947, -0.0002781599760055542, -0.0002577975392341614, -0.00023743510246276855, -0.00021707266569137573, -0.0001967102289199829, -0.0001763477921485901, -0.00015598535537719727, -0.00013562291860580444, -0.00011526048183441162, -9.48980450630188e-05, -7.453560829162598e-05, -5.4173171520233154e-05, -3.381073474884033e-05, -1.344829797744751e-05, 6.9141387939453125e-06, 2.7276575565338135e-05, 4.763901233673096e-05, 6.800144910812378e-05, 8.83638858795166e-05, 0.00010872632265090942, 0.00012908875942230225, 0.00014945119619369507, 0.0001698136329650879, 0.0001901760697364807, 0.00021053850650787354, 0.00023090094327926636, 0.0002512633800506592, 0.000271625816822052, 0.0002919882535934448, 0.00031235069036483765, 0.00033271312713623047, 0.0003530755639076233, 0.0003734380006790161, 0.00039380043745040894, 0.00041416287422180176, 0.0004345253109931946, 0.0004548877477645874, 0.0004752501845359802, 0.000495612621307373, 0.0005159750580787659, 0.0005363374948501587, 0.0005566999316215515, 0.0005770623683929443, 0.0005974248051643372, 0.00061778724193573, 0.0006381496787071228, 0.0006585121154785156]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 3.0, 6.0, 13.0, 13.0, 21.0, 26.0, 35.0, 54.0, 138.0, 256.0, 695.0, 2848.0, 45819.0, 964436.0, 30677.0, 2348.0, 638.0, 255.0, 115.0, 68.0, 30.0, 17.0, 8.0, 15.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.09375, -4.964630126953125, -4.83551025390625, -4.706390380859375, -4.5772705078125, -4.448150634765625, -4.31903076171875, -4.189910888671875, -4.060791015625, -3.931671142578125, -3.80255126953125, -3.673431396484375, -3.5443115234375, -3.415191650390625, -3.28607177734375, -3.156951904296875, -3.02783203125, -2.898712158203125, -2.76959228515625, -2.640472412109375, -2.5113525390625, -2.382232666015625, -2.25311279296875, -2.123992919921875, -1.994873046875, -1.865753173828125, -1.73663330078125, -1.607513427734375, -1.4783935546875, -1.349273681640625, -1.22015380859375, -1.091033935546875, -0.9619140625, -0.832794189453125, -0.70367431640625, -0.574554443359375, -0.4454345703125, -0.316314697265625, -0.18719482421875, -0.058074951171875, 0.071044921875, 0.200164794921875, 0.32928466796875, 0.458404541015625, 0.5875244140625, 0.716644287109375, 0.84576416015625, 0.974884033203125, 1.10400390625, 1.233123779296875, 1.36224365234375, 1.491363525390625, 1.6204833984375, 1.749603271484375, 1.87872314453125, 2.007843017578125, 2.136962890625, 2.266082763671875, 2.39520263671875, 2.524322509765625, 2.6534423828125, 2.782562255859375, 2.91168212890625, 3.040802001953125, 3.169921875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 9.0, 17.0, 21.0, 51.0, 154.0, 275.0, 250.0, 127.0, 56.0, 21.0, 9.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2734375, -7.10772705078125, -6.9420166015625, -6.77630615234375, -6.610595703125, -6.44488525390625, -6.2791748046875, -6.11346435546875, -5.94775390625, -5.78204345703125, -5.6163330078125, -5.45062255859375, -5.284912109375, -5.11920166015625, -4.9534912109375, -4.78778076171875, -4.6220703125, -4.45635986328125, -4.2906494140625, -4.12493896484375, -3.959228515625, -3.79351806640625, -3.6278076171875, -3.46209716796875, -3.29638671875, -3.13067626953125, -2.9649658203125, -2.79925537109375, -2.633544921875, -2.46783447265625, -2.3021240234375, -2.13641357421875, -1.970703125, -1.80499267578125, -1.6392822265625, -1.47357177734375, -1.307861328125, -1.14215087890625, -0.9764404296875, -0.81072998046875, -0.64501953125, -0.47930908203125, -0.3135986328125, -0.14788818359375, 0.017822265625, 0.18353271484375, 0.3492431640625, 0.51495361328125, 0.6806640625, 0.84637451171875, 1.0120849609375, 1.17779541015625, 1.343505859375, 1.50921630859375, 1.6749267578125, 1.84063720703125, 2.00634765625, 2.17205810546875, 2.3377685546875, 2.50347900390625, 2.669189453125, 2.83489990234375, 3.0006103515625, 3.16632080078125, 3.33203125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 9.0, 13.0, 32.0, 45.0, 77.0, 122.0, 206.0, 202.0, 148.0, 67.0, 32.0, 20.0, 13.0, 11.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.12327194213867, -32.422733306884766, -30.72219467163086, -29.021656036376953, -27.321117401123047, -25.62057876586914, -23.920040130615234, -22.219501495361328, -20.518962860107422, -18.818424224853516, -17.11788558959961, -15.417346954345703, -13.716808319091797, -12.01626968383789, -10.315731048583984, -8.615192413330078, -6.914653778076172, -5.214115142822266, -3.5135765075683594, -1.8130378723144531, -0.11249923706054688, 1.5880393981933594, 3.2885780334472656, 4.989116668701172, 6.689655303955078, 8.390193939208984, 10.09073257446289, 11.791271209716797, 13.491809844970703, 15.19234848022461, 16.892887115478516, 18.593425750732422, 20.293968200683594, 21.9945068359375, 23.695045471191406, 25.395584106445312, 27.09612274169922, 28.796661376953125, 30.49720001220703, 32.19773864746094, 33.898277282714844, 35.59881591796875, 37.299354553222656, 38.99989318847656, 40.70043182373047, 42.400970458984375, 44.10150909423828, 45.80204772949219, 47.502586364746094, 49.203125, 50.903663635253906, 52.60420227050781, 54.30474090576172, 56.005279541015625, 57.70581817626953, 59.40635681152344, 61.106895446777344, 62.80743408203125, 64.50797271728516, 66.20851135253906, 67.90904998779297, 69.60958862304688, 71.31012725830078, 73.01066589355469, 74.7112045288086]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 6.0, 6.0, 9.0, 9.0, 7.0, 17.0, 15.0, 20.0, 34.0, 31.0, 25.0, 36.0, 44.0, 39.0, 51.0, 59.0, 49.0, 60.0, 62.0, 53.0, 49.0, 50.0, 39.0, 40.0, 36.0, 29.0, 23.0, 19.0, 25.0, 14.0, 12.0, 4.0, 10.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.43669891357422, -18.67520523071289, -17.913711547851562, -17.152217864990234, -16.390724182128906, -15.629229545593262, -14.867734909057617, -14.106241226196289, -13.344747543334961, -12.583253860473633, -11.821760177612305, -11.06026554107666, -10.298771858215332, -9.537278175354004, -8.77578353881836, -8.014289855957031, -7.252796173095703, -6.491302490234375, -5.729808330535889, -4.968314170837402, -4.206820487976074, -3.445326566696167, -2.6838326454162598, -1.9223384857177734, -1.1608448028564453, -0.3993508815765381, 0.36214303970336914, 1.1236369609832764, 1.8851308822631836, 2.646624803543091, 3.408118724822998, 4.169612884521484, 4.93110466003418, 5.692598342895508, 6.454092502593994, 7.2155866622924805, 7.977080345153809, 8.738574028015137, 9.500068664550781, 10.26156234741211, 11.023056030273438, 11.784549713134766, 12.546043395996094, 13.307538032531738, 14.069031715393066, 14.830525398254395, 15.592020034790039, 16.353513717651367, 17.115007400512695, 17.876501083374023, 18.63799476623535, 19.39948844909668, 20.16098403930664, 20.92247772216797, 21.683971405029297, 22.445465087890625, 23.206958770751953, 23.96845245361328, 24.72994613647461, 25.491439819335938, 26.252933502197266, 27.014429092407227, 27.775922775268555, 28.537416458129883, 29.29891014099121]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 8.0, 8.0, 10.0, 9.0, 23.0, 29.0, 34.0, 54.0, 83.0, 135.0, 212.0, 461.0, 1006.0, 3365.0, 4122775.0, 61269.0, 2808.0, 972.0, 424.0, 207.0, 133.0, 72.0, 47.0, 26.0, 24.0, 15.0, 15.0, 10.0, 8.0, 7.0, 5.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.421875, -14.0206298828125, -13.619384765625, -13.2181396484375, -12.81689453125, -12.4156494140625, -12.014404296875, -11.6131591796875, -11.2119140625, -10.8106689453125, -10.409423828125, -10.0081787109375, -9.60693359375, -9.2056884765625, -8.804443359375, -8.4031982421875, -8.001953125, -7.6007080078125, -7.199462890625, -6.7982177734375, -6.39697265625, -5.9957275390625, -5.594482421875, -5.1932373046875, -4.7919921875, -4.3907470703125, -3.989501953125, -3.5882568359375, -3.18701171875, -2.7857666015625, -2.384521484375, -1.9832763671875, -1.58203125, -1.1807861328125, -0.779541015625, -0.3782958984375, 0.02294921875, 0.4241943359375, 0.825439453125, 1.2266845703125, 1.6279296875, 2.0291748046875, 2.430419921875, 2.8316650390625, 3.23291015625, 3.6341552734375, 4.035400390625, 4.4366455078125, 4.837890625, 5.2391357421875, 5.640380859375, 6.0416259765625, 6.44287109375, 6.8441162109375, 7.245361328125, 7.6466064453125, 8.0478515625, 8.4490966796875, 8.850341796875, 9.2515869140625, 9.65283203125, 10.0540771484375, 10.455322265625, 10.8565673828125, 11.2578125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 11.0, 19.0, 17.0, 27.0, 31.0, 51.0, 64.0, 68.0, 84.0, 96.0, 96.0, 87.0, 79.0, 73.0, 56.0, 39.0, 32.0, 16.0, 15.0, 10.0, 9.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.6608428955078125, -1.601959228515625, -1.5430755615234375, -1.48419189453125, -1.4253082275390625, -1.366424560546875, -1.3075408935546875, -1.2486572265625, -1.1897735595703125, -1.130889892578125, -1.0720062255859375, -1.01312255859375, -0.9542388916015625, -0.895355224609375, -0.8364715576171875, -0.777587890625, -0.7187042236328125, -0.659820556640625, -0.6009368896484375, -0.54205322265625, -0.4831695556640625, -0.424285888671875, -0.3654022216796875, -0.3065185546875, -0.2476348876953125, -0.188751220703125, -0.1298675537109375, -0.07098388671875, -0.0121002197265625, 0.046783447265625, 0.1056671142578125, 0.16455078125, 0.2234344482421875, 0.282318115234375, 0.3412017822265625, 0.40008544921875, 0.4589691162109375, 0.517852783203125, 0.5767364501953125, 0.6356201171875, 0.6945037841796875, 0.753387451171875, 0.8122711181640625, 0.87115478515625, 0.9300384521484375, 0.988922119140625, 1.0478057861328125, 1.106689453125, 1.1655731201171875, 1.224456787109375, 1.2833404541015625, 1.34222412109375, 1.4011077880859375, 1.459991455078125, 1.5188751220703125, 1.5777587890625, 1.6366424560546875, 1.695526123046875, 1.7544097900390625, 1.81329345703125, 1.8721771240234375, 1.931060791015625, 1.9899444580078125, 2.048828125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 9.0, 12.0, 11.0, 14.0, 17.0, 19.0, 21.0, 47.0, 33.0, 54.0, 74.0, 127.0, 239.0, 604.0, 2885.0, 63305.0, 4120776.0, 4419.0, 840.0, 249.0, 137.0, 94.0, 59.0, 55.0, 30.0, 21.0, 20.0, 16.0, 21.0, 8.0, 14.0, 8.0, 7.0, 11.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.5625, -19.005126953125, -18.44775390625, -17.890380859375, -17.3330078125, -16.775634765625, -16.21826171875, -15.660888671875, -15.103515625, -14.546142578125, -13.98876953125, -13.431396484375, -12.8740234375, -12.316650390625, -11.75927734375, -11.201904296875, -10.64453125, -10.087158203125, -9.52978515625, -8.972412109375, -8.4150390625, -7.857666015625, -7.30029296875, -6.742919921875, -6.185546875, -5.628173828125, -5.07080078125, -4.513427734375, -3.9560546875, -3.398681640625, -2.84130859375, -2.283935546875, -1.7265625, -1.169189453125, -0.61181640625, -0.054443359375, 0.5029296875, 1.060302734375, 1.61767578125, 2.175048828125, 2.732421875, 3.289794921875, 3.84716796875, 4.404541015625, 4.9619140625, 5.519287109375, 6.07666015625, 6.634033203125, 7.19140625, 7.748779296875, 8.30615234375, 8.863525390625, 9.4208984375, 9.978271484375, 10.53564453125, 11.093017578125, 11.650390625, 12.207763671875, 12.76513671875, 13.322509765625, 13.8798828125, 14.437255859375, 14.99462890625, 15.552001953125, 16.109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 10.0, 11.0, 28.0, 3769.0, 209.0, 27.0, 10.0, 4.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9990234375, -0.8983306884765625, -0.797637939453125, -0.6969451904296875, -0.59625244140625, -0.4955596923828125, -0.394866943359375, -0.2941741943359375, -0.1934814453125, -0.0927886962890625, 0.007904052734375, 0.1085968017578125, 0.20928955078125, 0.3099822998046875, 0.410675048828125, 0.5113677978515625, 0.612060546875, 0.7127532958984375, 0.813446044921875, 0.9141387939453125, 1.01483154296875, 1.1155242919921875, 1.216217041015625, 1.3169097900390625, 1.4176025390625, 1.5182952880859375, 1.618988037109375, 1.7196807861328125, 1.82037353515625, 1.9210662841796875, 2.021759033203125, 2.1224517822265625, 2.22314453125, 2.3238372802734375, 2.424530029296875, 2.5252227783203125, 2.62591552734375, 2.7266082763671875, 2.827301025390625, 2.9279937744140625, 3.0286865234375, 3.1293792724609375, 3.230072021484375, 3.3307647705078125, 3.43145751953125, 3.5321502685546875, 3.632843017578125, 3.7335357666015625, 3.834228515625, 3.9349212646484375, 4.035614013671875, 4.1363067626953125, 4.23699951171875, 4.3376922607421875, 4.438385009765625, 4.5390777587890625, 4.6397705078125, 4.7404632568359375, 4.841156005859375, 4.9418487548828125, 5.04254150390625, 5.1432342529296875, 5.243927001953125, 5.3446197509765625, 5.4453125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 6.0, 9.0, 11.0, 14.0, 33.0, 68.0, 95.0, 134.0, 141.0, 146.0, 132.0, 64.0, 47.0, 21.0, 24.0, 14.0, 17.0, 9.0, 4.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.269191741943359, -4.069043159484863, -3.868894100189209, -3.668745517730713, -3.4685964584350586, -3.2684478759765625, -3.0682990550994873, -2.868150234222412, -2.668001413345337, -2.4678525924682617, -2.2677037715911865, -2.0675549507141113, -1.8674062490463257, -1.6672574281692505, -1.4671087265014648, -1.2669599056243896, -1.0668110847473145, -0.8666622638702393, -0.6665135025978088, -0.4663647413253784, -0.2662159204483032, -0.06606709957122803, 0.13408160209655762, 0.3342304229736328, 0.534379243850708, 0.7345280647277832, 0.9346768260002136, 1.134825587272644, 1.3349744081497192, 1.5351232290267944, 1.73527193069458, 1.9354207515716553, 2.1355695724487305, 2.3357183933258057, 2.535867214202881, 2.736015796661377, 2.9361648559570312, 3.1363134384155273, 3.3364622592926025, 3.5366110801696777, 3.736759901046753, 3.936908721923828, 4.137057304382324, 4.3372063636779785, 4.537354946136475, 4.737504005432129, 4.937652587890625, 5.137801170349121, 5.337950229644775, 5.5380988121032715, 5.738247871398926, 5.938396453857422, 6.138545513153076, 6.338694095611572, 6.538843154907227, 6.738991737365723, 6.939140319824219, 7.139288902282715, 7.339437961578369, 7.539586544036865, 7.7397356033325195, 7.939884185791016, 8.140032768249512, 8.340181350708008, 8.54033088684082]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 11.0, 3.0, 5.0, 7.0, 22.0, 14.0, 16.0, 25.0, 29.0, 28.0, 30.0, 28.0, 38.0, 29.0, 38.0, 45.0, 35.0, 42.0, 42.0, 51.0, 53.0, 46.0, 43.0, 43.0, 35.0, 43.0, 25.0, 37.0, 23.0, 16.0, 12.0, 15.0, 14.0, 6.0, 14.0, 5.0, 10.0, 5.0, 3.0, 1.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.0690839290618896, -2.960240364074707, -2.8513965606689453, -2.7425529956817627, -2.63370943069458, -2.5248656272888184, -2.4160220623016357, -2.307178497314453, -2.1983346939086914, -2.089491128921509, -1.9806474447250366, -1.8718037605285645, -1.7629601955413818, -1.6541165113449097, -1.5452728271484375, -1.4364292621612549, -1.3275856971740723, -1.2187420129776, -1.1098984479904175, -1.0010547637939453, -0.8922111392021179, -0.7833675146102905, -0.6745238304138184, -0.565680205821991, -0.4568365812301636, -0.3479929566383362, -0.2391493022441864, -0.13030564785003662, -0.02146202325820923, 0.08738160133361816, 0.19622528553009033, 0.3050689101219177, 0.4139125347137451, 0.5227561593055725, 0.6315997838973999, 0.7404434680938721, 0.8492870926856995, 0.9581307172775269, 1.066974401473999, 1.1758179664611816, 1.2846616506576538, 1.393505334854126, 1.5023488998413086, 1.6111925840377808, 1.720036268234253, 1.8288798332214355, 1.9377235174179077, 2.04656720161438, 2.1554107666015625, 2.264254331588745, 2.373098134994507, 2.4819416999816895, 2.590785264968872, 2.6996288299560547, 2.8084726333618164, 2.917316198348999, 3.0261597633361816, 3.1350033283233643, 3.243847131729126, 3.3526906967163086, 3.461534261703491, 3.570377826690674, 3.6792216300964355, 3.788065195083618, 3.89690899848938]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 4.0, 15.0, 14.0, 14.0, 35.0, 53.0, 75.0, 122.0, 181.0, 312.0, 515.0, 897.0, 1842.0, 4016.0, 10785.0, 48367.0, 516018.0, 407407.0, 40846.0, 9604.0, 3623.0, 1691.0, 897.0, 452.0, 271.0, 179.0, 114.0, 58.0, 45.0, 27.0, 18.0, 13.0, 11.0, 9.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.21484375, -6.02032470703125, -5.8258056640625, -5.63128662109375, -5.436767578125, -5.24224853515625, -5.0477294921875, -4.85321044921875, -4.65869140625, -4.46417236328125, -4.2696533203125, -4.07513427734375, -3.880615234375, -3.68609619140625, -3.4915771484375, -3.29705810546875, -3.1025390625, -2.90802001953125, -2.7135009765625, -2.51898193359375, -2.324462890625, -2.12994384765625, -1.9354248046875, -1.74090576171875, -1.54638671875, -1.35186767578125, -1.1573486328125, -0.96282958984375, -0.768310546875, -0.57379150390625, -0.3792724609375, -0.18475341796875, 0.009765625, 0.20428466796875, 0.3988037109375, 0.59332275390625, 0.787841796875, 0.98236083984375, 1.1768798828125, 1.37139892578125, 1.56591796875, 1.76043701171875, 1.9549560546875, 2.14947509765625, 2.343994140625, 2.53851318359375, 2.7330322265625, 2.92755126953125, 3.1220703125, 3.31658935546875, 3.5111083984375, 3.70562744140625, 3.900146484375, 4.09466552734375, 4.2891845703125, 4.48370361328125, 4.67822265625, 4.87274169921875, 5.0672607421875, 5.26177978515625, 5.456298828125, 5.65081787109375, 5.8453369140625, 6.03985595703125, 6.234375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 14.0, 13.0, 15.0, 25.0, 29.0, 28.0, 35.0, 49.0, 60.0, 64.0, 64.0, 55.0, 86.0, 69.0, 86.0, 58.0, 49.0, 49.0, 28.0, 31.0, 17.0, 20.0, 17.0, 11.0, 9.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.552734375, -1.4959716796875, -1.439208984375, -1.3824462890625, -1.32568359375, -1.2689208984375, -1.212158203125, -1.1553955078125, -1.0986328125, -1.0418701171875, -0.985107421875, -0.9283447265625, -0.87158203125, -0.8148193359375, -0.758056640625, -0.7012939453125, -0.64453125, -0.5877685546875, -0.531005859375, -0.4742431640625, -0.41748046875, -0.3607177734375, -0.303955078125, -0.2471923828125, -0.1904296875, -0.1336669921875, -0.076904296875, -0.0201416015625, 0.03662109375, 0.0933837890625, 0.150146484375, 0.2069091796875, 0.263671875, 0.3204345703125, 0.377197265625, 0.4339599609375, 0.49072265625, 0.5474853515625, 0.604248046875, 0.6610107421875, 0.7177734375, 0.7745361328125, 0.831298828125, 0.8880615234375, 0.94482421875, 1.0015869140625, 1.058349609375, 1.1151123046875, 1.171875, 1.2286376953125, 1.285400390625, 1.3421630859375, 1.39892578125, 1.4556884765625, 1.512451171875, 1.5692138671875, 1.6259765625, 1.6827392578125, 1.739501953125, 1.7962646484375, 1.85302734375, 1.9097900390625, 1.966552734375, 2.0233154296875, 2.080078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 9.0, 15.0, 20.0, 26.0, 46.0, 87.0, 183.0, 465.0, 1391.0, 6498.0, 132997.0, 884803.0, 18287.0, 2494.0, 692.0, 247.0, 112.0, 62.0, 35.0, 29.0, 8.0, 12.0, 9.0, 8.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.609375, -18.157958984375, -17.70654296875, -17.255126953125, -16.8037109375, -16.352294921875, -15.90087890625, -15.449462890625, -14.998046875, -14.546630859375, -14.09521484375, -13.643798828125, -13.1923828125, -12.740966796875, -12.28955078125, -11.838134765625, -11.38671875, -10.935302734375, -10.48388671875, -10.032470703125, -9.5810546875, -9.129638671875, -8.67822265625, -8.226806640625, -7.775390625, -7.323974609375, -6.87255859375, -6.421142578125, -5.9697265625, -5.518310546875, -5.06689453125, -4.615478515625, -4.1640625, -3.712646484375, -3.26123046875, -2.809814453125, -2.3583984375, -1.906982421875, -1.45556640625, -1.004150390625, -0.552734375, -0.101318359375, 0.35009765625, 0.801513671875, 1.2529296875, 1.704345703125, 2.15576171875, 2.607177734375, 3.05859375, 3.510009765625, 3.96142578125, 4.412841796875, 4.8642578125, 5.315673828125, 5.76708984375, 6.218505859375, 6.669921875, 7.121337890625, 7.57275390625, 8.024169921875, 8.4755859375, 8.927001953125, 9.37841796875, 9.829833984375, 10.28125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 6.0, 3.0, 8.0, 9.0, 7.0, 11.0, 10.0, 19.0, 17.0, 25.0, 42.0, 31.0, 33.0, 41.0, 51.0, 43.0, 63.0, 74.0, 60.0, 51.0, 60.0, 51.0, 54.0, 35.0, 42.0, 31.0, 30.0, 25.0, 15.0, 9.0, 11.0, 13.0, 11.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.9921875, -8.72265625, -8.453125, -8.18359375, -7.9140625, -7.64453125, -7.375, -7.10546875, -6.8359375, -6.56640625, -6.296875, -6.02734375, -5.7578125, -5.48828125, -5.21875, -4.94921875, -4.6796875, -4.41015625, -4.140625, -3.87109375, -3.6015625, -3.33203125, -3.0625, -2.79296875, -2.5234375, -2.25390625, -1.984375, -1.71484375, -1.4453125, -1.17578125, -0.90625, -0.63671875, -0.3671875, -0.09765625, 0.171875, 0.44140625, 0.7109375, 0.98046875, 1.25, 1.51953125, 1.7890625, 2.05859375, 2.328125, 2.59765625, 2.8671875, 3.13671875, 3.40625, 3.67578125, 3.9453125, 4.21484375, 4.484375, 4.75390625, 5.0234375, 5.29296875, 5.5625, 5.83203125, 6.1015625, 6.37109375, 6.640625, 6.91015625, 7.1796875, 7.44921875, 7.71875, 7.98828125, 8.2578125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 10.0, 24.0, 31.0, 54.0, 149.0, 317.0, 1286.0, 27270.0, 1006998.0, 10998.0, 895.0, 260.0, 128.0, 55.0, 25.0, 18.0, 8.0, 9.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.4765625, -8.188232421875, -7.89990234375, -7.611572265625, -7.3232421875, -7.034912109375, -6.74658203125, -6.458251953125, -6.169921875, -5.881591796875, -5.59326171875, -5.304931640625, -5.0166015625, -4.728271484375, -4.43994140625, -4.151611328125, -3.86328125, -3.574951171875, -3.28662109375, -2.998291015625, -2.7099609375, -2.421630859375, -2.13330078125, -1.844970703125, -1.556640625, -1.268310546875, -0.97998046875, -0.691650390625, -0.4033203125, -0.114990234375, 0.17333984375, 0.461669921875, 0.75, 1.038330078125, 1.32666015625, 1.614990234375, 1.9033203125, 2.191650390625, 2.47998046875, 2.768310546875, 3.056640625, 3.344970703125, 3.63330078125, 3.921630859375, 4.2099609375, 4.498291015625, 4.78662109375, 5.074951171875, 5.36328125, 5.651611328125, 5.93994140625, 6.228271484375, 6.5166015625, 6.804931640625, 7.09326171875, 7.381591796875, 7.669921875, 7.958251953125, 8.24658203125, 8.534912109375, 8.8232421875, 9.111572265625, 9.39990234375, 9.688232421875, 9.9765625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 3.0, 7.0, 11.0, 13.0, 18.0, 17.0, 54.0, 59.0, 81.0, 116.0, 148.0, 135.0, 87.0, 81.0, 54.0, 34.0, 28.0, 17.0, 14.0, 2.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0005021095275878906, -0.0004867725074291229, -0.0004714354872703552, -0.0004560984671115875, -0.0004407614469528198, -0.0004254244267940521, -0.0004100874066352844, -0.0003947503864765167, -0.000379413366317749, -0.0003640763461589813, -0.0003487393260002136, -0.0003334023058414459, -0.0003180652856826782, -0.0003027282655239105, -0.0002873912453651428, -0.0002720542252063751, -0.0002567172050476074, -0.00024138018488883972, -0.00022604316473007202, -0.00021070614457130432, -0.00019536912441253662, -0.00018003210425376892, -0.00016469508409500122, -0.00014935806393623352, -0.00013402104377746582, -0.00011868402361869812, -0.00010334700345993042, -8.800998330116272e-05, -7.267296314239502e-05, -5.733594298362732e-05, -4.199892282485962e-05, -2.666190266609192e-05, -1.1324882507324219e-05, 4.0121376514434814e-06, 1.934915781021118e-05, 3.468617796897888e-05, 5.002319812774658e-05, 6.536021828651428e-05, 8.069723844528198e-05, 9.603425860404968e-05, 0.00011137127876281738, 0.00012670829892158508, 0.00014204531908035278, 0.00015738233923912048, 0.00017271935939788818, 0.00018805637955665588, 0.00020339339971542358, 0.00021873041987419128, 0.00023406744003295898, 0.0002494044601917267, 0.0002647414803504944, 0.0002800785005092621, 0.0002954155206680298, 0.0003107525408267975, 0.0003260895609855652, 0.0003414265811443329, 0.0003567636013031006, 0.0003721006214618683, 0.000387437641620636, 0.0004027746617794037, 0.0004181116819381714, 0.0004334487020969391, 0.0004487857222557068, 0.0004641227424144745, 0.0004794597625732422]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 4.0, 13.0, 15.0, 23.0, 32.0, 66.0, 147.0, 393.0, 1282.0, 6430.0, 97758.0, 902864.0, 34417.0, 3655.0, 877.0, 303.0, 118.0, 46.0, 31.0, 26.0, 14.0, 5.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.86322021484375, -3.7108154296875, -3.55841064453125, -3.406005859375, -3.25360107421875, -3.1011962890625, -2.94879150390625, -2.79638671875, -2.64398193359375, -2.4915771484375, -2.33917236328125, -2.186767578125, -2.03436279296875, -1.8819580078125, -1.72955322265625, -1.5771484375, -1.42474365234375, -1.2723388671875, -1.11993408203125, -0.967529296875, -0.81512451171875, -0.6627197265625, -0.51031494140625, -0.35791015625, -0.20550537109375, -0.0531005859375, 0.09930419921875, 0.251708984375, 0.40411376953125, 0.5565185546875, 0.70892333984375, 0.861328125, 1.01373291015625, 1.1661376953125, 1.31854248046875, 1.470947265625, 1.62335205078125, 1.7757568359375, 1.92816162109375, 2.08056640625, 2.23297119140625, 2.3853759765625, 2.53778076171875, 2.690185546875, 2.84259033203125, 2.9949951171875, 3.14739990234375, 3.2998046875, 3.45220947265625, 3.6046142578125, 3.75701904296875, 3.909423828125, 4.06182861328125, 4.2142333984375, 4.36663818359375, 4.51904296875, 4.67144775390625, 4.8238525390625, 4.97625732421875, 5.128662109375, 5.28106689453125, 5.4334716796875, 5.58587646484375, 5.73828125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 4.0, 8.0, 11.0, 10.0, 22.0, 29.0, 36.0, 77.0, 108.0, 141.0, 159.0, 116.0, 89.0, 66.0, 35.0, 26.0, 18.0, 8.0, 7.0, 10.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.62890625, -3.519927978515625, -3.41094970703125, -3.301971435546875, -3.1929931640625, -3.084014892578125, -2.97503662109375, -2.866058349609375, -2.757080078125, -2.648101806640625, -2.53912353515625, -2.430145263671875, -2.3211669921875, -2.212188720703125, -2.10321044921875, -1.994232177734375, -1.88525390625, -1.776275634765625, -1.66729736328125, -1.558319091796875, -1.4493408203125, -1.340362548828125, -1.23138427734375, -1.122406005859375, -1.013427734375, -0.904449462890625, -0.79547119140625, -0.686492919921875, -0.5775146484375, -0.468536376953125, -0.35955810546875, -0.250579833984375, -0.1416015625, -0.032623291015625, 0.07635498046875, 0.185333251953125, 0.2943115234375, 0.403289794921875, 0.51226806640625, 0.621246337890625, 0.730224609375, 0.839202880859375, 0.94818115234375, 1.057159423828125, 1.1661376953125, 1.275115966796875, 1.38409423828125, 1.493072509765625, 1.60205078125, 1.711029052734375, 1.82000732421875, 1.928985595703125, 2.0379638671875, 2.146942138671875, 2.25592041015625, 2.364898681640625, 2.473876953125, 2.582855224609375, 2.69183349609375, 2.800811767578125, 2.9097900390625, 3.018768310546875, 3.12774658203125, 3.236724853515625, 3.345703125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 16.0, 23.0, 68.0, 162.0, 313.0, 257.0, 103.0, 40.0, 16.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-147.29241943359375, -144.28326416015625, -141.2740936279297, -138.2649383544922, -135.2557830810547, -132.2466278076172, -129.23745727539062, -126.22830200195312, -123.21914672851562, -120.2099838256836, -117.2008285522461, -114.19166564941406, -111.18251037597656, -108.17334747314453, -105.16419219970703, -102.155029296875, -99.1458740234375, -96.13671112060547, -93.12755584716797, -90.11839294433594, -87.10923767089844, -84.1000747680664, -81.0909194946289, -78.08175659179688, -75.07259368896484, -72.06343078613281, -69.05427551269531, -66.04511260986328, -63.03595733642578, -60.026798248291016, -57.01763916015625, -54.00847625732422, -50.999324798583984, -47.99016571044922, -44.98100662231445, -41.97184753417969, -38.96268844604492, -35.953529357910156, -32.944366455078125, -29.935209274291992, -26.926050186157227, -23.91689109802246, -20.907732009887695, -17.898571014404297, -14.889412879943848, -11.880253791809082, -8.87109375, -5.861934661865234, -2.8527755737304688, 0.15638375282287598, 3.1655430793762207, 6.1747026443481445, 9.18386173248291, 12.193020820617676, 15.202180862426758, 18.211339950561523, 21.22049903869629, 24.229658126831055, 27.23881721496582, 30.24797821044922, 33.257137298583984, 36.26629638671875, 39.275455474853516, 42.28461456298828, 45.29377365112305]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 2.0, 5.0, 8.0, 9.0, 15.0, 19.0, 22.0, 31.0, 22.0, 40.0, 32.0, 55.0, 51.0, 57.0, 72.0, 75.0, 54.0, 72.0, 52.0, 47.0, 39.0, 43.0, 43.0, 25.0, 27.0, 16.0, 13.0, 9.0, 10.0, 6.0, 10.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.90699768066406, -42.6846923828125, -41.46238708496094, -40.240081787109375, -39.01777648925781, -37.795467376708984, -36.57316207885742, -35.35085678100586, -34.1285514831543, -32.906246185302734, -31.683940887451172, -30.461633682250977, -29.239328384399414, -28.01702308654785, -26.794715881347656, -25.572410583496094, -24.35010528564453, -23.12779998779297, -21.905494689941406, -20.68318748474121, -19.46088218688965, -18.238576889038086, -17.01626968383789, -15.793964385986328, -14.571659088134766, -13.349353790283203, -12.127047538757324, -10.904741287231445, -9.682435989379883, -8.46013069152832, -7.237824440002441, -6.0155181884765625, -4.793212890625, -3.5709071159362793, -2.3486013412475586, -1.126295566558838, 0.09601020812988281, 1.3183159828186035, 2.540621757507324, 3.762928009033203, 4.985233306884766, 6.207539081573486, 7.429844856262207, 8.652151107788086, 9.874456405639648, 11.096761703491211, 12.31906795501709, 13.541374206542969, 14.763679504394531, 15.985984802246094, 17.208290100097656, 18.43059730529785, 19.652902603149414, 20.875207901000977, 22.097515106201172, 23.319820404052734, 24.542125701904297, 25.76443099975586, 26.986736297607422, 28.209043502807617, 29.43134880065918, 30.653654098510742, 31.875961303710938, 33.0982666015625, 34.32057189941406]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 5.0, 3.0, 14.0, 13.0, 17.0, 17.0, 33.0, 51.0, 91.0, 128.0, 248.0, 533.0, 1367.0, 5789.0, 4137034.0, 43820.0, 3227.0, 959.0, 407.0, 200.0, 97.0, 57.0, 44.0, 34.0, 17.0, 15.0, 14.0, 9.0, 4.0, 4.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5078125, -15.086669921875, -14.66552734375, -14.244384765625, -13.8232421875, -13.402099609375, -12.98095703125, -12.559814453125, -12.138671875, -11.717529296875, -11.29638671875, -10.875244140625, -10.4541015625, -10.032958984375, -9.61181640625, -9.190673828125, -8.76953125, -8.348388671875, -7.92724609375, -7.506103515625, -7.0849609375, -6.663818359375, -6.24267578125, -5.821533203125, -5.400390625, -4.979248046875, -4.55810546875, -4.136962890625, -3.7158203125, -3.294677734375, -2.87353515625, -2.452392578125, -2.03125, -1.610107421875, -1.18896484375, -0.767822265625, -0.3466796875, 0.074462890625, 0.49560546875, 0.916748046875, 1.337890625, 1.759033203125, 2.18017578125, 2.601318359375, 3.0224609375, 3.443603515625, 3.86474609375, 4.285888671875, 4.70703125, 5.128173828125, 5.54931640625, 5.970458984375, 6.3916015625, 6.812744140625, 7.23388671875, 7.655029296875, 8.076171875, 8.497314453125, 8.91845703125, 9.339599609375, 9.7607421875, 10.181884765625, 10.60302734375, 11.024169921875, 11.4453125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 20.0, 39.0, 64.0, 117.0, 179.0, 184.0, 167.0, 102.0, 51.0, 34.0, 14.0, 9.0, 7.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.59375, -6.43035888671875, -6.2669677734375, -6.10357666015625, -5.940185546875, -5.77679443359375, -5.6134033203125, -5.45001220703125, -5.28662109375, -5.12322998046875, -4.9598388671875, -4.79644775390625, -4.633056640625, -4.46966552734375, -4.3062744140625, -4.14288330078125, -3.9794921875, -3.81610107421875, -3.6527099609375, -3.48931884765625, -3.325927734375, -3.16253662109375, -2.9991455078125, -2.83575439453125, -2.67236328125, -2.50897216796875, -2.3455810546875, -2.18218994140625, -2.018798828125, -1.85540771484375, -1.6920166015625, -1.52862548828125, -1.365234375, -1.20184326171875, -1.0384521484375, -0.87506103515625, -0.711669921875, -0.54827880859375, -0.3848876953125, -0.22149658203125, -0.05810546875, 0.10528564453125, 0.2686767578125, 0.43206787109375, 0.595458984375, 0.75885009765625, 0.9222412109375, 1.08563232421875, 1.2490234375, 1.41241455078125, 1.5758056640625, 1.73919677734375, 1.902587890625, 2.06597900390625, 2.2293701171875, 2.39276123046875, 2.55615234375, 2.71954345703125, 2.8829345703125, 3.04632568359375, 3.209716796875, 3.37310791015625, 3.5364990234375, 3.69989013671875, 3.86328125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 14.0, 16.0, 27.0, 63.0, 60.0, 111.0, 162.0, 276.0, 408.0, 794.0, 1851.0, 6087.0, 56556.0, 4108338.0, 13773.0, 3081.0, 1160.0, 556.0, 332.0, 227.0, 138.0, 89.0, 56.0, 35.0, 14.0, 16.0, 12.0, 14.0, 7.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.8621826171875, -11.372802734375, -10.8834228515625, -10.39404296875, -9.9046630859375, -9.415283203125, -8.9259033203125, -8.4365234375, -7.9471435546875, -7.457763671875, -6.9683837890625, -6.47900390625, -5.9896240234375, -5.500244140625, -5.0108642578125, -4.521484375, -4.0321044921875, -3.542724609375, -3.0533447265625, -2.56396484375, -2.0745849609375, -1.585205078125, -1.0958251953125, -0.6064453125, -0.1170654296875, 0.372314453125, 0.8616943359375, 1.35107421875, 1.8404541015625, 2.329833984375, 2.8192138671875, 3.30859375, 3.7979736328125, 4.287353515625, 4.7767333984375, 5.26611328125, 5.7554931640625, 6.244873046875, 6.7342529296875, 7.2236328125, 7.7130126953125, 8.202392578125, 8.6917724609375, 9.18115234375, 9.6705322265625, 10.159912109375, 10.6492919921875, 11.138671875, 11.6280517578125, 12.117431640625, 12.6068115234375, 13.09619140625, 13.5855712890625, 14.074951171875, 14.5643310546875, 15.0537109375, 15.5430908203125, 16.032470703125, 16.5218505859375, 17.01123046875, 17.5006103515625, 17.989990234375, 18.4793701171875, 18.96875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 8.0, 25.0, 60.0, 3436.0, 433.0, 46.0, 15.0, 14.0, 5.0, 10.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.890625, -3.70458984375, -3.5185546875, -3.33251953125, -3.146484375, -2.96044921875, -2.7744140625, -2.58837890625, -2.40234375, -2.21630859375, -2.0302734375, -1.84423828125, -1.658203125, -1.47216796875, -1.2861328125, -1.10009765625, -0.9140625, -0.72802734375, -0.5419921875, -0.35595703125, -0.169921875, 0.01611328125, 0.2021484375, 0.38818359375, 0.57421875, 0.76025390625, 0.9462890625, 1.13232421875, 1.318359375, 1.50439453125, 1.6904296875, 1.87646484375, 2.0625, 2.24853515625, 2.4345703125, 2.62060546875, 2.806640625, 2.99267578125, 3.1787109375, 3.36474609375, 3.55078125, 3.73681640625, 3.9228515625, 4.10888671875, 4.294921875, 4.48095703125, 4.6669921875, 4.85302734375, 5.0390625, 5.22509765625, 5.4111328125, 5.59716796875, 5.783203125, 5.96923828125, 6.1552734375, 6.34130859375, 6.52734375, 6.71337890625, 6.8994140625, 7.08544921875, 7.271484375, 7.45751953125, 7.6435546875, 7.82958984375, 8.015625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 9.0, 10.0, 28.0, 36.0, 57.0, 100.0, 118.0, 176.0, 140.0, 125.0, 81.0, 45.0, 20.0, 19.0, 10.0, 6.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.007283210754395, -8.506633758544922, -8.005985260009766, -7.505335807800293, -7.00468635559082, -6.504036903381348, -6.003387928009033, -5.502738952636719, -5.002089500427246, -4.501440048217773, -4.000791072845459, -3.5001418590545654, -2.999492645263672, -2.4988434314727783, -1.9981942176818848, -1.4975450038909912, -0.9968957901000977, -0.4962465763092041, 0.004402637481689453, 0.505051851272583, 1.0057010650634766, 1.5063502788543701, 2.0069994926452637, 2.5076487064361572, 3.008297920227051, 3.5089471340179443, 4.009596347808838, 4.510245323181152, 5.010894775390625, 5.511544227600098, 6.012193202972412, 6.512842178344727, 7.013490676879883, 7.5141401290893555, 8.014789581298828, 8.515438079833984, 9.016087532043457, 9.51673698425293, 10.017385482788086, 10.518034934997559, 11.018684387207031, 11.519333839416504, 12.019983291625977, 12.520631790161133, 13.021281242370605, 13.521930694580078, 14.022579193115234, 14.523228645324707, 15.02387809753418, 15.524527549743652, 16.025177001953125, 16.52582550048828, 17.026473999023438, 17.527124404907227, 18.027772903442383, 18.528423309326172, 19.029071807861328, 19.529720306396484, 20.030370712280273, 20.53101921081543, 21.03166961669922, 21.532318115234375, 22.03296661376953, 22.53361701965332, 23.034265518188477]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 7.0, 7.0, 5.0, 14.0, 17.0, 19.0, 26.0, 28.0, 30.0, 45.0, 40.0, 34.0, 59.0, 45.0, 49.0, 48.0, 54.0, 47.0, 56.0, 48.0, 47.0, 55.0, 30.0, 31.0, 31.0, 20.0, 12.0, 15.0, 14.0, 13.0, 10.0, 6.0, 7.0, 9.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.218850135803223, -10.889863967895508, -10.560877799987793, -10.231891632080078, -9.90290641784668, -9.573920249938965, -9.24493408203125, -8.915947914123535, -8.58696174621582, -8.257975578308105, -7.928989410400391, -7.600003719329834, -7.271017551422119, -6.942031383514404, -6.613045692443848, -6.284059524536133, -5.955073356628418, -5.626087188720703, -5.297101020812988, -4.968115329742432, -4.639129161834717, -4.310142993927002, -3.981157064437866, -3.6521711349487305, -3.3231849670410156, -2.994198799133301, -2.665212869644165, -2.3362269401550293, -2.0072407722473145, -1.6782547235488892, -1.3492686748504639, -1.0202827453613281, -0.6912975311279297, -0.3623114824295044, -0.0333254337310791, 0.2956606149673462, 0.6246466636657715, 0.9536327123641968, 1.282618761062622, 1.6116046905517578, 1.9405908584594727, 2.2695770263671875, 2.5985629558563232, 2.927548885345459, 3.256535053253174, 3.5855212211608887, 3.9145071506500244, 4.24349308013916, 4.572479248046875, 4.90146541595459, 5.230451583862305, 5.559437274932861, 5.888423442840576, 6.217409610748291, 6.546395301818848, 6.8753814697265625, 7.204367637634277, 7.533353805541992, 7.862339973449707, 8.191326141357422, 8.52031135559082, 8.849297523498535, 9.17828369140625, 9.507269859313965, 9.83625602722168]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 11.0, 12.0, 22.0, 41.0, 69.0, 117.0, 229.0, 550.0, 1569.0, 6698.0, 85290.0, 891986.0, 54311.0, 5313.0, 1337.0, 488.0, 240.0, 102.0, 67.0, 35.0, 22.0, 11.0, 8.0, 11.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.0859375, -9.6363525390625, -9.186767578125, -8.7371826171875, -8.28759765625, -7.8380126953125, -7.388427734375, -6.9388427734375, -6.4892578125, -6.0396728515625, -5.590087890625, -5.1405029296875, -4.69091796875, -4.2413330078125, -3.791748046875, -3.3421630859375, -2.892578125, -2.4429931640625, -1.993408203125, -1.5438232421875, -1.09423828125, -0.6446533203125, -0.195068359375, 0.2545166015625, 0.7041015625, 1.1536865234375, 1.603271484375, 2.0528564453125, 2.50244140625, 2.9520263671875, 3.401611328125, 3.8511962890625, 4.30078125, 4.7503662109375, 5.199951171875, 5.6495361328125, 6.09912109375, 6.5487060546875, 6.998291015625, 7.4478759765625, 7.8974609375, 8.3470458984375, 8.796630859375, 9.2462158203125, 9.69580078125, 10.1453857421875, 10.594970703125, 11.0445556640625, 11.494140625, 11.9437255859375, 12.393310546875, 12.8428955078125, 13.29248046875, 13.7420654296875, 14.191650390625, 14.6412353515625, 15.0908203125, 15.5404052734375, 15.989990234375, 16.4395751953125, 16.88916015625, 17.3387451171875, 17.788330078125, 18.2379150390625, 18.6875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 12.0, 14.0, 19.0, 23.0, 68.0, 61.0, 88.0, 103.0, 117.0, 102.0, 111.0, 102.0, 46.0, 38.0, 29.0, 26.0, 10.0, 10.0, 11.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.43359375, -4.31011962890625, -4.1866455078125, -4.06317138671875, -3.939697265625, -3.81622314453125, -3.6927490234375, -3.56927490234375, -3.44580078125, -3.32232666015625, -3.1988525390625, -3.07537841796875, -2.951904296875, -2.82843017578125, -2.7049560546875, -2.58148193359375, -2.4580078125, -2.33453369140625, -2.2110595703125, -2.08758544921875, -1.964111328125, -1.84063720703125, -1.7171630859375, -1.59368896484375, -1.47021484375, -1.34674072265625, -1.2232666015625, -1.09979248046875, -0.976318359375, -0.85284423828125, -0.7293701171875, -0.60589599609375, -0.482421875, -0.35894775390625, -0.2354736328125, -0.11199951171875, 0.011474609375, 0.13494873046875, 0.2584228515625, 0.38189697265625, 0.50537109375, 0.62884521484375, 0.7523193359375, 0.87579345703125, 0.999267578125, 1.12274169921875, 1.2462158203125, 1.36968994140625, 1.4931640625, 1.61663818359375, 1.7401123046875, 1.86358642578125, 1.987060546875, 2.11053466796875, 2.2340087890625, 2.35748291015625, 2.48095703125, 2.60443115234375, 2.7279052734375, 2.85137939453125, 2.974853515625, 3.09832763671875, 3.2218017578125, 3.34527587890625, 3.46875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 4.0, 9.0, 21.0, 22.0, 33.0, 62.0, 118.0, 189.0, 396.0, 832.0, 2562.0, 13317.0, 279643.0, 720921.0, 24602.0, 3794.0, 1053.0, 472.0, 190.0, 106.0, 61.0, 50.0, 21.0, 10.0, 13.0, 12.0, 9.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.7578125, -13.31591796875, -12.8740234375, -12.43212890625, -11.990234375, -11.54833984375, -11.1064453125, -10.66455078125, -10.22265625, -9.78076171875, -9.3388671875, -8.89697265625, -8.455078125, -8.01318359375, -7.5712890625, -7.12939453125, -6.6875, -6.24560546875, -5.8037109375, -5.36181640625, -4.919921875, -4.47802734375, -4.0361328125, -3.59423828125, -3.15234375, -2.71044921875, -2.2685546875, -1.82666015625, -1.384765625, -0.94287109375, -0.5009765625, -0.05908203125, 0.3828125, 0.82470703125, 1.2666015625, 1.70849609375, 2.150390625, 2.59228515625, 3.0341796875, 3.47607421875, 3.91796875, 4.35986328125, 4.8017578125, 5.24365234375, 5.685546875, 6.12744140625, 6.5693359375, 7.01123046875, 7.453125, 7.89501953125, 8.3369140625, 8.77880859375, 9.220703125, 9.66259765625, 10.1044921875, 10.54638671875, 10.98828125, 11.43017578125, 11.8720703125, 12.31396484375, 12.755859375, 13.19775390625, 13.6396484375, 14.08154296875, 14.5234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 8.0, 18.0, 22.0, 22.0, 35.0, 37.0, 64.0, 62.0, 79.0, 101.0, 94.0, 79.0, 83.0, 72.0, 58.0, 53.0, 29.0, 19.0, 21.0, 14.0, 14.0, 3.0, 1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.796875, -20.294677734375, -19.79248046875, -19.290283203125, -18.7880859375, -18.285888671875, -17.78369140625, -17.281494140625, -16.779296875, -16.277099609375, -15.77490234375, -15.272705078125, -14.7705078125, -14.268310546875, -13.76611328125, -13.263916015625, -12.76171875, -12.259521484375, -11.75732421875, -11.255126953125, -10.7529296875, -10.250732421875, -9.74853515625, -9.246337890625, -8.744140625, -8.241943359375, -7.73974609375, -7.237548828125, -6.7353515625, -6.233154296875, -5.73095703125, -5.228759765625, -4.7265625, -4.224365234375, -3.72216796875, -3.219970703125, -2.7177734375, -2.215576171875, -1.71337890625, -1.211181640625, -0.708984375, -0.206787109375, 0.29541015625, 0.797607421875, 1.2998046875, 1.802001953125, 2.30419921875, 2.806396484375, 3.30859375, 3.810791015625, 4.31298828125, 4.815185546875, 5.3173828125, 5.819580078125, 6.32177734375, 6.823974609375, 7.326171875, 7.828369140625, 8.33056640625, 8.832763671875, 9.3349609375, 9.837158203125, 10.33935546875, 10.841552734375, 11.34375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 4.0, 17.0, 21.0, 53.0, 92.0, 304.0, 862.0, 5487.0, 644763.0, 391095.0, 4648.0, 744.0, 234.0, 106.0, 39.0, 31.0, 21.0, 10.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.45361328125, -7.1962890625, -6.93896484375, -6.681640625, -6.42431640625, -6.1669921875, -5.90966796875, -5.65234375, -5.39501953125, -5.1376953125, -4.88037109375, -4.623046875, -4.36572265625, -4.1083984375, -3.85107421875, -3.59375, -3.33642578125, -3.0791015625, -2.82177734375, -2.564453125, -2.30712890625, -2.0498046875, -1.79248046875, -1.53515625, -1.27783203125, -1.0205078125, -0.76318359375, -0.505859375, -0.24853515625, 0.0087890625, 0.26611328125, 0.5234375, 0.78076171875, 1.0380859375, 1.29541015625, 1.552734375, 1.81005859375, 2.0673828125, 2.32470703125, 2.58203125, 2.83935546875, 3.0966796875, 3.35400390625, 3.611328125, 3.86865234375, 4.1259765625, 4.38330078125, 4.640625, 4.89794921875, 5.1552734375, 5.41259765625, 5.669921875, 5.92724609375, 6.1845703125, 6.44189453125, 6.69921875, 6.95654296875, 7.2138671875, 7.47119140625, 7.728515625, 7.98583984375, 8.2431640625, 8.50048828125, 8.7578125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 5.0, 7.0, 10.0, 12.0, 16.0, 13.0, 23.0, 40.0, 58.0, 67.0, 93.0, 120.0, 99.0, 102.0, 79.0, 72.0, 39.0, 32.0, 35.0, 21.0, 14.0, 6.0, 10.0, 6.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00046825408935546875, -0.00045337900519371033, -0.0004385039210319519, -0.0004236288368701935, -0.00040875375270843506, -0.00039387866854667664, -0.0003790035843849182, -0.0003641285002231598, -0.00034925341606140137, -0.00033437833189964294, -0.0003195032477378845, -0.0003046281635761261, -0.0002897530794143677, -0.00027487799525260925, -0.00026000291109085083, -0.0002451278269290924, -0.00023025274276733398, -0.00021537765860557556, -0.00020050257444381714, -0.00018562749028205872, -0.0001707524061203003, -0.00015587732195854187, -0.00014100223779678345, -0.00012612715363502502, -0.0001112520694732666, -9.637698531150818e-05, -8.150190114974976e-05, -6.662681698799133e-05, -5.175173282623291e-05, -3.687664866447449e-05, -2.2001564502716064e-05, -7.126480340957642e-06, 7.748603820800781e-06, 2.2623687982559204e-05, 3.749877214431763e-05, 5.237385630607605e-05, 6.724894046783447e-05, 8.21240246295929e-05, 9.699910879135132e-05, 0.00011187419295310974, 0.00012674927711486816, 0.0001416243612766266, 0.000156499445438385, 0.00017137452960014343, 0.00018624961376190186, 0.00020112469792366028, 0.0002159997820854187, 0.00023087486624717712, 0.00024574995040893555, 0.00026062503457069397, 0.0002755001187324524, 0.0002903752028942108, 0.00030525028705596924, 0.00032012537121772766, 0.0003350004553794861, 0.0003498755395412445, 0.00036475062370300293, 0.00037962570786476135, 0.0003945007920265198, 0.0004093758761882782, 0.0004242509603500366, 0.00043912604451179504, 0.00045400112867355347, 0.0004688762128353119, 0.0004837512969970703]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 5.0, 4.0, 8.0, 11.0, 15.0, 44.0, 92.0, 284.0, 1022.0, 11189.0, 1012234.0, 21797.0, 1318.0, 321.0, 102.0, 62.0, 22.0, 16.0, 8.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.7880859375, -11.490234375, -11.1923828125, -10.89453125, -10.5966796875, -10.298828125, -10.0009765625, -9.703125, -9.4052734375, -9.107421875, -8.8095703125, -8.51171875, -8.2138671875, -7.916015625, -7.6181640625, -7.3203125, -7.0224609375, -6.724609375, -6.4267578125, -6.12890625, -5.8310546875, -5.533203125, -5.2353515625, -4.9375, -4.6396484375, -4.341796875, -4.0439453125, -3.74609375, -3.4482421875, -3.150390625, -2.8525390625, -2.5546875, -2.2568359375, -1.958984375, -1.6611328125, -1.36328125, -1.0654296875, -0.767578125, -0.4697265625, -0.171875, 0.1259765625, 0.423828125, 0.7216796875, 1.01953125, 1.3173828125, 1.615234375, 1.9130859375, 2.2109375, 2.5087890625, 2.806640625, 3.1044921875, 3.40234375, 3.7001953125, 3.998046875, 4.2958984375, 4.59375, 4.8916015625, 5.189453125, 5.4873046875, 5.78515625, 6.0830078125, 6.380859375, 6.6787109375, 6.9765625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 11.0, 16.0, 30.0, 70.0, 109.0, 222.0, 257.0, 150.0, 59.0, 40.0, 17.0, 11.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.796875, -10.562744140625, -10.32861328125, -10.094482421875, -9.8603515625, -9.626220703125, -9.39208984375, -9.157958984375, -8.923828125, -8.689697265625, -8.45556640625, -8.221435546875, -7.9873046875, -7.753173828125, -7.51904296875, -7.284912109375, -7.05078125, -6.816650390625, -6.58251953125, -6.348388671875, -6.1142578125, -5.880126953125, -5.64599609375, -5.411865234375, -5.177734375, -4.943603515625, -4.70947265625, -4.475341796875, -4.2412109375, -4.007080078125, -3.77294921875, -3.538818359375, -3.3046875, -3.070556640625, -2.83642578125, -2.602294921875, -2.3681640625, -2.134033203125, -1.89990234375, -1.665771484375, -1.431640625, -1.197509765625, -0.96337890625, -0.729248046875, -0.4951171875, -0.260986328125, -0.02685546875, 0.207275390625, 0.44140625, 0.675537109375, 0.90966796875, 1.143798828125, 1.3779296875, 1.612060546875, 1.84619140625, 2.080322265625, 2.314453125, 2.548583984375, 2.78271484375, 3.016845703125, 3.2509765625, 3.485107421875, 3.71923828125, 3.953369140625, 4.1875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 11.0, 37.0, 103.0, 257.0, 294.0, 166.0, 83.0, 26.0, 12.0, 8.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.48255920410156, -165.64224243164062, -161.8019256591797, -157.96160888671875, -154.12127685546875, -150.2809600830078, -146.44064331054688, -142.60032653808594, -138.760009765625, -134.91969299316406, -131.07937622070312, -127.23905181884766, -123.39873504638672, -119.55841064453125, -115.71809387207031, -111.87777709960938, -108.0374526977539, -104.19713592529297, -100.3568115234375, -96.51649475097656, -92.67617797851562, -88.83586120605469, -84.99553680419922, -81.15522003173828, -77.31489562988281, -73.47457885742188, -69.6342544555664, -65.79393768310547, -61.95362091064453, -58.11330032348633, -54.272979736328125, -50.43266296386719, -46.59235382080078, -42.75203323364258, -38.91171646118164, -35.07139587402344, -31.231077194213867, -27.390758514404297, -23.550437927246094, -19.710119247436523, -15.869800567626953, -12.029481887817383, -8.189162254333496, -4.348842620849609, -0.5085239410400391, 3.3317947387695312, 7.172115325927734, 11.012434005737305, 14.852752685546875, 18.693071365356445, 22.533390045166016, 26.37371063232422, 30.21402931213379, 34.05434799194336, 37.89466857910156, 41.7349853515625, 45.5753059387207, 49.415626525878906, 53.255943298339844, 57.09626388549805, 60.93658447265625, 64.77690124511719, 68.61721801757812, 72.4575424194336, 76.29785919189453]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 2.0, 5.0, 12.0, 9.0, 11.0, 15.0, 25.0, 28.0, 35.0, 43.0, 61.0, 55.0, 66.0, 71.0, 58.0, 80.0, 65.0, 58.0, 36.0, 47.0, 42.0, 45.0, 25.0, 19.0, 24.0, 12.0, 20.0, 10.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.77496337890625, -43.11726760864258, -41.459571838378906, -39.80187225341797, -38.1441764831543, -36.486480712890625, -34.82878494262695, -33.17108917236328, -31.513391494750977, -29.855695724487305, -28.197998046875, -26.540302276611328, -24.882606506347656, -23.22490882873535, -21.56721305847168, -19.909515380859375, -18.251819610595703, -16.59412384033203, -14.936426162719727, -13.278730392456055, -11.621033668518066, -9.963336944580078, -8.305641174316406, -6.647944450378418, -4.99024772644043, -3.3325512409210205, -1.6748547554016113, -0.01715850830078125, 1.640538215637207, 3.2982349395751953, 4.955930709838867, 6.6136274337768555, 8.271324157714844, 9.929020881652832, 11.58671760559082, 13.244413375854492, 14.90211009979248, 16.55980682373047, 18.21750259399414, 19.875198364257812, 21.532896041870117, 23.19059181213379, 24.848289489746094, 26.505985260009766, 28.163681030273438, 29.821378707885742, 31.479074478149414, 33.13677215576172, 34.79446792602539, 36.45216369628906, 38.109859466552734, 39.767555236816406, 41.425254821777344, 43.082950592041016, 44.74064636230469, 46.39834213256836, 48.05603790283203, 49.7137336730957, 51.371429443359375, 53.02912902832031, 54.686824798583984, 56.344520568847656, 58.00221633911133, 59.659912109375, 61.31761169433594]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 14.0, 5.0, 15.0, 19.0, 20.0, 24.0, 48.0, 69.0, 93.0, 174.0, 316.0, 681.0, 1613.0, 4288.0, 14459.0, 81579.0, 3741583.0, 310820.0, 26250.0, 7072.0, 2709.0, 1127.0, 544.0, 281.0, 173.0, 116.0, 64.0, 35.0, 32.0, 20.0, 17.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.08984375, -5.8978271484375, -5.705810546875, -5.5137939453125, -5.32177734375, -5.1297607421875, -4.937744140625, -4.7457275390625, -4.5537109375, -4.3616943359375, -4.169677734375, -3.9776611328125, -3.78564453125, -3.5936279296875, -3.401611328125, -3.2095947265625, -3.017578125, -2.8255615234375, -2.633544921875, -2.4415283203125, -2.24951171875, -2.0574951171875, -1.865478515625, -1.6734619140625, -1.4814453125, -1.2894287109375, -1.097412109375, -0.9053955078125, -0.71337890625, -0.5213623046875, -0.329345703125, -0.1373291015625, 0.0546875, 0.2467041015625, 0.438720703125, 0.6307373046875, 0.82275390625, 1.0147705078125, 1.206787109375, 1.3988037109375, 1.5908203125, 1.7828369140625, 1.974853515625, 2.1668701171875, 2.35888671875, 2.5509033203125, 2.742919921875, 2.9349365234375, 3.126953125, 3.3189697265625, 3.510986328125, 3.7030029296875, 3.89501953125, 4.0870361328125, 4.279052734375, 4.4710693359375, 4.6630859375, 4.8551025390625, 5.047119140625, 5.2391357421875, 5.43115234375, 5.6231689453125, 5.815185546875, 6.0072021484375, 6.19921875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 14.0, 16.0, 16.0, 31.0, 51.0, 70.0, 96.0, 95.0, 101.0, 130.0, 104.0, 86.0, 57.0, 51.0, 29.0, 16.0, 14.0, 5.0, 4.0, 3.0, 3.0, 5.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.732421875, -3.622528076171875, -3.51263427734375, -3.402740478515625, -3.2928466796875, -3.182952880859375, -3.07305908203125, -2.963165283203125, -2.853271484375, -2.743377685546875, -2.63348388671875, -2.523590087890625, -2.4136962890625, -2.303802490234375, -2.19390869140625, -2.084014892578125, -1.97412109375, -1.864227294921875, -1.75433349609375, -1.644439697265625, -1.5345458984375, -1.424652099609375, -1.31475830078125, -1.204864501953125, -1.094970703125, -0.985076904296875, -0.87518310546875, -0.765289306640625, -0.6553955078125, -0.545501708984375, -0.43560791015625, -0.325714111328125, -0.2158203125, -0.105926513671875, 0.00396728515625, 0.113861083984375, 0.2237548828125, 0.333648681640625, 0.44354248046875, 0.553436279296875, 0.663330078125, 0.773223876953125, 0.88311767578125, 0.993011474609375, 1.1029052734375, 1.212799072265625, 1.32269287109375, 1.432586669921875, 1.54248046875, 1.652374267578125, 1.76226806640625, 1.872161865234375, 1.9820556640625, 2.091949462890625, 2.20184326171875, 2.311737060546875, 2.421630859375, 2.531524658203125, 2.64141845703125, 2.751312255859375, 2.8612060546875, 2.971099853515625, 3.08099365234375, 3.190887451171875, 3.30078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 7.0, 11.0, 13.0, 14.0, 37.0, 32.0, 48.0, 71.0, 120.0, 205.0, 417.0, 916.0, 1896.0, 5075.0, 16164.0, 68937.0, 2119893.0, 1889643.0, 66727.0, 15590.0, 4804.0, 1862.0, 815.0, 404.0, 222.0, 107.0, 75.0, 53.0, 31.0, 30.0, 12.0, 13.0, 4.0, 5.0, 8.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-7.20703125, -7.017333984375, -6.82763671875, -6.637939453125, -6.4482421875, -6.258544921875, -6.06884765625, -5.879150390625, -5.689453125, -5.499755859375, -5.31005859375, -5.120361328125, -4.9306640625, -4.740966796875, -4.55126953125, -4.361572265625, -4.171875, -3.982177734375, -3.79248046875, -3.602783203125, -3.4130859375, -3.223388671875, -3.03369140625, -2.843994140625, -2.654296875, -2.464599609375, -2.27490234375, -2.085205078125, -1.8955078125, -1.705810546875, -1.51611328125, -1.326416015625, -1.13671875, -0.947021484375, -0.75732421875, -0.567626953125, -0.3779296875, -0.188232421875, 0.00146484375, 0.191162109375, 0.380859375, 0.570556640625, 0.76025390625, 0.949951171875, 1.1396484375, 1.329345703125, 1.51904296875, 1.708740234375, 1.8984375, 2.088134765625, 2.27783203125, 2.467529296875, 2.6572265625, 2.846923828125, 3.03662109375, 3.226318359375, 3.416015625, 3.605712890625, 3.79541015625, 3.985107421875, 4.1748046875, 4.364501953125, 4.55419921875, 4.743896484375, 4.93359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 9.0, 2.0, 4.0, 8.0, 6.0, 11.0, 12.0, 12.0, 19.0, 24.0, 37.0, 56.0, 87.0, 136.0, 295.0, 859.0, 1375.0, 594.0, 211.0, 94.0, 53.0, 42.0, 35.0, 20.0, 15.0, 13.0, 11.0, 10.0, 11.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.65625, -5.4697265625, -5.283203125, -5.0966796875, -4.91015625, -4.7236328125, -4.537109375, -4.3505859375, -4.1640625, -3.9775390625, -3.791015625, -3.6044921875, -3.41796875, -3.2314453125, -3.044921875, -2.8583984375, -2.671875, -2.4853515625, -2.298828125, -2.1123046875, -1.92578125, -1.7392578125, -1.552734375, -1.3662109375, -1.1796875, -0.9931640625, -0.806640625, -0.6201171875, -0.43359375, -0.2470703125, -0.060546875, 0.1259765625, 0.3125, 0.4990234375, 0.685546875, 0.8720703125, 1.05859375, 1.2451171875, 1.431640625, 1.6181640625, 1.8046875, 1.9912109375, 2.177734375, 2.3642578125, 2.55078125, 2.7373046875, 2.923828125, 3.1103515625, 3.296875, 3.4833984375, 3.669921875, 3.8564453125, 4.04296875, 4.2294921875, 4.416015625, 4.6025390625, 4.7890625, 4.9755859375, 5.162109375, 5.3486328125, 5.53515625, 5.7216796875, 5.908203125, 6.0947265625, 6.28125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 5.0, 10.0, 7.0, 15.0, 21.0, 47.0, 98.0, 191.0, 219.0, 176.0, 116.0, 49.0, 26.0, 5.0, 7.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-90.4795913696289, -88.65483093261719, -86.830078125, -85.00531768798828, -83.18055725097656, -81.35579681396484, -79.53104400634766, -77.70628356933594, -75.88152313232422, -74.0567626953125, -72.23200988769531, -70.4072494506836, -68.58248901367188, -66.75772857666016, -64.93297576904297, -63.10821533203125, -61.2834587097168, -59.458702087402344, -57.633941650390625, -55.80918502807617, -53.98442459106445, -52.15966796875, -50.33490753173828, -48.51015090942383, -46.685394287109375, -44.86063766479492, -43.0358772277832, -41.21112060546875, -39.38636016845703, -37.56160354614258, -35.736846923828125, -33.912086486816406, -32.08732986450195, -30.262571334838867, -28.43781280517578, -26.613056182861328, -24.78829574584961, -22.963539123535156, -21.13878059387207, -19.314022064208984, -17.4892635345459, -15.664505004882812, -13.839746475219727, -12.014988899230957, -10.190230369567871, -8.365471839904785, -6.540714263916016, -4.71595573425293, -2.8911972045898438, -1.066438913345337, 0.7583193778991699, 2.5830774307250977, 4.407835960388184, 6.2325944900512695, 8.057352066040039, 9.882110595703125, 11.706869125366211, 13.531627655029297, 15.356386184692383, 17.18114471435547, 19.005901336669922, 20.83066177368164, 22.655418395996094, 24.48017692565918, 26.304935455322266]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 11.0, 9.0, 9.0, 14.0, 17.0, 26.0, 29.0, 31.0, 28.0, 42.0, 28.0, 33.0, 42.0, 52.0, 39.0, 44.0, 47.0, 47.0, 56.0, 42.0, 41.0, 38.0, 37.0, 29.0, 28.0, 28.0, 27.0, 19.0, 16.0, 16.0, 13.0, 16.0, 6.0, 6.0, 7.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.22383689880371, -22.50770378112793, -21.791568756103516, -21.075435638427734, -20.359302520751953, -19.64316749572754, -18.927034378051758, -18.210899353027344, -17.494766235351562, -16.77863311767578, -16.062498092651367, -15.346364974975586, -14.630230903625488, -13.91409683227539, -13.19796371459961, -12.481829643249512, -11.76569652557373, -11.049562454223633, -10.333429336547852, -9.617295265197754, -8.901161193847656, -8.185028076171875, -7.468894004821777, -6.75275993347168, -6.03662633895874, -5.320492744445801, -4.604358673095703, -3.8882250785827637, -3.172091245651245, -2.4559574127197266, -1.739823818206787, -1.0236897468566895, -0.30755615234375, 0.4085776209831238, 1.1247113943099976, 1.8408451080322266, 2.556978940963745, 3.2731127738952637, 3.989246368408203, 4.705380439758301, 5.42151403427124, 6.13764762878418, 6.853781700134277, 7.569915294647217, 8.286048889160156, 9.002182960510254, 9.718317031860352, 10.434450149536133, 11.15058422088623, 11.866718292236328, 12.58285140991211, 13.298985481262207, 14.015119552612305, 14.731252670288086, 15.447386741638184, 16.16352081298828, 16.879653930664062, 17.595787048339844, 18.311922073364258, 19.02805519104004, 19.74418830871582, 20.460323333740234, 21.176456451416016, 21.892589569091797, 22.60872459411621]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 8.0, 9.0, 16.0, 14.0, 17.0, 44.0, 51.0, 68.0, 104.0, 175.0, 354.0, 518.0, 954.0, 1943.0, 4084.0, 9840.0, 26653.0, 83983.0, 306284.0, 423270.0, 128154.0, 38113.0, 13314.0, 5344.0, 2486.0, 1134.0, 646.0, 351.0, 215.0, 146.0, 77.0, 57.0, 42.0, 20.0, 18.0, 18.0, 10.0, 5.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.478515625, -3.355010986328125, -3.23150634765625, -3.108001708984375, -2.9844970703125, -2.860992431640625, -2.73748779296875, -2.613983154296875, -2.490478515625, -2.366973876953125, -2.24346923828125, -2.119964599609375, -1.9964599609375, -1.872955322265625, -1.74945068359375, -1.625946044921875, -1.50244140625, -1.378936767578125, -1.25543212890625, -1.131927490234375, -1.0084228515625, -0.884918212890625, -0.76141357421875, -0.637908935546875, -0.514404296875, -0.390899658203125, -0.26739501953125, -0.143890380859375, -0.0203857421875, 0.103118896484375, 0.22662353515625, 0.350128173828125, 0.4736328125, 0.597137451171875, 0.72064208984375, 0.844146728515625, 0.9676513671875, 1.091156005859375, 1.21466064453125, 1.338165283203125, 1.461669921875, 1.585174560546875, 1.70867919921875, 1.832183837890625, 1.9556884765625, 2.079193115234375, 2.20269775390625, 2.326202392578125, 2.44970703125, 2.573211669921875, 2.69671630859375, 2.820220947265625, 2.9437255859375, 3.067230224609375, 3.19073486328125, 3.314239501953125, 3.437744140625, 3.561248779296875, 3.68475341796875, 3.808258056640625, 3.9317626953125, 4.055267333984375, 4.17877197265625, 4.302276611328125, 4.42578125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 13.0, 29.0, 29.0, 42.0, 65.0, 62.0, 84.0, 107.0, 106.0, 89.0, 80.0, 64.0, 61.0, 38.0, 34.0, 27.0, 18.0, 7.0, 12.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.05078125, -3.953521728515625, -3.85626220703125, -3.759002685546875, -3.6617431640625, -3.564483642578125, -3.46722412109375, -3.369964599609375, -3.272705078125, -3.175445556640625, -3.07818603515625, -2.980926513671875, -2.8836669921875, -2.786407470703125, -2.68914794921875, -2.591888427734375, -2.49462890625, -2.397369384765625, -2.30010986328125, -2.202850341796875, -2.1055908203125, -2.008331298828125, -1.91107177734375, -1.813812255859375, -1.716552734375, -1.619293212890625, -1.52203369140625, -1.424774169921875, -1.3275146484375, -1.230255126953125, -1.13299560546875, -1.035736083984375, -0.9384765625, -0.841217041015625, -0.74395751953125, -0.646697998046875, -0.5494384765625, -0.452178955078125, -0.35491943359375, -0.257659912109375, -0.160400390625, -0.063140869140625, 0.03411865234375, 0.131378173828125, 0.2286376953125, 0.325897216796875, 0.42315673828125, 0.520416259765625, 0.61767578125, 0.714935302734375, 0.81219482421875, 0.909454345703125, 1.0067138671875, 1.103973388671875, 1.20123291015625, 1.298492431640625, 1.395751953125, 1.493011474609375, 1.59027099609375, 1.687530517578125, 1.7847900390625, 1.882049560546875, 1.97930908203125, 2.076568603515625, 2.173828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 8.0, 6.0, 19.0, 26.0, 26.0, 36.0, 51.0, 89.0, 138.0, 204.0, 318.0, 496.0, 918.0, 1788.0, 4482.0, 15001.0, 88375.0, 681173.0, 214901.0, 28238.0, 6761.0, 2575.0, 1164.0, 611.0, 397.0, 242.0, 164.0, 94.0, 68.0, 46.0, 43.0, 22.0, 23.0, 10.0, 9.0, 7.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.2781982421875, -5.087646484375, -4.8970947265625, -4.70654296875, -4.5159912109375, -4.325439453125, -4.1348876953125, -3.9443359375, -3.7537841796875, -3.563232421875, -3.3726806640625, -3.18212890625, -2.9915771484375, -2.801025390625, -2.6104736328125, -2.419921875, -2.2293701171875, -2.038818359375, -1.8482666015625, -1.65771484375, -1.4671630859375, -1.276611328125, -1.0860595703125, -0.8955078125, -0.7049560546875, -0.514404296875, -0.3238525390625, -0.13330078125, 0.0572509765625, 0.247802734375, 0.4383544921875, 0.62890625, 0.8194580078125, 1.010009765625, 1.2005615234375, 1.39111328125, 1.5816650390625, 1.772216796875, 1.9627685546875, 2.1533203125, 2.3438720703125, 2.534423828125, 2.7249755859375, 2.91552734375, 3.1060791015625, 3.296630859375, 3.4871826171875, 3.677734375, 3.8682861328125, 4.058837890625, 4.2493896484375, 4.43994140625, 4.6304931640625, 4.821044921875, 5.0115966796875, 5.2021484375, 5.3927001953125, 5.583251953125, 5.7738037109375, 5.96435546875, 6.1549072265625, 6.345458984375, 6.5360107421875, 6.7265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 9.0, 8.0, 12.0, 16.0, 12.0, 15.0, 15.0, 18.0, 24.0, 27.0, 21.0, 34.0, 48.0, 29.0, 34.0, 44.0, 49.0, 48.0, 36.0, 40.0, 37.0, 50.0, 43.0, 44.0, 33.0, 36.0, 28.0, 22.0, 24.0, 25.0, 15.0, 15.0, 14.0, 12.0, 6.0, 6.0, 9.0, 7.0, 5.0, 1.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.08203125, -6.8609619140625, -6.639892578125, -6.4188232421875, -6.19775390625, -5.9766845703125, -5.755615234375, -5.5345458984375, -5.3134765625, -5.0924072265625, -4.871337890625, -4.6502685546875, -4.42919921875, -4.2081298828125, -3.987060546875, -3.7659912109375, -3.544921875, -3.3238525390625, -3.102783203125, -2.8817138671875, -2.66064453125, -2.4395751953125, -2.218505859375, -1.9974365234375, -1.7763671875, -1.5552978515625, -1.334228515625, -1.1131591796875, -0.89208984375, -0.6710205078125, -0.449951171875, -0.2288818359375, -0.0078125, 0.2132568359375, 0.434326171875, 0.6553955078125, 0.87646484375, 1.0975341796875, 1.318603515625, 1.5396728515625, 1.7607421875, 1.9818115234375, 2.202880859375, 2.4239501953125, 2.64501953125, 2.8660888671875, 3.087158203125, 3.3082275390625, 3.529296875, 3.7503662109375, 3.971435546875, 4.1925048828125, 4.41357421875, 4.6346435546875, 4.855712890625, 5.0767822265625, 5.2978515625, 5.5189208984375, 5.739990234375, 5.9610595703125, 6.18212890625, 6.4031982421875, 6.624267578125, 6.8453369140625, 7.06640625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 11.0, 6.0, 7.0, 18.0, 23.0, 38.0, 65.0, 112.0, 188.0, 498.0, 1432.0, 6104.0, 53240.0, 874400.0, 100825.0, 8656.0, 1849.0, 569.0, 225.0, 113.0, 61.0, 33.0, 30.0, 11.0, 9.0, 10.0, 6.0, 5.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.07366943359375, -3.9559326171875, -3.83819580078125, -3.720458984375, -3.60272216796875, -3.4849853515625, -3.36724853515625, -3.24951171875, -3.13177490234375, -3.0140380859375, -2.89630126953125, -2.778564453125, -2.66082763671875, -2.5430908203125, -2.42535400390625, -2.3076171875, -2.18988037109375, -2.0721435546875, -1.95440673828125, -1.836669921875, -1.71893310546875, -1.6011962890625, -1.48345947265625, -1.36572265625, -1.24798583984375, -1.1302490234375, -1.01251220703125, -0.894775390625, -0.77703857421875, -0.6593017578125, -0.54156494140625, -0.423828125, -0.30609130859375, -0.1883544921875, -0.07061767578125, 0.047119140625, 0.16485595703125, 0.2825927734375, 0.40032958984375, 0.51806640625, 0.63580322265625, 0.7535400390625, 0.87127685546875, 0.989013671875, 1.10675048828125, 1.2244873046875, 1.34222412109375, 1.4599609375, 1.57769775390625, 1.6954345703125, 1.81317138671875, 1.930908203125, 2.04864501953125, 2.1663818359375, 2.28411865234375, 2.40185546875, 2.51959228515625, 2.6373291015625, 2.75506591796875, 2.872802734375, 2.99053955078125, 3.1082763671875, 3.22601318359375, 3.34375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 0.0, 7.0, 10.0, 6.0, 9.0, 21.0, 30.0, 60.0, 75.0, 106.0, 131.0, 142.0, 123.0, 91.0, 68.0, 49.0, 26.0, 14.0, 8.0, 12.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005488395690917969, -0.0005294755101203918, -0.0005101114511489868, -0.0004907473921775818, -0.00047138333320617676, -0.00045201927423477173, -0.0004326552152633667, -0.00041329115629196167, -0.00039392709732055664, -0.0003745630383491516, -0.0003551989793777466, -0.00033583492040634155, -0.0003164708614349365, -0.0002971068024635315, -0.00027774274349212646, -0.00025837868452072144, -0.0002390146255493164, -0.00021965056657791138, -0.00020028650760650635, -0.00018092244863510132, -0.0001615583896636963, -0.00014219433069229126, -0.00012283027172088623, -0.0001034662127494812, -8.410215377807617e-05, -6.473809480667114e-05, -4.537403583526611e-05, -2.6009976863861084e-05, -6.645917892456055e-06, 1.2718141078948975e-05, 3.2082200050354004e-05, 5.144625902175903e-05, 7.081031799316406e-05, 9.017437696456909e-05, 0.00010953843593597412, 0.00012890249490737915, 0.00014826655387878418, 0.0001676306128501892, 0.00018699467182159424, 0.00020635873079299927, 0.0002257227897644043, 0.0002450868487358093, 0.00026445090770721436, 0.0002838149666786194, 0.0003031790256500244, 0.00032254308462142944, 0.00034190714359283447, 0.0003612712025642395, 0.00038063526153564453, 0.00039999932050704956, 0.0004193633794784546, 0.0004387274384498596, 0.00045809149742126465, 0.0004774555563926697, 0.0004968196153640747, 0.0005161836743354797, 0.0005355477333068848, 0.0005549117922782898, 0.0005742758512496948, 0.0005936399102210999, 0.0006130039691925049, 0.0006323680281639099, 0.0006517320871353149, 0.00067109614610672, 0.000690460205078125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 6.0, 15.0, 11.0, 20.0, 31.0, 50.0, 106.0, 154.0, 315.0, 661.0, 1737.0, 6111.0, 49220.0, 835162.0, 139889.0, 10884.0, 2497.0, 841.0, 362.0, 201.0, 101.0, 62.0, 36.0, 22.0, 17.0, 9.0, 10.0, 4.0, 1.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.33984375, -4.233123779296875, -4.12640380859375, -4.019683837890625, -3.9129638671875, -3.806243896484375, -3.69952392578125, -3.592803955078125, -3.486083984375, -3.379364013671875, -3.27264404296875, -3.165924072265625, -3.0592041015625, -2.952484130859375, -2.84576416015625, -2.739044189453125, -2.63232421875, -2.525604248046875, -2.41888427734375, -2.312164306640625, -2.2054443359375, -2.098724365234375, -1.99200439453125, -1.885284423828125, -1.778564453125, -1.671844482421875, -1.56512451171875, -1.458404541015625, -1.3516845703125, -1.244964599609375, -1.13824462890625, -1.031524658203125, -0.9248046875, -0.818084716796875, -0.71136474609375, -0.604644775390625, -0.4979248046875, -0.391204833984375, -0.28448486328125, -0.177764892578125, -0.071044921875, 0.035675048828125, 0.14239501953125, 0.249114990234375, 0.3558349609375, 0.462554931640625, 0.56927490234375, 0.675994873046875, 0.78271484375, 0.889434814453125, 0.99615478515625, 1.102874755859375, 1.2095947265625, 1.316314697265625, 1.42303466796875, 1.529754638671875, 1.636474609375, 1.743194580078125, 1.84991455078125, 1.956634521484375, 2.0633544921875, 2.170074462890625, 2.27679443359375, 2.383514404296875, 2.490234375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 14.0, 8.0, 20.0, 16.0, 29.0, 41.0, 55.0, 61.0, 66.0, 89.0, 97.0, 88.0, 80.0, 91.0, 54.0, 33.0, 33.0, 26.0, 19.0, 26.0, 7.0, 12.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.330078125, -2.24981689453125, -2.1695556640625, -2.08929443359375, -2.009033203125, -1.92877197265625, -1.8485107421875, -1.76824951171875, -1.68798828125, -1.60772705078125, -1.5274658203125, -1.44720458984375, -1.366943359375, -1.28668212890625, -1.2064208984375, -1.12615966796875, -1.0458984375, -0.96563720703125, -0.8853759765625, -0.80511474609375, -0.724853515625, -0.64459228515625, -0.5643310546875, -0.48406982421875, -0.40380859375, -0.32354736328125, -0.2432861328125, -0.16302490234375, -0.082763671875, -0.00250244140625, 0.0777587890625, 0.15802001953125, 0.23828125, 0.31854248046875, 0.3988037109375, 0.47906494140625, 0.559326171875, 0.63958740234375, 0.7198486328125, 0.80010986328125, 0.88037109375, 0.96063232421875, 1.0408935546875, 1.12115478515625, 1.201416015625, 1.28167724609375, 1.3619384765625, 1.44219970703125, 1.5224609375, 1.60272216796875, 1.6829833984375, 1.76324462890625, 1.843505859375, 1.92376708984375, 2.0040283203125, 2.08428955078125, 2.16455078125, 2.24481201171875, 2.3250732421875, 2.40533447265625, 2.485595703125, 2.56585693359375, 2.6461181640625, 2.72637939453125, 2.806640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 10.0, 11.0, 18.0, 48.0, 89.0, 132.0, 206.0, 178.0, 131.0, 83.0, 37.0, 22.0, 10.0, 10.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-66.2761459350586, -64.80431365966797, -63.33247375488281, -61.86063766479492, -60.38880157470703, -58.91696548461914, -57.44512939453125, -55.973297119140625, -54.50145721435547, -53.02962112426758, -51.55778503417969, -50.0859489440918, -48.614112854003906, -47.142276763916016, -45.670440673828125, -44.1986083984375, -42.72677230834961, -41.25493621826172, -39.78310012817383, -38.31126403808594, -36.83942794799805, -35.367591857910156, -33.89575958251953, -32.423919677734375, -30.952085494995117, -29.480249404907227, -28.008413314819336, -26.536579132080078, -25.064743041992188, -23.592906951904297, -22.121070861816406, -20.649234771728516, -19.177400588989258, -17.705564498901367, -16.233728408813477, -14.761893272399902, -13.290057182312012, -11.818221092224121, -10.346385955810547, -8.874549865722656, -7.402713775634766, -5.930877685546875, -4.459042072296143, -2.98720645904541, -1.5153703689575195, -0.043534278869628906, 1.4283008575439453, 2.900136947631836, 4.371973037719727, 5.843809127807617, 7.31564474105835, 8.787480354309082, 10.259316444396973, 11.731152534484863, 13.202987670898438, 14.674823760986328, 16.14665985107422, 17.61849594116211, 19.09033203125, 20.56216812133789, 22.03400421142578, 23.505840301513672, 24.97767448425293, 26.44951057434082, 27.92134666442871]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 11.0, 11.0, 16.0, 17.0, 24.0, 33.0, 18.0, 26.0, 23.0, 39.0, 30.0, 43.0, 47.0, 49.0, 61.0, 59.0, 59.0, 53.0, 43.0, 52.0, 35.0, 32.0, 28.0, 30.0, 24.0, 16.0, 19.0, 14.0, 16.0, 10.0, 8.0, 6.0, 9.0, 7.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-36.75929641723633, -35.75376892089844, -34.74824523925781, -33.74272155761719, -32.7371940612793, -31.73166847229004, -30.72614288330078, -29.720617294311523, -28.715091705322266, -27.709566116333008, -26.70404052734375, -25.698514938354492, -24.692989349365234, -23.687463760375977, -22.68193817138672, -21.67641258239746, -20.670886993408203, -19.665361404418945, -18.659835815429688, -17.65431022644043, -16.648784637451172, -15.643259048461914, -14.637733459472656, -13.632207870483398, -12.62668228149414, -11.621156692504883, -10.615631103515625, -9.610105514526367, -8.60457992553711, -7.599054336547852, -6.593528747558594, -5.588003158569336, -4.582479476928711, -3.576953887939453, -2.5714282989501953, -1.5659027099609375, -0.5603771209716797, 0.4451484680175781, 1.450674057006836, 2.4561996459960938, 3.4617252349853516, 4.467250823974609, 5.472776412963867, 6.478302001953125, 7.483827590942383, 8.48935317993164, 9.494878768920898, 10.500404357910156, 11.505929946899414, 12.511455535888672, 13.51698112487793, 14.522506713867188, 15.528032302856445, 16.533557891845703, 17.53908348083496, 18.54460906982422, 19.550134658813477, 20.555660247802734, 21.561185836791992, 22.56671142578125, 23.572237014770508, 24.577762603759766, 25.583288192749023, 26.58881378173828, 27.59433937072754]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 5.0, 12.0, 19.0, 26.0, 34.0, 70.0, 108.0, 250.0, 659.0, 2788.0, 19752.0, 3564967.0, 591225.0, 11696.0, 1798.0, 423.0, 188.0, 95.0, 48.0, 29.0, 30.0, 14.0, 7.0, 7.0, 2.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.78125, -10.51092529296875, -10.2406005859375, -9.97027587890625, -9.699951171875, -9.42962646484375, -9.1593017578125, -8.88897705078125, -8.61865234375, -8.34832763671875, -8.0780029296875, -7.80767822265625, -7.537353515625, -7.26702880859375, -6.9967041015625, -6.72637939453125, -6.4560546875, -6.18572998046875, -5.9154052734375, -5.64508056640625, -5.374755859375, -5.10443115234375, -4.8341064453125, -4.56378173828125, -4.29345703125, -4.02313232421875, -3.7528076171875, -3.48248291015625, -3.212158203125, -2.94183349609375, -2.6715087890625, -2.40118408203125, -2.130859375, -1.86053466796875, -1.5902099609375, -1.31988525390625, -1.049560546875, -0.77923583984375, -0.5089111328125, -0.23858642578125, 0.03173828125, 0.30206298828125, 0.5723876953125, 0.84271240234375, 1.113037109375, 1.38336181640625, 1.6536865234375, 1.92401123046875, 2.1943359375, 2.46466064453125, 2.7349853515625, 3.00531005859375, 3.275634765625, 3.54595947265625, 3.8162841796875, 4.08660888671875, 4.35693359375, 4.62725830078125, 4.8975830078125, 5.16790771484375, 5.438232421875, 5.70855712890625, 5.9788818359375, 6.24920654296875, 6.51953125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 12.0, 15.0, 11.0, 24.0, 21.0, 29.0, 35.0, 58.0, 57.0, 65.0, 55.0, 73.0, 78.0, 69.0, 83.0, 54.0, 53.0, 46.0, 34.0, 39.0, 15.0, 19.0, 9.0, 10.0, 10.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-3.177734375, -3.103851318359375, -3.02996826171875, -2.956085205078125, -2.8822021484375, -2.808319091796875, -2.73443603515625, -2.660552978515625, -2.586669921875, -2.512786865234375, -2.43890380859375, -2.365020751953125, -2.2911376953125, -2.217254638671875, -2.14337158203125, -2.069488525390625, -1.99560546875, -1.921722412109375, -1.84783935546875, -1.773956298828125, -1.7000732421875, -1.626190185546875, -1.55230712890625, -1.478424072265625, -1.404541015625, -1.330657958984375, -1.25677490234375, -1.182891845703125, -1.1090087890625, -1.035125732421875, -0.96124267578125, -0.887359619140625, -0.8134765625, -0.739593505859375, -0.66571044921875, -0.591827392578125, -0.5179443359375, -0.444061279296875, -0.37017822265625, -0.296295166015625, -0.222412109375, -0.148529052734375, -0.07464599609375, -0.000762939453125, 0.0731201171875, 0.147003173828125, 0.22088623046875, 0.294769287109375, 0.36865234375, 0.442535400390625, 0.51641845703125, 0.590301513671875, 0.6641845703125, 0.738067626953125, 0.81195068359375, 0.885833740234375, 0.959716796875, 1.033599853515625, 1.10748291015625, 1.181365966796875, 1.2552490234375, 1.329132080078125, 1.40301513671875, 1.476898193359375, 1.55078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 4.0, 1.0, 5.0, 5.0, 8.0, 21.0, 27.0, 49.0, 87.0, 130.0, 229.0, 439.0, 971.0, 2623.0, 7226.0, 23409.0, 121110.0, 3424324.0, 545831.0, 48033.0, 12805.0, 4203.0, 1561.0, 624.0, 256.0, 150.0, 71.0, 32.0, 17.0, 16.0, 12.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16015625, -3.01483154296875, -2.8695068359375, -2.72418212890625, -2.578857421875, -2.43353271484375, -2.2882080078125, -2.14288330078125, -1.99755859375, -1.85223388671875, -1.7069091796875, -1.56158447265625, -1.416259765625, -1.27093505859375, -1.1256103515625, -0.98028564453125, -0.8349609375, -0.68963623046875, -0.5443115234375, -0.39898681640625, -0.253662109375, -0.10833740234375, 0.0369873046875, 0.18231201171875, 0.32763671875, 0.47296142578125, 0.6182861328125, 0.76361083984375, 0.908935546875, 1.05426025390625, 1.1995849609375, 1.34490966796875, 1.490234375, 1.63555908203125, 1.7808837890625, 1.92620849609375, 2.071533203125, 2.21685791015625, 2.3621826171875, 2.50750732421875, 2.65283203125, 2.79815673828125, 2.9434814453125, 3.08880615234375, 3.234130859375, 3.37945556640625, 3.5247802734375, 3.67010498046875, 3.8154296875, 3.96075439453125, 4.1060791015625, 4.25140380859375, 4.396728515625, 4.54205322265625, 4.6873779296875, 4.83270263671875, 4.97802734375, 5.12335205078125, 5.2686767578125, 5.41400146484375, 5.559326171875, 5.70465087890625, 5.8499755859375, 5.99530029296875, 6.140625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 5.0, 10.0, 6.0, 5.0, 7.0, 13.0, 14.0, 9.0, 19.0, 16.0, 30.0, 54.0, 67.0, 127.0, 218.0, 476.0, 862.0, 966.0, 507.0, 241.0, 134.0, 78.0, 54.0, 41.0, 28.0, 15.0, 15.0, 5.0, 10.0, 7.0, 7.0, 7.0, 2.0, 7.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.35546875, -4.23468017578125, -4.1138916015625, -3.99310302734375, -3.872314453125, -3.75152587890625, -3.6307373046875, -3.50994873046875, -3.38916015625, -3.26837158203125, -3.1475830078125, -3.02679443359375, -2.906005859375, -2.78521728515625, -2.6644287109375, -2.54364013671875, -2.4228515625, -2.30206298828125, -2.1812744140625, -2.06048583984375, -1.939697265625, -1.81890869140625, -1.6981201171875, -1.57733154296875, -1.45654296875, -1.33575439453125, -1.2149658203125, -1.09417724609375, -0.973388671875, -0.85260009765625, -0.7318115234375, -0.61102294921875, -0.490234375, -0.36944580078125, -0.2486572265625, -0.12786865234375, -0.007080078125, 0.11370849609375, 0.2344970703125, 0.35528564453125, 0.47607421875, 0.59686279296875, 0.7176513671875, 0.83843994140625, 0.959228515625, 1.08001708984375, 1.2008056640625, 1.32159423828125, 1.4423828125, 1.56317138671875, 1.6839599609375, 1.80474853515625, 1.925537109375, 2.04632568359375, 2.1671142578125, 2.28790283203125, 2.40869140625, 2.52947998046875, 2.6502685546875, 2.77105712890625, 2.891845703125, 3.01263427734375, 3.1334228515625, 3.25421142578125, 3.375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 8.0, 22.0, 37.0, 84.0, 196.0, 245.0, 204.0, 109.0, 49.0, 17.0, 7.0, 3.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.01259994506836, -45.69345474243164, -44.374305725097656, -43.05516052246094, -41.73601531982422, -40.416866302490234, -39.097721099853516, -37.77857208251953, -36.45942687988281, -35.140281677246094, -33.82113265991211, -32.50198745727539, -31.18284034729004, -29.863693237304688, -28.54454803466797, -27.225400924682617, -25.906253814697266, -24.587106704711914, -23.267959594726562, -21.948814392089844, -20.629667282104492, -19.31052017211914, -17.991374969482422, -16.67222785949707, -15.353080749511719, -14.033933639526367, -12.714787483215332, -11.395641326904297, -10.076494216918945, -8.757347106933594, -7.438200950622559, -6.119054794311523, -4.7999114990234375, -3.480764865875244, -2.161618232727051, -0.8424715995788574, 0.47667503356933594, 1.7958216667175293, 3.1149682998657227, 4.434114456176758, 5.753261566162109, 7.072408199310303, 8.391554832458496, 9.710700988769531, 11.029848098754883, 12.348995208740234, 13.66814136505127, 14.987287521362305, 16.306434631347656, 17.625581741333008, 18.94472885131836, 20.263874053955078, 21.58302116394043, 22.90216827392578, 24.2213134765625, 25.54046058654785, 26.859607696533203, 28.178754806518555, 29.497901916503906, 30.817047119140625, 32.136192321777344, 33.45534133911133, 34.77448654174805, 36.09363555908203, 37.41278076171875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 5.0, 9.0, 4.0, 13.0, 21.0, 17.0, 15.0, 28.0, 26.0, 32.0, 38.0, 44.0, 44.0, 61.0, 46.0, 51.0, 50.0, 47.0, 73.0, 53.0, 49.0, 49.0, 52.0, 36.0, 36.0, 32.0, 15.0, 10.0, 10.0, 11.0, 6.0, 2.0, 4.0, 7.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.146295547485352, -14.520027160644531, -13.893758773803711, -13.26749038696289, -12.64122200012207, -12.01495361328125, -11.388684272766113, -10.762415885925293, -10.136147499084473, -9.509879112243652, -8.883610725402832, -8.257342338562012, -7.631073474884033, -7.004805088043213, -6.378536224365234, -5.752267837524414, -5.125999450683594, -4.499731063842773, -3.873462438583374, -3.2471938133239746, -2.6209254264831543, -1.994657039642334, -1.3683884143829346, -0.7421197891235352, -0.11585140228271484, 0.510417103767395, 1.1366856098175049, 1.7629541158676147, 2.3892226219177246, 3.015491008758545, 3.6417596340179443, 4.268028259277344, 4.894298553466797, 5.520566940307617, 6.1468353271484375, 6.773104190826416, 7.399372577667236, 8.025640487670898, 8.651909828186035, 9.278178215026855, 9.904446601867676, 10.530714988708496, 11.156983375549316, 11.783251762390137, 12.409521102905273, 13.035789489746094, 13.662057876586914, 14.288326263427734, 14.914594650268555, 15.540863037109375, 16.167131423950195, 16.793399810791016, 17.419668197631836, 18.045936584472656, 18.672204971313477, 19.298473358154297, 19.92474365234375, 20.55101203918457, 21.17728042602539, 21.80354881286621, 22.42981719970703, 23.05608558654785, 23.682353973388672, 24.308624267578125, 24.934890747070312]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 10.0, 14.0, 18.0, 20.0, 29.0, 58.0, 76.0, 123.0, 201.0, 329.0, 564.0, 926.0, 1702.0, 3249.0, 6486.0, 14098.0, 32757.0, 83807.0, 231636.0, 381644.0, 177394.0, 64292.0, 26108.0, 11316.0, 5416.0, 2784.0, 1389.0, 814.0, 485.0, 281.0, 200.0, 113.0, 61.0, 49.0, 36.0, 25.0, 12.0, 9.0, 11.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.53472900390625, -2.4385986328125, -2.34246826171875, -2.246337890625, -2.15020751953125, -2.0540771484375, -1.95794677734375, -1.86181640625, -1.76568603515625, -1.6695556640625, -1.57342529296875, -1.477294921875, -1.38116455078125, -1.2850341796875, -1.18890380859375, -1.0927734375, -0.99664306640625, -0.9005126953125, -0.80438232421875, -0.708251953125, -0.61212158203125, -0.5159912109375, -0.41986083984375, -0.32373046875, -0.22760009765625, -0.1314697265625, -0.03533935546875, 0.060791015625, 0.15692138671875, 0.2530517578125, 0.34918212890625, 0.4453125, 0.54144287109375, 0.6375732421875, 0.73370361328125, 0.829833984375, 0.92596435546875, 1.0220947265625, 1.11822509765625, 1.21435546875, 1.31048583984375, 1.4066162109375, 1.50274658203125, 1.598876953125, 1.69500732421875, 1.7911376953125, 1.88726806640625, 1.9833984375, 2.07952880859375, 2.1756591796875, 2.27178955078125, 2.367919921875, 2.46405029296875, 2.5601806640625, 2.65631103515625, 2.75244140625, 2.84857177734375, 2.9447021484375, 3.04083251953125, 3.136962890625, 3.23309326171875, 3.3292236328125, 3.42535400390625, 3.521484375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 15.0, 11.0, 17.0, 10.0, 17.0, 20.0, 29.0, 20.0, 28.0, 21.0, 28.0, 37.0, 42.0, 45.0, 71.0, 52.0, 55.0, 48.0, 38.0, 47.0, 45.0, 44.0, 42.0, 36.0, 24.0, 27.0, 22.0, 16.0, 10.0, 10.0, 16.0, 6.0, 10.0, 3.0, 4.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6572265625, -1.60723876953125, -1.5572509765625, -1.50726318359375, -1.457275390625, -1.40728759765625, -1.3572998046875, -1.30731201171875, -1.25732421875, -1.20733642578125, -1.1573486328125, -1.10736083984375, -1.057373046875, -1.00738525390625, -0.9573974609375, -0.90740966796875, -0.857421875, -0.80743408203125, -0.7574462890625, -0.70745849609375, -0.657470703125, -0.60748291015625, -0.5574951171875, -0.50750732421875, -0.45751953125, -0.40753173828125, -0.3575439453125, -0.30755615234375, -0.257568359375, -0.20758056640625, -0.1575927734375, -0.10760498046875, -0.0576171875, -0.00762939453125, 0.0423583984375, 0.09234619140625, 0.142333984375, 0.19232177734375, 0.2423095703125, 0.29229736328125, 0.34228515625, 0.39227294921875, 0.4422607421875, 0.49224853515625, 0.542236328125, 0.59222412109375, 0.6422119140625, 0.69219970703125, 0.7421875, 0.79217529296875, 0.8421630859375, 0.89215087890625, 0.942138671875, 0.99212646484375, 1.0421142578125, 1.09210205078125, 1.14208984375, 1.19207763671875, 1.2420654296875, 1.29205322265625, 1.342041015625, 1.39202880859375, 1.4420166015625, 1.49200439453125, 1.5419921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 10.0, 12.0, 15.0, 21.0, 27.0, 35.0, 69.0, 105.0, 205.0, 408.0, 843.0, 2357.0, 9223.0, 67610.0, 737654.0, 203335.0, 20212.0, 3918.0, 1286.0, 530.0, 267.0, 135.0, 94.0, 65.0, 34.0, 24.0, 12.0, 14.0, 4.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-7.671875, -7.4373779296875, -7.202880859375, -6.9683837890625, -6.73388671875, -6.4993896484375, -6.264892578125, -6.0303955078125, -5.7958984375, -5.5614013671875, -5.326904296875, -5.0924072265625, -4.85791015625, -4.6234130859375, -4.388916015625, -4.1544189453125, -3.919921875, -3.6854248046875, -3.450927734375, -3.2164306640625, -2.98193359375, -2.7474365234375, -2.512939453125, -2.2784423828125, -2.0439453125, -1.8094482421875, -1.574951171875, -1.3404541015625, -1.10595703125, -0.8714599609375, -0.636962890625, -0.4024658203125, -0.16796875, 0.0665283203125, 0.301025390625, 0.5355224609375, 0.77001953125, 1.0045166015625, 1.239013671875, 1.4735107421875, 1.7080078125, 1.9425048828125, 2.177001953125, 2.4114990234375, 2.64599609375, 2.8804931640625, 3.114990234375, 3.3494873046875, 3.583984375, 3.8184814453125, 4.052978515625, 4.2874755859375, 4.52197265625, 4.7564697265625, 4.990966796875, 5.2254638671875, 5.4599609375, 5.6944580078125, 5.928955078125, 6.1634521484375, 6.39794921875, 6.6324462890625, 6.866943359375, 7.1014404296875, 7.3359375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 10.0, 15.0, 13.0, 15.0, 21.0, 20.0, 35.0, 42.0, 56.0, 49.0, 55.0, 65.0, 61.0, 98.0, 55.0, 55.0, 54.0, 54.0, 42.0, 36.0, 31.0, 28.0, 18.0, 18.0, 14.0, 12.0, 10.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.20703125, -6.93597412109375, -6.6649169921875, -6.39385986328125, -6.122802734375, -5.85174560546875, -5.5806884765625, -5.30963134765625, -5.03857421875, -4.76751708984375, -4.4964599609375, -4.22540283203125, -3.954345703125, -3.68328857421875, -3.4122314453125, -3.14117431640625, -2.8701171875, -2.59906005859375, -2.3280029296875, -2.05694580078125, -1.785888671875, -1.51483154296875, -1.2437744140625, -0.97271728515625, -0.70166015625, -0.43060302734375, -0.1595458984375, 0.11151123046875, 0.382568359375, 0.65362548828125, 0.9246826171875, 1.19573974609375, 1.466796875, 1.73785400390625, 2.0089111328125, 2.27996826171875, 2.551025390625, 2.82208251953125, 3.0931396484375, 3.36419677734375, 3.63525390625, 3.90631103515625, 4.1773681640625, 4.44842529296875, 4.719482421875, 4.99053955078125, 5.2615966796875, 5.53265380859375, 5.8037109375, 6.07476806640625, 6.3458251953125, 6.61688232421875, 6.887939453125, 7.15899658203125, 7.4300537109375, 7.70111083984375, 7.97216796875, 8.24322509765625, 8.5142822265625, 8.78533935546875, 9.056396484375, 9.32745361328125, 9.5985107421875, 9.86956787109375, 10.140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 3.0, 3.0, 7.0, 6.0, 8.0, 12.0, 27.0, 20.0, 38.0, 92.0, 188.0, 533.0, 1951.0, 13122.0, 382638.0, 629544.0, 16986.0, 2259.0, 636.0, 230.0, 111.0, 45.0, 28.0, 21.0, 14.0, 10.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76171875, -4.629638671875, -4.49755859375, -4.365478515625, -4.2333984375, -4.101318359375, -3.96923828125, -3.837158203125, -3.705078125, -3.572998046875, -3.44091796875, -3.308837890625, -3.1767578125, -3.044677734375, -2.91259765625, -2.780517578125, -2.6484375, -2.516357421875, -2.38427734375, -2.252197265625, -2.1201171875, -1.988037109375, -1.85595703125, -1.723876953125, -1.591796875, -1.459716796875, -1.32763671875, -1.195556640625, -1.0634765625, -0.931396484375, -0.79931640625, -0.667236328125, -0.53515625, -0.403076171875, -0.27099609375, -0.138916015625, -0.0068359375, 0.125244140625, 0.25732421875, 0.389404296875, 0.521484375, 0.653564453125, 0.78564453125, 0.917724609375, 1.0498046875, 1.181884765625, 1.31396484375, 1.446044921875, 1.578125, 1.710205078125, 1.84228515625, 1.974365234375, 2.1064453125, 2.238525390625, 2.37060546875, 2.502685546875, 2.634765625, 2.766845703125, 2.89892578125, 3.031005859375, 3.1630859375, 3.295166015625, 3.42724609375, 3.559326171875, 3.69140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 7.0, 7.0, 8.0, 13.0, 23.0, 17.0, 27.0, 34.0, 55.0, 71.0, 79.0, 105.0, 106.0, 84.0, 72.0, 81.0, 41.0, 45.0, 26.0, 28.0, 16.0, 10.0, 10.0, 11.0, 10.0, 5.0, 1.0, 2.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00035119056701660156, -0.00033744052052497864, -0.0003236904740333557, -0.0003099404275417328, -0.00029619038105010986, -0.00028244033455848694, -0.000268690288066864, -0.0002549402415752411, -0.00024119019508361816, -0.00022744014859199524, -0.00021369010210037231, -0.0001999400556087494, -0.00018619000911712646, -0.00017243996262550354, -0.00015868991613388062, -0.0001449398696422577, -0.00013118982315063477, -0.00011743977665901184, -0.00010368973016738892, -8.993968367576599e-05, -7.618963718414307e-05, -6.243959069252014e-05, -4.868954420089722e-05, -3.493949770927429e-05, -2.1189451217651367e-05, -7.439404726028442e-06, 6.310641765594482e-06, 2.0060688257217407e-05, 3.381073474884033e-05, 4.756078124046326e-05, 6.131082773208618e-05, 7.50608742237091e-05, 8.881092071533203e-05, 0.00010256096720695496, 0.00011631101369857788, 0.0001300610601902008, 0.00014381110668182373, 0.00015756115317344666, 0.00017131119966506958, 0.0001850612461566925, 0.00019881129264831543, 0.00021256133913993835, 0.00022631138563156128, 0.0002400614321231842, 0.00025381147861480713, 0.00026756152510643005, 0.000281311571598053, 0.0002950616180896759, 0.00030881166458129883, 0.00032256171107292175, 0.0003363117575645447, 0.0003500618040561676, 0.00036381185054779053, 0.00037756189703941345, 0.0003913119435310364, 0.0004050619900226593, 0.0004188120365142822, 0.00043256208300590515, 0.0004463121294975281, 0.000460062175989151, 0.0004738122224807739, 0.00048756226897239685, 0.0005013123154640198, 0.0005150623619556427, 0.0005288124084472656]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 6.0, 12.0, 11.0, 16.0, 41.0, 56.0, 100.0, 187.0, 367.0, 815.0, 2294.0, 9558.0, 98263.0, 827520.0, 96019.0, 9359.0, 2300.0, 817.0, 350.0, 177.0, 109.0, 61.0, 37.0, 24.0, 19.0, 13.0, 4.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.787109375, -3.69122314453125, -3.5953369140625, -3.49945068359375, -3.403564453125, -3.30767822265625, -3.2117919921875, -3.11590576171875, -3.02001953125, -2.92413330078125, -2.8282470703125, -2.73236083984375, -2.636474609375, -2.54058837890625, -2.4447021484375, -2.34881591796875, -2.2529296875, -2.15704345703125, -2.0611572265625, -1.96527099609375, -1.869384765625, -1.77349853515625, -1.6776123046875, -1.58172607421875, -1.48583984375, -1.38995361328125, -1.2940673828125, -1.19818115234375, -1.102294921875, -1.00640869140625, -0.9105224609375, -0.81463623046875, -0.71875, -0.62286376953125, -0.5269775390625, -0.43109130859375, -0.335205078125, -0.23931884765625, -0.1434326171875, -0.04754638671875, 0.04833984375, 0.14422607421875, 0.2401123046875, 0.33599853515625, 0.431884765625, 0.52777099609375, 0.6236572265625, 0.71954345703125, 0.8154296875, 0.91131591796875, 1.0072021484375, 1.10308837890625, 1.198974609375, 1.29486083984375, 1.3907470703125, 1.48663330078125, 1.58251953125, 1.67840576171875, 1.7742919921875, 1.87017822265625, 1.966064453125, 2.06195068359375, 2.1578369140625, 2.25372314453125, 2.349609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 6.0, 11.0, 20.0, 32.0, 43.0, 60.0, 83.0, 129.0, 114.0, 146.0, 110.0, 93.0, 55.0, 32.0, 17.0, 9.0, 10.0, 6.0, 10.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.292633056640625, -4.17901611328125, -4.065399169921875, -3.9517822265625, -3.838165283203125, -3.72454833984375, -3.610931396484375, -3.497314453125, -3.383697509765625, -3.27008056640625, -3.156463623046875, -3.0428466796875, -2.929229736328125, -2.81561279296875, -2.701995849609375, -2.58837890625, -2.474761962890625, -2.36114501953125, -2.247528076171875, -2.1339111328125, -2.020294189453125, -1.90667724609375, -1.793060302734375, -1.679443359375, -1.565826416015625, -1.45220947265625, -1.338592529296875, -1.2249755859375, -1.111358642578125, -0.99774169921875, -0.884124755859375, -0.7705078125, -0.656890869140625, -0.54327392578125, -0.429656982421875, -0.3160400390625, -0.202423095703125, -0.08880615234375, 0.024810791015625, 0.138427734375, 0.252044677734375, 0.36566162109375, 0.479278564453125, 0.5928955078125, 0.706512451171875, 0.82012939453125, 0.933746337890625, 1.04736328125, 1.160980224609375, 1.27459716796875, 1.388214111328125, 1.5018310546875, 1.615447998046875, 1.72906494140625, 1.842681884765625, 1.956298828125, 2.069915771484375, 2.18353271484375, 2.297149658203125, 2.4107666015625, 2.524383544921875, 2.63800048828125, 2.751617431640625, 2.865234375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 23.0, 57.0, 180.0, 349.0, 246.0, 95.0, 29.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.92223358154297, -72.48037719726562, -70.03852081298828, -67.59667205810547, -65.15481567382812, -62.71295928955078, -60.27110290527344, -57.829246520996094, -55.387393951416016, -52.94553756713867, -50.503684997558594, -48.06182861328125, -45.619972229003906, -43.17811965942383, -40.736263275146484, -38.294410705566406, -35.85255432128906, -33.41069793701172, -30.96884536743164, -28.526988983154297, -26.085134506225586, -23.643280029296875, -21.20142364501953, -18.75956916809082, -16.31771469116211, -13.875860214233398, -11.434004783630371, -8.992149353027344, -6.550294876098633, -4.108440399169922, -1.6665849685668945, 0.7752704620361328, 3.2171173095703125, 5.658972263336182, 8.10082721710205, 10.542682647705078, 12.984537124633789, 15.4263916015625, 17.868247985839844, 20.310102462768555, 22.751956939697266, 25.193811416625977, 27.635665893554688, 30.07752227783203, 32.519378662109375, 34.96123123168945, 37.4030876159668, 39.844940185546875, 42.28679656982422, 44.72865295410156, 47.17050552368164, 49.612361907958984, 52.05421447753906, 54.496070861816406, 56.93792724609375, 59.379783630371094, 61.82163619995117, 64.26348876953125, 66.7053451538086, 69.14720153808594, 71.58905792236328, 74.03091430664062, 76.47276306152344, 78.91461944580078, 81.35647583007812]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 10.0, 10.0, 8.0, 14.0, 20.0, 17.0, 23.0, 28.0, 31.0, 30.0, 31.0, 41.0, 58.0, 56.0, 68.0, 65.0, 75.0, 70.0, 54.0, 49.0, 40.0, 33.0, 22.0, 25.0, 22.0, 25.0, 19.0, 10.0, 8.0, 10.0, 11.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.30786895751953, -26.287111282348633, -25.266353607177734, -24.245595932006836, -23.224838256835938, -22.204082489013672, -21.183324813842773, -20.162567138671875, -19.141809463500977, -18.121051788330078, -17.10029411315918, -16.07953643798828, -15.0587797164917, -14.0380220413208, -13.017265319824219, -11.99650764465332, -10.975749969482422, -9.954992294311523, -8.934234619140625, -7.913477897644043, -6.8927202224731445, -5.871962547302246, -4.851205348968506, -3.8304481506347656, -2.809690475463867, -1.7889330387115479, -0.7681756019592285, 0.2525818347930908, 1.2733392715454102, 2.2940969467163086, 3.314854145050049, 4.335611343383789, 5.356372833251953, 6.377130508422852, 7.397887706756592, 8.418644905090332, 9.43940258026123, 10.460160255432129, 11.480916976928711, 12.50167465209961, 13.522432327270508, 14.543190002441406, 15.563947677612305, 16.584705352783203, 17.60546112060547, 18.626220703125, 19.646976470947266, 20.667734146118164, 21.688491821289062, 22.70924949645996, 23.73000717163086, 24.750764846801758, 25.771522521972656, 26.792278289794922, 27.81303596496582, 28.83379364013672, 29.854551315307617, 30.875308990478516, 31.896066665649414, 32.91682434082031, 33.93758010864258, 34.95833969116211, 35.979095458984375, 36.999855041503906, 38.02061080932617]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 9.0, 10.0, 14.0, 11.0, 17.0, 28.0, 51.0, 64.0, 138.0, 259.0, 547.0, 1268.0, 3530.0, 10761.0, 42709.0, 294387.0, 2893180.0, 840783.0, 79681.0, 18198.0, 5287.0, 1893.0, 733.0, 316.0, 166.0, 93.0, 43.0, 32.0, 20.0, 18.0, 17.0, 9.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3515625, -2.263458251953125, -2.17535400390625, -2.087249755859375, -1.9991455078125, -1.911041259765625, -1.82293701171875, -1.734832763671875, -1.646728515625, -1.558624267578125, -1.47052001953125, -1.382415771484375, -1.2943115234375, -1.206207275390625, -1.11810302734375, -1.029998779296875, -0.94189453125, -0.853790283203125, -0.76568603515625, -0.677581787109375, -0.5894775390625, -0.501373291015625, -0.41326904296875, -0.325164794921875, -0.237060546875, -0.148956298828125, -0.06085205078125, 0.027252197265625, 0.1153564453125, 0.203460693359375, 0.29156494140625, 0.379669189453125, 0.4677734375, 0.555877685546875, 0.64398193359375, 0.732086181640625, 0.8201904296875, 0.908294677734375, 0.99639892578125, 1.084503173828125, 1.172607421875, 1.260711669921875, 1.34881591796875, 1.436920166015625, 1.5250244140625, 1.613128662109375, 1.70123291015625, 1.789337158203125, 1.87744140625, 1.965545654296875, 2.05364990234375, 2.141754150390625, 2.2298583984375, 2.317962646484375, 2.40606689453125, 2.494171142578125, 2.582275390625, 2.670379638671875, 2.75848388671875, 2.846588134765625, 2.9346923828125, 3.022796630859375, 3.11090087890625, 3.199005126953125, 3.287109375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 11.0, 11.0, 20.0, 27.0, 19.0, 36.0, 46.0, 55.0, 56.0, 76.0, 63.0, 56.0, 80.0, 71.0, 67.0, 65.0, 50.0, 39.0, 42.0, 29.0, 22.0, 18.0, 15.0, 15.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.077728271484375, -2.01092529296875, -1.944122314453125, -1.8773193359375, -1.810516357421875, -1.74371337890625, -1.676910400390625, -1.610107421875, -1.543304443359375, -1.47650146484375, -1.409698486328125, -1.3428955078125, -1.276092529296875, -1.20928955078125, -1.142486572265625, -1.07568359375, -1.008880615234375, -0.94207763671875, -0.875274658203125, -0.8084716796875, -0.741668701171875, -0.67486572265625, -0.608062744140625, -0.541259765625, -0.474456787109375, -0.40765380859375, -0.340850830078125, -0.2740478515625, -0.207244873046875, -0.14044189453125, -0.073638916015625, -0.0068359375, 0.059967041015625, 0.12677001953125, 0.193572998046875, 0.2603759765625, 0.327178955078125, 0.39398193359375, 0.460784912109375, 0.527587890625, 0.594390869140625, 0.66119384765625, 0.727996826171875, 0.7947998046875, 0.861602783203125, 0.92840576171875, 0.995208740234375, 1.06201171875, 1.128814697265625, 1.19561767578125, 1.262420654296875, 1.3292236328125, 1.396026611328125, 1.46282958984375, 1.529632568359375, 1.596435546875, 1.663238525390625, 1.73004150390625, 1.796844482421875, 1.8636474609375, 1.930450439453125, 1.99725341796875, 2.064056396484375, 2.130859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 6.0, 4.0, 5.0, 13.0, 12.0, 18.0, 34.0, 42.0, 65.0, 77.0, 132.0, 230.0, 414.0, 839.0, 1830.0, 5361.0, 17424.0, 70469.0, 548451.0, 3219698.0, 267841.0, 43897.0, 10951.0, 3511.0, 1391.0, 653.0, 347.0, 183.0, 139.0, 72.0, 50.0, 44.0, 19.0, 20.0, 13.0, 9.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.21875, -3.109130859375, -2.99951171875, -2.889892578125, -2.7802734375, -2.670654296875, -2.56103515625, -2.451416015625, -2.341796875, -2.232177734375, -2.12255859375, -2.012939453125, -1.9033203125, -1.793701171875, -1.68408203125, -1.574462890625, -1.46484375, -1.355224609375, -1.24560546875, -1.135986328125, -1.0263671875, -0.916748046875, -0.80712890625, -0.697509765625, -0.587890625, -0.478271484375, -0.36865234375, -0.259033203125, -0.1494140625, -0.039794921875, 0.06982421875, 0.179443359375, 0.2890625, 0.398681640625, 0.50830078125, 0.617919921875, 0.7275390625, 0.837158203125, 0.94677734375, 1.056396484375, 1.166015625, 1.275634765625, 1.38525390625, 1.494873046875, 1.6044921875, 1.714111328125, 1.82373046875, 1.933349609375, 2.04296875, 2.152587890625, 2.26220703125, 2.371826171875, 2.4814453125, 2.591064453125, 2.70068359375, 2.810302734375, 2.919921875, 3.029541015625, 3.13916015625, 3.248779296875, 3.3583984375, 3.468017578125, 3.57763671875, 3.687255859375, 3.796875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 10.0, 14.0, 6.0, 20.0, 20.0, 31.0, 33.0, 50.0, 63.0, 116.0, 143.0, 252.0, 491.0, 746.0, 777.0, 515.0, 280.0, 150.0, 100.0, 80.0, 39.0, 43.0, 25.0, 18.0, 13.0, 9.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0234375, -3.8895263671875, -3.755615234375, -3.6217041015625, -3.48779296875, -3.3538818359375, -3.219970703125, -3.0860595703125, -2.9521484375, -2.8182373046875, -2.684326171875, -2.5504150390625, -2.41650390625, -2.2825927734375, -2.148681640625, -2.0147705078125, -1.880859375, -1.7469482421875, -1.613037109375, -1.4791259765625, -1.34521484375, -1.2113037109375, -1.077392578125, -0.9434814453125, -0.8095703125, -0.6756591796875, -0.541748046875, -0.4078369140625, -0.27392578125, -0.1400146484375, -0.006103515625, 0.1278076171875, 0.26171875, 0.3956298828125, 0.529541015625, 0.6634521484375, 0.79736328125, 0.9312744140625, 1.065185546875, 1.1990966796875, 1.3330078125, 1.4669189453125, 1.600830078125, 1.7347412109375, 1.86865234375, 2.0025634765625, 2.136474609375, 2.2703857421875, 2.404296875, 2.5382080078125, 2.672119140625, 2.8060302734375, 2.93994140625, 3.0738525390625, 3.207763671875, 3.3416748046875, 3.4755859375, 3.6094970703125, 3.743408203125, 3.8773193359375, 4.01123046875, 4.1451416015625, 4.279052734375, 4.4129638671875, 4.546875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 6.0, 6.0, 7.0, 16.0, 28.0, 78.0, 139.0, 183.0, 217.0, 146.0, 89.0, 39.0, 17.0, 8.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-51.05595397949219, -49.683258056640625, -48.31056213378906, -46.9378662109375, -45.56516647338867, -44.19247055053711, -42.81977462768555, -41.447078704833984, -40.074378967285156, -38.701683044433594, -37.32898712158203, -35.95629119873047, -34.58359146118164, -33.21089553833008, -31.838199615478516, -30.465503692626953, -29.09280776977539, -27.720111846923828, -26.347414016723633, -24.97471809387207, -23.602020263671875, -22.229324340820312, -20.85662841796875, -19.483932495117188, -18.111234664916992, -16.73853874206543, -15.365840911865234, -13.993144989013672, -12.620448112487793, -11.247751235961914, -9.875055313110352, -8.502358436584473, -7.129657745361328, -5.756960868835449, -4.3842644691467285, -3.011568069458008, -1.638871192932129, -0.26617431640625, 1.1065216064453125, 2.4792184829711914, 3.8519153594970703, 5.224612236022949, 6.59730863571167, 7.970005035400391, 9.34270191192627, 10.715398788452148, 12.088094711303711, 13.46079158782959, 14.833488464355469, 16.20618438720703, 17.578882217407227, 18.95157814025879, 20.324275970458984, 21.696971893310547, 23.06966781616211, 24.442363739013672, 25.815061569213867, 27.18775749206543, 28.560455322265625, 29.933151245117188, 31.30584716796875, 32.67854309082031, 34.051239013671875, 35.4239387512207, 36.796634674072266]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 5.0, 6.0, 5.0, 9.0, 5.0, 10.0, 9.0, 15.0, 12.0, 23.0, 30.0, 18.0, 26.0, 28.0, 42.0, 36.0, 37.0, 40.0, 41.0, 40.0, 49.0, 42.0, 56.0, 54.0, 35.0, 49.0, 31.0, 35.0, 29.0, 19.0, 21.0, 30.0, 18.0, 16.0, 12.0, 9.0, 10.0, 13.0, 4.0, 8.0, 5.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-19.68364143371582, -19.091108322143555, -18.49857521057129, -17.906042098999023, -17.313507080078125, -16.72097396850586, -16.128440856933594, -15.535907745361328, -14.943374633789062, -14.350841522216797, -13.758308410644531, -13.16577434539795, -12.573241233825684, -11.980708122253418, -11.388174057006836, -10.79564094543457, -10.203107833862305, -9.610574722290039, -9.018041610717773, -8.425507545471191, -7.832974433898926, -7.24044132232666, -6.647907733917236, -6.0553741455078125, -5.462841033935547, -4.870307922363281, -4.277774333953857, -3.6852409839630127, -3.092707633972168, -2.5001742839813232, -1.9076409339904785, -1.3151073455810547, -0.7225723266601562, -0.13003897666931152, 0.4624943733215332, 1.055027723312378, 1.6475610733032227, 2.2400944232940674, 2.832627773284912, 3.425161361694336, 4.017694473266602, 4.610227584838867, 5.202761173248291, 5.795294761657715, 6.3878278732299805, 6.980360984802246, 7.57289457321167, 8.165428161621094, 8.75796127319336, 9.350494384765625, 9.94302749633789, 10.535561561584473, 11.128094673156738, 11.720627784729004, 12.313161849975586, 12.905694961547852, 13.498228073120117, 14.090761184692383, 14.683294296264648, 15.27582836151123, 15.868361473083496, 16.460895538330078, 17.053428649902344, 17.64596176147461, 18.238494873046875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 10.0, 11.0, 22.0, 26.0, 36.0, 74.0, 111.0, 143.0, 259.0, 422.0, 628.0, 1016.0, 1663.0, 2919.0, 4961.0, 8693.0, 14819.0, 25679.0, 43752.0, 74208.0, 123567.0, 188830.0, 204235.0, 142356.0, 86483.0, 51435.0, 29874.0, 17409.0, 10197.0, 5952.0, 3485.0, 2057.0, 1228.0, 745.0, 454.0, 271.0, 176.0, 115.0, 75.0, 55.0, 34.0, 24.0, 16.0, 11.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.59765625, -1.550872802734375, -1.50408935546875, -1.457305908203125, -1.4105224609375, -1.363739013671875, -1.31695556640625, -1.270172119140625, -1.223388671875, -1.176605224609375, -1.12982177734375, -1.083038330078125, -1.0362548828125, -0.989471435546875, -0.94268798828125, -0.895904541015625, -0.84912109375, -0.802337646484375, -0.75555419921875, -0.708770751953125, -0.6619873046875, -0.615203857421875, -0.56842041015625, -0.521636962890625, -0.474853515625, -0.428070068359375, -0.38128662109375, -0.334503173828125, -0.2877197265625, -0.240936279296875, -0.19415283203125, -0.147369384765625, -0.1005859375, -0.053802490234375, -0.00701904296875, 0.039764404296875, 0.0865478515625, 0.133331298828125, 0.18011474609375, 0.226898193359375, 0.273681640625, 0.320465087890625, 0.36724853515625, 0.414031982421875, 0.4608154296875, 0.507598876953125, 0.55438232421875, 0.601165771484375, 0.64794921875, 0.694732666015625, 0.74151611328125, 0.788299560546875, 0.8350830078125, 0.881866455078125, 0.92864990234375, 0.975433349609375, 1.022216796875, 1.069000244140625, 1.11578369140625, 1.162567138671875, 1.2093505859375, 1.256134033203125, 1.30291748046875, 1.349700927734375, 1.396484375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 6.0, 11.0, 9.0, 13.0, 16.0, 22.0, 35.0, 14.0, 19.0, 21.0, 34.0, 35.0, 38.0, 46.0, 44.0, 43.0, 45.0, 48.0, 45.0, 48.0, 39.0, 36.0, 39.0, 40.0, 26.0, 33.0, 21.0, 28.0, 25.0, 14.0, 18.0, 14.0, 15.0, 9.0, 12.0, 11.0, 5.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.068359375, -1.026885986328125, -0.98541259765625, -0.943939208984375, -0.9024658203125, -0.860992431640625, -0.81951904296875, -0.778045654296875, -0.736572265625, -0.695098876953125, -0.65362548828125, -0.612152099609375, -0.5706787109375, -0.529205322265625, -0.48773193359375, -0.446258544921875, -0.40478515625, -0.363311767578125, -0.32183837890625, -0.280364990234375, -0.2388916015625, -0.197418212890625, -0.15594482421875, -0.114471435546875, -0.072998046875, -0.031524658203125, 0.00994873046875, 0.051422119140625, 0.0928955078125, 0.134368896484375, 0.17584228515625, 0.217315673828125, 0.2587890625, 0.300262451171875, 0.34173583984375, 0.383209228515625, 0.4246826171875, 0.466156005859375, 0.50762939453125, 0.549102783203125, 0.590576171875, 0.632049560546875, 0.67352294921875, 0.714996337890625, 0.7564697265625, 0.797943115234375, 0.83941650390625, 0.880889892578125, 0.92236328125, 0.963836669921875, 1.00531005859375, 1.046783447265625, 1.0882568359375, 1.129730224609375, 1.17120361328125, 1.212677001953125, 1.254150390625, 1.295623779296875, 1.33709716796875, 1.378570556640625, 1.4200439453125, 1.461517333984375, 1.50299072265625, 1.544464111328125, 1.5859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 10.0, 12.0, 15.0, 30.0, 50.0, 63.0, 85.0, 120.0, 182.0, 238.0, 451.0, 653.0, 1131.0, 2422.0, 6584.0, 30370.0, 243862.0, 663898.0, 78057.0, 12634.0, 3689.0, 1657.0, 854.0, 546.0, 303.0, 187.0, 138.0, 82.0, 64.0, 37.0, 34.0, 20.0, 14.0, 18.0, 12.0, 7.0, 3.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5546875, -5.38238525390625, -5.2100830078125, -5.03778076171875, -4.865478515625, -4.69317626953125, -4.5208740234375, -4.34857177734375, -4.17626953125, -4.00396728515625, -3.8316650390625, -3.65936279296875, -3.487060546875, -3.31475830078125, -3.1424560546875, -2.97015380859375, -2.7978515625, -2.62554931640625, -2.4532470703125, -2.28094482421875, -2.108642578125, -1.93634033203125, -1.7640380859375, -1.59173583984375, -1.41943359375, -1.24713134765625, -1.0748291015625, -0.90252685546875, -0.730224609375, -0.55792236328125, -0.3856201171875, -0.21331787109375, -0.041015625, 0.13128662109375, 0.3035888671875, 0.47589111328125, 0.648193359375, 0.82049560546875, 0.9927978515625, 1.16510009765625, 1.33740234375, 1.50970458984375, 1.6820068359375, 1.85430908203125, 2.026611328125, 2.19891357421875, 2.3712158203125, 2.54351806640625, 2.7158203125, 2.88812255859375, 3.0604248046875, 3.23272705078125, 3.405029296875, 3.57733154296875, 3.7496337890625, 3.92193603515625, 4.09423828125, 4.26654052734375, 4.4388427734375, 4.61114501953125, 4.783447265625, 4.95574951171875, 5.1280517578125, 5.30035400390625, 5.47265625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 9.0, 8.0, 16.0, 22.0, 11.0, 33.0, 25.0, 35.0, 34.0, 40.0, 40.0, 51.0, 51.0, 50.0, 57.0, 68.0, 52.0, 55.0, 52.0, 43.0, 42.0, 33.0, 32.0, 27.0, 23.0, 21.0, 13.0, 15.0, 13.0, 1.0, 7.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.9091796875, -7.677734375, -7.4462890625, -7.21484375, -6.9833984375, -6.751953125, -6.5205078125, -6.2890625, -6.0576171875, -5.826171875, -5.5947265625, -5.36328125, -5.1318359375, -4.900390625, -4.6689453125, -4.4375, -4.2060546875, -3.974609375, -3.7431640625, -3.51171875, -3.2802734375, -3.048828125, -2.8173828125, -2.5859375, -2.3544921875, -2.123046875, -1.8916015625, -1.66015625, -1.4287109375, -1.197265625, -0.9658203125, -0.734375, -0.5029296875, -0.271484375, -0.0400390625, 0.19140625, 0.4228515625, 0.654296875, 0.8857421875, 1.1171875, 1.3486328125, 1.580078125, 1.8115234375, 2.04296875, 2.2744140625, 2.505859375, 2.7373046875, 2.96875, 3.2001953125, 3.431640625, 3.6630859375, 3.89453125, 4.1259765625, 4.357421875, 4.5888671875, 4.8203125, 5.0517578125, 5.283203125, 5.5146484375, 5.74609375, 5.9775390625, 6.208984375, 6.4404296875, 6.671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 9.0, 9.0, 12.0, 24.0, 25.0, 47.0, 60.0, 115.0, 181.0, 390.0, 762.0, 1802.0, 4850.0, 16857.0, 154874.0, 803843.0, 49807.0, 9201.0, 3124.0, 1302.0, 574.0, 276.0, 149.0, 78.0, 55.0, 42.0, 29.0, 11.0, 17.0, 9.0, 7.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.263671875, -3.173736572265625, -3.08380126953125, -2.993865966796875, -2.9039306640625, -2.813995361328125, -2.72406005859375, -2.634124755859375, -2.544189453125, -2.454254150390625, -2.36431884765625, -2.274383544921875, -2.1844482421875, -2.094512939453125, -2.00457763671875, -1.914642333984375, -1.82470703125, -1.734771728515625, -1.64483642578125, -1.554901123046875, -1.4649658203125, -1.375030517578125, -1.28509521484375, -1.195159912109375, -1.105224609375, -1.015289306640625, -0.92535400390625, -0.835418701171875, -0.7454833984375, -0.655548095703125, -0.56561279296875, -0.475677490234375, -0.3857421875, -0.295806884765625, -0.20587158203125, -0.115936279296875, -0.0260009765625, 0.063934326171875, 0.15386962890625, 0.243804931640625, 0.333740234375, 0.423675537109375, 0.51361083984375, 0.603546142578125, 0.6934814453125, 0.783416748046875, 0.87335205078125, 0.963287353515625, 1.05322265625, 1.143157958984375, 1.23309326171875, 1.323028564453125, 1.4129638671875, 1.502899169921875, 1.59283447265625, 1.682769775390625, 1.772705078125, 1.862640380859375, 1.95257568359375, 2.042510986328125, 2.1324462890625, 2.222381591796875, 2.31231689453125, 2.402252197265625, 2.4921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 3.0, 11.0, 15.0, 12.0, 34.0, 65.0, 78.0, 153.0, 209.0, 160.0, 99.0, 58.0, 24.0, 15.0, 13.0, 11.0, 9.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.001018524169921875, -0.0009897947311401367, -0.0009610652923583984, -0.0009323358535766602, -0.0009036064147949219, -0.0008748769760131836, -0.0008461475372314453, -0.000817418098449707, -0.0007886886596679688, -0.0007599592208862305, -0.0007312297821044922, -0.0007025003433227539, -0.0006737709045410156, -0.0006450414657592773, -0.0006163120269775391, -0.0005875825881958008, -0.0005588531494140625, -0.0005301237106323242, -0.0005013942718505859, -0.00047266483306884766, -0.0004439353942871094, -0.0004152059555053711, -0.0003864765167236328, -0.00035774707794189453, -0.00032901763916015625, -0.00030028820037841797, -0.0002715587615966797, -0.0002428293228149414, -0.00021409988403320312, -0.00018537044525146484, -0.00015664100646972656, -0.00012791156768798828, -9.918212890625e-05, -7.045269012451172e-05, -4.172325134277344e-05, -1.2993812561035156e-05, 1.5735626220703125e-05, 4.4465065002441406e-05, 7.319450378417969e-05, 0.00010192394256591797, 0.00013065338134765625, 0.00015938282012939453, 0.0001881122589111328, 0.0002168416976928711, 0.0002455711364746094, 0.00027430057525634766, 0.00030303001403808594, 0.0003317594528198242, 0.0003604888916015625, 0.0003892183303833008, 0.00041794776916503906, 0.00044667720794677734, 0.0004754066467285156, 0.0005041360855102539, 0.0005328655242919922, 0.0005615949630737305, 0.0005903244018554688, 0.000619053840637207, 0.0006477832794189453, 0.0006765127182006836, 0.0007052421569824219, 0.0007339715957641602, 0.0007627010345458984, 0.0007914304733276367, 0.000820159912109375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 9.0, 18.0, 14.0, 33.0, 63.0, 83.0, 201.0, 462.0, 1283.0, 4017.0, 17955.0, 660463.0, 343783.0, 14733.0, 3425.0, 1168.0, 430.0, 195.0, 88.0, 40.0, 28.0, 19.0, 13.0, 10.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.638671875, -3.517181396484375, -3.39569091796875, -3.274200439453125, -3.1527099609375, -3.031219482421875, -2.90972900390625, -2.788238525390625, -2.666748046875, -2.545257568359375, -2.42376708984375, -2.302276611328125, -2.1807861328125, -2.059295654296875, -1.93780517578125, -1.816314697265625, -1.69482421875, -1.573333740234375, -1.45184326171875, -1.330352783203125, -1.2088623046875, -1.087371826171875, -0.96588134765625, -0.844390869140625, -0.722900390625, -0.601409912109375, -0.47991943359375, -0.358428955078125, -0.2369384765625, -0.115447998046875, 0.00604248046875, 0.127532958984375, 0.2490234375, 0.370513916015625, 0.49200439453125, 0.613494873046875, 0.7349853515625, 0.856475830078125, 0.97796630859375, 1.099456787109375, 1.220947265625, 1.342437744140625, 1.46392822265625, 1.585418701171875, 1.7069091796875, 1.828399658203125, 1.94989013671875, 2.071380615234375, 2.19287109375, 2.314361572265625, 2.43585205078125, 2.557342529296875, 2.6788330078125, 2.800323486328125, 2.92181396484375, 3.043304443359375, 3.164794921875, 3.286285400390625, 3.40777587890625, 3.529266357421875, 3.6507568359375, 3.772247314453125, 3.89373779296875, 4.015228271484375, 4.13671875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 7.0, 12.0, 15.0, 22.0, 19.0, 43.0, 48.0, 72.0, 85.0, 102.0, 100.0, 106.0, 89.0, 64.0, 57.0, 38.0, 23.0, 26.0, 17.0, 14.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.205078125, -2.130859375, -2.056640625, -1.982421875, -1.908203125, -1.833984375, -1.759765625, -1.685546875, -1.611328125, -1.537109375, -1.462890625, -1.388671875, -1.314453125, -1.240234375, -1.166015625, -1.091796875, -1.017578125, -0.943359375, -0.869140625, -0.794921875, -0.720703125, -0.646484375, -0.572265625, -0.498046875, -0.423828125, -0.349609375, -0.275390625, -0.201171875, -0.126953125, -0.052734375, 0.021484375, 0.095703125, 0.169921875, 0.244140625, 0.318359375, 0.392578125, 0.466796875, 0.541015625, 0.615234375, 0.689453125, 0.763671875, 0.837890625, 0.912109375, 0.986328125, 1.060546875, 1.134765625, 1.208984375, 1.283203125, 1.357421875, 1.431640625, 1.505859375, 1.580078125, 1.654296875, 1.728515625, 1.802734375, 1.876953125, 1.951171875, 2.025390625, 2.099609375, 2.173828125, 2.248046875, 2.322265625, 2.396484375, 2.470703125, 2.544921875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 26.0, 71.0, 161.0, 374.0, 226.0, 83.0, 29.0, 16.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.24414825439453, -56.93902587890625, -54.633907318115234, -52.32878494262695, -50.02366638183594, -47.718544006347656, -45.413421630859375, -43.108299255371094, -40.80318069458008, -38.4980583190918, -36.19293975830078, -33.8878173828125, -31.58269691467285, -29.277576446533203, -26.972454071044922, -24.667333602905273, -22.362213134765625, -20.057092666625977, -17.751972198486328, -15.446849822998047, -13.141729354858398, -10.83660888671875, -8.531487464904785, -6.22636604309082, -3.921245574951172, -1.6161246299743652, 0.6889963150024414, 2.994117259979248, 5.299238204956055, 7.604358673095703, 9.909480094909668, 12.214601516723633, 14.519729614257812, 16.82485008239746, 19.12997055053711, 21.43509292602539, 23.74021339416504, 26.045333862304688, 28.35045623779297, 30.655576705932617, 32.960697174072266, 35.26581954956055, 37.57093811035156, 39.876060485839844, 42.181182861328125, 44.48630142211914, 46.79142379760742, 49.09654235839844, 51.40166473388672, 53.706787109375, 56.011905670166016, 58.3170280456543, 60.62214660644531, 62.927268981933594, 65.23239135742188, 67.53751373291016, 69.84263610839844, 72.14775848388672, 74.452880859375, 76.75799560546875, 79.06311798095703, 81.36824035644531, 83.6733627319336, 85.97848510742188, 88.28359985351562]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 9.0, 9.0, 3.0, 4.0, 10.0, 9.0, 14.0, 20.0, 21.0, 30.0, 23.0, 27.0, 28.0, 29.0, 31.0, 44.0, 50.0, 41.0, 67.0, 79.0, 68.0, 51.0, 42.0, 37.0, 29.0, 28.0, 26.0, 23.0, 23.0, 22.0, 19.0, 9.0, 12.0, 11.0, 9.0, 9.0, 9.0, 4.0, 2.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.85352325439453, -22.10639190673828, -21.35926055908203, -20.61212730407715, -19.8649959564209, -19.11786460876465, -18.370731353759766, -17.623600006103516, -16.876468658447266, -16.129337310791016, -15.38220500946045, -14.635072708129883, -13.887941360473633, -13.140810012817383, -12.393677711486816, -11.64654541015625, -10.8994140625, -10.15228271484375, -9.405150413513184, -8.658018112182617, -7.910886764526367, -7.163754940032959, -6.416623115539551, -5.669491291046143, -4.922359466552734, -4.175227642059326, -3.428095817565918, -2.6809639930725098, -1.9338321685791016, -1.1867003440856934, -0.43956851959228516, 0.30756330490112305, 1.0546932220458984, 1.8018250465393066, 2.548956871032715, 3.296088695526123, 4.043220520019531, 4.7903523445129395, 5.537484169006348, 6.284615993499756, 7.031747817993164, 7.778879642486572, 8.52601146697998, 9.273143768310547, 10.020275115966797, 10.767406463623047, 11.514538764953613, 12.26167106628418, 13.00880241394043, 13.75593376159668, 14.503066062927246, 15.250198364257812, 15.997329711914062, 16.744461059570312, 17.491592407226562, 18.238725662231445, 18.985857009887695, 19.732988357543945, 20.480121612548828, 21.227252960205078, 21.974384307861328, 22.721515655517578, 23.468647003173828, 24.21578025817871, 24.96291160583496]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 12.0, 11.0, 16.0, 27.0, 42.0, 63.0, 93.0, 129.0, 208.0, 409.0, 628.0, 1239.0, 2510.0, 4965.0, 12495.0, 36458.0, 157138.0, 1032011.0, 2317199.0, 499719.0, 87865.0, 24205.0, 8800.0, 3898.0, 1877.0, 963.0, 513.0, 296.0, 148.0, 107.0, 80.0, 50.0, 29.0, 27.0, 13.0, 9.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.171875, -2.1151885986328125, -2.058502197265625, -2.0018157958984375, -1.94512939453125, -1.8884429931640625, -1.831756591796875, -1.7750701904296875, -1.7183837890625, -1.6616973876953125, -1.605010986328125, -1.5483245849609375, -1.49163818359375, -1.4349517822265625, -1.378265380859375, -1.3215789794921875, -1.264892578125, -1.2082061767578125, -1.151519775390625, -1.0948333740234375, -1.03814697265625, -0.9814605712890625, -0.924774169921875, -0.8680877685546875, -0.8114013671875, -0.7547149658203125, -0.698028564453125, -0.6413421630859375, -0.58465576171875, -0.5279693603515625, -0.471282958984375, -0.4145965576171875, -0.35791015625, -0.3012237548828125, -0.244537353515625, -0.1878509521484375, -0.13116455078125, -0.0744781494140625, -0.017791748046875, 0.0388946533203125, 0.0955810546875, 0.1522674560546875, 0.208953857421875, 0.2656402587890625, 0.32232666015625, 0.3790130615234375, 0.435699462890625, 0.4923858642578125, 0.549072265625, 0.6057586669921875, 0.662445068359375, 0.7191314697265625, 0.77581787109375, 0.8325042724609375, 0.889190673828125, 0.9458770751953125, 1.0025634765625, 1.0592498779296875, 1.115936279296875, 1.1726226806640625, 1.22930908203125, 1.2859954833984375, 1.342681884765625, 1.3993682861328125, 1.4560546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 6.0, 9.0, 6.0, 9.0, 8.0, 9.0, 17.0, 13.0, 22.0, 19.0, 24.0, 25.0, 39.0, 24.0, 31.0, 43.0, 40.0, 35.0, 42.0, 56.0, 37.0, 46.0, 32.0, 39.0, 49.0, 36.0, 35.0, 36.0, 29.0, 33.0, 17.0, 20.0, 19.0, 15.0, 20.0, 17.0, 7.0, 10.0, 3.0, 9.0, 8.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.29296875, -1.25457763671875, -1.2161865234375, -1.17779541015625, -1.139404296875, -1.10101318359375, -1.0626220703125, -1.02423095703125, -0.98583984375, -0.94744873046875, -0.9090576171875, -0.87066650390625, -0.832275390625, -0.79388427734375, -0.7554931640625, -0.71710205078125, -0.6787109375, -0.64031982421875, -0.6019287109375, -0.56353759765625, -0.525146484375, -0.48675537109375, -0.4483642578125, -0.40997314453125, -0.37158203125, -0.33319091796875, -0.2947998046875, -0.25640869140625, -0.218017578125, -0.17962646484375, -0.1412353515625, -0.10284423828125, -0.064453125, -0.02606201171875, 0.0123291015625, 0.05072021484375, 0.089111328125, 0.12750244140625, 0.1658935546875, 0.20428466796875, 0.24267578125, 0.28106689453125, 0.3194580078125, 0.35784912109375, 0.396240234375, 0.43463134765625, 0.4730224609375, 0.51141357421875, 0.5498046875, 0.58819580078125, 0.6265869140625, 0.66497802734375, 0.703369140625, 0.74176025390625, 0.7801513671875, 0.81854248046875, 0.85693359375, 0.89532470703125, 0.9337158203125, 0.97210693359375, 1.010498046875, 1.04888916015625, 1.0872802734375, 1.12567138671875, 1.1640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 9.0, 6.0, 6.0, 11.0, 21.0, 18.0, 34.0, 64.0, 88.0, 148.0, 217.0, 521.0, 1325.0, 4517.0, 25546.0, 315492.0, 3627223.0, 193021.0, 19952.0, 3876.0, 1173.0, 458.0, 217.0, 127.0, 82.0, 49.0, 40.0, 15.0, 18.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.58489990234375, -5.4432373046875, -5.30157470703125, -5.159912109375, -5.01824951171875, -4.8765869140625, -4.73492431640625, -4.59326171875, -4.45159912109375, -4.3099365234375, -4.16827392578125, -4.026611328125, -3.88494873046875, -3.7432861328125, -3.60162353515625, -3.4599609375, -3.31829833984375, -3.1766357421875, -3.03497314453125, -2.893310546875, -2.75164794921875, -2.6099853515625, -2.46832275390625, -2.32666015625, -2.18499755859375, -2.0433349609375, -1.90167236328125, -1.760009765625, -1.61834716796875, -1.4766845703125, -1.33502197265625, -1.193359375, -1.05169677734375, -0.9100341796875, -0.76837158203125, -0.626708984375, -0.48504638671875, -0.3433837890625, -0.20172119140625, -0.06005859375, 0.08160400390625, 0.2232666015625, 0.36492919921875, 0.506591796875, 0.64825439453125, 0.7899169921875, 0.93157958984375, 1.0732421875, 1.21490478515625, 1.3565673828125, 1.49822998046875, 1.639892578125, 1.78155517578125, 1.9232177734375, 2.06488037109375, 2.20654296875, 2.34820556640625, 2.4898681640625, 2.63153076171875, 2.773193359375, 2.91485595703125, 3.0565185546875, 3.19818115234375, 3.33984375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 8.0, 13.0, 11.0, 14.0, 19.0, 26.0, 35.0, 55.0, 75.0, 94.0, 135.0, 207.0, 352.0, 496.0, 643.0, 574.0, 433.0, 269.0, 184.0, 117.0, 75.0, 63.0, 34.0, 33.0, 18.0, 22.0, 12.0, 15.0, 8.0, 6.0, 5.0, 2.0, 9.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0], "bins": [-3.625, -3.52899169921875, -3.4329833984375, -3.33697509765625, -3.240966796875, -3.14495849609375, -3.0489501953125, -2.95294189453125, -2.85693359375, -2.76092529296875, -2.6649169921875, -2.56890869140625, -2.472900390625, -2.37689208984375, -2.2808837890625, -2.18487548828125, -2.0888671875, -1.99285888671875, -1.8968505859375, -1.80084228515625, -1.704833984375, -1.60882568359375, -1.5128173828125, -1.41680908203125, -1.32080078125, -1.22479248046875, -1.1287841796875, -1.03277587890625, -0.936767578125, -0.84075927734375, -0.7447509765625, -0.64874267578125, -0.552734375, -0.45672607421875, -0.3607177734375, -0.26470947265625, -0.168701171875, -0.07269287109375, 0.0233154296875, 0.11932373046875, 0.21533203125, 0.31134033203125, 0.4073486328125, 0.50335693359375, 0.599365234375, 0.69537353515625, 0.7913818359375, 0.88739013671875, 0.9833984375, 1.07940673828125, 1.1754150390625, 1.27142333984375, 1.367431640625, 1.46343994140625, 1.5594482421875, 1.65545654296875, 1.75146484375, 1.84747314453125, 1.9434814453125, 2.03948974609375, 2.135498046875, 2.23150634765625, 2.3275146484375, 2.42352294921875, 2.51953125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 13.0, 16.0, 40.0, 80.0, 194.0, 258.0, 225.0, 100.0, 47.0, 16.0, 8.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.52568817138672, -38.99300003051758, -37.46031188964844, -35.9276237487793, -34.394935607910156, -32.86225128173828, -31.32956314086914, -29.796875, -28.26418685913086, -26.73149871826172, -25.198810577392578, -23.66612434387207, -22.13343620300293, -20.60074806213379, -19.06806182861328, -17.53537368774414, -16.002685546875, -14.46999740600586, -12.937310218811035, -11.404623031616211, -9.87193489074707, -8.33924674987793, -6.8065595626831055, -5.273872375488281, -3.7411842346191406, -2.208496570587158, -0.6758089065551758, 0.8568787574768066, 2.389566421508789, 3.9222540855407715, 5.454941749572754, 6.987628936767578, 8.520317077636719, 10.05300521850586, 11.585692405700684, 13.118379592895508, 14.651067733764648, 16.18375587463379, 17.716442108154297, 19.249130249023438, 20.781818389892578, 22.31450653076172, 23.84719467163086, 25.379880905151367, 26.912569046020508, 28.44525718688965, 29.977943420410156, 31.510631561279297, 33.04331970214844, 34.57600784301758, 36.10869598388672, 37.64138412475586, 39.174072265625, 40.706756591796875, 42.239444732666016, 43.772132873535156, 45.3048210144043, 46.83750915527344, 48.37019729614258, 49.90288543701172, 51.435569763183594, 52.968257904052734, 54.500946044921875, 56.033634185791016, 57.566322326660156]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 8.0, 9.0, 4.0, 4.0, 11.0, 11.0, 15.0, 21.0, 16.0, 27.0, 19.0, 28.0, 35.0, 34.0, 42.0, 39.0, 37.0, 45.0, 55.0, 43.0, 57.0, 34.0, 47.0, 46.0, 37.0, 28.0, 33.0, 32.0, 23.0, 19.0, 14.0, 20.0, 20.0, 24.0, 14.0, 10.0, 7.0, 8.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.267934799194336, -13.815223693847656, -13.362512588500977, -12.909801483154297, -12.4570894241333, -12.004378318786621, -11.551667213439941, -11.098956108093262, -10.646244049072266, -10.193532943725586, -9.740821838378906, -9.288110733032227, -8.83539867401123, -8.38268756866455, -7.929976463317871, -7.477265357971191, -7.024554252624512, -6.571843147277832, -6.119131565093994, -5.6664204597473145, -5.213708877563477, -4.760997772216797, -4.308286666870117, -3.8555753231048584, -3.4028639793395996, -2.950152635574341, -2.497441291809082, -2.0447301864624023, -1.5920188426971436, -1.1393074989318848, -0.6865963935852051, -0.2338850498199463, 0.2188262939453125, 0.6715375781059265, 1.1242488622665405, 1.5769600868225098, 2.0296714305877686, 2.4823827743530273, 2.935093879699707, 3.387805223464966, 3.8405165672302246, 4.293227672576904, 4.745939254760742, 5.198650360107422, 5.651361465454102, 6.1040730476379395, 6.556784152984619, 7.009495735168457, 7.462206840515137, 7.914917945861816, 8.367629051208496, 8.820341110229492, 9.273052215576172, 9.725763320922852, 10.178474426269531, 10.631185531616211, 11.08389663696289, 11.53660774230957, 11.98931884765625, 12.44202995300293, 12.894742012023926, 13.347453117370605, 13.800164222717285, 14.252875328063965, 14.705587387084961]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 6.0, 6.0, 7.0, 11.0, 17.0, 29.0, 29.0, 40.0, 67.0, 76.0, 125.0, 192.0, 327.0, 434.0, 651.0, 1035.0, 1629.0, 2582.0, 4115.0, 6663.0, 10919.0, 18572.0, 31107.0, 53342.0, 89883.0, 148838.0, 209744.0, 182234.0, 115606.0, 69208.0, 40442.0, 23905.0, 14068.0, 8531.0, 5099.0, 3252.0, 1948.0, 1314.0, 882.0, 532.0, 342.0, 240.0, 134.0, 129.0, 82.0, 43.0, 41.0, 28.0, 23.0, 16.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4541015625, -1.40521240234375, -1.3563232421875, -1.30743408203125, -1.258544921875, -1.20965576171875, -1.1607666015625, -1.11187744140625, -1.06298828125, -1.01409912109375, -0.9652099609375, -0.91632080078125, -0.867431640625, -0.81854248046875, -0.7696533203125, -0.72076416015625, -0.671875, -0.62298583984375, -0.5740966796875, -0.52520751953125, -0.476318359375, -0.42742919921875, -0.3785400390625, -0.32965087890625, -0.28076171875, -0.23187255859375, -0.1829833984375, -0.13409423828125, -0.085205078125, -0.03631591796875, 0.0125732421875, 0.06146240234375, 0.1103515625, 0.15924072265625, 0.2081298828125, 0.25701904296875, 0.305908203125, 0.35479736328125, 0.4036865234375, 0.45257568359375, 0.50146484375, 0.55035400390625, 0.5992431640625, 0.64813232421875, 0.697021484375, 0.74591064453125, 0.7947998046875, 0.84368896484375, 0.892578125, 0.94146728515625, 0.9903564453125, 1.03924560546875, 1.088134765625, 1.13702392578125, 1.1859130859375, 1.23480224609375, 1.28369140625, 1.33258056640625, 1.3814697265625, 1.43035888671875, 1.479248046875, 1.52813720703125, 1.5770263671875, 1.62591552734375, 1.6748046875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 9.0, 11.0, 13.0, 18.0, 26.0, 15.0, 14.0, 25.0, 27.0, 37.0, 36.0, 44.0, 49.0, 50.0, 36.0, 46.0, 37.0, 40.0, 52.0, 35.0, 36.0, 34.0, 46.0, 32.0, 31.0, 32.0, 17.0, 18.0, 18.0, 12.0, 14.0, 20.0, 10.0, 7.0, 11.0, 5.0, 5.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.132354736328125, -1.09283447265625, -1.053314208984375, -1.0137939453125, -0.974273681640625, -0.93475341796875, -0.895233154296875, -0.855712890625, -0.816192626953125, -0.77667236328125, -0.737152099609375, -0.6976318359375, -0.658111572265625, -0.61859130859375, -0.579071044921875, -0.53955078125, -0.500030517578125, -0.46051025390625, -0.420989990234375, -0.3814697265625, -0.341949462890625, -0.30242919921875, -0.262908935546875, -0.223388671875, -0.183868408203125, -0.14434814453125, -0.104827880859375, -0.0653076171875, -0.025787353515625, 0.01373291015625, 0.053253173828125, 0.0927734375, 0.132293701171875, 0.17181396484375, 0.211334228515625, 0.2508544921875, 0.290374755859375, 0.32989501953125, 0.369415283203125, 0.408935546875, 0.448455810546875, 0.48797607421875, 0.527496337890625, 0.5670166015625, 0.606536865234375, 0.64605712890625, 0.685577392578125, 0.72509765625, 0.764617919921875, 0.80413818359375, 0.843658447265625, 0.8831787109375, 0.922698974609375, 0.96221923828125, 1.001739501953125, 1.041259765625, 1.080780029296875, 1.12030029296875, 1.159820556640625, 1.1993408203125, 1.238861083984375, 1.27838134765625, 1.317901611328125, 1.357421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 11.0, 10.0, 24.0, 14.0, 28.0, 41.0, 58.0, 105.0, 135.0, 243.0, 344.0, 563.0, 1048.0, 2069.0, 5388.0, 21434.0, 141198.0, 712288.0, 133076.0, 20659.0, 5258.0, 2025.0, 994.0, 522.0, 351.0, 217.0, 146.0, 82.0, 56.0, 54.0, 33.0, 20.0, 22.0, 13.0, 9.0, 2.0, 2.0, 7.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.90625, -5.7349853515625, -5.563720703125, -5.3924560546875, -5.22119140625, -5.0499267578125, -4.878662109375, -4.7073974609375, -4.5361328125, -4.3648681640625, -4.193603515625, -4.0223388671875, -3.85107421875, -3.6798095703125, -3.508544921875, -3.3372802734375, -3.166015625, -2.9947509765625, -2.823486328125, -2.6522216796875, -2.48095703125, -2.3096923828125, -2.138427734375, -1.9671630859375, -1.7958984375, -1.6246337890625, -1.453369140625, -1.2821044921875, -1.11083984375, -0.9395751953125, -0.768310546875, -0.5970458984375, -0.42578125, -0.2545166015625, -0.083251953125, 0.0880126953125, 0.25927734375, 0.4305419921875, 0.601806640625, 0.7730712890625, 0.9443359375, 1.1156005859375, 1.286865234375, 1.4581298828125, 1.62939453125, 1.8006591796875, 1.971923828125, 2.1431884765625, 2.314453125, 2.4857177734375, 2.656982421875, 2.8282470703125, 2.99951171875, 3.1707763671875, 3.342041015625, 3.5133056640625, 3.6845703125, 3.8558349609375, 4.027099609375, 4.1983642578125, 4.36962890625, 4.5408935546875, 4.712158203125, 4.8834228515625, 5.0546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 8.0, 6.0, 7.0, 7.0, 17.0, 9.0, 11.0, 14.0, 25.0, 18.0, 32.0, 37.0, 41.0, 41.0, 46.0, 52.0, 55.0, 43.0, 48.0, 51.0, 58.0, 44.0, 43.0, 50.0, 37.0, 46.0, 36.0, 27.0, 21.0, 11.0, 17.0, 11.0, 10.0, 10.0, 5.0, 4.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78125, -5.60400390625, -5.4267578125, -5.24951171875, -5.072265625, -4.89501953125, -4.7177734375, -4.54052734375, -4.36328125, -4.18603515625, -4.0087890625, -3.83154296875, -3.654296875, -3.47705078125, -3.2998046875, -3.12255859375, -2.9453125, -2.76806640625, -2.5908203125, -2.41357421875, -2.236328125, -2.05908203125, -1.8818359375, -1.70458984375, -1.52734375, -1.35009765625, -1.1728515625, -0.99560546875, -0.818359375, -0.64111328125, -0.4638671875, -0.28662109375, -0.109375, 0.06787109375, 0.2451171875, 0.42236328125, 0.599609375, 0.77685546875, 0.9541015625, 1.13134765625, 1.30859375, 1.48583984375, 1.6630859375, 1.84033203125, 2.017578125, 2.19482421875, 2.3720703125, 2.54931640625, 2.7265625, 2.90380859375, 3.0810546875, 3.25830078125, 3.435546875, 3.61279296875, 3.7900390625, 3.96728515625, 4.14453125, 4.32177734375, 4.4990234375, 4.67626953125, 4.853515625, 5.03076171875, 5.2080078125, 5.38525390625, 5.5625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 12.0, 16.0, 22.0, 24.0, 47.0, 88.0, 126.0, 204.0, 397.0, 705.0, 1426.0, 2873.0, 6676.0, 17765.0, 64486.0, 337850.0, 511276.0, 72276.0, 18915.0, 7167.0, 3024.0, 1390.0, 765.0, 416.0, 216.0, 126.0, 94.0, 48.0, 30.0, 26.0, 13.0, 15.0, 3.0, 3.0, 10.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7587890625, -1.708587646484375, -1.65838623046875, -1.608184814453125, -1.5579833984375, -1.507781982421875, -1.45758056640625, -1.407379150390625, -1.357177734375, -1.306976318359375, -1.25677490234375, -1.206573486328125, -1.1563720703125, -1.106170654296875, -1.05596923828125, -1.005767822265625, -0.95556640625, -0.905364990234375, -0.85516357421875, -0.804962158203125, -0.7547607421875, -0.704559326171875, -0.65435791015625, -0.604156494140625, -0.553955078125, -0.503753662109375, -0.45355224609375, -0.403350830078125, -0.3531494140625, -0.302947998046875, -0.25274658203125, -0.202545166015625, -0.15234375, -0.102142333984375, -0.05194091796875, -0.001739501953125, 0.0484619140625, 0.098663330078125, 0.14886474609375, 0.199066162109375, 0.249267578125, 0.299468994140625, 0.34967041015625, 0.399871826171875, 0.4500732421875, 0.500274658203125, 0.55047607421875, 0.600677490234375, 0.65087890625, 0.701080322265625, 0.75128173828125, 0.801483154296875, 0.8516845703125, 0.901885986328125, 0.95208740234375, 1.002288818359375, 1.052490234375, 1.102691650390625, 1.15289306640625, 1.203094482421875, 1.2532958984375, 1.303497314453125, 1.35369873046875, 1.403900146484375, 1.4541015625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 12.0, 5.0, 14.0, 24.0, 32.0, 41.0, 72.0, 69.0, 133.0, 126.0, 124.0, 94.0, 62.0, 47.0, 33.0, 20.0, 15.0, 11.0, 11.0, 9.0, 5.0, 9.0, 0.0, 3.0, 7.0, 1.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0007138252258300781, -0.0006913244724273682, -0.0006688237190246582, -0.0006463229656219482, -0.0006238222122192383, -0.0006013214588165283, -0.0005788207054138184, -0.0005563199520111084, -0.0005338191986083984, -0.0005113184452056885, -0.0004888176918029785, -0.00046631693840026855, -0.0004438161849975586, -0.00042131543159484863, -0.00039881467819213867, -0.0003763139247894287, -0.00035381317138671875, -0.0003313124179840088, -0.00030881166458129883, -0.00028631091117858887, -0.0002638101577758789, -0.00024130940437316895, -0.00021880865097045898, -0.00019630789756774902, -0.00017380714416503906, -0.0001513063907623291, -0.00012880563735961914, -0.00010630488395690918, -8.380413055419922e-05, -6.130337715148926e-05, -3.88026237487793e-05, -1.6301870346069336e-05, 6.198883056640625e-06, 2.8699636459350586e-05, 5.120038986206055e-05, 7.370114326477051e-05, 9.620189666748047e-05, 0.00011870265007019043, 0.0001412034034729004, 0.00016370415687561035, 0.0001862049102783203, 0.00020870566368103027, 0.00023120641708374023, 0.0002537071704864502, 0.00027620792388916016, 0.0002987086772918701, 0.0003212094306945801, 0.00034371018409729004, 0.0003662109375, 0.00038871169090270996, 0.0004112124443054199, 0.0004337131977081299, 0.00045621395111083984, 0.0004787147045135498, 0.0005012154579162598, 0.0005237162113189697, 0.0005462169647216797, 0.0005687177181243896, 0.0005912184715270996, 0.0006137192249298096, 0.0006362199783325195, 0.0006587207317352295, 0.0006812214851379395, 0.0007037222385406494, 0.0007262229919433594]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 6.0, 9.0, 9.0, 12.0, 21.0, 17.0, 35.0, 51.0, 72.0, 128.0, 208.0, 342.0, 590.0, 1139.0, 2556.0, 6649.0, 20329.0, 97238.0, 646836.0, 217831.0, 37030.0, 10167.0, 3763.0, 1714.0, 740.0, 416.0, 222.0, 132.0, 92.0, 61.0, 44.0, 27.0, 19.0, 18.0, 9.0, 7.0, 2.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5048828125, -1.4524688720703125, -1.400054931640625, -1.3476409912109375, -1.29522705078125, -1.2428131103515625, -1.190399169921875, -1.1379852294921875, -1.0855712890625, -1.0331573486328125, -0.980743408203125, -0.9283294677734375, -0.87591552734375, -0.8235015869140625, -0.771087646484375, -0.7186737060546875, -0.666259765625, -0.6138458251953125, -0.561431884765625, -0.5090179443359375, -0.45660400390625, -0.4041900634765625, -0.351776123046875, -0.2993621826171875, -0.2469482421875, -0.1945343017578125, -0.142120361328125, -0.0897064208984375, -0.03729248046875, 0.0151214599609375, 0.067535400390625, 0.1199493408203125, 0.17236328125, 0.2247772216796875, 0.277191162109375, 0.3296051025390625, 0.38201904296875, 0.4344329833984375, 0.486846923828125, 0.5392608642578125, 0.5916748046875, 0.6440887451171875, 0.696502685546875, 0.7489166259765625, 0.80133056640625, 0.8537445068359375, 0.906158447265625, 0.9585723876953125, 1.010986328125, 1.0634002685546875, 1.115814208984375, 1.1682281494140625, 1.22064208984375, 1.2730560302734375, 1.325469970703125, 1.3778839111328125, 1.4302978515625, 1.4827117919921875, 1.535125732421875, 1.5875396728515625, 1.63995361328125, 1.6923675537109375, 1.744781494140625, 1.7971954345703125, 1.849609375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 9.0, 7.0, 10.0, 6.0, 4.0, 11.0, 18.0, 21.0, 19.0, 21.0, 29.0, 35.0, 36.0, 37.0, 47.0, 52.0, 61.0, 49.0, 64.0, 60.0, 55.0, 61.0, 52.0, 38.0, 48.0, 32.0, 17.0, 22.0, 20.0, 19.0, 3.0, 3.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0], "bins": [-1.4814453125, -1.440399169921875, -1.39935302734375, -1.358306884765625, -1.3172607421875, -1.276214599609375, -1.23516845703125, -1.194122314453125, -1.153076171875, -1.112030029296875, -1.07098388671875, -1.029937744140625, -0.9888916015625, -0.947845458984375, -0.90679931640625, -0.865753173828125, -0.82470703125, -0.783660888671875, -0.74261474609375, -0.701568603515625, -0.6605224609375, -0.619476318359375, -0.57843017578125, -0.537384033203125, -0.496337890625, -0.455291748046875, -0.41424560546875, -0.373199462890625, -0.3321533203125, -0.291107177734375, -0.25006103515625, -0.209014892578125, -0.16796875, -0.126922607421875, -0.08587646484375, -0.044830322265625, -0.0037841796875, 0.037261962890625, 0.07830810546875, 0.119354248046875, 0.160400390625, 0.201446533203125, 0.24249267578125, 0.283538818359375, 0.3245849609375, 0.365631103515625, 0.40667724609375, 0.447723388671875, 0.48876953125, 0.529815673828125, 0.57086181640625, 0.611907958984375, 0.6529541015625, 0.694000244140625, 0.73504638671875, 0.776092529296875, 0.817138671875, 0.858184814453125, 0.89923095703125, 0.940277099609375, 0.9813232421875, 1.022369384765625, 1.06341552734375, 1.104461669921875, 1.1455078125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 6.0, 10.0, 13.0, 32.0, 59.0, 102.0, 158.0, 297.0, 155.0, 83.0, 44.0, 12.0, 9.0, 7.0, 7.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.77064514160156, -32.26698303222656, -30.76331901550293, -29.25965690612793, -27.75599479675293, -26.252330780029297, -24.748668670654297, -23.245006561279297, -21.741344451904297, -20.237682342529297, -18.734018325805664, -17.230356216430664, -15.726694107055664, -14.223031044006348, -12.719367980957031, -11.215705871582031, -9.712041854858398, -8.208378791809082, -6.704716682434082, -5.201053619384766, -3.6973910331726074, -2.193728446960449, -0.6900653839111328, 0.8135967254638672, 2.3172597885131836, 3.820922374725342, 5.3245849609375, 6.828248023986816, 8.331911087036133, 9.835573196411133, 11.33923625946045, 12.84289836883545, 14.346561431884766, 15.850224494934082, 17.3538875579834, 18.8575496673584, 20.3612117767334, 21.86487579345703, 23.36853790283203, 24.87220001220703, 26.37586212158203, 27.87952423095703, 29.383188247680664, 30.886850357055664, 32.3905143737793, 33.8941764831543, 35.3978385925293, 36.9015007019043, 38.40516662597656, 39.90882873535156, 41.41249084472656, 42.91615295410156, 44.41981887817383, 45.92348098754883, 47.42714309692383, 48.93080520629883, 50.43446731567383, 51.93812942504883, 53.44179153442383, 54.945457458496094, 56.449119567871094, 57.952781677246094, 59.456443786621094, 60.960105895996094, 62.463768005371094]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 5.0, 6.0, 11.0, 8.0, 8.0, 14.0, 18.0, 16.0, 31.0, 33.0, 29.0, 44.0, 40.0, 34.0, 51.0, 67.0, 76.0, 80.0, 80.0, 53.0, 32.0, 41.0, 43.0, 24.0, 24.0, 17.0, 19.0, 22.0, 14.0, 10.0, 12.0, 11.0, 5.0, 4.0, 6.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.14849853515625, -26.375289916992188, -25.602079391479492, -24.82887077331543, -24.055660247802734, -23.282451629638672, -22.509241104125977, -21.736032485961914, -20.96282196044922, -20.189613342285156, -19.41640281677246, -18.6431941986084, -17.869983673095703, -17.09677505493164, -16.323564529418945, -15.550355911254883, -14.777146339416504, -14.003936767578125, -13.230727195739746, -12.457517623901367, -11.684308052062988, -10.91109848022461, -10.137889862060547, -9.364679336547852, -8.591470718383789, -7.81826114654541, -7.045051574707031, -6.271842002868652, -5.498632431030273, -4.7254228591918945, -3.952213764190674, -3.179004192352295, -2.405794143676758, -1.632584571838379, -0.8593751192092896, -0.0861656665802002, 0.6870439052581787, 1.4602534770965576, 2.2334628105163574, 3.0066723823547363, 3.7798819541931152, 4.553091526031494, 5.326301097869873, 6.099510192871094, 6.872719764709473, 7.645929336547852, 8.41913890838623, 9.19234848022461, 9.965558052062988, 10.738767623901367, 11.511977195739746, 12.285186767578125, 13.058396339416504, 13.831605911254883, 14.604814529418945, 15.37802505493164, 16.151233673095703, 16.924442291259766, 17.69765281677246, 18.470861434936523, 19.24407196044922, 20.01728057861328, 20.790491104125977, 21.56369972229004, 22.336910247802734]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 5.0, 11.0, 6.0, 24.0, 22.0, 28.0, 38.0, 43.0, 58.0, 79.0, 124.0, 166.0, 266.0, 410.0, 690.0, 1222.0, 2465.0, 5433.0, 13438.0, 41329.0, 197415.0, 1253281.0, 2117572.0, 444343.0, 78603.0, 21695.0, 8124.0, 3474.0, 1684.0, 856.0, 456.0, 269.0, 166.0, 135.0, 93.0, 60.0, 49.0, 40.0, 22.0, 20.0, 14.0, 15.0, 8.0, 5.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 4.0], "bins": [-1.9287109375, -1.872344970703125, -1.81597900390625, -1.759613037109375, -1.7032470703125, -1.646881103515625, -1.59051513671875, -1.534149169921875, -1.477783203125, -1.421417236328125, -1.36505126953125, -1.308685302734375, -1.2523193359375, -1.195953369140625, -1.13958740234375, -1.083221435546875, -1.02685546875, -0.970489501953125, -0.91412353515625, -0.857757568359375, -0.8013916015625, -0.745025634765625, -0.68865966796875, -0.632293701171875, -0.575927734375, -0.519561767578125, -0.46319580078125, -0.406829833984375, -0.3504638671875, -0.294097900390625, -0.23773193359375, -0.181365966796875, -0.125, -0.068634033203125, -0.01226806640625, 0.044097900390625, 0.1004638671875, 0.156829833984375, 0.21319580078125, 0.269561767578125, 0.325927734375, 0.382293701171875, 0.43865966796875, 0.495025634765625, 0.5513916015625, 0.607757568359375, 0.66412353515625, 0.720489501953125, 0.77685546875, 0.833221435546875, 0.88958740234375, 0.945953369140625, 1.0023193359375, 1.058685302734375, 1.11505126953125, 1.171417236328125, 1.227783203125, 1.284149169921875, 1.34051513671875, 1.396881103515625, 1.4532470703125, 1.509613037109375, 1.56597900390625, 1.622344970703125, 1.6787109375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 8.0, 8.0, 8.0, 4.0, 8.0, 11.0, 13.0, 13.0, 20.0, 22.0, 27.0, 22.0, 29.0, 43.0, 26.0, 34.0, 28.0, 44.0, 41.0, 40.0, 33.0, 46.0, 31.0, 46.0, 39.0, 32.0, 35.0, 36.0, 39.0, 22.0, 20.0, 20.0, 26.0, 21.0, 22.0, 15.0, 11.0, 11.0, 12.0, 4.0, 7.0, 9.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0712890625, -1.0369873046875, -1.002685546875, -0.9683837890625, -0.93408203125, -0.8997802734375, -0.865478515625, -0.8311767578125, -0.796875, -0.7625732421875, -0.728271484375, -0.6939697265625, -0.65966796875, -0.6253662109375, -0.591064453125, -0.5567626953125, -0.5224609375, -0.4881591796875, -0.453857421875, -0.4195556640625, -0.38525390625, -0.3509521484375, -0.316650390625, -0.2823486328125, -0.248046875, -0.2137451171875, -0.179443359375, -0.1451416015625, -0.11083984375, -0.0765380859375, -0.042236328125, -0.0079345703125, 0.0263671875, 0.0606689453125, 0.094970703125, 0.1292724609375, 0.16357421875, 0.1978759765625, 0.232177734375, 0.2664794921875, 0.30078125, 0.3350830078125, 0.369384765625, 0.4036865234375, 0.43798828125, 0.4722900390625, 0.506591796875, 0.5408935546875, 0.5751953125, 0.6094970703125, 0.643798828125, 0.6781005859375, 0.71240234375, 0.7467041015625, 0.781005859375, 0.8153076171875, 0.849609375, 0.8839111328125, 0.918212890625, 0.9525146484375, 0.98681640625, 1.0211181640625, 1.055419921875, 1.0897216796875, 1.1240234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 10.0, 18.0, 23.0, 38.0, 82.0, 142.0, 238.0, 479.0, 1599.0, 16002.0, 3722739.0, 445444.0, 5833.0, 970.0, 343.0, 149.0, 86.0, 51.0, 18.0, 11.0, 9.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.7620849609375, -7.461669921875, -7.1612548828125, -6.86083984375, -6.5604248046875, -6.260009765625, -5.9595947265625, -5.6591796875, -5.3587646484375, -5.058349609375, -4.7579345703125, -4.45751953125, -4.1571044921875, -3.856689453125, -3.5562744140625, -3.255859375, -2.9554443359375, -2.655029296875, -2.3546142578125, -2.05419921875, -1.7537841796875, -1.453369140625, -1.1529541015625, -0.8525390625, -0.5521240234375, -0.251708984375, 0.0487060546875, 0.34912109375, 0.6495361328125, 0.949951171875, 1.2503662109375, 1.55078125, 1.8511962890625, 2.151611328125, 2.4520263671875, 2.75244140625, 3.0528564453125, 3.353271484375, 3.6536865234375, 3.9541015625, 4.2545166015625, 4.554931640625, 4.8553466796875, 5.15576171875, 5.4561767578125, 5.756591796875, 6.0570068359375, 6.357421875, 6.6578369140625, 6.958251953125, 7.2586669921875, 7.55908203125, 7.8594970703125, 8.159912109375, 8.4603271484375, 8.7607421875, 9.0611572265625, 9.361572265625, 9.6619873046875, 9.96240234375, 10.2628173828125, 10.563232421875, 10.8636474609375, 11.1640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 5.0, 18.0, 28.0, 29.0, 112.0, 222.0, 539.0, 1300.0, 1075.0, 397.0, 178.0, 79.0, 36.0, 26.0, 20.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.6427001953125, -8.426025390625, -8.2093505859375, -7.99267578125, -7.7760009765625, -7.559326171875, -7.3426513671875, -7.1259765625, -6.9093017578125, -6.692626953125, -6.4759521484375, -6.25927734375, -6.0426025390625, -5.825927734375, -5.6092529296875, -5.392578125, -5.1759033203125, -4.959228515625, -4.7425537109375, -4.52587890625, -4.3092041015625, -4.092529296875, -3.8758544921875, -3.6591796875, -3.4425048828125, -3.225830078125, -3.0091552734375, -2.79248046875, -2.5758056640625, -2.359130859375, -2.1424560546875, -1.92578125, -1.7091064453125, -1.492431640625, -1.2757568359375, -1.05908203125, -0.8424072265625, -0.625732421875, -0.4090576171875, -0.1923828125, 0.0242919921875, 0.240966796875, 0.4576416015625, 0.67431640625, 0.8909912109375, 1.107666015625, 1.3243408203125, 1.541015625, 1.7576904296875, 1.974365234375, 2.1910400390625, 2.40771484375, 2.6243896484375, 2.841064453125, 3.0577392578125, 3.2744140625, 3.4910888671875, 3.707763671875, 3.9244384765625, 4.14111328125, 4.3577880859375, 4.574462890625, 4.7911376953125, 5.0078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 1.0, 6.0, 26.0, 60.0, 169.0, 311.0, 220.0, 116.0, 48.0, 16.0, 7.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-73.69612121582031, -71.79644012451172, -69.8967514038086, -67.9970703125, -66.09738159179688, -64.19770050048828, -62.29801940917969, -60.39833450317383, -58.49864959716797, -56.59896469116211, -54.69927978515625, -52.799598693847656, -50.8999137878418, -49.00022888183594, -47.100547790527344, -45.200862884521484, -43.301177978515625, -41.401493072509766, -39.501808166503906, -37.60212707519531, -35.70244216918945, -33.802757263183594, -31.903074264526367, -30.00339126586914, -28.10370635986328, -26.204021453857422, -24.304338455200195, -22.40465545654297, -20.50497055053711, -18.60528564453125, -16.705602645874023, -14.80591869354248, -12.906230926513672, -11.006546974182129, -9.106863021850586, -7.207179069519043, -5.3074951171875, -3.407811164855957, -1.508127212524414, 0.3915567398071289, 2.291240692138672, 4.190924644470215, 6.090608596801758, 7.990292549133301, 9.889976501464844, 11.789660453796387, 13.68934440612793, 15.589028358459473, 17.488712310791016, 19.388397216796875, 21.2880802154541, 23.187763214111328, 25.087448120117188, 26.987133026123047, 28.886816024780273, 30.7864990234375, 32.68618392944336, 34.58586883544922, 36.48554992675781, 38.38523483276367, 40.28491973876953, 42.18460464477539, 44.08428955078125, 45.983970642089844, 47.8836555480957]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 11.0, 10.0, 18.0, 16.0, 19.0, 17.0, 30.0, 42.0, 36.0, 39.0, 52.0, 37.0, 47.0, 46.0, 56.0, 48.0, 61.0, 60.0, 69.0, 33.0, 42.0, 28.0, 29.0, 34.0, 25.0, 17.0, 15.0, 17.0, 9.0, 16.0, 5.0, 3.0, 3.0, 6.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.568950653076172, -20.937515258789062, -20.306079864501953, -19.674646377563477, -19.043210983276367, -18.411775588989258, -17.78034210205078, -17.148906707763672, -16.517471313476562, -15.886035919189453, -15.25460147857666, -14.623167037963867, -13.991731643676758, -13.360296249389648, -12.728861808776855, -12.097427368164062, -11.465991973876953, -10.834556579589844, -10.20312213897705, -9.571687698364258, -8.940252304077148, -8.308816909790039, -7.677382469177246, -7.045947551727295, -6.414512634277344, -5.783077716827393, -5.151642799377441, -4.52020788192749, -3.888772964477539, -3.257338047027588, -2.6259031295776367, -1.9944682121276855, -1.3630332946777344, -0.7315983772277832, -0.10016345977783203, 0.5312714576721191, 1.1627063751220703, 1.7941412925720215, 2.4255762100219727, 3.057011127471924, 3.688446044921875, 4.319880962371826, 4.951315879821777, 5.5827507972717285, 6.21418571472168, 6.845620632171631, 7.477055549621582, 8.108489990234375, 8.739925384521484, 9.371360778808594, 10.002795219421387, 10.63422966003418, 11.265665054321289, 11.897100448608398, 12.528534889221191, 13.159969329833984, 13.791404724121094, 14.422840118408203, 15.054274559020996, 15.685708999633789, 16.3171443939209, 16.948579788208008, 17.580013275146484, 18.211448669433594, 18.842884063720703]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 6.0, 13.0, 8.0, 11.0, 23.0, 31.0, 43.0, 67.0, 97.0, 132.0, 203.0, 310.0, 487.0, 714.0, 1128.0, 1837.0, 2976.0, 5087.0, 8519.0, 14724.0, 26444.0, 47406.0, 84477.0, 143573.0, 206170.0, 197192.0, 131159.0, 76332.0, 42484.0, 23542.0, 13618.0, 7822.0, 4543.0, 2755.0, 1631.0, 1037.0, 674.0, 453.0, 283.0, 167.0, 125.0, 84.0, 52.0, 38.0, 31.0, 15.0, 13.0, 9.0, 8.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-1.6455078125, -1.5955047607421875, -1.545501708984375, -1.4954986572265625, -1.44549560546875, -1.3954925537109375, -1.345489501953125, -1.2954864501953125, -1.2454833984375, -1.1954803466796875, -1.145477294921875, -1.0954742431640625, -1.04547119140625, -0.9954681396484375, -0.945465087890625, -0.8954620361328125, -0.845458984375, -0.7954559326171875, -0.745452880859375, -0.6954498291015625, -0.64544677734375, -0.5954437255859375, -0.545440673828125, -0.4954376220703125, -0.4454345703125, -0.3954315185546875, -0.345428466796875, -0.2954254150390625, -0.24542236328125, -0.1954193115234375, -0.145416259765625, -0.0954132080078125, -0.04541015625, 0.0045928955078125, 0.054595947265625, 0.1045989990234375, 0.15460205078125, 0.2046051025390625, 0.254608154296875, 0.3046112060546875, 0.3546142578125, 0.4046173095703125, 0.454620361328125, 0.5046234130859375, 0.55462646484375, 0.6046295166015625, 0.654632568359375, 0.7046356201171875, 0.754638671875, 0.8046417236328125, 0.854644775390625, 0.9046478271484375, 0.95465087890625, 1.0046539306640625, 1.054656982421875, 1.1046600341796875, 1.1546630859375, 1.2046661376953125, 1.254669189453125, 1.3046722412109375, 1.35467529296875, 1.4046783447265625, 1.454681396484375, 1.5046844482421875, 1.5546875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 12.0, 7.0, 16.0, 8.0, 14.0, 18.0, 24.0, 30.0, 34.0, 36.0, 37.0, 39.0, 69.0, 74.0, 44.0, 47.0, 46.0, 60.0, 57.0, 40.0, 53.0, 37.0, 26.0, 31.0, 19.0, 30.0, 24.0, 9.0, 17.0, 10.0, 10.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-2.060546875, -2.0087890625, -1.95703125, -1.9052734375, -1.853515625, -1.8017578125, -1.75, -1.6982421875, -1.646484375, -1.5947265625, -1.54296875, -1.4912109375, -1.439453125, -1.3876953125, -1.3359375, -1.2841796875, -1.232421875, -1.1806640625, -1.12890625, -1.0771484375, -1.025390625, -0.9736328125, -0.921875, -0.8701171875, -0.818359375, -0.7666015625, -0.71484375, -0.6630859375, -0.611328125, -0.5595703125, -0.5078125, -0.4560546875, -0.404296875, -0.3525390625, -0.30078125, -0.2490234375, -0.197265625, -0.1455078125, -0.09375, -0.0419921875, 0.009765625, 0.0615234375, 0.11328125, 0.1650390625, 0.216796875, 0.2685546875, 0.3203125, 0.3720703125, 0.423828125, 0.4755859375, 0.52734375, 0.5791015625, 0.630859375, 0.6826171875, 0.734375, 0.7861328125, 0.837890625, 0.8896484375, 0.94140625, 0.9931640625, 1.044921875, 1.0966796875, 1.1484375, 1.2001953125, 1.251953125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 10.0, 17.0, 24.0, 24.0, 57.0, 93.0, 154.0, 318.0, 861.0, 2260.0, 7833.0, 34557.0, 214749.0, 666994.0, 95469.0, 17669.0, 4776.0, 1463.0, 580.0, 253.0, 135.0, 66.0, 51.0, 35.0, 24.0, 17.0, 18.0, 9.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.4495849609375, -5.285888671875, -5.1221923828125, -4.95849609375, -4.7947998046875, -4.631103515625, -4.4674072265625, -4.3037109375, -4.1400146484375, -3.976318359375, -3.8126220703125, -3.64892578125, -3.4852294921875, -3.321533203125, -3.1578369140625, -2.994140625, -2.8304443359375, -2.666748046875, -2.5030517578125, -2.33935546875, -2.1756591796875, -2.011962890625, -1.8482666015625, -1.6845703125, -1.5208740234375, -1.357177734375, -1.1934814453125, -1.02978515625, -0.8660888671875, -0.702392578125, -0.5386962890625, -0.375, -0.2113037109375, -0.047607421875, 0.1160888671875, 0.27978515625, 0.4434814453125, 0.607177734375, 0.7708740234375, 0.9345703125, 1.0982666015625, 1.261962890625, 1.4256591796875, 1.58935546875, 1.7530517578125, 1.916748046875, 2.0804443359375, 2.244140625, 2.4078369140625, 2.571533203125, 2.7352294921875, 2.89892578125, 3.0626220703125, 3.226318359375, 3.3900146484375, 3.5537109375, 3.7174072265625, 3.881103515625, 4.0447998046875, 4.20849609375, 4.3721923828125, 4.535888671875, 4.6995849609375, 4.86328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 5.0, 11.0, 19.0, 16.0, 38.0, 36.0, 56.0, 52.0, 68.0, 74.0, 80.0, 78.0, 85.0, 62.0, 71.0, 61.0, 32.0, 47.0, 33.0, 11.0, 14.0, 15.0, 4.0, 11.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.59375, -8.326416015625, -8.05908203125, -7.791748046875, -7.5244140625, -7.257080078125, -6.98974609375, -6.722412109375, -6.455078125, -6.187744140625, -5.92041015625, -5.653076171875, -5.3857421875, -5.118408203125, -4.85107421875, -4.583740234375, -4.31640625, -4.049072265625, -3.78173828125, -3.514404296875, -3.2470703125, -2.979736328125, -2.71240234375, -2.445068359375, -2.177734375, -1.910400390625, -1.64306640625, -1.375732421875, -1.1083984375, -0.841064453125, -0.57373046875, -0.306396484375, -0.0390625, 0.228271484375, 0.49560546875, 0.762939453125, 1.0302734375, 1.297607421875, 1.56494140625, 1.832275390625, 2.099609375, 2.366943359375, 2.63427734375, 2.901611328125, 3.1689453125, 3.436279296875, 3.70361328125, 3.970947265625, 4.23828125, 4.505615234375, 4.77294921875, 5.040283203125, 5.3076171875, 5.574951171875, 5.84228515625, 6.109619140625, 6.376953125, 6.644287109375, 6.91162109375, 7.178955078125, 7.4462890625, 7.713623046875, 7.98095703125, 8.248291015625, 8.515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 13.0, 17.0, 13.0, 22.0, 29.0, 41.0, 55.0, 69.0, 83.0, 125.0, 208.0, 289.0, 420.0, 635.0, 949.0, 1487.0, 2534.0, 4827.0, 9578.0, 24252.0, 87267.0, 619969.0, 218979.0, 45352.0, 15501.0, 6755.0, 3420.0, 1979.0, 1250.0, 785.0, 504.0, 336.0, 215.0, 172.0, 112.0, 92.0, 56.0, 40.0, 31.0, 22.0, 28.0, 10.0, 4.0, 8.0, 8.0, 5.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0], "bins": [-2.072265625, -2.010894775390625, -1.94952392578125, -1.888153076171875, -1.8267822265625, -1.765411376953125, -1.70404052734375, -1.642669677734375, -1.581298828125, -1.519927978515625, -1.45855712890625, -1.397186279296875, -1.3358154296875, -1.274444580078125, -1.21307373046875, -1.151702880859375, -1.09033203125, -1.028961181640625, -0.96759033203125, -0.906219482421875, -0.8448486328125, -0.783477783203125, -0.72210693359375, -0.660736083984375, -0.599365234375, -0.537994384765625, -0.47662353515625, -0.415252685546875, -0.3538818359375, -0.292510986328125, -0.23114013671875, -0.169769287109375, -0.1083984375, -0.047027587890625, 0.01434326171875, 0.075714111328125, 0.1370849609375, 0.198455810546875, 0.25982666015625, 0.321197509765625, 0.382568359375, 0.443939208984375, 0.50531005859375, 0.566680908203125, 0.6280517578125, 0.689422607421875, 0.75079345703125, 0.812164306640625, 0.87353515625, 0.934906005859375, 0.99627685546875, 1.057647705078125, 1.1190185546875, 1.180389404296875, 1.24176025390625, 1.303131103515625, 1.364501953125, 1.425872802734375, 1.48724365234375, 1.548614501953125, 1.6099853515625, 1.671356201171875, 1.73272705078125, 1.794097900390625, 1.85546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 16.0, 32.0, 71.0, 187.0, 340.0, 185.0, 73.0, 26.0, 13.0, 9.0, 6.0, 9.0, 4.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0018281936645507812, -0.0017701387405395508, -0.0017120838165283203, -0.0016540288925170898, -0.0015959739685058594, -0.001537919044494629, -0.0014798641204833984, -0.001421809196472168, -0.0013637542724609375, -0.001305699348449707, -0.0012476444244384766, -0.001189589500427246, -0.0011315345764160156, -0.0010734796524047852, -0.0010154247283935547, -0.0009573698043823242, -0.0008993148803710938, -0.0008412599563598633, -0.0007832050323486328, -0.0007251501083374023, -0.0006670951843261719, -0.0006090402603149414, -0.0005509853363037109, -0.0004929304122924805, -0.00043487548828125, -0.00037682056427001953, -0.00031876564025878906, -0.0002607107162475586, -0.00020265579223632812, -0.00014460086822509766, -8.654594421386719e-05, -2.849102020263672e-05, 2.956390380859375e-05, 8.761882781982422e-05, 0.0001456737518310547, 0.00020372867584228516, 0.0002617835998535156, 0.0003198385238647461, 0.00037789344787597656, 0.00043594837188720703, 0.0004940032958984375, 0.000552058219909668, 0.0006101131439208984, 0.0006681680679321289, 0.0007262229919433594, 0.0007842779159545898, 0.0008423328399658203, 0.0009003877639770508, 0.0009584426879882812, 0.0010164976119995117, 0.0010745525360107422, 0.0011326074600219727, 0.0011906623840332031, 0.0012487173080444336, 0.001306772232055664, 0.0013648271560668945, 0.001422882080078125, 0.0014809370040893555, 0.001538991928100586, 0.0015970468521118164, 0.0016551017761230469, 0.0017131567001342773, 0.0017712116241455078, 0.0018292665481567383, 0.0018873214721679688]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 10.0, 13.0, 20.0, 35.0, 72.0, 100.0, 199.0, 333.0, 628.0, 1060.0, 2162.0, 4876.0, 12210.0, 40317.0, 207767.0, 641078.0, 99259.0, 23456.0, 8081.0, 3436.0, 1572.0, 813.0, 425.0, 251.0, 127.0, 84.0, 68.0, 27.0, 23.0, 7.0, 12.0, 9.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.23046875, -2.167266845703125, -2.10406494140625, -2.040863037109375, -1.9776611328125, -1.914459228515625, -1.85125732421875, -1.788055419921875, -1.724853515625, -1.661651611328125, -1.59844970703125, -1.535247802734375, -1.4720458984375, -1.408843994140625, -1.34564208984375, -1.282440185546875, -1.21923828125, -1.156036376953125, -1.09283447265625, -1.029632568359375, -0.9664306640625, -0.903228759765625, -0.84002685546875, -0.776824951171875, -0.713623046875, -0.650421142578125, -0.58721923828125, -0.524017333984375, -0.4608154296875, -0.397613525390625, -0.33441162109375, -0.271209716796875, -0.2080078125, -0.144805908203125, -0.08160400390625, -0.018402099609375, 0.0447998046875, 0.108001708984375, 0.17120361328125, 0.234405517578125, 0.297607421875, 0.360809326171875, 0.42401123046875, 0.487213134765625, 0.5504150390625, 0.613616943359375, 0.67681884765625, 0.740020751953125, 0.80322265625, 0.866424560546875, 0.92962646484375, 0.992828369140625, 1.0560302734375, 1.119232177734375, 1.18243408203125, 1.245635986328125, 1.308837890625, 1.372039794921875, 1.43524169921875, 1.498443603515625, 1.5616455078125, 1.624847412109375, 1.68804931640625, 1.751251220703125, 1.814453125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 2.0, 10.0, 10.0, 12.0, 19.0, 14.0, 26.0, 36.0, 45.0, 37.0, 65.0, 67.0, 70.0, 92.0, 107.0, 80.0, 74.0, 56.0, 35.0, 25.0, 33.0, 15.0, 10.0, 10.0, 12.0, 5.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.90234375, -1.840545654296875, -1.77874755859375, -1.716949462890625, -1.6551513671875, -1.593353271484375, -1.53155517578125, -1.469757080078125, -1.407958984375, -1.346160888671875, -1.28436279296875, -1.222564697265625, -1.1607666015625, -1.098968505859375, -1.03717041015625, -0.975372314453125, -0.91357421875, -0.851776123046875, -0.78997802734375, -0.728179931640625, -0.6663818359375, -0.604583740234375, -0.54278564453125, -0.480987548828125, -0.419189453125, -0.357391357421875, -0.29559326171875, -0.233795166015625, -0.1719970703125, -0.110198974609375, -0.04840087890625, 0.013397216796875, 0.0751953125, 0.136993408203125, 0.19879150390625, 0.260589599609375, 0.3223876953125, 0.384185791015625, 0.44598388671875, 0.507781982421875, 0.569580078125, 0.631378173828125, 0.69317626953125, 0.754974365234375, 0.8167724609375, 0.878570556640625, 0.94036865234375, 1.002166748046875, 1.06396484375, 1.125762939453125, 1.18756103515625, 1.249359130859375, 1.3111572265625, 1.372955322265625, 1.43475341796875, 1.496551513671875, 1.558349609375, 1.620147705078125, 1.68194580078125, 1.743743896484375, 1.8055419921875, 1.867340087890625, 1.92913818359375, 1.990936279296875, 2.052734375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 13.0, 19.0, 48.0, 73.0, 107.0, 231.0, 170.0, 114.0, 76.0, 54.0, 26.0, 20.0, 9.0, 4.0, 11.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.167694091796875, -38.906982421875, -37.646270751953125, -36.385562896728516, -35.12485122680664, -33.864139556884766, -32.60342788696289, -31.342716217041016, -30.082006454467773, -28.8212947845459, -27.560585021972656, -26.29987335205078, -25.039161682128906, -23.778451919555664, -22.51774024963379, -21.257030487060547, -19.996318817138672, -18.735607147216797, -17.474897384643555, -16.21418571472168, -14.953474998474121, -13.692764282226562, -12.432052612304688, -11.171341896057129, -9.91063117980957, -8.649920463562012, -7.389209270477295, -6.128498077392578, -4.8677873611450195, -3.607076644897461, -2.346365451812744, -1.0856542587280273, 0.17505645751953125, 1.435767412185669, 2.6964783668518066, 3.9571893215179443, 5.217900276184082, 6.478610992431641, 7.739322185516357, 9.000033378601074, 10.260744094848633, 11.521454811096191, 12.78216552734375, 14.042877197265625, 15.303587913513184, 16.564298629760742, 17.825010299682617, 19.08572006225586, 20.346431732177734, 21.60714340209961, 22.86785316467285, 24.128564834594727, 25.38927459716797, 26.649986267089844, 27.91069793701172, 29.171409606933594, 30.432119369506836, 31.69283103942871, 32.95354080200195, 34.21425247192383, 35.4749641418457, 36.73567199707031, 37.99638366699219, 39.25709533691406, 40.51780700683594]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 11.0, 4.0, 8.0, 10.0, 10.0, 11.0, 22.0, 18.0, 21.0, 24.0, 29.0, 15.0, 19.0, 37.0, 24.0, 35.0, 60.0, 60.0, 80.0, 85.0, 55.0, 38.0, 39.0, 31.0, 32.0, 41.0, 25.0, 25.0, 20.0, 21.0, 14.0, 14.0, 16.0, 12.0, 9.0, 9.0, 5.0, 3.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.353973388671875, -22.64341926574707, -21.9328670501709, -21.222312927246094, -20.51175880432129, -19.801206588745117, -19.090652465820312, -18.38010025024414, -17.669546127319336, -16.95899200439453, -16.24843978881836, -15.537885665893555, -14.827332496643066, -14.116779327392578, -13.406225204467773, -12.695672035217285, -11.98511791229248, -11.274564743041992, -10.564010620117188, -9.8534574508667, -9.142904281616211, -8.432350158691406, -7.721796989440918, -7.01124382019043, -6.300690174102783, -5.590136528015137, -4.879583358764648, -4.169029712677002, -3.4584763050079346, -2.747922897338867, -2.0373692512512207, -1.3268160820007324, -0.6162624359130859, 0.09429103136062622, 0.8048444986343384, 1.5153980255126953, 2.2259514331817627, 2.93650484085083, 3.6470584869384766, 4.357611656188965, 5.068165302276611, 5.778718948364258, 6.489272117614746, 7.199825763702393, 7.910379409790039, 8.620932579040527, 9.331485748291016, 10.04203987121582, 10.752593040466309, 11.463146209716797, 12.173700332641602, 12.88425350189209, 13.594806671142578, 14.305360794067383, 15.015913963317871, 15.72646713256836, 16.437021255493164, 17.14757537841797, 17.85812759399414, 18.568681716918945, 19.27923583984375, 19.989788055419922, 20.700342178344727, 21.41089630126953, 22.121448516845703]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 9.0, 16.0, 8.0, 26.0, 36.0, 46.0, 45.0, 52.0, 89.0, 113.0, 196.0, 240.0, 442.0, 725.0, 1348.0, 2797.0, 7376.0, 24834.0, 150056.0, 1560494.0, 2162193.0, 232220.0, 34630.0, 9218.0, 3352.0, 1549.0, 782.0, 461.0, 292.0, 192.0, 116.0, 77.0, 71.0, 48.0, 30.0, 33.0, 21.0, 17.0, 10.0, 6.0, 4.0, 1.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.255859375, -2.175567626953125, -2.09527587890625, -2.014984130859375, -1.9346923828125, -1.854400634765625, -1.77410888671875, -1.693817138671875, -1.613525390625, -1.533233642578125, -1.45294189453125, -1.372650146484375, -1.2923583984375, -1.212066650390625, -1.13177490234375, -1.051483154296875, -0.97119140625, -0.890899658203125, -0.81060791015625, -0.730316162109375, -0.6500244140625, -0.569732666015625, -0.48944091796875, -0.409149169921875, -0.328857421875, -0.248565673828125, -0.16827392578125, -0.087982177734375, -0.0076904296875, 0.072601318359375, 0.15289306640625, 0.233184814453125, 0.3134765625, 0.393768310546875, 0.47406005859375, 0.554351806640625, 0.6346435546875, 0.714935302734375, 0.79522705078125, 0.875518798828125, 0.955810546875, 1.036102294921875, 1.11639404296875, 1.196685791015625, 1.2769775390625, 1.357269287109375, 1.43756103515625, 1.517852783203125, 1.59814453125, 1.678436279296875, 1.75872802734375, 1.839019775390625, 1.9193115234375, 1.999603271484375, 2.07989501953125, 2.160186767578125, 2.240478515625, 2.320770263671875, 2.40106201171875, 2.481353759765625, 2.5616455078125, 2.641937255859375, 2.72222900390625, 2.802520751953125, 2.8828125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 12.0, 5.0, 15.0, 17.0, 14.0, 22.0, 21.0, 23.0, 28.0, 38.0, 54.0, 59.0, 54.0, 56.0, 74.0, 74.0, 53.0, 48.0, 62.0, 52.0, 45.0, 42.0, 32.0, 25.0, 18.0, 11.0, 11.0, 18.0, 4.0, 7.0, 6.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.983123779296875, -1.92327880859375, -1.863433837890625, -1.8035888671875, -1.743743896484375, -1.68389892578125, -1.624053955078125, -1.564208984375, -1.504364013671875, -1.44451904296875, -1.384674072265625, -1.3248291015625, -1.264984130859375, -1.20513916015625, -1.145294189453125, -1.08544921875, -1.025604248046875, -0.96575927734375, -0.905914306640625, -0.8460693359375, -0.786224365234375, -0.72637939453125, -0.666534423828125, -0.606689453125, -0.546844482421875, -0.48699951171875, -0.427154541015625, -0.3673095703125, -0.307464599609375, -0.24761962890625, -0.187774658203125, -0.1279296875, -0.068084716796875, -0.00823974609375, 0.051605224609375, 0.1114501953125, 0.171295166015625, 0.23114013671875, 0.290985107421875, 0.350830078125, 0.410675048828125, 0.47052001953125, 0.530364990234375, 0.5902099609375, 0.650054931640625, 0.70989990234375, 0.769744873046875, 0.82958984375, 0.889434814453125, 0.94927978515625, 1.009124755859375, 1.0689697265625, 1.128814697265625, 1.18865966796875, 1.248504638671875, 1.308349609375, 1.368194580078125, 1.42803955078125, 1.487884521484375, 1.5477294921875, 1.607574462890625, 1.66741943359375, 1.727264404296875, 1.787109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 8.0, 12.0, 28.0, 41.0, 76.0, 144.0, 325.0, 1017.0, 5546.0, 168701.0, 3982934.0, 31923.0, 2436.0, 587.0, 219.0, 118.0, 67.0, 36.0, 27.0, 18.0, 12.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-15.359375, -15.03472900390625, -14.7100830078125, -14.38543701171875, -14.060791015625, -13.73614501953125, -13.4114990234375, -13.08685302734375, -12.76220703125, -12.43756103515625, -12.1129150390625, -11.78826904296875, -11.463623046875, -11.13897705078125, -10.8143310546875, -10.48968505859375, -10.1650390625, -9.84039306640625, -9.5157470703125, -9.19110107421875, -8.866455078125, -8.54180908203125, -8.2171630859375, -7.89251708984375, -7.56787109375, -7.24322509765625, -6.9185791015625, -6.59393310546875, -6.269287109375, -5.94464111328125, -5.6199951171875, -5.29534912109375, -4.970703125, -4.64605712890625, -4.3214111328125, -3.99676513671875, -3.672119140625, -3.34747314453125, -3.0228271484375, -2.69818115234375, -2.37353515625, -2.04888916015625, -1.7242431640625, -1.39959716796875, -1.074951171875, -0.75030517578125, -0.4256591796875, -0.10101318359375, 0.2236328125, 0.54827880859375, 0.8729248046875, 1.19757080078125, 1.522216796875, 1.84686279296875, 2.1715087890625, 2.49615478515625, 2.82080078125, 3.14544677734375, 3.4700927734375, 3.79473876953125, 4.119384765625, 4.44403076171875, 4.7686767578125, 5.09332275390625, 5.41796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 9.0, 20.0, 26.0, 41.0, 91.0, 162.0, 525.0, 1246.0, 1176.0, 454.0, 168.0, 70.0, 39.0, 21.0, 15.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7421875, -6.4921875, -6.2421875, -5.9921875, -5.7421875, -5.4921875, -5.2421875, -4.9921875, -4.7421875, -4.4921875, -4.2421875, -3.9921875, -3.7421875, -3.4921875, -3.2421875, -2.9921875, -2.7421875, -2.4921875, -2.2421875, -1.9921875, -1.7421875, -1.4921875, -1.2421875, -0.9921875, -0.7421875, -0.4921875, -0.2421875, 0.0078125, 0.2578125, 0.5078125, 0.7578125, 1.0078125, 1.2578125, 1.5078125, 1.7578125, 2.0078125, 2.2578125, 2.5078125, 2.7578125, 3.0078125, 3.2578125, 3.5078125, 3.7578125, 4.0078125, 4.2578125, 4.5078125, 4.7578125, 5.0078125, 5.2578125, 5.5078125, 5.7578125, 6.0078125, 6.2578125, 6.5078125, 6.7578125, 7.0078125, 7.2578125, 7.5078125, 7.7578125, 8.0078125, 8.2578125, 8.5078125, 8.7578125, 9.0078125, 9.2578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 12.0, 15.0, 23.0, 38.0, 88.0, 128.0, 148.0, 153.0, 135.0, 95.0, 61.0, 41.0, 22.0, 13.0, 10.0, 12.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.452430725097656, -42.40061950683594, -41.34880447387695, -40.296993255615234, -39.245182037353516, -38.19336700439453, -37.14155578613281, -36.089744567871094, -35.03792953491211, -33.98611831665039, -32.934303283691406, -31.882492065429688, -30.830678939819336, -29.778865814208984, -28.727054595947266, -27.675241470336914, -26.623430252075195, -25.571617126464844, -24.519805908203125, -23.467992782592773, -22.416179656982422, -21.364368438720703, -20.31255531311035, -19.2607421875, -18.20893096923828, -17.15711784362793, -16.10530662536621, -15.05349349975586, -14.001680374145508, -12.949868202209473, -11.898056030273438, -10.846242904663086, -9.794429779052734, -8.7426176071167, -7.690804481506348, -6.6389923095703125, -5.587179660797119, -4.535367012023926, -3.4835548400878906, -2.4317421913146973, -1.379929542541504, -0.3281170129776001, 0.7236955165863037, 1.775507926940918, 2.8273205757141113, 3.8791332244873047, 4.93094539642334, 5.982758045196533, 7.034570693969727, 8.086382865905762, 9.138195991516113, 10.190008163452148, 11.2418212890625, 12.293633460998535, 13.34544563293457, 14.397258758544922, 15.449070930480957, 16.500883102416992, 17.552696228027344, 18.604507446289062, 19.656320571899414, 20.708133697509766, 21.759944915771484, 22.811758041381836, 23.863571166992188]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 5.0, 8.0, 4.0, 12.0, 9.0, 6.0, 10.0, 17.0, 14.0, 29.0, 32.0, 41.0, 34.0, 29.0, 25.0, 38.0, 58.0, 53.0, 48.0, 62.0, 66.0, 50.0, 39.0, 48.0, 35.0, 43.0, 29.0, 32.0, 19.0, 15.0, 18.0, 18.0, 12.0, 9.0, 7.0, 9.0, 10.0, 5.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.932329177856445, -19.31830596923828, -18.70428466796875, -18.090261459350586, -17.476240158081055, -16.86221694946289, -16.24819564819336, -15.634172439575195, -15.020150184631348, -14.4061279296875, -13.792105674743652, -13.178083419799805, -12.56406021118164, -11.95003890991211, -11.336015701293945, -10.721993446350098, -10.10797119140625, -9.493948936462402, -8.879926681518555, -8.265904426574707, -7.651881694793701, -7.0378594398498535, -6.423836708068848, -5.809814453125, -5.195792198181152, -4.581769943237305, -3.967747449874878, -3.353724956512451, -2.7397027015686035, -2.125680446624756, -1.511657953262329, -0.8976354598999023, -0.2836151123046875, 0.3304072618484497, 0.9444296360015869, 1.5584520101547241, 2.1724743843078613, 2.786496639251709, 3.4005191326141357, 4.0145416259765625, 4.62856388092041, 5.242586135864258, 5.8566083908081055, 6.470631122589111, 7.084653377532959, 7.698675632476807, 8.312698364257812, 8.92672061920166, 9.540742874145508, 10.154765129089355, 10.768787384033203, 11.38280963897705, 11.996831893920898, 12.610855102539062, 13.22487735748291, 13.838899612426758, 14.452921867370605, 15.066944122314453, 15.6809663772583, 16.29498863220215, 16.909011840820312, 17.523033142089844, 18.137056350708008, 18.751079559326172, 19.365100860595703]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 4.0, 9.0, 8.0, 17.0, 30.0, 26.0, 64.0, 72.0, 130.0, 206.0, 307.0, 462.0, 861.0, 1449.0, 2480.0, 4490.0, 8085.0, 15235.0, 29738.0, 59293.0, 122368.0, 239031.0, 268628.0, 147982.0, 71685.0, 35760.0, 18137.0, 9620.0, 5235.0, 2889.0, 1670.0, 992.0, 597.0, 380.0, 207.0, 138.0, 90.0, 54.0, 41.0, 27.0, 28.0, 15.0, 7.0, 10.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.074005126953125, -2.01324462890625, -1.952484130859375, -1.8917236328125, -1.830963134765625, -1.77020263671875, -1.709442138671875, -1.648681640625, -1.587921142578125, -1.52716064453125, -1.466400146484375, -1.4056396484375, -1.344879150390625, -1.28411865234375, -1.223358154296875, -1.16259765625, -1.101837158203125, -1.04107666015625, -0.980316162109375, -0.9195556640625, -0.858795166015625, -0.79803466796875, -0.737274169921875, -0.676513671875, -0.615753173828125, -0.55499267578125, -0.494232177734375, -0.4334716796875, -0.372711181640625, -0.31195068359375, -0.251190185546875, -0.1904296875, -0.129669189453125, -0.06890869140625, -0.008148193359375, 0.0526123046875, 0.113372802734375, 0.17413330078125, 0.234893798828125, 0.295654296875, 0.356414794921875, 0.41717529296875, 0.477935791015625, 0.5386962890625, 0.599456787109375, 0.66021728515625, 0.720977783203125, 0.78173828125, 0.842498779296875, 0.90325927734375, 0.964019775390625, 1.0247802734375, 1.085540771484375, 1.14630126953125, 1.207061767578125, 1.267822265625, 1.328582763671875, 1.38934326171875, 1.450103759765625, 1.5108642578125, 1.571624755859375, 1.63238525390625, 1.693145751953125, 1.75390625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 8.0, 6.0, 10.0, 9.0, 13.0, 17.0, 21.0, 22.0, 24.0, 36.0, 40.0, 40.0, 45.0, 47.0, 44.0, 55.0, 62.0, 65.0, 55.0, 46.0, 59.0, 48.0, 37.0, 35.0, 38.0, 25.0, 18.0, 10.0, 14.0, 12.0, 11.0, 8.0, 11.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.869140625, -1.8087158203125, -1.748291015625, -1.6878662109375, -1.62744140625, -1.5670166015625, -1.506591796875, -1.4461669921875, -1.3857421875, -1.3253173828125, -1.264892578125, -1.2044677734375, -1.14404296875, -1.0836181640625, -1.023193359375, -0.9627685546875, -0.90234375, -0.8419189453125, -0.781494140625, -0.7210693359375, -0.66064453125, -0.6002197265625, -0.539794921875, -0.4793701171875, -0.4189453125, -0.3585205078125, -0.298095703125, -0.2376708984375, -0.17724609375, -0.1168212890625, -0.056396484375, 0.0040283203125, 0.064453125, 0.1248779296875, 0.185302734375, 0.2457275390625, 0.30615234375, 0.3665771484375, 0.427001953125, 0.4874267578125, 0.5478515625, 0.6082763671875, 0.668701171875, 0.7291259765625, 0.78955078125, 0.8499755859375, 0.910400390625, 0.9708251953125, 1.03125, 1.0916748046875, 1.152099609375, 1.2125244140625, 1.27294921875, 1.3333740234375, 1.393798828125, 1.4542236328125, 1.5146484375, 1.5750732421875, 1.635498046875, 1.6959228515625, 1.75634765625, 1.8167724609375, 1.877197265625, 1.9376220703125, 1.998046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 6.0, 6.0, 16.0, 15.0, 25.0, 38.0, 57.0, 63.0, 121.0, 144.0, 287.0, 485.0, 937.0, 2168.0, 5687.0, 21902.0, 123918.0, 726411.0, 132715.0, 22840.0, 6106.0, 2192.0, 1027.0, 471.0, 315.0, 173.0, 129.0, 87.0, 41.0, 51.0, 26.0, 14.0, 14.0, 12.0, 8.0, 5.0, 7.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.65234375, -5.48370361328125, -5.3150634765625, -5.14642333984375, -4.977783203125, -4.80914306640625, -4.6405029296875, -4.47186279296875, -4.30322265625, -4.13458251953125, -3.9659423828125, -3.79730224609375, -3.628662109375, -3.46002197265625, -3.2913818359375, -3.12274169921875, -2.9541015625, -2.78546142578125, -2.6168212890625, -2.44818115234375, -2.279541015625, -2.11090087890625, -1.9422607421875, -1.77362060546875, -1.60498046875, -1.43634033203125, -1.2677001953125, -1.09906005859375, -0.930419921875, -0.76177978515625, -0.5931396484375, -0.42449951171875, -0.255859375, -0.08721923828125, 0.0814208984375, 0.25006103515625, 0.418701171875, 0.58734130859375, 0.7559814453125, 0.92462158203125, 1.09326171875, 1.26190185546875, 1.4305419921875, 1.59918212890625, 1.767822265625, 1.93646240234375, 2.1051025390625, 2.27374267578125, 2.4423828125, 2.61102294921875, 2.7796630859375, 2.94830322265625, 3.116943359375, 3.28558349609375, 3.4542236328125, 3.62286376953125, 3.79150390625, 3.96014404296875, 4.1287841796875, 4.29742431640625, 4.466064453125, 4.63470458984375, 4.8033447265625, 4.97198486328125, 5.140625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 5.0, 8.0, 17.0, 19.0, 19.0, 19.0, 42.0, 36.0, 48.0, 48.0, 55.0, 85.0, 80.0, 51.0, 71.0, 72.0, 57.0, 29.0, 66.0, 42.0, 22.0, 22.0, 21.0, 14.0, 8.0, 8.0, 5.0, 4.0, 2.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.086669921875, -7.80615234375, -7.525634765625, -7.2451171875, -6.964599609375, -6.68408203125, -6.403564453125, -6.123046875, -5.842529296875, -5.56201171875, -5.281494140625, -5.0009765625, -4.720458984375, -4.43994140625, -4.159423828125, -3.87890625, -3.598388671875, -3.31787109375, -3.037353515625, -2.7568359375, -2.476318359375, -2.19580078125, -1.915283203125, -1.634765625, -1.354248046875, -1.07373046875, -0.793212890625, -0.5126953125, -0.232177734375, 0.04833984375, 0.328857421875, 0.609375, 0.889892578125, 1.17041015625, 1.450927734375, 1.7314453125, 2.011962890625, 2.29248046875, 2.572998046875, 2.853515625, 3.134033203125, 3.41455078125, 3.695068359375, 3.9755859375, 4.256103515625, 4.53662109375, 4.817138671875, 5.09765625, 5.378173828125, 5.65869140625, 5.939208984375, 6.2197265625, 6.500244140625, 6.78076171875, 7.061279296875, 7.341796875, 7.622314453125, 7.90283203125, 8.183349609375, 8.4638671875, 8.744384765625, 9.02490234375, 9.305419921875, 9.5859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 10.0, 4.0, 6.0, 7.0, 9.0, 8.0, 22.0, 22.0, 40.0, 70.0, 107.0, 199.0, 364.0, 775.0, 1733.0, 4510.0, 14810.0, 70309.0, 711633.0, 199479.0, 31303.0, 8079.0, 2723.0, 1138.0, 536.0, 294.0, 118.0, 81.0, 43.0, 29.0, 29.0, 19.0, 11.0, 12.0, 12.0, 1.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.890625, -1.8362274169921875, -1.781829833984375, -1.7274322509765625, -1.67303466796875, -1.6186370849609375, -1.564239501953125, -1.5098419189453125, -1.4554443359375, -1.4010467529296875, -1.346649169921875, -1.2922515869140625, -1.23785400390625, -1.1834564208984375, -1.129058837890625, -1.0746612548828125, -1.020263671875, -0.9658660888671875, -0.911468505859375, -0.8570709228515625, -0.80267333984375, -0.7482757568359375, -0.693878173828125, -0.6394805908203125, -0.5850830078125, -0.5306854248046875, -0.476287841796875, -0.4218902587890625, -0.36749267578125, -0.3130950927734375, -0.258697509765625, -0.2042999267578125, -0.14990234375, -0.0955047607421875, -0.041107177734375, 0.0132904052734375, 0.06768798828125, 0.1220855712890625, 0.176483154296875, 0.2308807373046875, 0.2852783203125, 0.3396759033203125, 0.394073486328125, 0.4484710693359375, 0.50286865234375, 0.5572662353515625, 0.611663818359375, 0.6660614013671875, 0.720458984375, 0.7748565673828125, 0.829254150390625, 0.8836517333984375, 0.93804931640625, 0.9924468994140625, 1.046844482421875, 1.1012420654296875, 1.1556396484375, 1.2100372314453125, 1.264434814453125, 1.3188323974609375, 1.37322998046875, 1.4276275634765625, 1.482025146484375, 1.5364227294921875, 1.5908203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 7.0, 7.0, 14.0, 15.0, 18.0, 16.0, 23.0, 30.0, 38.0, 42.0, 61.0, 89.0, 109.0, 116.0, 58.0, 62.0, 51.0, 45.0, 30.0, 27.0, 26.0, 20.0, 15.0, 12.0, 9.0, 8.0, 10.0, 2.0, 7.0, 1.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.000377655029296875, -0.0003658384084701538, -0.0003540217876434326, -0.0003422051668167114, -0.00033038854598999023, -0.00031857192516326904, -0.00030675530433654785, -0.00029493868350982666, -0.00028312206268310547, -0.0002713054418563843, -0.0002594888210296631, -0.0002476722002029419, -0.0002358555793762207, -0.0002240389585494995, -0.00021222233772277832, -0.00020040571689605713, -0.00018858909606933594, -0.00017677247524261475, -0.00016495585441589355, -0.00015313923358917236, -0.00014132261276245117, -0.00012950599193572998, -0.00011768937110900879, -0.0001058727502822876, -9.40561294555664e-05, -8.223950862884521e-05, -7.042288780212402e-05, -5.860626697540283e-05, -4.678964614868164e-05, -3.497302532196045e-05, -2.3156404495239258e-05, -1.1339783668518066e-05, 4.76837158203125e-07, 1.2293457984924316e-05, 2.4110078811645508e-05, 3.59266996383667e-05, 4.774332046508789e-05, 5.955994129180908e-05, 7.137656211853027e-05, 8.319318294525146e-05, 9.500980377197266e-05, 0.00010682642459869385, 0.00011864304542541504, 0.00013045966625213623, 0.00014227628707885742, 0.0001540929079055786, 0.0001659095287322998, 0.000177726149559021, 0.0001895427703857422, 0.00020135939121246338, 0.00021317601203918457, 0.00022499263286590576, 0.00023680925369262695, 0.00024862587451934814, 0.00026044249534606934, 0.00027225911617279053, 0.0002840757369995117, 0.0002958923578262329, 0.0003077089786529541, 0.0003195255994796753, 0.0003313422203063965, 0.0003431588411331177, 0.00035497546195983887, 0.00036679208278656006, 0.00037860870361328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 12.0, 19.0, 20.0, 45.0, 83.0, 167.0, 369.0, 926.0, 2391.0, 9547.0, 65838.0, 820394.0, 128067.0, 15056.0, 3490.0, 1136.0, 491.0, 236.0, 112.0, 53.0, 42.0, 15.0, 11.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.515625, -2.43853759765625, -2.3614501953125, -2.28436279296875, -2.207275390625, -2.13018798828125, -2.0531005859375, -1.97601318359375, -1.89892578125, -1.82183837890625, -1.7447509765625, -1.66766357421875, -1.590576171875, -1.51348876953125, -1.4364013671875, -1.35931396484375, -1.2822265625, -1.20513916015625, -1.1280517578125, -1.05096435546875, -0.973876953125, -0.89678955078125, -0.8197021484375, -0.74261474609375, -0.66552734375, -0.58843994140625, -0.5113525390625, -0.43426513671875, -0.357177734375, -0.28009033203125, -0.2030029296875, -0.12591552734375, -0.048828125, 0.02825927734375, 0.1053466796875, 0.18243408203125, 0.259521484375, 0.33660888671875, 0.4136962890625, 0.49078369140625, 0.56787109375, 0.64495849609375, 0.7220458984375, 0.79913330078125, 0.876220703125, 0.95330810546875, 1.0303955078125, 1.10748291015625, 1.1845703125, 1.26165771484375, 1.3387451171875, 1.41583251953125, 1.492919921875, 1.57000732421875, 1.6470947265625, 1.72418212890625, 1.80126953125, 1.87835693359375, 1.9554443359375, 2.03253173828125, 2.109619140625, 2.18670654296875, 2.2637939453125, 2.34088134765625, 2.41796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 2.0, 2.0, 4.0, 9.0, 8.0, 9.0, 9.0, 14.0, 19.0, 14.0, 22.0, 21.0, 35.0, 47.0, 73.0, 83.0, 89.0, 84.0, 90.0, 77.0, 61.0, 47.0, 38.0, 26.0, 18.0, 11.0, 14.0, 11.0, 11.0, 5.0, 5.0, 3.0, 6.0, 9.0, 2.0, 6.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0927734375, -1.049530029296875, -1.00628662109375, -0.963043212890625, -0.9197998046875, -0.876556396484375, -0.83331298828125, -0.790069580078125, -0.746826171875, -0.703582763671875, -0.66033935546875, -0.617095947265625, -0.5738525390625, -0.530609130859375, -0.48736572265625, -0.444122314453125, -0.40087890625, -0.357635498046875, -0.31439208984375, -0.271148681640625, -0.2279052734375, -0.184661865234375, -0.14141845703125, -0.098175048828125, -0.054931640625, -0.011688232421875, 0.03155517578125, 0.074798583984375, 0.1180419921875, 0.161285400390625, 0.20452880859375, 0.247772216796875, 0.291015625, 0.334259033203125, 0.37750244140625, 0.420745849609375, 0.4639892578125, 0.507232666015625, 0.55047607421875, 0.593719482421875, 0.636962890625, 0.680206298828125, 0.72344970703125, 0.766693115234375, 0.8099365234375, 0.853179931640625, 0.89642333984375, 0.939666748046875, 0.98291015625, 1.026153564453125, 1.06939697265625, 1.112640380859375, 1.1558837890625, 1.199127197265625, 1.24237060546875, 1.285614013671875, 1.328857421875, 1.372100830078125, 1.41534423828125, 1.458587646484375, 1.5018310546875, 1.545074462890625, 1.58831787109375, 1.631561279296875, 1.6748046875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 2.0, 6.0, 3.0, 26.0, 39.0, 99.0, 209.0, 354.0, 130.0, 67.0, 39.0, 18.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-86.04781341552734, -84.3418197631836, -82.63583374023438, -80.92984008789062, -79.2238540649414, -77.51786041259766, -75.81187438964844, -74.10588073730469, -72.39988708496094, -70.69389343261719, -68.98790740966797, -67.28191375732422, -65.575927734375, -63.86993408203125, -62.163944244384766, -60.45795440673828, -58.75196838378906, -57.04597854614258, -55.339988708496094, -53.63399887084961, -51.928009033203125, -50.222015380859375, -48.51602554321289, -46.810035705566406, -45.10404586791992, -43.39805603027344, -41.69206619262695, -39.98607635498047, -38.28008270263672, -36.5740966796875, -34.86810302734375, -33.162113189697266, -31.45612335205078, -29.750133514404297, -28.044143676757812, -26.338151931762695, -24.63216209411621, -22.926172256469727, -21.22018051147461, -19.514190673828125, -17.80820083618164, -16.102210998535156, -14.396220207214355, -12.690229415893555, -10.98423957824707, -9.278249740600586, -7.572258949279785, -5.866268157958984, -4.1602783203125, -2.4542880058288574, -0.7482976913452148, 0.9576926231384277, 2.6636829376220703, 4.369672775268555, 6.0756635665893555, 7.781654357910156, 9.48764419555664, 11.193634033203125, 12.899624824523926, 14.605615615844727, 16.31160545349121, 18.017595291137695, 19.723587036132812, 21.429576873779297, 23.13556671142578]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 3.0, 3.0, 5.0, 8.0, 11.0, 11.0, 10.0, 7.0, 16.0, 15.0, 22.0, 16.0, 23.0, 15.0, 28.0, 20.0, 28.0, 33.0, 62.0, 66.0, 89.0, 99.0, 58.0, 43.0, 38.0, 31.0, 35.0, 24.0, 19.0, 19.0, 18.0, 15.0, 13.0, 9.0, 14.0, 17.0, 8.0, 4.0, 3.0, 8.0, 6.0, 5.0, 6.0, 2.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-28.702878952026367, -27.878311157226562, -27.053741455078125, -26.22917366027832, -25.404605865478516, -24.580036163330078, -23.755468368530273, -22.93090057373047, -22.10633087158203, -21.281763076782227, -20.45719337463379, -19.632625579833984, -18.80805778503418, -17.983489990234375, -17.158920288085938, -16.334352493286133, -15.509784698486328, -14.685215950012207, -13.860648155212402, -13.036079406738281, -12.211511611938477, -11.386942863464355, -10.562374114990234, -9.73780632019043, -8.913237571716309, -8.088668823242188, -7.264101028442383, -6.439532279968262, -5.614964008331299, -4.790395736694336, -3.965826988220215, -3.141258716583252, -2.3166885375976562, -1.4921201467514038, -0.6675517559051514, 0.15701675415039062, 0.9815850257873535, 1.8061532974243164, 2.6307220458984375, 3.4552903175354004, 4.279858589172363, 5.104426860809326, 5.928995132446289, 6.75356388092041, 7.578132152557373, 8.402700424194336, 9.227269172668457, 10.051837921142578, 10.876405715942383, 11.700974464416504, 12.525542259216309, 13.35011100769043, 14.174678802490234, 14.999247550964355, 15.823816299438477, 16.64838409423828, 17.47295379638672, 18.297521591186523, 19.12209129333496, 19.946659088134766, 20.77122688293457, 21.595794677734375, 22.420364379882812, 23.244932174682617, 24.069499969482422]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 10.0, 13.0, 12.0, 26.0, 35.0, 62.0, 77.0, 135.0, 222.0, 468.0, 858.0, 1758.0, 4219.0, 11740.0, 48943.0, 363203.0, 2542417.0, 1073336.0, 112902.0, 21972.0, 6603.0, 2653.0, 1226.0, 594.0, 305.0, 169.0, 121.0, 70.0, 48.0, 36.0, 15.0, 10.0, 5.0, 7.0, 6.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.076171875, -2.98760986328125, -2.8990478515625, -2.81048583984375, -2.721923828125, -2.63336181640625, -2.5447998046875, -2.45623779296875, -2.36767578125, -2.27911376953125, -2.1905517578125, -2.10198974609375, -2.013427734375, -1.92486572265625, -1.8363037109375, -1.74774169921875, -1.6591796875, -1.57061767578125, -1.4820556640625, -1.39349365234375, -1.304931640625, -1.21636962890625, -1.1278076171875, -1.03924560546875, -0.95068359375, -0.86212158203125, -0.7735595703125, -0.68499755859375, -0.596435546875, -0.50787353515625, -0.4193115234375, -0.33074951171875, -0.2421875, -0.15362548828125, -0.0650634765625, 0.02349853515625, 0.112060546875, 0.20062255859375, 0.2891845703125, 0.37774658203125, 0.46630859375, 0.55487060546875, 0.6434326171875, 0.73199462890625, 0.820556640625, 0.90911865234375, 0.9976806640625, 1.08624267578125, 1.1748046875, 1.26336669921875, 1.3519287109375, 1.44049072265625, 1.529052734375, 1.61761474609375, 1.7061767578125, 1.79473876953125, 1.88330078125, 1.97186279296875, 2.0604248046875, 2.14898681640625, 2.237548828125, 2.32611083984375, 2.4146728515625, 2.50323486328125, 2.591796875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 0.0, 4.0, 7.0, 9.0, 9.0, 12.0, 15.0, 22.0, 27.0, 32.0, 33.0, 35.0, 45.0, 42.0, 46.0, 45.0, 57.0, 57.0, 49.0, 56.0, 44.0, 57.0, 47.0, 46.0, 33.0, 28.0, 19.0, 33.0, 16.0, 11.0, 16.0, 8.0, 6.0, 13.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8955078125, -1.83807373046875, -1.7806396484375, -1.72320556640625, -1.665771484375, -1.60833740234375, -1.5509033203125, -1.49346923828125, -1.43603515625, -1.37860107421875, -1.3211669921875, -1.26373291015625, -1.206298828125, -1.14886474609375, -1.0914306640625, -1.03399658203125, -0.9765625, -0.91912841796875, -0.8616943359375, -0.80426025390625, -0.746826171875, -0.68939208984375, -0.6319580078125, -0.57452392578125, -0.51708984375, -0.45965576171875, -0.4022216796875, -0.34478759765625, -0.287353515625, -0.22991943359375, -0.1724853515625, -0.11505126953125, -0.0576171875, -0.00018310546875, 0.0572509765625, 0.11468505859375, 0.172119140625, 0.22955322265625, 0.2869873046875, 0.34442138671875, 0.40185546875, 0.45928955078125, 0.5167236328125, 0.57415771484375, 0.631591796875, 0.68902587890625, 0.7464599609375, 0.80389404296875, 0.861328125, 0.91876220703125, 0.9761962890625, 1.03363037109375, 1.091064453125, 1.14849853515625, 1.2059326171875, 1.26336669921875, 1.32080078125, 1.37823486328125, 1.4356689453125, 1.49310302734375, 1.550537109375, 1.60797119140625, 1.6654052734375, 1.72283935546875, 1.7802734375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 10.0, 11.0, 15.0, 16.0, 30.0, 56.0, 107.0, 146.0, 245.0, 672.0, 2636.0, 17986.0, 1899723.0, 2249579.0, 19193.0, 2559.0, 696.0, 264.0, 132.0, 72.0, 62.0, 28.0, 15.0, 9.0, 7.0, 8.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4921875, -7.192626953125, -6.89306640625, -6.593505859375, -6.2939453125, -5.994384765625, -5.69482421875, -5.395263671875, -5.095703125, -4.796142578125, -4.49658203125, -4.197021484375, -3.8974609375, -3.597900390625, -3.29833984375, -2.998779296875, -2.69921875, -2.399658203125, -2.10009765625, -1.800537109375, -1.5009765625, -1.201416015625, -0.90185546875, -0.602294921875, -0.302734375, -0.003173828125, 0.29638671875, 0.595947265625, 0.8955078125, 1.195068359375, 1.49462890625, 1.794189453125, 2.09375, 2.393310546875, 2.69287109375, 2.992431640625, 3.2919921875, 3.591552734375, 3.89111328125, 4.190673828125, 4.490234375, 4.789794921875, 5.08935546875, 5.388916015625, 5.6884765625, 5.988037109375, 6.28759765625, 6.587158203125, 6.88671875, 7.186279296875, 7.48583984375, 7.785400390625, 8.0849609375, 8.384521484375, 8.68408203125, 8.983642578125, 9.283203125, 9.582763671875, 9.88232421875, 10.181884765625, 10.4814453125, 10.781005859375, 11.08056640625, 11.380126953125, 11.6796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 14.0, 20.0, 43.0, 58.0, 158.0, 452.0, 1371.0, 1210.0, 438.0, 168.0, 69.0, 30.0, 16.0, 9.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2734375, -13.95599365234375, -13.6385498046875, -13.32110595703125, -13.003662109375, -12.68621826171875, -12.3687744140625, -12.05133056640625, -11.73388671875, -11.41644287109375, -11.0989990234375, -10.78155517578125, -10.464111328125, -10.14666748046875, -9.8292236328125, -9.51177978515625, -9.1943359375, -8.87689208984375, -8.5594482421875, -8.24200439453125, -7.924560546875, -7.60711669921875, -7.2896728515625, -6.97222900390625, -6.65478515625, -6.33734130859375, -6.0198974609375, -5.70245361328125, -5.385009765625, -5.06756591796875, -4.7501220703125, -4.43267822265625, -4.115234375, -3.79779052734375, -3.4803466796875, -3.16290283203125, -2.845458984375, -2.52801513671875, -2.2105712890625, -1.89312744140625, -1.57568359375, -1.25823974609375, -0.9407958984375, -0.62335205078125, -0.305908203125, 0.01153564453125, 0.3289794921875, 0.64642333984375, 0.9638671875, 1.28131103515625, 1.5987548828125, 1.91619873046875, 2.233642578125, 2.55108642578125, 2.8685302734375, 3.18597412109375, 3.50341796875, 3.82086181640625, 4.1383056640625, 4.45574951171875, 4.773193359375, 5.09063720703125, 5.4080810546875, 5.72552490234375, 6.04296875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 10.0, 9.0, 12.0, 37.0, 69.0, 128.0, 166.0, 227.0, 150.0, 88.0, 45.0, 21.0, 20.0, 16.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.141845703125, -32.614219665527344, -31.086591720581055, -29.558963775634766, -28.03133773803711, -26.50370979309082, -24.97608184814453, -23.448455810546875, -21.920827865600586, -20.393199920654297, -18.86557388305664, -17.33794593811035, -15.810318946838379, -14.282691955566406, -12.755064010620117, -11.227437019348145, -9.699810028076172, -8.1721830368042, -6.644555568695068, -5.1169281005859375, -3.589301109313965, -2.061674118041992, -0.5340461730957031, 0.9935808181762695, 2.521207809448242, 4.048834800720215, 5.576462268829346, 7.104089736938477, 8.63171672821045, 10.159343719482422, 11.686971664428711, 13.214598655700684, 14.742225646972656, 16.269853591918945, 17.7974796295166, 19.32510757446289, 20.852733612060547, 22.380361557006836, 23.907989501953125, 25.43561553955078, 26.96324348449707, 28.49087142944336, 30.018497467041016, 31.546125411987305, 33.073753356933594, 34.60137939453125, 36.129005432128906, 37.65663528442383, 39.184261322021484, 40.71188735961914, 42.23951721191406, 43.76714324951172, 45.294769287109375, 46.82239532470703, 48.35002517700195, 49.87765121459961, 51.40528106689453, 52.93290710449219, 54.46053695678711, 55.988162994384766, 57.51578903198242, 59.043418884277344, 60.571044921875, 62.098670959472656, 63.62629699707031]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 9.0, 4.0, 9.0, 18.0, 12.0, 14.0, 35.0, 39.0, 32.0, 49.0, 57.0, 52.0, 54.0, 52.0, 66.0, 60.0, 48.0, 55.0, 53.0, 49.0, 42.0, 36.0, 27.0, 28.0, 17.0, 25.0, 13.0, 9.0, 2.0, 13.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.66283416748047, -28.812519073486328, -27.96220588684082, -27.11189079284668, -26.261577606201172, -25.41126251220703, -24.56094741821289, -23.71063232421875, -22.860319137573242, -22.0100040435791, -21.159690856933594, -20.309375762939453, -19.459060668945312, -18.608747482299805, -17.758432388305664, -16.908119201660156, -16.057804107666016, -15.207489967346191, -14.357175827026367, -13.506860733032227, -12.656546592712402, -11.806232452392578, -10.955917358398438, -10.105603218078613, -9.255289077758789, -8.404974937438965, -7.554660320281982, -6.704345703125, -5.854031562805176, -5.003717422485352, -4.153402805328369, -3.3030881881713867, -2.4527721405029297, -1.6024577617645264, -0.752143383026123, 0.09817099571228027, 0.9484853744506836, 1.7987995147705078, 2.6491141319274902, 3.4994287490844727, 4.349742889404297, 5.200057029724121, 6.0503716468811035, 6.900686264038086, 7.75100040435791, 8.601314544677734, 9.451629638671875, 10.3019437789917, 11.152257919311523, 12.002572059631348, 12.852886199951172, 13.703201293945312, 14.553515434265137, 15.403829574584961, 16.2541446685791, 17.10445785522461, 17.95477294921875, 18.80508804321289, 19.6554012298584, 20.50571632385254, 21.356029510498047, 22.206344604492188, 23.056659698486328, 23.90697479248047, 24.757287979125977]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 4.0, 3.0, 8.0, 8.0, 11.0, 14.0, 22.0, 33.0, 40.0, 50.0, 71.0, 108.0, 149.0, 249.0, 386.0, 662.0, 1126.0, 1887.0, 3181.0, 5960.0, 11727.0, 25123.0, 59925.0, 160916.0, 385981.0, 239062.0, 84880.0, 34124.0, 15499.0, 7502.0, 4080.0, 2283.0, 1306.0, 789.0, 454.0, 308.0, 195.0, 118.0, 93.0, 59.0, 50.0, 31.0, 18.0, 17.0, 16.0, 6.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-3.048828125, -2.952606201171875, -2.85638427734375, -2.760162353515625, -2.6639404296875, -2.567718505859375, -2.47149658203125, -2.375274658203125, -2.279052734375, -2.182830810546875, -2.08660888671875, -1.990386962890625, -1.8941650390625, -1.797943115234375, -1.70172119140625, -1.605499267578125, -1.50927734375, -1.413055419921875, -1.31683349609375, -1.220611572265625, -1.1243896484375, -1.028167724609375, -0.93194580078125, -0.835723876953125, -0.739501953125, -0.643280029296875, -0.54705810546875, -0.450836181640625, -0.3546142578125, -0.258392333984375, -0.16217041015625, -0.065948486328125, 0.0302734375, 0.126495361328125, 0.22271728515625, 0.318939208984375, 0.4151611328125, 0.511383056640625, 0.60760498046875, 0.703826904296875, 0.800048828125, 0.896270751953125, 0.99249267578125, 1.088714599609375, 1.1849365234375, 1.281158447265625, 1.37738037109375, 1.473602294921875, 1.56982421875, 1.666046142578125, 1.76226806640625, 1.858489990234375, 1.9547119140625, 2.050933837890625, 2.14715576171875, 2.243377685546875, 2.339599609375, 2.435821533203125, 2.53204345703125, 2.628265380859375, 2.7244873046875, 2.820709228515625, 2.91693115234375, 3.013153076171875, 3.109375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 7.0, 4.0, 2.0, 8.0, 14.0, 7.0, 12.0, 11.0, 16.0, 13.0, 23.0, 16.0, 24.0, 31.0, 27.0, 25.0, 42.0, 47.0, 40.0, 49.0, 49.0, 41.0, 46.0, 38.0, 43.0, 42.0, 44.0, 37.0, 30.0, 27.0, 32.0, 23.0, 22.0, 25.0, 12.0, 12.0, 10.0, 15.0, 6.0, 6.0, 3.0, 4.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.6181640625, -1.5685882568359375, -1.519012451171875, -1.4694366455078125, -1.41986083984375, -1.3702850341796875, -1.320709228515625, -1.2711334228515625, -1.2215576171875, -1.1719818115234375, -1.122406005859375, -1.0728302001953125, -1.02325439453125, -0.9736785888671875, -0.924102783203125, -0.8745269775390625, -0.824951171875, -0.7753753662109375, -0.725799560546875, -0.6762237548828125, -0.62664794921875, -0.5770721435546875, -0.527496337890625, -0.4779205322265625, -0.4283447265625, -0.3787689208984375, -0.329193115234375, -0.2796173095703125, -0.23004150390625, -0.1804656982421875, -0.130889892578125, -0.0813140869140625, -0.03173828125, 0.0178375244140625, 0.067413330078125, 0.1169891357421875, 0.16656494140625, 0.2161407470703125, 0.265716552734375, 0.3152923583984375, 0.3648681640625, 0.4144439697265625, 0.464019775390625, 0.5135955810546875, 0.56317138671875, 0.6127471923828125, 0.662322998046875, 0.7118988037109375, 0.761474609375, 0.8110504150390625, 0.860626220703125, 0.9102020263671875, 0.95977783203125, 1.0093536376953125, 1.058929443359375, 1.1085052490234375, 1.1580810546875, 1.2076568603515625, 1.257232666015625, 1.3068084716796875, 1.35638427734375, 1.4059600830078125, 1.455535888671875, 1.5051116943359375, 1.5546875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 8.0, 3.0, 6.0, 12.0, 14.0, 13.0, 24.0, 30.0, 42.0, 69.0, 98.0, 125.0, 207.0, 262.0, 514.0, 888.0, 1780.0, 4362.0, 17872.0, 116665.0, 792279.0, 90723.0, 14556.0, 4045.0, 1635.0, 871.0, 469.0, 321.0, 214.0, 143.0, 75.0, 72.0, 46.0, 27.0, 28.0, 12.0, 20.0, 9.0, 2.0, 2.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.0078125, -5.8226318359375, -5.637451171875, -5.4522705078125, -5.26708984375, -5.0819091796875, -4.896728515625, -4.7115478515625, -4.5263671875, -4.3411865234375, -4.156005859375, -3.9708251953125, -3.78564453125, -3.6004638671875, -3.415283203125, -3.2301025390625, -3.044921875, -2.8597412109375, -2.674560546875, -2.4893798828125, -2.30419921875, -2.1190185546875, -1.933837890625, -1.7486572265625, -1.5634765625, -1.3782958984375, -1.193115234375, -1.0079345703125, -0.82275390625, -0.6375732421875, -0.452392578125, -0.2672119140625, -0.08203125, 0.1031494140625, 0.288330078125, 0.4735107421875, 0.65869140625, 0.8438720703125, 1.029052734375, 1.2142333984375, 1.3994140625, 1.5845947265625, 1.769775390625, 1.9549560546875, 2.14013671875, 2.3253173828125, 2.510498046875, 2.6956787109375, 2.880859375, 3.0660400390625, 3.251220703125, 3.4364013671875, 3.62158203125, 3.8067626953125, 3.991943359375, 4.1771240234375, 4.3623046875, 4.5474853515625, 4.732666015625, 4.9178466796875, 5.10302734375, 5.2882080078125, 5.473388671875, 5.6585693359375, 5.84375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 5.0, 5.0, 6.0, 8.0, 7.0, 15.0, 18.0, 12.0, 27.0, 32.0, 30.0, 35.0, 43.0, 61.0, 59.0, 79.0, 61.0, 63.0, 60.0, 53.0, 53.0, 48.0, 42.0, 30.0, 31.0, 25.0, 22.0, 21.0, 12.0, 5.0, 12.0, 5.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-8.3203125, -8.088134765625, -7.85595703125, -7.623779296875, -7.3916015625, -7.159423828125, -6.92724609375, -6.695068359375, -6.462890625, -6.230712890625, -5.99853515625, -5.766357421875, -5.5341796875, -5.302001953125, -5.06982421875, -4.837646484375, -4.60546875, -4.373291015625, -4.14111328125, -3.908935546875, -3.6767578125, -3.444580078125, -3.21240234375, -2.980224609375, -2.748046875, -2.515869140625, -2.28369140625, -2.051513671875, -1.8193359375, -1.587158203125, -1.35498046875, -1.122802734375, -0.890625, -0.658447265625, -0.42626953125, -0.194091796875, 0.0380859375, 0.270263671875, 0.50244140625, 0.734619140625, 0.966796875, 1.198974609375, 1.43115234375, 1.663330078125, 1.8955078125, 2.127685546875, 2.35986328125, 2.592041015625, 2.82421875, 3.056396484375, 3.28857421875, 3.520751953125, 3.7529296875, 3.985107421875, 4.21728515625, 4.449462890625, 4.681640625, 4.913818359375, 5.14599609375, 5.378173828125, 5.6103515625, 5.842529296875, 6.07470703125, 6.306884765625, 6.5390625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 8.0, 12.0, 14.0, 14.0, 18.0, 19.0, 23.0, 46.0, 60.0, 102.0, 119.0, 170.0, 301.0, 497.0, 782.0, 1532.0, 3062.0, 7242.0, 19952.0, 67257.0, 522795.0, 325879.0, 65581.0, 19464.0, 7148.0, 2928.0, 1430.0, 793.0, 443.0, 268.0, 183.0, 117.0, 84.0, 53.0, 41.0, 37.0, 18.0, 9.0, 13.0, 14.0, 7.0, 4.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.013671875, -0.9838485717773438, -0.9540252685546875, -0.9242019653320312, -0.894378662109375, -0.8645553588867188, -0.8347320556640625, -0.8049087524414062, -0.77508544921875, -0.7452621459960938, -0.7154388427734375, -0.6856155395507812, -0.655792236328125, -0.6259689331054688, -0.5961456298828125, -0.5663223266601562, -0.5364990234375, -0.5066757202148438, -0.4768524169921875, -0.44702911376953125, -0.417205810546875, -0.38738250732421875, -0.3575592041015625, -0.32773590087890625, -0.29791259765625, -0.26808929443359375, -0.2382659912109375, -0.20844268798828125, -0.178619384765625, -0.14879608154296875, -0.1189727783203125, -0.08914947509765625, -0.059326171875, -0.02950286865234375, 0.0003204345703125, 0.03014373779296875, 0.059967041015625, 0.08979034423828125, 0.1196136474609375, 0.14943695068359375, 0.17926025390625, 0.20908355712890625, 0.2389068603515625, 0.26873016357421875, 0.298553466796875, 0.32837677001953125, 0.3582000732421875, 0.38802337646484375, 0.4178466796875, 0.44766998291015625, 0.4774932861328125, 0.5073165893554688, 0.537139892578125, 0.5669631958007812, 0.5967864990234375, 0.6266098022460938, 0.65643310546875, 0.6862564086914062, 0.7160797119140625, 0.7459030151367188, 0.775726318359375, 0.8055496215820312, 0.8353729248046875, 0.8651962280273438, 0.89501953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 3.0, 7.0, 4.0, 10.0, 14.0, 14.0, 22.0, 27.0, 37.0, 46.0, 80.0, 94.0, 125.0, 137.0, 103.0, 77.0, 51.0, 39.0, 35.0, 25.0, 17.0, 10.0, 6.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00064849853515625, -0.0006305426359176636, -0.0006125867366790771, -0.0005946308374404907, -0.0005766749382019043, -0.0005587190389633179, -0.0005407631397247314, -0.000522807240486145, -0.0005048513412475586, -0.00048689544200897217, -0.00046893954277038574, -0.0004509836435317993, -0.0004330277442932129, -0.00041507184505462646, -0.00039711594581604004, -0.0003791600465774536, -0.0003612041473388672, -0.00034324824810028076, -0.00032529234886169434, -0.0003073364496231079, -0.0002893805503845215, -0.00027142465114593506, -0.00025346875190734863, -0.0002355128526687622, -0.00021755695343017578, -0.00019960105419158936, -0.00018164515495300293, -0.0001636892557144165, -0.00014573335647583008, -0.00012777745723724365, -0.00010982155799865723, -9.18656587600708e-05, -7.390975952148438e-05, -5.595386028289795e-05, -3.7997961044311523e-05, -2.0042061805725098e-05, -2.086162567138672e-06, 1.5869736671447754e-05, 3.382563591003418e-05, 5.1781535148620605e-05, 6.973743438720703e-05, 8.769333362579346e-05, 0.00010564923286437988, 0.0001236051321029663, 0.00014156103134155273, 0.00015951693058013916, 0.00017747282981872559, 0.000195428729057312, 0.00021338462829589844, 0.00023134052753448486, 0.0002492964267730713, 0.0002672523260116577, 0.00028520822525024414, 0.00030316412448883057, 0.000321120023727417, 0.0003390759229660034, 0.00035703182220458984, 0.00037498772144317627, 0.0003929436206817627, 0.0004108995199203491, 0.00042885541915893555, 0.00044681131839752197, 0.0004647672176361084, 0.0004827231168746948, 0.0005006790161132812]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 7.0, 4.0, 9.0, 6.0, 5.0, 15.0, 21.0, 30.0, 27.0, 40.0, 46.0, 65.0, 97.0, 129.0, 185.0, 289.0, 451.0, 835.0, 1533.0, 3181.0, 7632.0, 21764.0, 75868.0, 588657.0, 257575.0, 59543.0, 17666.0, 6487.0, 2785.0, 1433.0, 775.0, 463.0, 273.0, 184.0, 117.0, 78.0, 88.0, 44.0, 38.0, 23.0, 15.0, 14.0, 9.0, 17.0, 8.0, 11.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0], "bins": [-1.0322265625, -1.0008621215820312, -0.9694976806640625, -0.9381332397460938, -0.906768798828125, -0.8754043579101562, -0.8440399169921875, -0.8126754760742188, -0.78131103515625, -0.7499465942382812, -0.7185821533203125, -0.6872177124023438, -0.655853271484375, -0.6244888305664062, -0.5931243896484375, -0.5617599487304688, -0.5303955078125, -0.49903106689453125, -0.4676666259765625, -0.43630218505859375, -0.404937744140625, -0.37357330322265625, -0.3422088623046875, -0.31084442138671875, -0.27947998046875, -0.24811553955078125, -0.2167510986328125, -0.18538665771484375, -0.154022216796875, -0.12265777587890625, -0.0912933349609375, -0.05992889404296875, -0.028564453125, 0.00279998779296875, 0.0341644287109375, 0.06552886962890625, 0.096893310546875, 0.12825775146484375, 0.1596221923828125, 0.19098663330078125, 0.22235107421875, 0.25371551513671875, 0.2850799560546875, 0.31644439697265625, 0.347808837890625, 0.37917327880859375, 0.4105377197265625, 0.44190216064453125, 0.4732666015625, 0.5046310424804688, 0.5359954833984375, 0.5673599243164062, 0.598724365234375, 0.6300888061523438, 0.6614532470703125, 0.6928176879882812, 0.72418212890625, 0.7555465698242188, 0.7869110107421875, 0.8182754516601562, 0.849639892578125, 0.8810043334960938, 0.9123687744140625, 0.9437332153320312, 0.97509765625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 10.0, 17.0, 20.0, 19.0, 36.0, 40.0, 51.0, 84.0, 90.0, 116.0, 120.0, 91.0, 75.0, 55.0, 46.0, 33.0, 15.0, 13.0, 11.0, 16.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.5927734375, -1.5519256591796875, -1.511077880859375, -1.4702301025390625, -1.42938232421875, -1.3885345458984375, -1.347686767578125, -1.3068389892578125, -1.2659912109375, -1.2251434326171875, -1.184295654296875, -1.1434478759765625, -1.10260009765625, -1.0617523193359375, -1.020904541015625, -0.9800567626953125, -0.939208984375, -0.8983612060546875, -0.857513427734375, -0.8166656494140625, -0.77581787109375, -0.7349700927734375, -0.694122314453125, -0.6532745361328125, -0.6124267578125, -0.5715789794921875, -0.530731201171875, -0.4898834228515625, -0.44903564453125, -0.4081878662109375, -0.367340087890625, -0.3264923095703125, -0.28564453125, -0.2447967529296875, -0.203948974609375, -0.1631011962890625, -0.12225341796875, -0.0814056396484375, -0.040557861328125, 0.0002899169921875, 0.0411376953125, 0.0819854736328125, 0.122833251953125, 0.1636810302734375, 0.20452880859375, 0.2453765869140625, 0.286224365234375, 0.3270721435546875, 0.367919921875, 0.4087677001953125, 0.449615478515625, 0.4904632568359375, 0.53131103515625, 0.5721588134765625, 0.613006591796875, 0.6538543701171875, 0.6947021484375, 0.7355499267578125, 0.776397705078125, 0.8172454833984375, 0.85809326171875, 0.8989410400390625, 0.939788818359375, 0.9806365966796875, 1.021484375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 7.0, 11.0, 28.0, 29.0, 57.0, 80.0, 108.0, 344.0, 147.0, 74.0, 54.0, 27.0, 10.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-51.98194122314453, -50.912879943847656, -49.84382247924805, -48.77476501464844, -47.70570373535156, -46.63664245605469, -45.56758499145508, -44.49852752685547, -43.429466247558594, -42.36040496826172, -41.29134750366211, -40.2222900390625, -39.153228759765625, -38.08416748046875, -37.01511001586914, -35.94605255126953, -34.876991271972656, -33.80792999267578, -32.73887252807617, -31.66981315612793, -30.600753784179688, -29.531694412231445, -28.462635040283203, -27.39357566833496, -26.32451629638672, -25.255456924438477, -24.186397552490234, -23.117338180541992, -22.04827880859375, -20.979219436645508, -19.910160064697266, -18.841100692749023, -17.772045135498047, -16.702985763549805, -15.633926391601562, -14.56486701965332, -13.495807647705078, -12.426748275756836, -11.357688903808594, -10.288629531860352, -9.21957015991211, -8.150510787963867, -7.081451416015625, -6.012392044067383, -4.943332672119141, -3.8742733001708984, -2.8052139282226562, -1.736154556274414, -0.6670951843261719, 0.4019641876220703, 1.4710235595703125, 2.5400829315185547, 3.609142303466797, 4.678201675415039, 5.747261047363281, 6.816320419311523, 7.885379791259766, 8.954439163208008, 10.02349853515625, 11.092557907104492, 12.161617279052734, 13.230676651000977, 14.299736022949219, 15.368795394897461, 16.437854766845703]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 6.0, 6.0, 9.0, 21.0, 22.0, 13.0, 25.0, 20.0, 23.0, 34.0, 32.0, 36.0, 32.0, 50.0, 154.0, 135.0, 69.0, 51.0, 38.0, 26.0, 39.0, 23.0, 18.0, 23.0, 14.0, 16.0, 14.0, 8.0, 8.0, 4.0, 5.0, 2.0, 5.0, 1.0, 2.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.863197326660156, -27.990028381347656, -27.116857528686523, -26.243688583374023, -25.370519638061523, -24.49734878540039, -23.62417984008789, -22.75101089477539, -21.87784194946289, -21.00467300415039, -20.131502151489258, -19.258333206176758, -18.385164260864258, -17.511993408203125, -16.638824462890625, -15.765655517578125, -14.892485618591309, -14.019315719604492, -13.146146774291992, -12.272976875305176, -11.399807929992676, -10.52663803100586, -9.65346908569336, -8.780299186706543, -7.907129764556885, -7.033960342407227, -6.160790920257568, -5.28762149810791, -4.414451599121094, -3.5412821769714355, -2.6681127548217773, -1.7949433326721191, -0.9217739105224609, -0.04860442876815796, 0.824565052986145, 1.6977345943450928, 2.570904016494751, 3.4440736770629883, 4.3172430992126465, 5.190412521362305, 6.063581943511963, 6.936751365661621, 7.809920787811279, 8.683090209960938, 9.556260108947754, 10.42943000793457, 11.30259895324707, 12.17576789855957, 13.048937797546387, 13.922107696533203, 14.795276641845703, 15.66844654083252, 16.541616439819336, 17.414785385131836, 18.287954330444336, 19.16112518310547, 20.03429412841797, 20.90746307373047, 21.7806339263916, 22.6538028717041, 23.5269718170166, 24.400142669677734, 25.273311614990234, 26.146480560302734, 27.019649505615234]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 7.0, 10.0, 10.0, 17.0, 30.0, 37.0, 50.0, 72.0, 102.0, 165.0, 268.0, 408.0, 729.0, 1249.0, 2633.0, 6082.0, 16081.0, 58357.0, 324506.0, 1767618.0, 1630013.0, 304128.0, 55011.0, 15319.0, 5889.0, 2458.0, 1266.0, 682.0, 397.0, 247.0, 125.0, 110.0, 61.0, 41.0, 34.0, 26.0, 15.0, 5.0, 3.0, 6.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0], "bins": [-3.322265625, -3.22991943359375, -3.1375732421875, -3.04522705078125, -2.952880859375, -2.86053466796875, -2.7681884765625, -2.67584228515625, -2.58349609375, -2.49114990234375, -2.3988037109375, -2.30645751953125, -2.214111328125, -2.12176513671875, -2.0294189453125, -1.93707275390625, -1.8447265625, -1.75238037109375, -1.6600341796875, -1.56768798828125, -1.475341796875, -1.38299560546875, -1.2906494140625, -1.19830322265625, -1.10595703125, -1.01361083984375, -0.9212646484375, -0.82891845703125, -0.736572265625, -0.64422607421875, -0.5518798828125, -0.45953369140625, -0.3671875, -0.27484130859375, -0.1824951171875, -0.09014892578125, 0.002197265625, 0.09454345703125, 0.1868896484375, 0.27923583984375, 0.37158203125, 0.46392822265625, 0.5562744140625, 0.64862060546875, 0.740966796875, 0.83331298828125, 0.9256591796875, 1.01800537109375, 1.1103515625, 1.20269775390625, 1.2950439453125, 1.38739013671875, 1.479736328125, 1.57208251953125, 1.6644287109375, 1.75677490234375, 1.84912109375, 1.94146728515625, 2.0338134765625, 2.12615966796875, 2.218505859375, 2.31085205078125, 2.4031982421875, 2.49554443359375, 2.587890625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 8.0, 7.0, 7.0, 14.0, 6.0, 9.0, 8.0, 16.0, 15.0, 22.0, 27.0, 29.0, 31.0, 34.0, 39.0, 51.0, 31.0, 38.0, 42.0, 49.0, 54.0, 46.0, 38.0, 47.0, 43.0, 35.0, 44.0, 28.0, 34.0, 27.0, 20.0, 21.0, 16.0, 11.0, 12.0, 10.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.619140625, -1.5712432861328125, -1.523345947265625, -1.4754486083984375, -1.42755126953125, -1.3796539306640625, -1.331756591796875, -1.2838592529296875, -1.2359619140625, -1.1880645751953125, -1.140167236328125, -1.0922698974609375, -1.04437255859375, -0.9964752197265625, -0.948577880859375, -0.9006805419921875, -0.852783203125, -0.8048858642578125, -0.756988525390625, -0.7090911865234375, -0.66119384765625, -0.6132965087890625, -0.565399169921875, -0.5175018310546875, -0.4696044921875, -0.4217071533203125, -0.373809814453125, -0.3259124755859375, -0.27801513671875, -0.2301177978515625, -0.182220458984375, -0.1343231201171875, -0.08642578125, -0.0385284423828125, 0.009368896484375, 0.0572662353515625, 0.10516357421875, 0.1530609130859375, 0.200958251953125, 0.2488555908203125, 0.2967529296875, 0.3446502685546875, 0.392547607421875, 0.4404449462890625, 0.48834228515625, 0.5362396240234375, 0.584136962890625, 0.6320343017578125, 0.679931640625, 0.7278289794921875, 0.775726318359375, 0.8236236572265625, 0.87152099609375, 0.9194183349609375, 0.967315673828125, 1.0152130126953125, 1.0631103515625, 1.1110076904296875, 1.158905029296875, 1.2068023681640625, 1.25469970703125, 1.3025970458984375, 1.350494384765625, 1.3983917236328125, 1.4462890625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 15.0, 10.0, 16.0, 18.0, 35.0, 45.0, 66.0, 91.0, 150.0, 231.0, 435.0, 808.0, 2058.0, 7952.0, 107289.0, 3915804.0, 144992.0, 9775.0, 2292.0, 952.0, 479.0, 270.0, 167.0, 105.0, 52.0, 46.0, 28.0, 15.0, 24.0, 10.0, 9.0, 8.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-10.7578125, -10.46337890625, -10.1689453125, -9.87451171875, -9.580078125, -9.28564453125, -8.9912109375, -8.69677734375, -8.40234375, -8.10791015625, -7.8134765625, -7.51904296875, -7.224609375, -6.93017578125, -6.6357421875, -6.34130859375, -6.046875, -5.75244140625, -5.4580078125, -5.16357421875, -4.869140625, -4.57470703125, -4.2802734375, -3.98583984375, -3.69140625, -3.39697265625, -3.1025390625, -2.80810546875, -2.513671875, -2.21923828125, -1.9248046875, -1.63037109375, -1.3359375, -1.04150390625, -0.7470703125, -0.45263671875, -0.158203125, 0.13623046875, 0.4306640625, 0.72509765625, 1.01953125, 1.31396484375, 1.6083984375, 1.90283203125, 2.197265625, 2.49169921875, 2.7861328125, 3.08056640625, 3.375, 3.66943359375, 3.9638671875, 4.25830078125, 4.552734375, 4.84716796875, 5.1416015625, 5.43603515625, 5.73046875, 6.02490234375, 6.3193359375, 6.61376953125, 6.908203125, 7.20263671875, 7.4970703125, 7.79150390625, 8.0859375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 4.0, 15.0, 18.0, 24.0, 34.0, 43.0, 66.0, 88.0, 121.0, 182.0, 245.0, 334.0, 465.0, 602.0, 495.0, 369.0, 263.0, 182.0, 150.0, 92.0, 67.0, 56.0, 39.0, 33.0, 15.0, 16.0, 12.0, 12.0, 4.0, 10.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.36328125, -3.20770263671875, -3.0521240234375, -2.89654541015625, -2.740966796875, -2.58538818359375, -2.4298095703125, -2.27423095703125, -2.11865234375, -1.96307373046875, -1.8074951171875, -1.65191650390625, -1.496337890625, -1.34075927734375, -1.1851806640625, -1.02960205078125, -0.8740234375, -0.71844482421875, -0.5628662109375, -0.40728759765625, -0.251708984375, -0.09613037109375, 0.0594482421875, 0.21502685546875, 0.37060546875, 0.52618408203125, 0.6817626953125, 0.83734130859375, 0.992919921875, 1.14849853515625, 1.3040771484375, 1.45965576171875, 1.615234375, 1.77081298828125, 1.9263916015625, 2.08197021484375, 2.237548828125, 2.39312744140625, 2.5487060546875, 2.70428466796875, 2.85986328125, 3.01544189453125, 3.1710205078125, 3.32659912109375, 3.482177734375, 3.63775634765625, 3.7933349609375, 3.94891357421875, 4.1044921875, 4.26007080078125, 4.4156494140625, 4.57122802734375, 4.726806640625, 4.88238525390625, 5.0379638671875, 5.19354248046875, 5.34912109375, 5.50469970703125, 5.6602783203125, 5.81585693359375, 5.971435546875, 6.12701416015625, 6.2825927734375, 6.43817138671875, 6.59375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 8.0, 15.0, 27.0, 15.0, 32.0, 65.0, 92.0, 133.0, 163.0, 115.0, 66.0, 89.0, 51.0, 29.0, 22.0, 19.0, 13.0, 5.0, 4.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-40.690914154052734, -39.20191955566406, -37.712921142578125, -36.22392654418945, -34.73493194580078, -33.245933532714844, -31.756938934326172, -30.267942428588867, -28.778945922851562, -27.289949417114258, -25.800952911376953, -24.31195831298828, -22.822961807250977, -21.333965301513672, -19.844970703125, -18.355974197387695, -16.86697769165039, -15.377981185913086, -13.888985633850098, -12.39999008178711, -10.910993576049805, -9.4219970703125, -7.933001518249512, -6.444005966186523, -4.955009460449219, -3.4660134315490723, -1.9770174026489258, -0.4880213737487793, 1.0009746551513672, 2.4899706840515137, 3.97896671295166, 5.467962265014648, 6.9569549560546875, 8.445951461791992, 9.93494701385498, 11.423942565917969, 12.912939071655273, 14.401935577392578, 15.890931129455566, 17.379926681518555, 18.86892318725586, 20.357919692993164, 21.84691619873047, 23.33591079711914, 24.824907302856445, 26.31390380859375, 27.802898406982422, 29.291894912719727, 30.78089141845703, 32.2698860168457, 33.75888442993164, 35.24787902832031, 36.73687744140625, 38.22587203979492, 39.714866638183594, 41.20386505126953, 42.6928596496582, 44.181854248046875, 45.67085266113281, 47.159847259521484, 48.648841857910156, 50.137840270996094, 51.626834869384766, 53.11582946777344, 54.604827880859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 6.0, 11.0, 14.0, 18.0, 26.0, 22.0, 20.0, 26.0, 37.0, 33.0, 40.0, 47.0, 31.0, 55.0, 49.0, 55.0, 56.0, 55.0, 54.0, 48.0, 64.0, 35.0, 30.0, 29.0, 19.0, 24.0, 20.0, 12.0, 13.0, 8.0, 10.0, 8.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.169715881347656, -29.26593589782715, -28.36215591430664, -27.458375930786133, -26.554595947265625, -25.650814056396484, -24.747034072875977, -23.84325408935547, -22.93947410583496, -22.035694122314453, -21.131914138793945, -20.228134155273438, -19.324352264404297, -18.420574188232422, -17.51679229736328, -16.613012313842773, -15.709232330322266, -14.805452346801758, -13.90167236328125, -12.997891426086426, -12.094111442565918, -11.19033145904541, -10.286550521850586, -9.382770538330078, -8.47899055480957, -7.5752105712890625, -6.6714301109313965, -5.7676496505737305, -4.863869667053223, -3.960089683532715, -3.056309223175049, -2.152528762817383, -1.2487468719482422, -0.3449666500091553, 0.5588135719299316, 1.4625937938690186, 2.3663740158081055, 3.2701539993286133, 4.173934459686279, 5.077714920043945, 5.981494903564453, 6.885274887084961, 7.789055347442627, 8.692835807800293, 9.5966157913208, 10.500395774841309, 11.404176712036133, 12.30795669555664, 13.211736679077148, 14.115516662597656, 15.019296646118164, 15.923077583312988, 16.826858520507812, 17.730636596679688, 18.634418487548828, 19.538198471069336, 20.441978454589844, 21.34575843811035, 22.24953842163086, 23.153318405151367, 24.057098388671875, 24.960880279541016, 25.864660263061523, 26.76844024658203, 27.67222023010254]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 8.0, 5.0, 12.0, 10.0, 17.0, 22.0, 26.0, 42.0, 61.0, 74.0, 156.0, 201.0, 369.0, 549.0, 855.0, 1545.0, 2747.0, 5676.0, 13826.0, 41336.0, 174249.0, 621707.0, 128921.0, 33606.0, 11598.0, 4947.0, 2424.0, 1410.0, 791.0, 484.0, 284.0, 208.0, 149.0, 76.0, 55.0, 46.0, 18.0, 16.0, 12.0, 8.0, 3.0, 3.0, 7.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.6875, -3.570098876953125, -3.45269775390625, -3.335296630859375, -3.2178955078125, -3.100494384765625, -2.98309326171875, -2.865692138671875, -2.748291015625, -2.630889892578125, -2.51348876953125, -2.396087646484375, -2.2786865234375, -2.161285400390625, -2.04388427734375, -1.926483154296875, -1.80908203125, -1.691680908203125, -1.57427978515625, -1.456878662109375, -1.3394775390625, -1.222076416015625, -1.10467529296875, -0.987274169921875, -0.869873046875, -0.752471923828125, -0.63507080078125, -0.517669677734375, -0.4002685546875, -0.282867431640625, -0.16546630859375, -0.048065185546875, 0.0693359375, 0.186737060546875, 0.30413818359375, 0.421539306640625, 0.5389404296875, 0.656341552734375, 0.77374267578125, 0.891143798828125, 1.008544921875, 1.125946044921875, 1.24334716796875, 1.360748291015625, 1.4781494140625, 1.595550537109375, 1.71295166015625, 1.830352783203125, 1.94775390625, 2.065155029296875, 2.18255615234375, 2.299957275390625, 2.4173583984375, 2.534759521484375, 2.65216064453125, 2.769561767578125, 2.886962890625, 3.004364013671875, 3.12176513671875, 3.239166259765625, 3.3565673828125, 3.473968505859375, 3.59136962890625, 3.708770751953125, 3.826171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 10.0, 9.0, 17.0, 15.0, 25.0, 28.0, 26.0, 28.0, 37.0, 44.0, 33.0, 56.0, 47.0, 74.0, 50.0, 52.0, 65.0, 54.0, 49.0, 46.0, 39.0, 28.0, 32.0, 27.0, 17.0, 17.0, 9.0, 13.0, 7.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.716796875, -1.651885986328125, -1.58697509765625, -1.522064208984375, -1.4571533203125, -1.392242431640625, -1.32733154296875, -1.262420654296875, -1.197509765625, -1.132598876953125, -1.06768798828125, -1.002777099609375, -0.9378662109375, -0.872955322265625, -0.80804443359375, -0.743133544921875, -0.67822265625, -0.613311767578125, -0.54840087890625, -0.483489990234375, -0.4185791015625, -0.353668212890625, -0.28875732421875, -0.223846435546875, -0.158935546875, -0.094024658203125, -0.02911376953125, 0.035797119140625, 0.1007080078125, 0.165618896484375, 0.23052978515625, 0.295440673828125, 0.3603515625, 0.425262451171875, 0.49017333984375, 0.555084228515625, 0.6199951171875, 0.684906005859375, 0.74981689453125, 0.814727783203125, 0.879638671875, 0.944549560546875, 1.00946044921875, 1.074371337890625, 1.1392822265625, 1.204193115234375, 1.26910400390625, 1.334014892578125, 1.39892578125, 1.463836669921875, 1.52874755859375, 1.593658447265625, 1.6585693359375, 1.723480224609375, 1.78839111328125, 1.853302001953125, 1.918212890625, 1.983123779296875, 2.04803466796875, 2.112945556640625, 2.1778564453125, 2.242767333984375, 2.30767822265625, 2.372589111328125, 2.4375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 5.0, 7.0, 6.0, 6.0, 11.0, 13.0, 28.0, 36.0, 38.0, 39.0, 55.0, 79.0, 116.0, 161.0, 237.0, 373.0, 683.0, 1153.0, 2279.0, 5136.0, 14849.0, 55593.0, 798529.0, 126712.0, 26589.0, 8434.0, 3408.0, 1558.0, 852.0, 502.0, 316.0, 218.0, 146.0, 106.0, 92.0, 52.0, 33.0, 22.0, 20.0, 11.0, 15.0, 10.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.53515625, -3.42376708984375, -3.3123779296875, -3.20098876953125, -3.089599609375, -2.97821044921875, -2.8668212890625, -2.75543212890625, -2.64404296875, -2.53265380859375, -2.4212646484375, -2.30987548828125, -2.198486328125, -2.08709716796875, -1.9757080078125, -1.86431884765625, -1.7529296875, -1.64154052734375, -1.5301513671875, -1.41876220703125, -1.307373046875, -1.19598388671875, -1.0845947265625, -0.97320556640625, -0.86181640625, -0.75042724609375, -0.6390380859375, -0.52764892578125, -0.416259765625, -0.30487060546875, -0.1934814453125, -0.08209228515625, 0.029296875, 0.14068603515625, 0.2520751953125, 0.36346435546875, 0.474853515625, 0.58624267578125, 0.6976318359375, 0.80902099609375, 0.92041015625, 1.03179931640625, 1.1431884765625, 1.25457763671875, 1.365966796875, 1.47735595703125, 1.5887451171875, 1.70013427734375, 1.8115234375, 1.92291259765625, 2.0343017578125, 2.14569091796875, 2.257080078125, 2.36846923828125, 2.4798583984375, 2.59124755859375, 2.70263671875, 2.81402587890625, 2.9254150390625, 3.03680419921875, 3.148193359375, 3.25958251953125, 3.3709716796875, 3.48236083984375, 3.59375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 8.0, 5.0, 4.0, 8.0, 13.0, 5.0, 11.0, 12.0, 20.0, 18.0, 25.0, 16.0, 37.0, 35.0, 44.0, 57.0, 63.0, 86.0, 69.0, 61.0, 55.0, 63.0, 41.0, 32.0, 26.0, 19.0, 21.0, 18.0, 19.0, 15.0, 7.0, 21.0, 10.0, 13.0, 5.0, 4.0, 6.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.93359375, -7.70086669921875, -7.4681396484375, -7.23541259765625, -7.002685546875, -6.76995849609375, -6.5372314453125, -6.30450439453125, -6.07177734375, -5.83905029296875, -5.6063232421875, -5.37359619140625, -5.140869140625, -4.90814208984375, -4.6754150390625, -4.44268798828125, -4.2099609375, -3.97723388671875, -3.7445068359375, -3.51177978515625, -3.279052734375, -3.04632568359375, -2.8135986328125, -2.58087158203125, -2.34814453125, -2.11541748046875, -1.8826904296875, -1.64996337890625, -1.417236328125, -1.18450927734375, -0.9517822265625, -0.71905517578125, -0.486328125, -0.25360107421875, -0.0208740234375, 0.21185302734375, 0.444580078125, 0.67730712890625, 0.9100341796875, 1.14276123046875, 1.37548828125, 1.60821533203125, 1.8409423828125, 2.07366943359375, 2.306396484375, 2.53912353515625, 2.7718505859375, 3.00457763671875, 3.2373046875, 3.47003173828125, 3.7027587890625, 3.93548583984375, 4.168212890625, 4.40093994140625, 4.6336669921875, 4.86639404296875, 5.09912109375, 5.33184814453125, 5.5645751953125, 5.79730224609375, 6.030029296875, 6.26275634765625, 6.4954833984375, 6.72821044921875, 6.9609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 4.0, 7.0, 8.0, 10.0, 14.0, 25.0, 20.0, 36.0, 48.0, 72.0, 107.0, 166.0, 249.0, 412.0, 613.0, 1076.0, 1879.0, 3783.0, 8249.0, 19869.0, 63903.0, 766145.0, 127584.0, 31431.0, 11667.0, 5056.0, 2620.0, 1321.0, 768.0, 466.0, 305.0, 207.0, 143.0, 80.0, 53.0, 38.0, 21.0, 26.0, 17.0, 8.0, 5.0, 6.0, 2.0, 5.0, 8.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.7890625, -0.765655517578125, -0.74224853515625, -0.718841552734375, -0.6954345703125, -0.672027587890625, -0.64862060546875, -0.625213623046875, -0.601806640625, -0.578399658203125, -0.55499267578125, -0.531585693359375, -0.5081787109375, -0.484771728515625, -0.46136474609375, -0.437957763671875, -0.41455078125, -0.391143798828125, -0.36773681640625, -0.344329833984375, -0.3209228515625, -0.297515869140625, -0.27410888671875, -0.250701904296875, -0.227294921875, -0.203887939453125, -0.18048095703125, -0.157073974609375, -0.1336669921875, -0.110260009765625, -0.08685302734375, -0.063446044921875, -0.0400390625, -0.016632080078125, 0.00677490234375, 0.030181884765625, 0.0535888671875, 0.076995849609375, 0.10040283203125, 0.123809814453125, 0.147216796875, 0.170623779296875, 0.19403076171875, 0.217437744140625, 0.2408447265625, 0.264251708984375, 0.28765869140625, 0.311065673828125, 0.33447265625, 0.357879638671875, 0.38128662109375, 0.404693603515625, 0.4281005859375, 0.451507568359375, 0.47491455078125, 0.498321533203125, 0.521728515625, 0.545135498046875, 0.56854248046875, 0.591949462890625, 0.6153564453125, 0.638763427734375, 0.66217041015625, 0.685577392578125, 0.708984375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 8.0, 12.0, 16.0, 25.0, 32.0, 37.0, 39.0, 73.0, 117.0, 144.0, 149.0, 89.0, 66.0, 49.0, 28.0, 17.0, 14.0, 10.0, 5.0, 15.0, 7.0, 4.0, 8.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0005812644958496094, -0.0005655102431774139, -0.0005497559905052185, -0.0005340017378330231, -0.0005182474851608276, -0.0005024932324886322, -0.00048673897981643677, -0.00047098472714424133, -0.0004552304744720459, -0.00043947622179985046, -0.00042372196912765503, -0.0004079677164554596, -0.00039221346378326416, -0.0003764592111110687, -0.0003607049584388733, -0.00034495070576667786, -0.0003291964530944824, -0.000313442200422287, -0.00029768794775009155, -0.0002819336950778961, -0.0002661794424057007, -0.00025042518973350525, -0.00023467093706130981, -0.00021891668438911438, -0.00020316243171691895, -0.0001874081790447235, -0.00017165392637252808, -0.00015589967370033264, -0.0001401454210281372, -0.00012439116835594177, -0.00010863691568374634, -9.28826630115509e-05, -7.712841033935547e-05, -6.137415766716003e-05, -4.56199049949646e-05, -2.9865652322769165e-05, -1.411139965057373e-05, 1.642853021621704e-06, 1.739710569381714e-05, 3.315135836601257e-05, 4.890561103820801e-05, 6.465986371040344e-05, 8.041411638259888e-05, 9.616836905479431e-05, 0.00011192262172698975, 0.00012767687439918518, 0.00014343112707138062, 0.00015918537974357605, 0.00017493963241577148, 0.00019069388508796692, 0.00020644813776016235, 0.0002222023904323578, 0.00023795664310455322, 0.00025371089577674866, 0.0002694651484489441, 0.0002852194011211395, 0.00030097365379333496, 0.0003167279064655304, 0.00033248215913772583, 0.00034823641180992126, 0.0003639906644821167, 0.00037974491715431213, 0.00039549916982650757, 0.000411253422498703, 0.00042700767517089844]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 9.0, 10.0, 22.0, 29.0, 27.0, 48.0, 66.0, 92.0, 122.0, 213.0, 298.0, 484.0, 854.0, 1390.0, 2425.0, 4693.0, 9456.0, 22133.0, 64514.0, 711733.0, 158434.0, 40134.0, 15851.0, 7034.0, 3564.0, 1941.0, 1069.0, 688.0, 395.0, 269.0, 145.0, 122.0, 80.0, 50.0, 47.0, 24.0, 27.0, 21.0, 7.0, 6.0, 10.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.62841796875, -0.6092605590820312, -0.5901031494140625, -0.5709457397460938, -0.551788330078125, -0.5326309204101562, -0.5134735107421875, -0.49431610107421875, -0.47515869140625, -0.45600128173828125, -0.4368438720703125, -0.41768646240234375, -0.398529052734375, -0.37937164306640625, -0.3602142333984375, -0.34105682373046875, -0.3218994140625, -0.30274200439453125, -0.2835845947265625, -0.26442718505859375, -0.245269775390625, -0.22611236572265625, -0.2069549560546875, -0.18779754638671875, -0.16864013671875, -0.14948272705078125, -0.1303253173828125, -0.11116790771484375, -0.092010498046875, -0.07285308837890625, -0.0536956787109375, -0.03453826904296875, -0.015380859375, 0.00377655029296875, 0.0229339599609375, 0.04209136962890625, 0.061248779296875, 0.08040618896484375, 0.0995635986328125, 0.11872100830078125, 0.13787841796875, 0.15703582763671875, 0.1761932373046875, 0.19535064697265625, 0.214508056640625, 0.23366546630859375, 0.2528228759765625, 0.27198028564453125, 0.2911376953125, 0.31029510498046875, 0.3294525146484375, 0.34860992431640625, 0.367767333984375, 0.38692474365234375, 0.4060821533203125, 0.42523956298828125, 0.44439697265625, 0.46355438232421875, 0.4827117919921875, 0.5018692016601562, 0.521026611328125, 0.5401840209960938, 0.5593414306640625, 0.5784988403320312, 0.59765625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 5.0, 4.0, 7.0, 9.0, 15.0, 12.0, 20.0, 20.0, 33.0, 44.0, 73.0, 82.0, 127.0, 149.0, 95.0, 82.0, 67.0, 43.0, 28.0, 10.0, 12.0, 15.0, 12.0, 6.0, 11.0, 4.0, 6.0, 1.0, 6.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8466796875, -0.8117523193359375, -0.776824951171875, -0.7418975830078125, -0.70697021484375, -0.6720428466796875, -0.637115478515625, -0.6021881103515625, -0.5672607421875, -0.5323333740234375, -0.497406005859375, -0.4624786376953125, -0.42755126953125, -0.3926239013671875, -0.357696533203125, -0.3227691650390625, -0.287841796875, -0.2529144287109375, -0.217987060546875, -0.1830596923828125, -0.14813232421875, -0.1132049560546875, -0.078277587890625, -0.0433502197265625, -0.0084228515625, 0.0265045166015625, 0.061431884765625, 0.0963592529296875, 0.13128662109375, 0.1662139892578125, 0.201141357421875, 0.2360687255859375, 0.27099609375, 0.3059234619140625, 0.340850830078125, 0.3757781982421875, 0.41070556640625, 0.4456329345703125, 0.480560302734375, 0.5154876708984375, 0.5504150390625, 0.5853424072265625, 0.620269775390625, 0.6551971435546875, 0.69012451171875, 0.7250518798828125, 0.759979248046875, 0.7949066162109375, 0.829833984375, 0.8647613525390625, 0.899688720703125, 0.9346160888671875, 0.96954345703125, 1.0044708251953125, 1.039398193359375, 1.0743255615234375, 1.1092529296875, 1.1441802978515625, 1.179107666015625, 1.2140350341796875, 1.24896240234375, 1.2838897705078125, 1.318817138671875, 1.3537445068359375, 1.388671875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 13.0, 13.0, 53.0, 65.0, 155.0, 471.0, 86.0, 69.0, 26.0, 18.0, 11.0, 4.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.42418670654297, -48.224525451660156, -47.024864196777344, -45.825199127197266, -44.62553787231445, -43.42587661743164, -42.22621536254883, -41.026554107666016, -39.82688903808594, -38.627227783203125, -37.42756652832031, -36.227901458740234, -35.02824020385742, -33.82857894897461, -32.6289176940918, -31.429256439208984, -30.229595184326172, -29.02993392944336, -27.830270767211914, -26.6306095123291, -25.430946350097656, -24.231285095214844, -23.03162384033203, -21.83196258544922, -20.632299423217773, -19.43263816833496, -18.232975006103516, -17.033313751220703, -15.833651542663574, -14.633989334106445, -13.434328079223633, -12.234665870666504, -11.03500747680664, -9.835345268249512, -8.635683059692383, -7.43602180480957, -6.236359596252441, -5.0366973876953125, -3.837035655975342, -2.637373924255371, -1.4377117156982422, -0.23804974555969238, 0.9616122245788574, 2.1612741947174072, 3.360936164855957, 4.560598373413086, 5.760260105133057, 6.959921836853027, 8.159584045410156, 9.359246253967285, 10.558908462524414, 11.758569717407227, 12.958231925964355, 14.157894134521484, 15.357555389404297, 16.55721664428711, 17.756879806518555, 18.956541061401367, 20.156204223632812, 21.355865478515625, 22.555526733398438, 23.755189895629883, 24.954851150512695, 26.15451431274414, 27.354175567626953]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 6.0, 11.0, 12.0, 13.0, 9.0, 8.0, 13.0, 17.0, 21.0, 25.0, 31.0, 34.0, 33.0, 64.0, 259.0, 213.0, 29.0, 30.0, 24.0, 20.0, 16.0, 18.0, 15.0, 15.0, 7.0, 9.0, 5.0, 10.0, 7.0, 4.0, 3.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-26.99744415283203, -26.265052795410156, -25.532663345336914, -24.80027198791504, -24.067880630493164, -23.335491180419922, -22.603099822998047, -21.870708465576172, -21.13831901550293, -20.405927658081055, -19.673538208007812, -18.941146850585938, -18.208755493164062, -17.47636604309082, -16.743974685668945, -16.011585235595703, -15.279192924499512, -14.546802520751953, -13.814411163330078, -13.08202075958252, -12.349630355834961, -11.617238998413086, -10.884848594665527, -10.152458190917969, -9.420066833496094, -8.687676429748535, -7.955285549163818, -7.222894668579102, -6.490504264831543, -5.758113384246826, -5.025722503662109, -4.293332099914551, -3.560941696166992, -2.8285510540008545, -2.096160411834717, -1.36376953125, -0.6313788890838623, 0.10101175308227539, 0.8334026336669922, 1.5657930374145508, 2.2981839179992676, 3.0305745601654053, 3.762965202331543, 4.49535608291626, 5.227746963500977, 5.960137367248535, 6.692528247833252, 7.4249186515808105, 8.157309532165527, 8.889699935913086, 9.622091293334961, 10.35448169708252, 11.086872100830078, 11.819263458251953, 12.551653861999512, 13.28404426574707, 14.016435623168945, 14.748826026916504, 15.481217384338379, 16.213607788085938, 16.945999145507812, 17.678388595581055, 18.41077995300293, 19.143169403076172, 19.875560760498047]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 9.0, 13.0, 8.0, 21.0, 32.0, 36.0, 29.0, 45.0, 57.0, 110.0, 327.0, 92.0, 59.0, 49.0, 32.0, 22.0, 22.0, 14.0, 11.0, 5.0, 9.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.75, -1.6552734375, -1.560546875, -1.4658203125, -1.37109375, -1.2763671875, -1.181640625, -1.0869140625, -0.9921875, -0.8974609375, -0.802734375, -0.7080078125, -0.61328125, -0.5185546875, -0.423828125, -0.3291015625, -0.234375, -0.1396484375, -0.044921875, 0.0498046875, 0.14453125, 0.2392578125, 0.333984375, 0.4287109375, 0.5234375, 0.6181640625, 0.712890625, 0.8076171875, 0.90234375, 0.9970703125, 1.091796875, 1.1865234375, 1.28125, 1.3759765625, 1.470703125, 1.5654296875, 1.66015625, 1.7548828125, 1.849609375, 1.9443359375, 2.0390625, 2.1337890625, 2.228515625, 2.3232421875, 2.41796875, 2.5126953125, 2.607421875, 2.7021484375, 2.796875, 2.8916015625, 2.986328125, 3.0810546875, 3.17578125, 3.2705078125, 3.365234375, 3.4599609375, 3.5546875, 3.6494140625, 3.744140625, 3.8388671875, 3.93359375, 4.0283203125, 4.123046875, 4.2177734375, 4.3125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 12.0, 18.0, 28.0, 41.0, 76.0, 122.0, 234.0, 699.0, 2994.0, 33137.0, 8342211.0, 6921.0, 1308.0, 395.0, 142.0, 96.0, 41.0, 20.0, 9.0, 27.0, 7.0, 11.0, 3.0, 2.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-24.358963012695312, -23.525684356689453, -22.692405700683594, -21.859127044677734, -21.025850296020508, -20.19257164001465, -19.35929298400879, -18.52601432800293, -17.692737579345703, -16.859458923339844, -16.026180267333984, -15.192902565002441, -14.359624862670898, -13.526346206665039, -12.69306755065918, -11.85978889465332, -11.026510238647461, -10.193231582641602, -9.359953880310059, -8.5266752243042, -7.693397045135498, -6.860118865966797, -6.0268402099609375, -5.193562030792236, -4.360283851623535, -3.527005672454834, -2.6937272548675537, -1.8604488372802734, -1.0271706581115723, -0.1938924789428711, 0.6393861770629883, 1.4726643562316895, 2.3059444427490234, 3.1392226219177246, 3.972501039505005, 4.805779457092285, 5.639057636260986, 6.4723358154296875, 7.305614471435547, 8.138893127441406, 8.97217082977295, 9.805449485778809, 10.638727188110352, 11.472005844116211, 12.30528450012207, 13.138562202453613, 13.971840858459473, 14.805118560791016, 15.638397216796875, 16.471675872802734, 17.304954528808594, 18.138233184814453, 18.97150993347168, 19.80478858947754, 20.6380672454834, 21.471345901489258, 22.304622650146484, 23.137901306152344, 23.971179962158203, 24.804458618164062, 25.63773536682129, 26.47101402282715, 27.304292678833008, 28.137571334838867, 28.970849990844727]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 8.0, 9.0, 3.0, 8.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 6.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.946720123291016, -18.426326751708984, -17.905933380126953, -17.385540008544922, -16.865144729614258, -16.344751358032227, -15.824357986450195, -15.303964614868164, -14.783571243286133, -14.263177871704102, -13.742783546447754, -13.222390174865723, -12.701996803283691, -12.181602478027344, -11.661209106445312, -11.140815734863281, -10.620421409606934, -10.100028038024902, -9.579633712768555, -9.059240341186523, -8.538846969604492, -8.018453598022461, -7.498059272766113, -6.977665901184082, -6.457272052764893, -5.936878204345703, -5.416484832763672, -4.896090984344482, -4.375697135925293, -3.8553037643432617, -3.3349099159240723, -2.814516305923462, -2.294123649597168, -1.7737300395965576, -1.2533363103866577, -0.7329425811767578, -0.21254897117614746, 0.3078446388244629, 0.8282384872436523, 1.3486320972442627, 1.869025707244873, 2.3894193172454834, 2.9098129272460938, 3.430206775665283, 3.9506003856658936, 4.470993995666504, 4.991387844085693, 5.511781692504883, 6.032175064086914, 6.5525689125061035, 7.072962284088135, 7.593356132507324, 8.113749504089355, 8.634143829345703, 9.154537200927734, 9.674930572509766, 10.195323944091797, 10.715717315673828, 11.236111640930176, 11.756505012512207, 12.276898384094238, 12.797292709350586, 13.317686080932617, 13.838079452514648, 14.358473777770996]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 7.0, 7.0, 6.0, 3.0, 24.0, 15.0, 24.0, 34.0, 39.0, 60.0, 95.0, 118.0, 186.0, 254.0, 373.0, 651.0, 1151.0, 2159.0, 4522.0, 10551.0, 26168.0, 69598.0, 168245.0, 145751.0, 56046.0, 21266.0, 8761.0, 3839.0, 1956.0, 923.0, 479.0, 298.0, 199.0, 142.0, 83.0, 57.0, 42.0, 34.0, 19.0, 16.0, 14.0, 11.0, 14.0, 6.0, 11.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.140625, -11.689208984375, -11.23779296875, -10.786376953125, -10.3349609375, -9.883544921875, -9.43212890625, -8.980712890625, -8.529296875, -8.077880859375, -7.62646484375, -7.175048828125, -6.7236328125, -6.272216796875, -5.82080078125, -5.369384765625, -4.91796875, -4.466552734375, -4.01513671875, -3.563720703125, -3.1123046875, -2.660888671875, -2.20947265625, -1.758056640625, -1.306640625, -0.855224609375, -0.40380859375, 0.047607421875, 0.4990234375, 0.950439453125, 1.40185546875, 1.853271484375, 2.3046875, 2.756103515625, 3.20751953125, 3.658935546875, 4.1103515625, 4.561767578125, 5.01318359375, 5.464599609375, 5.916015625, 6.367431640625, 6.81884765625, 7.270263671875, 7.7216796875, 8.173095703125, 8.62451171875, 9.075927734375, 9.52734375, 9.978759765625, 10.43017578125, 10.881591796875, 11.3330078125, 11.784423828125, 12.23583984375, 12.687255859375, 13.138671875, 13.590087890625, 14.04150390625, 14.492919921875, 14.9443359375, 15.395751953125, 15.84716796875, 16.298583984375, 16.75]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 2.0, 8.0, 6.0, 4.0, 11.0, 10.0, 8.0, 20.0, 17.0, 35.0, 29.0, 34.0, 33.0, 44.0, 65.0, 65.0, 58.0, 61.0, 84.0, 61.0, 52.0, 53.0, 46.0, 41.0, 43.0, 20.0, 12.0, 15.0, 12.0, 10.0, 6.0, 6.0, 2.0, 8.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.779296875, -1.715301513671875, -1.65130615234375, -1.587310791015625, -1.5233154296875, -1.459320068359375, -1.39532470703125, -1.331329345703125, -1.267333984375, -1.203338623046875, -1.13934326171875, -1.075347900390625, -1.0113525390625, -0.947357177734375, -0.88336181640625, -0.819366455078125, -0.75537109375, -0.691375732421875, -0.62738037109375, -0.563385009765625, -0.4993896484375, -0.435394287109375, -0.37139892578125, -0.307403564453125, -0.243408203125, -0.179412841796875, -0.11541748046875, -0.051422119140625, 0.0125732421875, 0.076568603515625, 0.14056396484375, 0.204559326171875, 0.2685546875, 0.332550048828125, 0.39654541015625, 0.460540771484375, 0.5245361328125, 0.588531494140625, 0.65252685546875, 0.716522216796875, 0.780517578125, 0.844512939453125, 0.90850830078125, 0.972503662109375, 1.0364990234375, 1.100494384765625, 1.16448974609375, 1.228485107421875, 1.29248046875, 1.356475830078125, 1.42047119140625, 1.484466552734375, 1.5484619140625, 1.612457275390625, 1.67645263671875, 1.740447998046875, 1.804443359375, 1.868438720703125, 1.93243408203125, 1.996429443359375, 2.0604248046875, 2.124420166015625, 2.18841552734375, 2.252410888671875, 2.31640625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 5.0, 17.0, 21.0, 32.0, 85.0, 159.0, 101.0, 32.0, 16.0, 7.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.23423767089844, -42.13417434692383, -41.034114837646484, -39.934051513671875, -38.833988189697266, -37.733924865722656, -36.63386535644531, -35.5338020324707, -34.433738708496094, -33.333675384521484, -32.23361587524414, -31.13355255126953, -30.033489227294922, -28.933427810668945, -27.83336639404297, -26.73330307006836, -25.633243560791016, -24.53318214416504, -23.43311882019043, -22.333057403564453, -21.232994079589844, -20.132932662963867, -19.03287124633789, -17.93280792236328, -16.832746505737305, -15.732684135437012, -14.632621765136719, -13.532560348510742, -12.43249797821045, -11.332435607910156, -10.23237419128418, -9.132311820983887, -8.032247543334961, -6.932185173034668, -5.832123279571533, -4.732061386108398, -3.6319990158081055, -2.5319366455078125, -1.4318747520446777, -0.33181285858154297, 0.76824951171875, 1.8683116436004639, 2.9683737754821777, 4.0684356689453125, 5.1684980392456055, 6.268560409545898, 7.368622303009033, 8.468684196472168, 9.568746566772461, 10.668808937072754, 11.768871307373047, 12.868932723999023, 13.968995094299316, 15.06905746459961, 16.169118881225586, 17.269180297851562, 18.369243621826172, 19.46930503845215, 20.569368362426758, 21.669429779052734, 22.769493103027344, 23.86955451965332, 24.969615936279297, 26.069679260253906, 27.169740676879883]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 6.0, 10.0, 7.0, 11.0, 15.0, 23.0, 35.0, 67.0, 85.0, 79.0, 44.0, 23.0, 14.0, 2.0, 8.0, 9.0, 9.0, 4.0, 0.0, 0.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.868427276611328, -9.561698913574219, -9.254969596862793, -8.948241233825684, -8.641511917114258, -8.334783554077148, -8.028054237365723, -7.721325874328613, -7.414597034454346, -7.107868194580078, -6.8011393547058105, -6.494410514831543, -6.187682151794434, -5.880952835083008, -5.574224472045898, -5.267495632171631, -4.960766792297363, -4.654037952423096, -4.347309112548828, -4.0405802726745605, -3.733851671218872, -3.4271228313446045, -3.120394229888916, -2.8136653900146484, -2.506936550140381, -2.2002077102661133, -1.8934789896011353, -1.5867502689361572, -1.2800214290618896, -0.9732925891876221, -0.666563868522644, -0.359835147857666, -0.05310630798339844, 0.25362247228622437, 0.5603512525558472, 0.86708003282547, 1.1738088130950928, 1.4805376529693604, 1.7872663736343384, 2.0939950942993164, 2.400723934173584, 2.7074527740478516, 3.014181613922119, 3.3209102153778076, 3.627639055252075, 3.9343678951263428, 4.241096496582031, 4.547825336456299, 4.854554176330566, 5.161283016204834, 5.468011856079102, 5.774740695953369, 6.081469535827637, 6.388197898864746, 6.694926738739014, 7.001655578613281, 7.308384418487549, 7.615113258361816, 7.921842098236084, 8.228570938110352, 8.535299301147461, 8.842028617858887, 9.148756980895996, 9.455486297607422, 9.762214660644531]}, "eval/loss": 4.249406337738037, "eval/wer": 1.931356604522015, "eval/runtime": 954.2128, "eval/samples_per_second": 2.769, "eval/steps_per_second": 0.347} \ No newline at end of file