diff --git "a/wandb/run-20220303_033953-1eigbhyo/files/wandb-summary.json" "b/wandb/run-20220303_033953-1eigbhyo/files/wandb-summary.json" --- "a/wandb/run-20220303_033953-1eigbhyo/files/wandb-summary.json" +++ "b/wandb/run-20220303_033953-1eigbhyo/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.7246, "train/learning_rate": 0.000996, "train/epoch": 0.56, "train/global_step": 500, "_runtime": 3880, "_timestamp": 1646282673, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [4.0, 237.0, 759.0, 14.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-65.58610534667969, -35.810096740722656, -6.034088134765625, 23.741920471191406, 53.51792907714844, 83.29393005371094, 113.0699462890625, 142.84596252441406, 172.62196350097656, 202.39797973632812, 232.17398071289062, 261.9499816894531, 291.72601318359375, 321.50201416015625, 351.27801513671875, 381.05401611328125, 410.83001708984375, 440.60601806640625, 470.38201904296875, 500.1580505371094, 529.93408203125, 559.7100830078125, 589.486083984375, 619.2620849609375, 649.0380859375, 678.8140869140625, 708.590087890625, 738.3660888671875, 768.14208984375, 797.9180908203125, 827.6941528320312, 857.4701538085938, 887.2462158203125, 917.022216796875, 946.7982177734375, 976.57421875, 1006.3502197265625, 1036.126220703125, 1065.9022216796875, 1095.67822265625, 1125.454345703125, 1155.2303466796875, 1185.00634765625, 1214.7823486328125, 1244.558349609375, 1274.3343505859375, 1304.1103515625, 1333.886474609375, 1363.662353515625, 1393.4383544921875, 1423.21435546875, 1452.9903564453125, 1482.766357421875, 1512.5423583984375, 1542.318359375, 1572.094482421875, 1601.870361328125, 1631.6463623046875, 1661.42236328125, 1691.1983642578125, 1720.974365234375, 1750.7503662109375, 1780.5263671875, 1810.302490234375, 1840.0784912109375]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 5.0, 12.0, 16.0, 23.0, 21.0, 24.0, 28.0, 39.0, 36.0, 71.0, 71.0, 70.0, 70.0, 58.0, 74.0, 56.0, 53.0, 53.0, 29.0, 44.0, 30.0, 25.0, 24.0, 6.0, 11.0, 12.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.4993133544922, -243.7826385498047, -235.06597900390625, -226.34930419921875, -217.63262939453125, -208.91595458984375, -200.1992950439453, -191.4826202392578, -182.76596069335938, -174.04928588867188, -165.33262634277344, -156.61595153808594, -147.89927673339844, -139.1826171875, -130.4659423828125, -121.749267578125, -113.0325927734375, -104.31592559814453, -95.59925079345703, -86.88258361816406, -78.16590881347656, -69.4492416381836, -60.732574462890625, -52.01590347290039, -43.299232482910156, -34.58256149291992, -25.86589241027832, -17.14922332763672, -8.432552337646484, 0.28411865234375, 9.000785827636719, 17.717456817626953, 26.43414306640625, 35.150814056396484, 43.86748504638672, 52.58415222167969, 61.30082321166992, 70.01749420166016, 78.73416137695312, 87.45083618164062, 96.1675033569336, 104.88417053222656, 113.60084533691406, 122.31751251220703, 131.0341796875, 139.7508544921875, 148.467529296875, 157.18418884277344, 165.90086364746094, 174.61753845214844, 183.33419799804688, 192.05087280273438, 200.76754760742188, 209.48422241210938, 218.2008819580078, 226.9175567626953, 235.63421630859375, 244.35089111328125, 253.0675506591797, 261.78424072265625, 270.5008850097656, 279.2175598144531, 287.9342346191406, 296.6509094238281, 305.3675842285156]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 4.0, 13.0, 25.0, 20.0, 26.0, 30.0, 35.0, 44.0, 64.0, 76.0, 69.0, 61.0, 65.0, 65.0, 70.0, 38.0, 52.0, 34.0, 53.0, 42.0, 20.0, 15.0, 14.0, 10.0, 12.0, 8.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.68359375, -3.55340576171875, -3.4232177734375, -3.29302978515625, -3.162841796875, -3.03265380859375, -2.9024658203125, -2.77227783203125, -2.64208984375, -2.51190185546875, -2.3817138671875, -2.25152587890625, -2.121337890625, -1.99114990234375, -1.8609619140625, -1.73077392578125, -1.6005859375, -1.47039794921875, -1.3402099609375, -1.21002197265625, -1.079833984375, -0.94964599609375, -0.8194580078125, -0.68927001953125, -0.55908203125, -0.42889404296875, -0.2987060546875, -0.16851806640625, -0.038330078125, 0.09185791015625, 0.2220458984375, 0.35223388671875, 0.482421875, 0.61260986328125, 0.7427978515625, 0.87298583984375, 1.003173828125, 1.13336181640625, 1.2635498046875, 1.39373779296875, 1.52392578125, 1.65411376953125, 1.7843017578125, 1.91448974609375, 2.044677734375, 2.17486572265625, 2.3050537109375, 2.43524169921875, 2.5654296875, 2.69561767578125, 2.8258056640625, 2.95599365234375, 3.086181640625, 3.21636962890625, 3.3465576171875, 3.47674560546875, 3.60693359375, 3.73712158203125, 3.8673095703125, 3.99749755859375, 4.127685546875, 4.25787353515625, 4.3880615234375, 4.51824951171875, 4.6484375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 7.0, 14.0, 16.0, 17.0, 36.0, 35.0, 43.0, 90.0, 106.0, 153.0, 232.0, 348.0, 522.0, 967.0, 1656.0, 3255.0, 8921.0, 53525.0, 4012053.0, 93158.0, 10593.0, 3822.0, 1825.0, 1045.0, 641.0, 379.0, 265.0, 150.0, 112.0, 80.0, 55.0, 38.0, 29.0, 22.0, 17.0, 12.0, 9.0, 9.0, 2.0, 8.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.03125, -26.9765625, -25.921875, -24.8671875, -23.8125, -22.7578125, -21.703125, -20.6484375, -19.59375, -18.5390625, -17.484375, -16.4296875, -15.375, -14.3203125, -13.265625, -12.2109375, -11.15625, -10.1015625, -9.046875, -7.9921875, -6.9375, -5.8828125, -4.828125, -3.7734375, -2.71875, -1.6640625, -0.609375, 0.4453125, 1.5, 2.5546875, 3.609375, 4.6640625, 5.71875, 6.7734375, 7.828125, 8.8828125, 9.9375, 10.9921875, 12.046875, 13.1015625, 14.15625, 15.2109375, 16.265625, 17.3203125, 18.375, 19.4296875, 20.484375, 21.5390625, 22.59375, 23.6484375, 24.703125, 25.7578125, 26.8125, 27.8671875, 28.921875, 29.9765625, 31.03125, 32.0859375, 33.140625, 34.1953125, 35.25, 36.3046875, 37.359375, 38.4140625, 39.46875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 8.0, 13.0, 16.0, 17.0, 30.0, 57.0, 65.0, 126.0, 246.0, 411.0, 905.0, 974.0, 520.0, 258.0, 158.0, 93.0, 62.0, 44.0, 22.0, 19.0, 6.0, 9.0, 4.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.4375, -18.88330078125, -18.3291015625, -17.77490234375, -17.220703125, -16.66650390625, -16.1123046875, -15.55810546875, -15.00390625, -14.44970703125, -13.8955078125, -13.34130859375, -12.787109375, -12.23291015625, -11.6787109375, -11.12451171875, -10.5703125, -10.01611328125, -9.4619140625, -8.90771484375, -8.353515625, -7.79931640625, -7.2451171875, -6.69091796875, -6.13671875, -5.58251953125, -5.0283203125, -4.47412109375, -3.919921875, -3.36572265625, -2.8115234375, -2.25732421875, -1.703125, -1.14892578125, -0.5947265625, -0.04052734375, 0.513671875, 1.06787109375, 1.6220703125, 2.17626953125, 2.73046875, 3.28466796875, 3.8388671875, 4.39306640625, 4.947265625, 5.50146484375, 6.0556640625, 6.60986328125, 7.1640625, 7.71826171875, 8.2724609375, 8.82666015625, 9.380859375, 9.93505859375, 10.4892578125, 11.04345703125, 11.59765625, 12.15185546875, 12.7060546875, 13.26025390625, 13.814453125, 14.36865234375, 14.9228515625, 15.47705078125, 16.03125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 8.0, 16.0, 18.0, 32.0, 70.0, 103.0, 139.0, 277.0, 607.0, 2123.0, 69665.0, 4099668.0, 19058.0, 1436.0, 466.0, 251.0, 128.0, 78.0, 49.0, 23.0, 18.0, 12.0, 9.0, 7.0, 9.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.875, -49.08203125, -47.2890625, -45.49609375, -43.703125, -41.91015625, -40.1171875, -38.32421875, -36.53125, -34.73828125, -32.9453125, -31.15234375, -29.359375, -27.56640625, -25.7734375, -23.98046875, -22.1875, -20.39453125, -18.6015625, -16.80859375, -15.015625, -13.22265625, -11.4296875, -9.63671875, -7.84375, -6.05078125, -4.2578125, -2.46484375, -0.671875, 1.12109375, 2.9140625, 4.70703125, 6.5, 8.29296875, 10.0859375, 11.87890625, 13.671875, 15.46484375, 17.2578125, 19.05078125, 20.84375, 22.63671875, 24.4296875, 26.22265625, 28.015625, 29.80859375, 31.6015625, 33.39453125, 35.1875, 36.98046875, 38.7734375, 40.56640625, 42.359375, 44.15234375, 45.9453125, 47.73828125, 49.53125, 51.32421875, 53.1171875, 54.91015625, 56.703125, 58.49609375, 60.2890625, 62.08203125, 63.875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 78.0, 747.0, 182.0, 8.0, 0.0, 0.0, 1.0], "bins": [-363.37139892578125, -357.1737365722656, -350.97607421875, -344.7784423828125, -338.5807800292969, -332.38311767578125, -326.18548583984375, -319.9878234863281, -313.7901611328125, -307.5924987792969, -301.39483642578125, -295.19720458984375, -288.9995422363281, -282.8018798828125, -276.604248046875, -270.4065856933594, -264.20892333984375, -258.0112609863281, -251.81361389160156, -245.615966796875, -239.41830444335938, -233.22064208984375, -227.0229949951172, -220.82534790039062, -214.627685546875, -208.43002319335938, -202.2323760986328, -196.03472900390625, -189.83706665039062, -183.639404296875, -177.44175720214844, -171.24411010742188, -165.04644775390625, -158.84878540039062, -152.65113830566406, -146.4534912109375, -140.25582885742188, -134.05816650390625, -127.86051940917969, -121.6628646850586, -115.4652099609375, -109.2675552368164, -103.06990051269531, -96.87224578857422, -90.67459106445312, -84.47693634033203, -78.27928161621094, -72.08162689208984, -65.88397216796875, -59.686317443847656, -53.48866271972656, -47.29100799560547, -41.093353271484375, -34.89569854736328, -28.698043823242188, -22.500389099121094, -16.302730560302734, -10.10507583618164, -3.907421112060547, 2.290233612060547, 8.48788833618164, 14.685543060302734, 20.883197784423828, 27.080852508544922, 33.278507232666016]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 1.0, 9.0, 9.0, 12.0, 19.0, 11.0, 19.0, 19.0, 19.0, 17.0, 44.0, 30.0, 37.0, 29.0, 29.0, 39.0, 32.0, 30.0, 41.0, 41.0, 40.0, 37.0, 38.0, 47.0, 45.0, 25.0, 39.0, 33.0, 28.0, 31.0, 23.0, 15.0, 11.0, 20.0, 19.0, 5.0, 17.0, 8.0, 7.0, 3.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.180938720703125, -34.971675872802734, -33.762413024902344, -32.55315017700195, -31.343887329101562, -30.134624481201172, -28.92536163330078, -27.71609878540039, -26.5068359375, -25.29757308959961, -24.08831024169922, -22.879047393798828, -21.669784545898438, -20.460521697998047, -19.251258850097656, -18.041996002197266, -16.832733154296875, -15.623470306396484, -14.414207458496094, -13.204944610595703, -11.995681762695312, -10.786418914794922, -9.577156066894531, -8.36789321899414, -7.15863037109375, -5.949367523193359, -4.740104675292969, -3.530841827392578, -2.3215789794921875, -1.1123161315917969, 0.09694671630859375, 1.3062095642089844, 2.515472412109375, 3.7247352600097656, 4.933998107910156, 6.143260955810547, 7.3525238037109375, 8.561786651611328, 9.771049499511719, 10.98031234741211, 12.1895751953125, 13.39883804321289, 14.608100891113281, 15.817363739013672, 17.026626586914062, 18.235889434814453, 19.445152282714844, 20.654415130615234, 21.863677978515625, 23.072940826416016, 24.282203674316406, 25.491466522216797, 26.700729370117188, 27.909992218017578, 29.11925506591797, 30.32851791381836, 31.53778076171875, 32.74704360961914, 33.95630645751953, 35.16556930541992, 36.37483215332031, 37.5840950012207, 38.793357849121094, 40.002620697021484, 41.211883544921875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 8.0, 12.0, 22.0, 22.0, 24.0, 27.0, 33.0, 47.0, 55.0, 62.0, 71.0, 62.0, 60.0, 59.0, 63.0, 50.0, 52.0, 41.0, 40.0, 43.0, 42.0, 17.0, 11.0, 13.0, 14.0, 7.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7421875, -3.615966796875, -3.48974609375, -3.363525390625, -3.2373046875, -3.111083984375, -2.98486328125, -2.858642578125, -2.732421875, -2.606201171875, -2.47998046875, -2.353759765625, -2.2275390625, -2.101318359375, -1.97509765625, -1.848876953125, -1.72265625, -1.596435546875, -1.47021484375, -1.343994140625, -1.2177734375, -1.091552734375, -0.96533203125, -0.839111328125, -0.712890625, -0.586669921875, -0.46044921875, -0.334228515625, -0.2080078125, -0.081787109375, 0.04443359375, 0.170654296875, 0.296875, 0.423095703125, 0.54931640625, 0.675537109375, 0.8017578125, 0.927978515625, 1.05419921875, 1.180419921875, 1.306640625, 1.432861328125, 1.55908203125, 1.685302734375, 1.8115234375, 1.937744140625, 2.06396484375, 2.190185546875, 2.31640625, 2.442626953125, 2.56884765625, 2.695068359375, 2.8212890625, 2.947509765625, 3.07373046875, 3.199951171875, 3.326171875, 3.452392578125, 3.57861328125, 3.704833984375, 3.8310546875, 3.957275390625, 4.08349609375, 4.209716796875, 4.3359375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 10.0, 13.0, 20.0, 28.0, 39.0, 44.0, 64.0, 72.0, 108.0, 186.0, 255.0, 332.0, 499.0, 831.0, 1275.0, 1952.0, 3235.0, 5302.0, 9157.0, 16816.0, 30462.0, 60081.0, 134801.0, 374003.0, 227760.0, 86716.0, 42041.0, 22027.0, 12174.0, 7066.0, 4086.0, 2419.0, 1539.0, 1039.0, 639.0, 450.0, 334.0, 203.0, 129.0, 110.0, 73.0, 47.0, 31.0, 22.0, 23.0, 14.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18324851989746094, -0.17728805541992188, -0.1713275909423828, -0.16536712646484375, -0.1594066619873047, -0.15344619750976562, -0.14748573303222656, -0.1415252685546875, -0.13556480407714844, -0.12960433959960938, -0.12364387512207031, -0.11768341064453125, -0.11172294616699219, -0.10576248168945312, -0.09980201721191406, -0.093841552734375, -0.08788108825683594, -0.08192062377929688, -0.07596015930175781, -0.06999969482421875, -0.06403923034667969, -0.058078765869140625, -0.05211830139160156, -0.0461578369140625, -0.04019737243652344, -0.034236907958984375, -0.028276443481445312, -0.02231597900390625, -0.016355514526367188, -0.010395050048828125, -0.0044345855712890625, 0.00152587890625, 0.0074863433837890625, 0.013446807861328125, 0.019407272338867188, 0.02536773681640625, 0.03132820129394531, 0.037288665771484375, 0.04324913024902344, 0.0492095947265625, 0.05517005920410156, 0.061130523681640625, 0.06709098815917969, 0.07305145263671875, 0.07901191711425781, 0.08497238159179688, 0.09093284606933594, 0.096893310546875, 0.10285377502441406, 0.10881423950195312, 0.11477470397949219, 0.12073516845703125, 0.1266956329345703, 0.13265609741210938, 0.13861656188964844, 0.1445770263671875, 0.15053749084472656, 0.15649795532226562, 0.1624584197998047, 0.16841888427734375, 0.1743793487548828, 0.18033981323242188, 0.18630027770996094, 0.1922607421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 2.0, 12.0, 5.0, 13.0, 6.0, 12.0, 23.0, 19.0, 22.0, 23.0, 24.0, 36.0, 38.0, 26.0, 38.0, 32.0, 48.0, 49.0, 47.0, 1077.0, 32.0, 50.0, 31.0, 45.0, 33.0, 41.0, 36.0, 27.0, 31.0, 27.0, 24.0, 19.0, 11.0, 16.0, 11.0, 5.0, 15.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.463836669921875, -2.38470458984375, -2.305572509765625, -2.2264404296875, -2.147308349609375, -2.06817626953125, -1.989044189453125, -1.909912109375, -1.830780029296875, -1.75164794921875, -1.672515869140625, -1.5933837890625, -1.514251708984375, -1.43511962890625, -1.355987548828125, -1.27685546875, -1.197723388671875, -1.11859130859375, -1.039459228515625, -0.9603271484375, -0.881195068359375, -0.80206298828125, -0.722930908203125, -0.643798828125, -0.564666748046875, -0.48553466796875, -0.406402587890625, -0.3272705078125, -0.248138427734375, -0.16900634765625, -0.089874267578125, -0.0107421875, 0.068389892578125, 0.14752197265625, 0.226654052734375, 0.3057861328125, 0.384918212890625, 0.46405029296875, 0.543182373046875, 0.622314453125, 0.701446533203125, 0.78057861328125, 0.859710693359375, 0.9388427734375, 1.017974853515625, 1.09710693359375, 1.176239013671875, 1.25537109375, 1.334503173828125, 1.41363525390625, 1.492767333984375, 1.5718994140625, 1.651031494140625, 1.73016357421875, 1.809295654296875, 1.888427734375, 1.967559814453125, 2.04669189453125, 2.125823974609375, 2.2049560546875, 2.284088134765625, 2.36322021484375, 2.442352294921875, 2.521484375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 13.0, 17.0, 21.0, 33.0, 53.0, 76.0, 139.0, 222.0, 367.0, 577.0, 957.0, 1549.0, 2567.0, 4386.0, 7353.0, 12684.0, 21799.0, 38586.0, 70465.0, 145112.0, 1387471.0, 201591.0, 89195.0, 47447.0, 26909.0, 15378.0, 8929.0, 5263.0, 3119.0, 1882.0, 1136.0, 691.0, 435.0, 284.0, 140.0, 113.0, 59.0, 43.0, 25.0, 15.0, 6.0, 11.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.094482421875, -0.09159088134765625, -0.0886993408203125, -0.08580780029296875, -0.082916259765625, -0.08002471923828125, -0.0771331787109375, -0.07424163818359375, -0.07135009765625, -0.06845855712890625, -0.0655670166015625, -0.06267547607421875, -0.059783935546875, -0.05689239501953125, -0.0540008544921875, -0.05110931396484375, -0.0482177734375, -0.04532623291015625, -0.0424346923828125, -0.03954315185546875, -0.036651611328125, -0.03376007080078125, -0.0308685302734375, -0.02797698974609375, -0.02508544921875, -0.02219390869140625, -0.0193023681640625, -0.01641082763671875, -0.013519287109375, -0.01062774658203125, -0.0077362060546875, -0.00484466552734375, -0.001953125, 0.00093841552734375, 0.0038299560546875, 0.00672149658203125, 0.009613037109375, 0.01250457763671875, 0.0153961181640625, 0.01828765869140625, 0.02117919921875, 0.02407073974609375, 0.0269622802734375, 0.02985382080078125, 0.032745361328125, 0.03563690185546875, 0.0385284423828125, 0.04141998291015625, 0.0443115234375, 0.04720306396484375, 0.0500946044921875, 0.05298614501953125, 0.055877685546875, 0.05876922607421875, 0.0616607666015625, 0.06455230712890625, 0.06744384765625, 0.07033538818359375, 0.0732269287109375, 0.07611846923828125, 0.079010009765625, 0.08190155029296875, 0.0847930908203125, 0.08768463134765625, 0.090576171875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 9.0, 6.0, 9.0, 7.0, 9.0, 16.0, 25.0, 13.0, 13.0, 21.0, 15.0, 25.0, 54.0, 39.0, 39.0, 28.0, 43.0, 48.0, 50.0, 42.0, 46.0, 41.0, 52.0, 47.0, 33.0, 33.0, 36.0, 28.0, 18.0, 14.0, 22.0, 14.0, 15.0, 18.0, 12.0, 11.0, 10.0, 16.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.355741500854492e-05, -3.243889659643173e-05, -3.132037818431854e-05, -3.0201859772205353e-05, -2.9083341360092163e-05, -2.7964822947978973e-05, -2.6846304535865784e-05, -2.5727786123752594e-05, -2.4609267711639404e-05, -2.3490749299526215e-05, -2.2372230887413025e-05, -2.1253712475299835e-05, -2.0135194063186646e-05, -1.9016675651073456e-05, -1.7898157238960266e-05, -1.6779638826847076e-05, -1.5661120414733887e-05, -1.4542602002620697e-05, -1.3424083590507507e-05, -1.2305565178394318e-05, -1.1187046766281128e-05, -1.0068528354167938e-05, -8.950009942054749e-06, -7.831491529941559e-06, -6.712973117828369e-06, -5.5944547057151794e-06, -4.47593629360199e-06, -3.3574178814888e-06, -2.2388994693756104e-06, -1.1203810572624207e-06, -1.862645149230957e-09, 1.1166557669639587e-06, 2.2351741790771484e-06, 3.353692591190338e-06, 4.472211003303528e-06, 5.5907294154167175e-06, 6.709247827529907e-06, 7.827766239643097e-06, 8.946284651756287e-06, 1.0064803063869476e-05, 1.1183321475982666e-05, 1.2301839888095856e-05, 1.3420358300209045e-05, 1.4538876712322235e-05, 1.5657395124435425e-05, 1.6775913536548615e-05, 1.7894431948661804e-05, 1.9012950360774994e-05, 2.0131468772888184e-05, 2.1249987185001373e-05, 2.2368505597114563e-05, 2.3487024009227753e-05, 2.4605542421340942e-05, 2.5724060833454132e-05, 2.6842579245567322e-05, 2.796109765768051e-05, 2.90796160697937e-05, 3.019813448190689e-05, 3.131665289402008e-05, 3.243517130613327e-05, 3.355368971824646e-05, 3.467220813035965e-05, 3.579072654247284e-05, 3.690924495458603e-05, 3.802776336669922e-05]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 8.0, 15.0, 11.0, 15.0, 15.0, 25.0, 30.0, 38.0, 30.0, 41.0, 58.0, 54.0, 89.0, 98.0, 148.0, 175.0, 168.0, 263.0, 319.0, 1035.0, 1036230.0, 7877.0, 415.0, 259.0, 217.0, 155.0, 145.0, 106.0, 92.0, 70.0, 66.0, 66.0, 45.0, 26.0, 19.0, 40.0, 26.0, 13.0, 10.0, 16.0, 10.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.0007548332214355469, -0.0007317513227462769, -0.0007086694240570068, -0.0006855875253677368, -0.0006625056266784668, -0.0006394237279891968, -0.0006163418292999268, -0.0005932599306106567, -0.0005701780319213867, -0.0005470961332321167, -0.0005240142345428467, -0.0005009323358535767, -0.00047785043716430664, -0.0004547685384750366, -0.0004316866397857666, -0.0004086047410964966, -0.00038552284240722656, -0.00036244094371795654, -0.0003393590450286865, -0.0003162771463394165, -0.0002931952476501465, -0.00027011334896087646, -0.00024703145027160645, -0.00022394955158233643, -0.0002008676528930664, -0.0001777857542037964, -0.00015470385551452637, -0.00013162195682525635, -0.00010854005813598633, -8.545815944671631e-05, -6.237626075744629e-05, -3.929436206817627e-05, -1.621246337890625e-05, 6.8694353103637695e-06, 2.995133399963379e-05, 5.303323268890381e-05, 7.611513137817383e-05, 9.919703006744385e-05, 0.00012227892875671387, 0.0001453608274459839, 0.0001684427261352539, 0.00019152462482452393, 0.00021460652351379395, 0.00023768842220306396, 0.000260770320892334, 0.000283852219581604, 0.000306934118270874, 0.00033001601696014404, 0.00035309791564941406, 0.0003761798143386841, 0.0003992617130279541, 0.0004223436117172241, 0.00044542551040649414, 0.00046850740909576416, 0.0004915893077850342, 0.0005146712064743042, 0.0005377531051635742, 0.0005608350038528442, 0.0005839169025421143, 0.0006069988012313843, 0.0006300806999206543, 0.0006531625986099243, 0.0006762444972991943, 0.0006993263959884644, 0.0007224082946777344]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 964.0, 54.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003014194662682712, -0.00029057663050480187, -0.000279733823845163, -0.00026889098808169365, -0.00025804818142205477, -0.00024720534565858543, -0.00023636252444703132, -0.0002255197032354772, -0.0002146768820239231, -0.000203834060812369, -0.00019299123960081488, -0.00018214841838926077, -0.00017130558262579143, -0.00016046277596615255, -0.0001496199402026832, -0.0001387771189911291, -0.000127934297779575, -0.00011709147656802088, -0.00010624865535646677, -9.540582686895505e-05, -8.456300565740094e-05, -7.372018444584683e-05, -6.28773559583351e-05, -5.203453474678099e-05, -4.119171353522688e-05, -3.0348890504683368e-05, -1.9506067474139854e-05, -8.663242624606937e-06, 2.179578586947173e-06, 1.3022399798501283e-05, 2.3865228286013007e-05, 3.470804949756712e-05, 4.555084160529077e-05, 5.639366281684488e-05, 6.723648402839899e-05, 7.807931251591071e-05, 8.892213372746482e-05, 9.976495493901893e-05, 0.00011060778342653066, 0.00012145060463808477, 0.00013229342584963888, 0.000143136247061193, 0.0001539790682727471, 0.0001648218894843012, 0.00017566472524777055, 0.00018650753190740943, 0.00019735036767087877, 0.00020819318888243288, 0.000219036010093987, 0.0002298788313055411, 0.0002407216525170952, 0.00025156448828056455, 0.00026240729494020343, 0.00027325013070367277, 0.0002840929664671421, 0.000294935773126781, 0.00030577857978641987, 0.0003166214155498892, 0.0003274642222095281, 0.0003383070579729974, 0.0003491498646326363, 0.00035999270039610565, 0.000370835536159575, 0.00038167834281921387, 0.0003925211785826832]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 12.0, 10.0, 9.0, 9.0, 15.0, 17.0, 29.0, 14.0, 29.0, 25.0, 26.0, 21.0, 28.0, 47.0, 32.0, 41.0, 40.0, 42.0, 52.0, 44.0, 33.0, 46.0, 30.0, 35.0, 42.0, 32.0, 31.0, 47.0, 20.0, 17.0, 16.0, 14.0, 16.0, 15.0, 10.0, 8.0, 6.0, 14.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4139881134033203e-05, -2.342555671930313e-05, -2.271123230457306e-05, -2.1996907889842987e-05, -2.1282583475112915e-05, -2.0568259060382843e-05, -1.985393464565277e-05, -1.91396102309227e-05, -1.8425285816192627e-05, -1.7710961401462555e-05, -1.6996636986732483e-05, -1.628231257200241e-05, -1.556798815727234e-05, -1.4853663742542267e-05, -1.4139339327812195e-05, -1.3425014913082123e-05, -1.271069049835205e-05, -1.1996366083621979e-05, -1.1282041668891907e-05, -1.0567717254161835e-05, -9.853392839431763e-06, -9.13906842470169e-06, -8.424744009971619e-06, -7.710419595241547e-06, -6.996095180511475e-06, -6.281770765781403e-06, -5.5674463510513306e-06, -4.8531219363212585e-06, -4.1387975215911865e-06, -3.4244731068611145e-06, -2.7101486921310425e-06, -1.9958242774009705e-06, -1.2814998626708984e-06, -5.671754479408264e-07, 1.471489667892456e-07, 8.614733815193176e-07, 1.5757977962493896e-06, 2.2901222109794617e-06, 3.0044466257095337e-06, 3.7187710404396057e-06, 4.433095455169678e-06, 5.14741986989975e-06, 5.861744284629822e-06, 6.576068699359894e-06, 7.290393114089966e-06, 8.004717528820038e-06, 8.71904194355011e-06, 9.433366358280182e-06, 1.0147690773010254e-05, 1.0862015187740326e-05, 1.1576339602470398e-05, 1.229066401720047e-05, 1.3004988431930542e-05, 1.3719312846660614e-05, 1.4433637261390686e-05, 1.5147961676120758e-05, 1.586228609085083e-05, 1.6576610505580902e-05, 1.7290934920310974e-05, 1.8005259335041046e-05, 1.8719583749771118e-05, 1.943390816450119e-05, 2.0148232579231262e-05, 2.0862556993961334e-05, 2.1576881408691406e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 8.0, 12.0, 22.0, 22.0, 24.0, 27.0, 33.0, 47.0, 55.0, 62.0, 71.0, 62.0, 60.0, 59.0, 63.0, 50.0, 52.0, 41.0, 40.0, 43.0, 42.0, 17.0, 11.0, 13.0, 14.0, 7.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7421875, -3.615966796875, -3.48974609375, -3.363525390625, -3.2373046875, -3.111083984375, -2.98486328125, -2.858642578125, -2.732421875, -2.606201171875, -2.47998046875, -2.353759765625, -2.2275390625, -2.101318359375, -1.97509765625, -1.848876953125, -1.72265625, -1.596435546875, -1.47021484375, -1.343994140625, -1.2177734375, -1.091552734375, -0.96533203125, -0.839111328125, -0.712890625, -0.586669921875, -0.46044921875, -0.334228515625, -0.2080078125, -0.081787109375, 0.04443359375, 0.170654296875, 0.296875, 0.423095703125, 0.54931640625, 0.675537109375, 0.8017578125, 0.927978515625, 1.05419921875, 1.180419921875, 1.306640625, 1.432861328125, 1.55908203125, 1.685302734375, 1.8115234375, 1.937744140625, 2.06396484375, 2.190185546875, 2.31640625, 2.442626953125, 2.56884765625, 2.695068359375, 2.8212890625, 2.947509765625, 3.07373046875, 3.199951171875, 3.326171875, 3.452392578125, 3.57861328125, 3.704833984375, 3.8310546875, 3.957275390625, 4.08349609375, 4.209716796875, 4.3359375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 9.0, 16.0, 21.0, 31.0, 34.0, 53.0, 67.0, 89.0, 101.0, 159.0, 234.0, 310.0, 488.0, 752.0, 1322.0, 2216.0, 3753.0, 8146.0, 25050.0, 240498.0, 705189.0, 38173.0, 10542.0, 4543.0, 2540.0, 1499.0, 880.0, 552.0, 322.0, 252.0, 196.0, 119.0, 95.0, 75.0, 47.0, 42.0, 32.0, 17.0, 12.0, 15.0, 11.0, 8.0, 3.0, 7.0, 3.0, 6.0, 2.0, 1.0, 1.0, 4.0], "bins": [-30.46875, -29.576171875, -28.68359375, -27.791015625, -26.8984375, -26.005859375, -25.11328125, -24.220703125, -23.328125, -22.435546875, -21.54296875, -20.650390625, -19.7578125, -18.865234375, -17.97265625, -17.080078125, -16.1875, -15.294921875, -14.40234375, -13.509765625, -12.6171875, -11.724609375, -10.83203125, -9.939453125, -9.046875, -8.154296875, -7.26171875, -6.369140625, -5.4765625, -4.583984375, -3.69140625, -2.798828125, -1.90625, -1.013671875, -0.12109375, 0.771484375, 1.6640625, 2.556640625, 3.44921875, 4.341796875, 5.234375, 6.126953125, 7.01953125, 7.912109375, 8.8046875, 9.697265625, 10.58984375, 11.482421875, 12.375, 13.267578125, 14.16015625, 15.052734375, 15.9453125, 16.837890625, 17.73046875, 18.623046875, 19.515625, 20.408203125, 21.30078125, 22.193359375, 23.0859375, 23.978515625, 24.87109375, 25.763671875, 26.65625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 10.0, 8.0, 10.0, 8.0, 16.0, 10.0, 12.0, 33.0, 18.0, 21.0, 27.0, 42.0, 34.0, 43.0, 51.0, 46.0, 74.0, 131.0, 1632.0, 233.0, 85.0, 56.0, 53.0, 63.0, 37.0, 49.0, 38.0, 31.0, 28.0, 34.0, 18.0, 19.0, 15.0, 15.0, 9.0, 10.0, 9.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.65625, -9.331298828125, -9.00634765625, -8.681396484375, -8.3564453125, -8.031494140625, -7.70654296875, -7.381591796875, -7.056640625, -6.731689453125, -6.40673828125, -6.081787109375, -5.7568359375, -5.431884765625, -5.10693359375, -4.781982421875, -4.45703125, -4.132080078125, -3.80712890625, -3.482177734375, -3.1572265625, -2.832275390625, -2.50732421875, -2.182373046875, -1.857421875, -1.532470703125, -1.20751953125, -0.882568359375, -0.5576171875, -0.232666015625, 0.09228515625, 0.417236328125, 0.7421875, 1.067138671875, 1.39208984375, 1.717041015625, 2.0419921875, 2.366943359375, 2.69189453125, 3.016845703125, 3.341796875, 3.666748046875, 3.99169921875, 4.316650390625, 4.6416015625, 4.966552734375, 5.29150390625, 5.616455078125, 5.94140625, 6.266357421875, 6.59130859375, 6.916259765625, 7.2412109375, 7.566162109375, 7.89111328125, 8.216064453125, 8.541015625, 8.865966796875, 9.19091796875, 9.515869140625, 9.8408203125, 10.165771484375, 10.49072265625, 10.815673828125, 11.140625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 8.0, 6.0, 12.0, 18.0, 12.0, 21.0, 16.0, 20.0, 31.0, 35.0, 40.0, 77.0, 78.0, 111.0, 271.0, 743.0, 7270.0, 3013481.0, 120248.0, 2208.0, 397.0, 185.0, 98.0, 68.0, 48.0, 36.0, 33.0, 12.0, 20.0, 22.0, 9.0, 8.0, 15.0, 12.0, 8.0, 6.0, 6.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.78125, -48.30810546875, -46.8349609375, -45.36181640625, -43.888671875, -42.41552734375, -40.9423828125, -39.46923828125, -37.99609375, -36.52294921875, -35.0498046875, -33.57666015625, -32.103515625, -30.63037109375, -29.1572265625, -27.68408203125, -26.2109375, -24.73779296875, -23.2646484375, -21.79150390625, -20.318359375, -18.84521484375, -17.3720703125, -15.89892578125, -14.42578125, -12.95263671875, -11.4794921875, -10.00634765625, -8.533203125, -7.06005859375, -5.5869140625, -4.11376953125, -2.640625, -1.16748046875, 0.3056640625, 1.77880859375, 3.251953125, 4.72509765625, 6.1982421875, 7.67138671875, 9.14453125, 10.61767578125, 12.0908203125, 13.56396484375, 15.037109375, 16.51025390625, 17.9833984375, 19.45654296875, 20.9296875, 22.40283203125, 23.8759765625, 25.34912109375, 26.822265625, 28.29541015625, 29.7685546875, 31.24169921875, 32.71484375, 34.18798828125, 35.6611328125, 37.13427734375, 38.607421875, 40.08056640625, 41.5537109375, 43.02685546875, 44.5]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 81.0, 607.0, 287.0, 32.0, 6.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.40023803710938, -179.775146484375, -176.1500701904297, -172.5249786376953, -168.89988708496094, -165.27479553222656, -161.64971923828125, -158.02462768554688, -154.3995361328125, -150.77444458007812, -147.1493682861328, -143.52427673339844, -139.89918518066406, -136.2740936279297, -132.64901733398438, -129.02392578125, -125.39884185791016, -121.77375793457031, -118.14866638183594, -114.5235824584961, -110.89849090576172, -107.27340698242188, -103.6483154296875, -100.02323150634766, -96.39814758300781, -92.77306365966797, -89.1479721069336, -85.52288818359375, -81.89779663085938, -78.27271270751953, -74.64762878417969, -71.02253723144531, -67.3974380493164, -63.7723503112793, -60.14726257324219, -56.522178649902344, -52.89708709716797, -49.272003173828125, -45.646915435791016, -42.021827697753906, -38.3967399597168, -34.77165222167969, -31.146564483642578, -27.5214786529541, -23.896390914916992, -20.271303176879883, -16.646217346191406, -13.021129608154297, -9.396041870117188, -5.770954608917236, -2.145867347717285, 1.4792194366455078, 5.104307174682617, 8.729394912719727, 12.354480743408203, 15.979568481445312, 19.604656219482422, 23.22974395751953, 26.85483169555664, 30.479917526245117, 34.105003356933594, 37.73009490966797, 41.35517883300781, 44.98026657104492, 48.60535430908203]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 2.0, 10.0, 13.0, 13.0, 12.0, 21.0, 21.0, 21.0, 20.0, 27.0, 24.0, 33.0, 41.0, 45.0, 41.0, 44.0, 41.0, 33.0, 31.0, 38.0, 39.0, 40.0, 39.0, 44.0, 32.0, 37.0, 21.0, 28.0, 29.0, 26.0, 25.0, 19.0, 17.0, 17.0, 9.0, 7.0, 5.0, 14.0, 2.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0], "bins": [-46.847984313964844, -45.650413513183594, -44.452842712402344, -43.25527572631836, -42.05770492553711, -40.86013412475586, -39.66256332397461, -38.464996337890625, -37.267425537109375, -36.069854736328125, -34.872283935546875, -33.67471694946289, -32.47714614868164, -31.27957534790039, -30.08200454711914, -28.884435653686523, -27.686864852905273, -26.489294052124023, -25.291725158691406, -24.094154357910156, -22.89658546447754, -21.69901466369629, -20.501445770263672, -19.303874969482422, -18.106304168701172, -16.908733367919922, -15.711164474487305, -14.513593673706055, -13.316024780273438, -12.118453979492188, -10.920884132385254, -9.72331428527832, -8.525745391845703, -7.3281755447387695, -6.130605697631836, -4.933035373687744, -3.7354655265808105, -2.537895679473877, -1.3403253555297852, -0.14275550842285156, 1.054814338684082, 2.2523841857910156, 3.4499542713165283, 4.647524356842041, 5.845094203948975, 7.042664051055908, 8.240234375, 9.437804222106934, 10.635374069213867, 11.8329439163208, 13.030513763427734, 14.228084564208984, 15.425653457641602, 16.62322425842285, 17.82079315185547, 19.01836395263672, 20.21593475341797, 21.41350555419922, 22.611074447631836, 23.808645248413086, 25.006214141845703, 26.203784942626953, 27.401355743408203, 28.59892463684082, 29.796493530273438]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 1.0, 4.0, 10.0, 12.0, 18.0, 16.0, 32.0, 20.0, 42.0, 26.0, 60.0, 55.0, 69.0, 67.0, 61.0, 54.0, 59.0, 56.0, 61.0, 42.0, 38.0, 41.0, 44.0, 28.0, 15.0, 14.0, 9.0, 7.0, 9.0, 6.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.765625, -3.63592529296875, -3.5062255859375, -3.37652587890625, -3.246826171875, -3.11712646484375, -2.9874267578125, -2.85772705078125, -2.72802734375, -2.59832763671875, -2.4686279296875, -2.33892822265625, -2.209228515625, -2.07952880859375, -1.9498291015625, -1.82012939453125, -1.6904296875, -1.56072998046875, -1.4310302734375, -1.30133056640625, -1.171630859375, -1.04193115234375, -0.9122314453125, -0.78253173828125, -0.65283203125, -0.52313232421875, -0.3934326171875, -0.26373291015625, -0.134033203125, -0.00433349609375, 0.1253662109375, 0.25506591796875, 0.384765625, 0.51446533203125, 0.6441650390625, 0.77386474609375, 0.903564453125, 1.03326416015625, 1.1629638671875, 1.29266357421875, 1.42236328125, 1.55206298828125, 1.6817626953125, 1.81146240234375, 1.941162109375, 2.07086181640625, 2.2005615234375, 2.33026123046875, 2.4599609375, 2.58966064453125, 2.7193603515625, 2.84906005859375, 2.978759765625, 3.10845947265625, 3.2381591796875, 3.36785888671875, 3.49755859375, 3.62725830078125, 3.7569580078125, 3.88665771484375, 4.016357421875, 4.14605712890625, 4.2757568359375, 4.40545654296875, 4.53515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 4.0, 1.0, 5.0, 3.0, 4.0, 8.0, 5.0, 21.0, 26.0, 43.0, 51.0, 85.0, 108.0, 178.0, 353.0, 657.0, 1463.0, 4000.0, 29359.0, 3998291.0, 148669.0, 7003.0, 2000.0, 876.0, 420.0, 244.0, 134.0, 87.0, 57.0, 28.0, 18.0, 22.0, 18.0, 9.0, 6.0, 3.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.21875, -37.8515625, -36.484375, -35.1171875, -33.75, -32.3828125, -31.015625, -29.6484375, -28.28125, -26.9140625, -25.546875, -24.1796875, -22.8125, -21.4453125, -20.078125, -18.7109375, -17.34375, -15.9765625, -14.609375, -13.2421875, -11.875, -10.5078125, -9.140625, -7.7734375, -6.40625, -5.0390625, -3.671875, -2.3046875, -0.9375, 0.4296875, 1.796875, 3.1640625, 4.53125, 5.8984375, 7.265625, 8.6328125, 10.0, 11.3671875, 12.734375, 14.1015625, 15.46875, 16.8359375, 18.203125, 19.5703125, 20.9375, 22.3046875, 23.671875, 25.0390625, 26.40625, 27.7734375, 29.140625, 30.5078125, 31.875, 33.2421875, 34.609375, 35.9765625, 37.34375, 38.7109375, 40.078125, 41.4453125, 42.8125, 44.1796875, 45.546875, 46.9140625, 48.28125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 9.0, 13.0, 14.0, 23.0, 27.0, 54.0, 67.0, 133.0, 150.0, 251.0, 440.0, 702.0, 834.0, 495.0, 285.0, 201.0, 114.0, 87.0, 60.0, 33.0, 33.0, 16.0, 10.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.96875, -10.51318359375, -10.0576171875, -9.60205078125, -9.146484375, -8.69091796875, -8.2353515625, -7.77978515625, -7.32421875, -6.86865234375, -6.4130859375, -5.95751953125, -5.501953125, -5.04638671875, -4.5908203125, -4.13525390625, -3.6796875, -3.22412109375, -2.7685546875, -2.31298828125, -1.857421875, -1.40185546875, -0.9462890625, -0.49072265625, -0.03515625, 0.42041015625, 0.8759765625, 1.33154296875, 1.787109375, 2.24267578125, 2.6982421875, 3.15380859375, 3.609375, 4.06494140625, 4.5205078125, 4.97607421875, 5.431640625, 5.88720703125, 6.3427734375, 6.79833984375, 7.25390625, 7.70947265625, 8.1650390625, 8.62060546875, 9.076171875, 9.53173828125, 9.9873046875, 10.44287109375, 10.8984375, 11.35400390625, 11.8095703125, 12.26513671875, 12.720703125, 13.17626953125, 13.6318359375, 14.08740234375, 14.54296875, 14.99853515625, 15.4541015625, 15.90966796875, 16.365234375, 16.82080078125, 17.2763671875, 17.73193359375, 18.1875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 2.0, 11.0, 17.0, 49.0, 43.0, 91.0, 153.0, 270.0, 478.0, 1108.0, 2627.0, 8487.0, 34944.0, 285525.0, 3389806.0, 410570.0, 44501.0, 9911.0, 3166.0, 1303.0, 511.0, 305.0, 144.0, 103.0, 66.0, 31.0, 15.0, 18.0, 8.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.953125, -21.094482421875, -20.23583984375, -19.377197265625, -18.5185546875, -17.659912109375, -16.80126953125, -15.942626953125, -15.083984375, -14.225341796875, -13.36669921875, -12.508056640625, -11.6494140625, -10.790771484375, -9.93212890625, -9.073486328125, -8.21484375, -7.356201171875, -6.49755859375, -5.638916015625, -4.7802734375, -3.921630859375, -3.06298828125, -2.204345703125, -1.345703125, -0.487060546875, 0.37158203125, 1.230224609375, 2.0888671875, 2.947509765625, 3.80615234375, 4.664794921875, 5.5234375, 6.382080078125, 7.24072265625, 8.099365234375, 8.9580078125, 9.816650390625, 10.67529296875, 11.533935546875, 12.392578125, 13.251220703125, 14.10986328125, 14.968505859375, 15.8271484375, 16.685791015625, 17.54443359375, 18.403076171875, 19.26171875, 20.120361328125, 20.97900390625, 21.837646484375, 22.6962890625, 23.554931640625, 24.41357421875, 25.272216796875, 26.130859375, 26.989501953125, 27.84814453125, 28.706787109375, 29.5654296875, 30.424072265625, 31.28271484375, 32.141357421875, 33.0]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 11.0, 42.0, 166.0, 319.0, 329.0, 115.0, 20.0, 11.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.693973541259766, -32.02808380126953, -27.362192153930664, -22.696300506591797, -18.030410766601562, -13.364521026611328, -8.698629379272461, -4.032737731933594, 0.6331520080566406, 5.299042701721191, 9.964933395385742, 14.630824089050293, 19.296714782714844, 23.962604522705078, 28.628496170043945, 33.29438781738281, 37.96027755737305, 42.62616729736328, 47.29206085205078, 51.957950592041016, 56.62384033203125, 61.289730072021484, 65.95561981201172, 70.62151336669922, 75.28739929199219, 79.95329284667969, 84.61917877197266, 89.28507232666016, 93.95095825195312, 98.61685180664062, 103.28274536132812, 107.94863891601562, 112.61453247070312, 117.28042602539062, 121.9463119506836, 126.6122055053711, 131.27809143066406, 135.94398498535156, 140.60987854003906, 145.27577209472656, 149.941650390625, 154.6075439453125, 159.2734375, 163.93931579589844, 168.60520935058594, 173.27110290527344, 177.93699645996094, 182.60289001464844, 187.26878356933594, 191.93467712402344, 196.60057067871094, 201.26644897460938, 205.93234252929688, 210.59823608398438, 215.26412963867188, 219.93002319335938, 224.59591674804688, 229.26181030273438, 233.92770385742188, 238.5935821533203, 243.2594757080078, 247.9253692626953, 252.5912628173828, 257.25714111328125, 261.92303466796875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 5.0, 7.0, 24.0, 25.0, 20.0, 16.0, 36.0, 33.0, 30.0, 32.0, 32.0, 38.0, 48.0, 47.0, 39.0, 48.0, 37.0, 39.0, 39.0, 39.0, 45.0, 47.0, 36.0, 35.0, 35.0, 32.0, 26.0, 14.0, 20.0, 14.0, 10.0, 8.0, 9.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.860904693603516, -38.67665481567383, -37.492401123046875, -36.30815124511719, -35.1239013671875, -33.93965148925781, -32.75539779663086, -31.571147918701172, -30.38689613342285, -29.20264434814453, -28.018394470214844, -26.834142684936523, -25.649890899658203, -24.465641021728516, -23.281389236450195, -22.097137451171875, -20.912887573242188, -19.728635787963867, -18.54438591003418, -17.36013412475586, -16.175884246826172, -14.991632461547852, -13.807380676269531, -12.623129844665527, -11.438879013061523, -10.25462818145752, -9.070377349853516, -7.886125564575195, -6.701874732971191, -5.5176239013671875, -4.333372592926025, -3.1491212844848633, -1.9648666381835938, -0.7806155681610107, 0.40363550186157227, 1.5878865718841553, 2.7721376419067383, 3.956388473510742, 5.140639781951904, 6.324891090393066, 7.50914192199707, 8.693392753601074, 9.877643585205078, 11.061895370483398, 12.246146202087402, 13.430397033691406, 14.614648818969727, 15.79889965057373, 16.983150482177734, 18.167402267456055, 19.351652145385742, 20.535903930664062, 21.72015380859375, 22.90440559387207, 24.08865737915039, 25.272907257080078, 26.4571590423584, 27.64141082763672, 28.825660705566406, 30.009912490844727, 31.194164276123047, 32.378414154052734, 33.56266403198242, 34.746917724609375, 35.93116760253906]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 4.0, 15.0, 19.0, 22.0, 22.0, 31.0, 37.0, 40.0, 40.0, 42.0, 54.0, 54.0, 51.0, 63.0, 59.0, 57.0, 48.0, 52.0, 59.0, 37.0, 35.0, 26.0, 29.0, 12.0, 19.0, 15.0, 10.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.814453125, -3.690277099609375, -3.56610107421875, -3.441925048828125, -3.3177490234375, -3.193572998046875, -3.06939697265625, -2.945220947265625, -2.821044921875, -2.696868896484375, -2.57269287109375, -2.448516845703125, -2.3243408203125, -2.200164794921875, -2.07598876953125, -1.951812744140625, -1.82763671875, -1.703460693359375, -1.57928466796875, -1.455108642578125, -1.3309326171875, -1.206756591796875, -1.08258056640625, -0.958404541015625, -0.834228515625, -0.710052490234375, -0.58587646484375, -0.461700439453125, -0.3375244140625, -0.213348388671875, -0.08917236328125, 0.035003662109375, 0.1591796875, 0.283355712890625, 0.40753173828125, 0.531707763671875, 0.6558837890625, 0.780059814453125, 0.90423583984375, 1.028411865234375, 1.152587890625, 1.276763916015625, 1.40093994140625, 1.525115966796875, 1.6492919921875, 1.773468017578125, 1.89764404296875, 2.021820068359375, 2.14599609375, 2.270172119140625, 2.39434814453125, 2.518524169921875, 2.6427001953125, 2.766876220703125, 2.89105224609375, 3.015228271484375, 3.139404296875, 3.263580322265625, 3.38775634765625, 3.511932373046875, 3.6361083984375, 3.760284423828125, 3.88446044921875, 4.008636474609375, 4.1328125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 12.0, 21.0, 18.0, 37.0, 44.0, 76.0, 102.0, 145.0, 178.0, 259.0, 362.0, 516.0, 770.0, 1213.0, 1784.0, 2747.0, 4432.0, 7326.0, 12256.0, 21300.0, 38351.0, 73943.0, 167287.0, 381444.0, 167703.0, 74377.0, 38180.0, 21286.0, 12278.0, 7355.0, 4444.0, 2714.0, 1815.0, 1161.0, 759.0, 561.0, 377.0, 248.0, 194.0, 150.0, 78.0, 67.0, 45.0, 40.0, 24.0, 16.0, 12.0, 9.0, 7.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.17041015625, -0.16516685485839844, -0.15992355346679688, -0.1546802520751953, -0.14943695068359375, -0.1441936492919922, -0.13895034790039062, -0.13370704650878906, -0.1284637451171875, -0.12322044372558594, -0.11797714233398438, -0.11273384094238281, -0.10749053955078125, -0.10224723815917969, -0.09700393676757812, -0.09176063537597656, -0.086517333984375, -0.08127403259277344, -0.07603073120117188, -0.07078742980957031, -0.06554412841796875, -0.06030082702636719, -0.055057525634765625, -0.04981422424316406, -0.0445709228515625, -0.03932762145996094, -0.034084320068359375, -0.028841018676757812, -0.02359771728515625, -0.018354415893554688, -0.013111114501953125, -0.007867813110351562, -0.00262451171875, 0.0026187896728515625, 0.007862091064453125, 0.013105392456054688, 0.01834869384765625, 0.023591995239257812, 0.028835296630859375, 0.03407859802246094, 0.0393218994140625, 0.04456520080566406, 0.049808502197265625, 0.05505180358886719, 0.06029510498046875, 0.06553840637207031, 0.07078170776367188, 0.07602500915527344, 0.081268310546875, 0.08651161193847656, 0.09175491333007812, 0.09699821472167969, 0.10224151611328125, 0.10748481750488281, 0.11272811889648438, 0.11797142028808594, 0.1232147216796875, 0.12845802307128906, 0.13370132446289062, 0.1389446258544922, 0.14418792724609375, 0.1494312286376953, 0.15467453002929688, 0.15991783142089844, 0.1651611328125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 11.0, 8.0, 9.0, 12.0, 19.0, 25.0, 25.0, 23.0, 21.0, 30.0, 28.0, 33.0, 31.0, 35.0, 35.0, 35.0, 24.0, 31.0, 47.0, 1059.0, 42.0, 35.0, 28.0, 45.0, 29.0, 32.0, 27.0, 34.0, 22.0, 15.0, 27.0, 19.0, 21.0, 12.0, 9.0, 13.0, 14.0, 4.0, 8.0, 8.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-2.435546875, -2.3642578125, -2.29296875, -2.2216796875, -2.150390625, -2.0791015625, -2.0078125, -1.9365234375, -1.865234375, -1.7939453125, -1.72265625, -1.6513671875, -1.580078125, -1.5087890625, -1.4375, -1.3662109375, -1.294921875, -1.2236328125, -1.15234375, -1.0810546875, -1.009765625, -0.9384765625, -0.8671875, -0.7958984375, -0.724609375, -0.6533203125, -0.58203125, -0.5107421875, -0.439453125, -0.3681640625, -0.296875, -0.2255859375, -0.154296875, -0.0830078125, -0.01171875, 0.0595703125, 0.130859375, 0.2021484375, 0.2734375, 0.3447265625, 0.416015625, 0.4873046875, 0.55859375, 0.6298828125, 0.701171875, 0.7724609375, 0.84375, 0.9150390625, 0.986328125, 1.0576171875, 1.12890625, 1.2001953125, 1.271484375, 1.3427734375, 1.4140625, 1.4853515625, 1.556640625, 1.6279296875, 1.69921875, 1.7705078125, 1.841796875, 1.9130859375, 1.984375, 2.0556640625, 2.126953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 1.0, 5.0, 13.0, 21.0, 27.0, 46.0, 56.0, 113.0, 170.0, 272.0, 440.0, 682.0, 1061.0, 1625.0, 2707.0, 4259.0, 6952.0, 11342.0, 18354.0, 30352.0, 50682.0, 89929.0, 185379.0, 1356142.0, 148150.0, 76623.0, 43434.0, 26301.0, 15918.0, 9888.0, 6123.0, 3728.0, 2366.0, 1442.0, 954.0, 577.0, 374.0, 204.0, 157.0, 98.0, 61.0, 29.0, 26.0, 19.0, 16.0, 9.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0931396484375, -0.09042930603027344, -0.08771896362304688, -0.08500862121582031, -0.08229827880859375, -0.07958793640136719, -0.07687759399414062, -0.07416725158691406, -0.0714569091796875, -0.06874656677246094, -0.06603622436523438, -0.06332588195800781, -0.06061553955078125, -0.05790519714355469, -0.055194854736328125, -0.05248451232910156, -0.049774169921875, -0.04706382751464844, -0.044353485107421875, -0.04164314270019531, -0.03893280029296875, -0.03622245788574219, -0.033512115478515625, -0.030801773071289062, -0.0280914306640625, -0.025381088256835938, -0.022670745849609375, -0.019960403442382812, -0.01725006103515625, -0.014539718627929688, -0.011829376220703125, -0.009119033813476562, -0.00640869140625, -0.0036983489990234375, -0.000988006591796875, 0.0017223358154296875, 0.00443267822265625, 0.0071430206298828125, 0.009853363037109375, 0.012563705444335938, 0.0152740478515625, 0.017984390258789062, 0.020694732666015625, 0.023405075073242188, 0.02611541748046875, 0.028825759887695312, 0.031536102294921875, 0.03424644470214844, 0.036956787109375, 0.03966712951660156, 0.042377471923828125, 0.04508781433105469, 0.04779815673828125, 0.05050849914550781, 0.053218841552734375, 0.05592918395996094, 0.0586395263671875, 0.06134986877441406, 0.06406021118164062, 0.06677055358886719, 0.06948089599609375, 0.07219123840332031, 0.07490158081054688, 0.07761192321777344, 0.080322265625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 13.0, 6.0, 8.0, 16.0, 20.0, 14.0, 29.0, 21.0, 38.0, 48.0, 38.0, 48.0, 51.0, 40.0, 43.0, 48.0, 54.0, 44.0, 53.0, 46.0, 46.0, 25.0, 30.0, 39.0, 30.0, 20.0, 23.0, 14.0, 12.0, 19.0, 15.0, 7.0, 9.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.629922866821289e-05, -3.520585596561432e-05, -3.411248326301575e-05, -3.3019110560417175e-05, -3.1925737857818604e-05, -3.083236515522003e-05, -2.973899245262146e-05, -2.8645619750022888e-05, -2.7552247047424316e-05, -2.6458874344825745e-05, -2.5365501642227173e-05, -2.42721289396286e-05, -2.317875623703003e-05, -2.2085383534431458e-05, -2.0992010831832886e-05, -1.9898638129234314e-05, -1.8805265426635742e-05, -1.771189272403717e-05, -1.66185200214386e-05, -1.5525147318840027e-05, -1.4431774616241455e-05, -1.3338401913642883e-05, -1.2245029211044312e-05, -1.115165650844574e-05, -1.0058283805847168e-05, -8.964911103248596e-06, -7.871538400650024e-06, -6.778165698051453e-06, -5.684792995452881e-06, -4.591420292854309e-06, -3.4980475902557373e-06, -2.4046748876571655e-06, -1.3113021850585938e-06, -2.1792948246002197e-07, 8.754432201385498e-07, 1.9688159227371216e-06, 3.0621886253356934e-06, 4.155561327934265e-06, 5.248934030532837e-06, 6.342306733131409e-06, 7.4356794357299805e-06, 8.529052138328552e-06, 9.622424840927124e-06, 1.0715797543525696e-05, 1.1809170246124268e-05, 1.290254294872284e-05, 1.3995915651321411e-05, 1.5089288353919983e-05, 1.6182661056518555e-05, 1.7276033759117126e-05, 1.8369406461715698e-05, 1.946277916431427e-05, 2.0556151866912842e-05, 2.1649524569511414e-05, 2.2742897272109985e-05, 2.3836269974708557e-05, 2.492964267730713e-05, 2.60230153799057e-05, 2.7116388082504272e-05, 2.8209760785102844e-05, 2.9303133487701416e-05, 3.0396506190299988e-05, 3.148987889289856e-05, 3.258325159549713e-05, 3.36766242980957e-05]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 10.0, 4.0, 8.0, 7.0, 10.0, 12.0, 16.0, 25.0, 34.0, 33.0, 50.0, 49.0, 59.0, 80.0, 110.0, 104.0, 136.0, 140.0, 175.0, 331.0, 2120.0, 193166.0, 838969.0, 11151.0, 578.0, 207.0, 172.0, 123.0, 98.0, 92.0, 89.0, 58.0, 62.0, 46.0, 49.0, 50.0, 21.0, 26.0, 23.0, 11.0, 15.0, 9.0, 2.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005736351013183594, -0.0005552619695663452, -0.0005368888378143311, -0.0005185157060623169, -0.0005001425743103027, -0.0004817694425582886, -0.0004633963108062744, -0.00044502317905426025, -0.0004266500473022461, -0.00040827691555023193, -0.0003899037837982178, -0.0003715306520462036, -0.00035315752029418945, -0.0003347843885421753, -0.00031641125679016113, -0.00029803812503814697, -0.0002796649932861328, -0.00026129186153411865, -0.0002429187297821045, -0.00022454559803009033, -0.00020617246627807617, -0.000187799334526062, -0.00016942620277404785, -0.0001510530710220337, -0.00013267993927001953, -0.00011430680751800537, -9.593367576599121e-05, -7.756054401397705e-05, -5.918741226196289e-05, -4.081428050994873e-05, -2.244114875793457e-05, -4.06801700592041e-06, 1.430511474609375e-05, 3.267824649810791e-05, 5.105137825012207e-05, 6.942451000213623e-05, 8.779764175415039e-05, 0.00010617077350616455, 0.0001245439052581787, 0.00014291703701019287, 0.00016129016876220703, 0.0001796633005142212, 0.00019803643226623535, 0.0002164095640182495, 0.00023478269577026367, 0.00025315582752227783, 0.000271528959274292, 0.00028990209102630615, 0.0003082752227783203, 0.00032664835453033447, 0.00034502148628234863, 0.0003633946180343628, 0.00038176774978637695, 0.0004001408815383911, 0.0004185140132904053, 0.00043688714504241943, 0.0004552602767944336, 0.00047363340854644775, 0.0004920065402984619, 0.0005103796720504761, 0.0005287528038024902, 0.0005471259355545044, 0.0005654990673065186, 0.0005838721990585327, 0.0006022453308105469]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 23.0, 37.0, 130.0, 315.0, 326.0, 127.0, 42.0, 8.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.350548210320994e-05, -5.9986017731716856e-05, -5.646655336022377e-05, -5.2947088988730684e-05, -4.94276246172376e-05, -4.590816024574451e-05, -4.2388695874251425e-05, -3.886923150275834e-05, -3.534976713126525e-05, -3.1830302759772167e-05, -2.831083838827908e-05, -2.4791374016785994e-05, -2.1271909645292908e-05, -1.7752445273799822e-05, -1.4232980902306736e-05, -1.071351653081365e-05, -7.194052159320563e-06, -3.674587787827477e-06, -1.5512341633439064e-07, 3.3643409551586956e-06, 6.883805326651782e-06, 1.0403269698144868e-05, 1.3922734069637954e-05, 1.744219844113104e-05, 2.0961662812624127e-05, 2.4481127184117213e-05, 2.80005915556103e-05, 3.1520055927103385e-05, 3.503952029859647e-05, 3.855898467008956e-05, 4.2078449041582644e-05, 4.559791341307573e-05, 4.911738506052643e-05, 5.263684943201952e-05, 5.61563138035126e-05, 5.967577817500569e-05, 6.319524254649878e-05, 6.671471055597067e-05, 7.023417128948495e-05, 7.375363202299923e-05, 7.727310003247112e-05, 8.079256804194301e-05, 8.431202877545729e-05, 8.783148950897157e-05, 9.135095751844347e-05, 9.487042552791536e-05, 9.838988626142964e-05, 0.00010190934699494392, 0.00010542881500441581, 0.0001089482830138877, 0.00011246774374740198, 0.00011598720448091626, 0.00011950667249038815, 0.00012302614049986005, 0.00012654560850933194, 0.0001300650619668886, 0.0001335845299763605, 0.0001371039979858324, 0.00014062345144338906, 0.00014414291945286095, 0.00014766238746233284, 0.00015118185547180474, 0.00015470132348127663, 0.0001582207769388333, 0.0001617402449483052]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 9.0, 17.0, 24.0, 27.0, 31.0, 35.0, 41.0, 33.0, 43.0, 47.0, 44.0, 49.0, 71.0, 54.0, 55.0, 53.0, 45.0, 40.0, 41.0, 50.0, 36.0, 29.0, 29.0, 23.0, 15.0, 12.0, 7.0, 9.0, 3.0, 4.0, 2.0, 3.0, 5.0, 0.0, 4.0], "bins": [-4.178285598754883e-05, -4.078727215528488e-05, -3.9791688323020935e-05, -3.879610449075699e-05, -3.780052065849304e-05, -3.6804936826229095e-05, -3.580935299396515e-05, -3.48137691617012e-05, -3.3818185329437256e-05, -3.282260149717331e-05, -3.182701766490936e-05, -3.0831433832645416e-05, -2.983585000038147e-05, -2.8840266168117523e-05, -2.7844682335853577e-05, -2.684909850358963e-05, -2.5853514671325684e-05, -2.4857930839061737e-05, -2.386234700679779e-05, -2.2866763174533844e-05, -2.1871179342269897e-05, -2.087559551000595e-05, -1.9880011677742004e-05, -1.8884427845478058e-05, -1.788884401321411e-05, -1.6893260180950165e-05, -1.5897676348686218e-05, -1.4902092516422272e-05, -1.3906508684158325e-05, -1.2910924851894379e-05, -1.1915341019630432e-05, -1.0919757187366486e-05, -9.924173355102539e-06, -8.928589522838593e-06, -7.933005690574646e-06, -6.9374218583106995e-06, -5.941838026046753e-06, -4.946254193782806e-06, -3.95067036151886e-06, -2.9550865292549133e-06, -1.959502696990967e-06, -9.639188647270203e-07, 3.166496753692627e-08, 1.0272487998008728e-06, 2.0228326320648193e-06, 3.018416464328766e-06, 4.014000296592712e-06, 5.009584128856659e-06, 6.0051679611206055e-06, 7.000751793384552e-06, 7.996335625648499e-06, 8.991919457912445e-06, 9.987503290176392e-06, 1.0983087122440338e-05, 1.1978670954704285e-05, 1.2974254786968231e-05, 1.3969838619232178e-05, 1.4965422451496124e-05, 1.596100628376007e-05, 1.6956590116024017e-05, 1.7952173948287964e-05, 1.894775778055191e-05, 1.9943341612815857e-05, 2.0938925445079803e-05, 2.193450927734375e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 4.0, 15.0, 19.0, 22.0, 22.0, 31.0, 37.0, 40.0, 40.0, 42.0, 54.0, 54.0, 51.0, 63.0, 59.0, 57.0, 48.0, 52.0, 59.0, 37.0, 35.0, 26.0, 29.0, 12.0, 19.0, 15.0, 10.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.814453125, -3.690277099609375, -3.56610107421875, -3.441925048828125, -3.3177490234375, -3.193572998046875, -3.06939697265625, -2.945220947265625, -2.821044921875, -2.696868896484375, -2.57269287109375, -2.448516845703125, -2.3243408203125, -2.200164794921875, -2.07598876953125, -1.951812744140625, -1.82763671875, -1.703460693359375, -1.57928466796875, -1.455108642578125, -1.3309326171875, -1.206756591796875, -1.08258056640625, -0.958404541015625, -0.834228515625, -0.710052490234375, -0.58587646484375, -0.461700439453125, -0.3375244140625, -0.213348388671875, -0.08917236328125, 0.035003662109375, 0.1591796875, 0.283355712890625, 0.40753173828125, 0.531707763671875, 0.6558837890625, 0.780059814453125, 0.90423583984375, 1.028411865234375, 1.152587890625, 1.276763916015625, 1.40093994140625, 1.525115966796875, 1.6492919921875, 1.773468017578125, 1.89764404296875, 2.021820068359375, 2.14599609375, 2.270172119140625, 2.39434814453125, 2.518524169921875, 2.6427001953125, 2.766876220703125, 2.89105224609375, 3.015228271484375, 3.139404296875, 3.263580322265625, 3.38775634765625, 3.511932373046875, 3.6361083984375, 3.760284423828125, 3.88446044921875, 4.008636474609375, 4.1328125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 14.0, 19.0, 10.0, 14.0, 32.0, 36.0, 66.0, 107.0, 128.0, 261.0, 394.0, 692.0, 1155.0, 1950.0, 3639.0, 7437.0, 16537.0, 44904.0, 163382.0, 547517.0, 177570.0, 48302.0, 17704.0, 7744.0, 3960.0, 2047.0, 1081.0, 674.0, 399.0, 270.0, 150.0, 123.0, 76.0, 50.0, 33.0, 20.0, 7.0, 15.0, 6.0, 6.0, 0.0, 1.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.734375, -3.612060546875, -3.48974609375, -3.367431640625, -3.2451171875, -3.122802734375, -3.00048828125, -2.878173828125, -2.755859375, -2.633544921875, -2.51123046875, -2.388916015625, -2.2666015625, -2.144287109375, -2.02197265625, -1.899658203125, -1.77734375, -1.655029296875, -1.53271484375, -1.410400390625, -1.2880859375, -1.165771484375, -1.04345703125, -0.921142578125, -0.798828125, -0.676513671875, -0.55419921875, -0.431884765625, -0.3095703125, -0.187255859375, -0.06494140625, 0.057373046875, 0.1796875, 0.302001953125, 0.42431640625, 0.546630859375, 0.6689453125, 0.791259765625, 0.91357421875, 1.035888671875, 1.158203125, 1.280517578125, 1.40283203125, 1.525146484375, 1.6474609375, 1.769775390625, 1.89208984375, 2.014404296875, 2.13671875, 2.259033203125, 2.38134765625, 2.503662109375, 2.6259765625, 2.748291015625, 2.87060546875, 2.992919921875, 3.115234375, 3.237548828125, 3.35986328125, 3.482177734375, 3.6044921875, 3.726806640625, 3.84912109375, 3.971435546875, 4.09375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 6.0, 7.0, 9.0, 10.0, 13.0, 13.0, 18.0, 19.0, 19.0, 29.0, 37.0, 31.0, 33.0, 39.0, 49.0, 46.0, 60.0, 126.0, 1810.0, 172.0, 76.0, 50.0, 54.0, 43.0, 36.0, 42.0, 28.0, 22.0, 22.0, 22.0, 28.0, 16.0, 15.0, 8.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.5234375, -13.14306640625, -12.7626953125, -12.38232421875, -12.001953125, -11.62158203125, -11.2412109375, -10.86083984375, -10.48046875, -10.10009765625, -9.7197265625, -9.33935546875, -8.958984375, -8.57861328125, -8.1982421875, -7.81787109375, -7.4375, -7.05712890625, -6.6767578125, -6.29638671875, -5.916015625, -5.53564453125, -5.1552734375, -4.77490234375, -4.39453125, -4.01416015625, -3.6337890625, -3.25341796875, -2.873046875, -2.49267578125, -2.1123046875, -1.73193359375, -1.3515625, -0.97119140625, -0.5908203125, -0.21044921875, 0.169921875, 0.55029296875, 0.9306640625, 1.31103515625, 1.69140625, 2.07177734375, 2.4521484375, 2.83251953125, 3.212890625, 3.59326171875, 3.9736328125, 4.35400390625, 4.734375, 5.11474609375, 5.4951171875, 5.87548828125, 6.255859375, 6.63623046875, 7.0166015625, 7.39697265625, 7.77734375, 8.15771484375, 8.5380859375, 8.91845703125, 9.298828125, 9.67919921875, 10.0595703125, 10.43994140625, 10.8203125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 11.0, 13.0, 13.0, 28.0, 23.0, 22.0, 24.0, 39.0, 48.0, 61.0, 90.0, 170.0, 315.0, 968.0, 8565.0, 3025223.0, 106440.0, 2382.0, 527.0, 225.0, 120.0, 72.0, 55.0, 50.0, 37.0, 30.0, 18.0, 18.0, 20.0, 11.0, 15.0, 7.0, 7.0, 7.0, 8.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.921875, -21.102783203125, -20.28369140625, -19.464599609375, -18.6455078125, -17.826416015625, -17.00732421875, -16.188232421875, -15.369140625, -14.550048828125, -13.73095703125, -12.911865234375, -12.0927734375, -11.273681640625, -10.45458984375, -9.635498046875, -8.81640625, -7.997314453125, -7.17822265625, -6.359130859375, -5.5400390625, -4.720947265625, -3.90185546875, -3.082763671875, -2.263671875, -1.444580078125, -0.62548828125, 0.193603515625, 1.0126953125, 1.831787109375, 2.65087890625, 3.469970703125, 4.2890625, 5.108154296875, 5.92724609375, 6.746337890625, 7.5654296875, 8.384521484375, 9.20361328125, 10.022705078125, 10.841796875, 11.660888671875, 12.47998046875, 13.299072265625, 14.1181640625, 14.937255859375, 15.75634765625, 16.575439453125, 17.39453125, 18.213623046875, 19.03271484375, 19.851806640625, 20.6708984375, 21.489990234375, 22.30908203125, 23.128173828125, 23.947265625, 24.766357421875, 25.58544921875, 26.404541015625, 27.2236328125, 28.042724609375, 28.86181640625, 29.680908203125, 30.5]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [3.0, 96.0, 917.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.43546199798584, -6.46983528137207, -1.5042085647583008, 3.4614181518554688, 8.427044868469238, 13.392670631408691, 18.358299255371094, 23.323925018310547, 28.28955078125, 33.25517654418945, 38.220802307128906, 43.186431884765625, 48.15205764770508, 53.11768341064453, 58.08331298828125, 63.0489387512207, 68.01456451416016, 72.98019409179688, 77.94581604003906, 82.91144561767578, 87.8770751953125, 92.84269714355469, 97.8083267211914, 102.77395629882812, 107.73957824707031, 112.70520782470703, 117.67082977294922, 122.63645935058594, 127.60208129882812, 132.56771850585938, 137.53334045410156, 142.49896240234375, 147.464599609375, 152.4302215576172, 157.39585876464844, 162.36148071289062, 167.3271026611328, 172.292724609375, 177.25836181640625, 182.22398376464844, 187.18960571289062, 192.1552276611328, 197.12086486816406, 202.08648681640625, 207.05210876464844, 212.01773071289062, 216.98336791992188, 221.94898986816406, 226.9146270751953, 231.8802490234375, 236.84588623046875, 241.81150817871094, 246.77713012695312, 251.74276733398438, 256.7083740234375, 261.67401123046875, 266.6396484375, 271.60528564453125, 276.5708923339844, 281.5365295410156, 286.5021667480469, 291.4677734375, 296.43341064453125, 301.3990478515625, 306.3646545410156]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 3.0, 7.0, 16.0, 14.0, 10.0, 15.0, 21.0, 28.0, 24.0, 31.0, 32.0, 31.0, 43.0, 49.0, 32.0, 49.0, 33.0, 51.0, 43.0, 37.0, 45.0, 46.0, 51.0, 34.0, 38.0, 34.0, 29.0, 32.0, 15.0, 19.0, 15.0, 23.0, 13.0, 6.0, 6.0, 3.0, 4.0, 0.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.51384735107422, -37.267852783203125, -36.0218620300293, -34.77587127685547, -33.529876708984375, -32.28388214111328, -31.037891387939453, -29.791898727416992, -28.54590606689453, -27.29991340637207, -26.05392074584961, -24.80792808532715, -23.561935424804688, -22.315942764282227, -21.069950103759766, -19.823957443237305, -18.577964782714844, -17.331972122192383, -16.085979461669922, -14.839986801147461, -13.593994140625, -12.348001480102539, -11.102008819580078, -9.856016159057617, -8.610023498535156, -7.364030838012695, -6.118038177490234, -4.872045516967773, -3.6260528564453125, -2.3800601959228516, -1.1340675354003906, 0.11192512512207031, 1.3579216003417969, 2.603914260864258, 3.8499069213867188, 5.09589958190918, 6.341892242431641, 7.587884902954102, 8.833877563476562, 10.079870223999023, 11.325862884521484, 12.571855545043945, 13.817848205566406, 15.063840866088867, 16.309833526611328, 17.55582618713379, 18.80181884765625, 20.04781150817871, 21.293804168701172, 22.539796829223633, 23.785789489746094, 25.031782150268555, 26.277774810791016, 27.523767471313477, 28.769760131835938, 30.0157527923584, 31.26174545288086, 32.50773620605469, 33.75373077392578, 34.999725341796875, 36.2457160949707, 37.49170684814453, 38.737701416015625, 39.98369598388672, 41.22968673706055]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 2.0, 5.0, 2.0, 2.0, 5.0, 4.0, 14.0, 19.0, 22.0, 24.0, 30.0, 33.0, 34.0, 51.0, 38.0, 49.0, 57.0, 52.0, 55.0, 65.0, 55.0, 46.0, 60.0, 50.0, 45.0, 31.0, 31.0, 24.0, 17.0, 21.0, 11.0, 12.0, 10.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.853515625, -3.728424072265625, -3.60333251953125, -3.478240966796875, -3.3531494140625, -3.228057861328125, -3.10296630859375, -2.977874755859375, -2.852783203125, -2.727691650390625, -2.60260009765625, -2.477508544921875, -2.3524169921875, -2.227325439453125, -2.10223388671875, -1.977142333984375, -1.85205078125, -1.726959228515625, -1.60186767578125, -1.476776123046875, -1.3516845703125, -1.226593017578125, -1.10150146484375, -0.976409912109375, -0.851318359375, -0.726226806640625, -0.60113525390625, -0.476043701171875, -0.3509521484375, -0.225860595703125, -0.10076904296875, 0.024322509765625, 0.1494140625, 0.274505615234375, 0.39959716796875, 0.524688720703125, 0.6497802734375, 0.774871826171875, 0.89996337890625, 1.025054931640625, 1.150146484375, 1.275238037109375, 1.40032958984375, 1.525421142578125, 1.6505126953125, 1.775604248046875, 1.90069580078125, 2.025787353515625, 2.15087890625, 2.275970458984375, 2.40106201171875, 2.526153564453125, 2.6512451171875, 2.776336669921875, 2.90142822265625, 3.026519775390625, 3.151611328125, 3.276702880859375, 3.40179443359375, 3.526885986328125, 3.6519775390625, 3.777069091796875, 3.90216064453125, 4.027252197265625, 4.15234375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 8.0, 12.0, 12.0, 21.0, 20.0, 24.0, 60.0, 70.0, 132.0, 220.0, 346.0, 673.0, 1483.0, 4891.0, 46422.0, 3867666.0, 257849.0, 10115.0, 2146.0, 954.0, 475.0, 251.0, 160.0, 101.0, 46.0, 45.0, 23.0, 20.0, 9.0, 7.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.46875, -33.446044921875, -32.42333984375, -31.400634765625, -30.3779296875, -29.355224609375, -28.33251953125, -27.309814453125, -26.287109375, -25.264404296875, -24.24169921875, -23.218994140625, -22.1962890625, -21.173583984375, -20.15087890625, -19.128173828125, -18.10546875, -17.082763671875, -16.06005859375, -15.037353515625, -14.0146484375, -12.991943359375, -11.96923828125, -10.946533203125, -9.923828125, -8.901123046875, -7.87841796875, -6.855712890625, -5.8330078125, -4.810302734375, -3.78759765625, -2.764892578125, -1.7421875, -0.719482421875, 0.30322265625, 1.325927734375, 2.3486328125, 3.371337890625, 4.39404296875, 5.416748046875, 6.439453125, 7.462158203125, 8.48486328125, 9.507568359375, 10.5302734375, 11.552978515625, 12.57568359375, 13.598388671875, 14.62109375, 15.643798828125, 16.66650390625, 17.689208984375, 18.7119140625, 19.734619140625, 20.75732421875, 21.780029296875, 22.802734375, 23.825439453125, 24.84814453125, 25.870849609375, 26.8935546875, 27.916259765625, 28.93896484375, 29.961669921875, 30.984375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 5.0, 11.0, 15.0, 18.0, 20.0, 37.0, 45.0, 53.0, 58.0, 101.0, 131.0, 196.0, 259.0, 342.0, 477.0, 597.0, 405.0, 347.0, 242.0, 161.0, 127.0, 98.0, 87.0, 60.0, 38.0, 26.0, 24.0, 22.0, 11.0, 12.0, 5.0, 10.0, 10.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.890625, -9.5948486328125, -9.299072265625, -9.0032958984375, -8.70751953125, -8.4117431640625, -8.115966796875, -7.8201904296875, -7.5244140625, -7.2286376953125, -6.932861328125, -6.6370849609375, -6.34130859375, -6.0455322265625, -5.749755859375, -5.4539794921875, -5.158203125, -4.8624267578125, -4.566650390625, -4.2708740234375, -3.97509765625, -3.6793212890625, -3.383544921875, -3.0877685546875, -2.7919921875, -2.4962158203125, -2.200439453125, -1.9046630859375, -1.60888671875, -1.3131103515625, -1.017333984375, -0.7215576171875, -0.42578125, -0.1300048828125, 0.165771484375, 0.4615478515625, 0.75732421875, 1.0531005859375, 1.348876953125, 1.6446533203125, 1.9404296875, 2.2362060546875, 2.531982421875, 2.8277587890625, 3.12353515625, 3.4193115234375, 3.715087890625, 4.0108642578125, 4.306640625, 4.6024169921875, 4.898193359375, 5.1939697265625, 5.48974609375, 5.7855224609375, 6.081298828125, 6.3770751953125, 6.6728515625, 6.9686279296875, 7.264404296875, 7.5601806640625, 7.85595703125, 8.1517333984375, 8.447509765625, 8.7432861328125, 9.0390625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 7.0, 7.0, 10.0, 11.0, 20.0, 35.0, 53.0, 63.0, 110.0, 153.0, 277.0, 463.0, 782.0, 1347.0, 2513.0, 5393.0, 12594.0, 34346.0, 119232.0, 649131.0, 2726503.0, 492161.0, 98073.0, 29513.0, 11190.0, 4877.0, 2387.0, 1224.0, 723.0, 406.0, 259.0, 145.0, 88.0, 67.0, 38.0, 30.0, 13.0, 15.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.5682373046875, -17.042724609375, -16.5172119140625, -15.99169921875, -15.4661865234375, -14.940673828125, -14.4151611328125, -13.8896484375, -13.3641357421875, -12.838623046875, -12.3131103515625, -11.78759765625, -11.2620849609375, -10.736572265625, -10.2110595703125, -9.685546875, -9.1600341796875, -8.634521484375, -8.1090087890625, -7.58349609375, -7.0579833984375, -6.532470703125, -6.0069580078125, -5.4814453125, -4.9559326171875, -4.430419921875, -3.9049072265625, -3.37939453125, -2.8538818359375, -2.328369140625, -1.8028564453125, -1.27734375, -0.7518310546875, -0.226318359375, 0.2991943359375, 0.82470703125, 1.3502197265625, 1.875732421875, 2.4012451171875, 2.9267578125, 3.4522705078125, 3.977783203125, 4.5032958984375, 5.02880859375, 5.5543212890625, 6.079833984375, 6.6053466796875, 7.130859375, 7.6563720703125, 8.181884765625, 8.7073974609375, 9.23291015625, 9.7584228515625, 10.283935546875, 10.8094482421875, 11.3349609375, 11.8604736328125, 12.385986328125, 12.9114990234375, 13.43701171875, 13.9625244140625, 14.488037109375, 15.0135498046875, 15.5390625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 9.0, 17.0, 23.0, 24.0, 24.0, 50.0, 57.0, 63.0, 72.0, 89.0, 84.0, 84.0, 61.0, 57.0, 73.0, 45.0, 38.0, 24.0, 29.0, 15.0, 8.0, 10.0, 16.0, 7.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.29800796508789, -47.07801818847656, -45.858028411865234, -44.638038635253906, -43.41804885864258, -42.19805908203125, -40.97806930541992, -39.758079528808594, -38.538089752197266, -37.31809997558594, -36.09811019897461, -34.87812042236328, -33.65813064575195, -32.438140869140625, -31.218151092529297, -29.99816131591797, -28.778169631958008, -27.55817985534668, -26.33819007873535, -25.118200302124023, -23.898210525512695, -22.678220748901367, -21.458229064941406, -20.238239288330078, -19.01824951171875, -17.798259735107422, -16.578269958496094, -15.358280181884766, -14.138290405273438, -12.91830062866211, -11.698309898376465, -10.478320121765137, -9.258329391479492, -8.038339614868164, -6.818349838256836, -5.59835958480835, -4.3783698081970215, -3.1583800315856934, -1.938389778137207, -0.7184000015258789, 0.5015897750854492, 1.721579670906067, 2.9415695667266846, 4.161559581756592, 5.38154935836792, 6.601539134979248, 7.821529388427734, 9.041519165039062, 10.26150894165039, 11.481498718261719, 12.701488494873047, 13.921478271484375, 15.141468048095703, 16.36145782470703, 17.58144760131836, 18.801437377929688, 20.021427154541016, 21.241416931152344, 22.461406707763672, 23.681396484375, 24.901386260986328, 26.121376037597656, 27.341365814208984, 28.561355590820312, 29.781347274780273]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 3.0, 10.0, 10.0, 14.0, 12.0, 13.0, 18.0, 18.0, 18.0, 27.0, 27.0, 25.0, 32.0, 40.0, 53.0, 39.0, 34.0, 52.0, 36.0, 44.0, 44.0, 41.0, 34.0, 34.0, 43.0, 43.0, 32.0, 35.0, 34.0, 19.0, 19.0, 19.0, 18.0, 9.0, 5.0, 7.0, 8.0, 14.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.27893829345703, -34.19860076904297, -33.118263244628906, -32.03792953491211, -30.957592010498047, -29.877254486083984, -28.796918869018555, -27.716583251953125, -26.636245727539062, -25.555908203125, -24.47557258605957, -23.39523696899414, -22.314899444580078, -21.234561920166016, -20.154226303100586, -19.073890686035156, -17.993553161621094, -16.91321563720703, -15.832880020141602, -14.752543449401855, -13.67220687866211, -12.591870307922363, -11.511533737182617, -10.431197166442871, -9.350860595703125, -8.270524024963379, -7.190187454223633, -6.109850883483887, -5.029514312744141, -3.9491777420043945, -2.8688411712646484, -1.7885046005249023, -0.7081718444824219, 0.3721647262573242, 1.4525012969970703, 2.5328378677368164, 3.6131744384765625, 4.693511009216309, 5.773847579956055, 6.854184150695801, 7.934520721435547, 9.014857292175293, 10.095193862915039, 11.175530433654785, 12.255867004394531, 13.336203575134277, 14.416540145874023, 15.49687671661377, 16.577213287353516, 17.657550811767578, 18.737886428833008, 19.818222045898438, 20.8985595703125, 21.978897094726562, 23.059232711791992, 24.139568328857422, 25.219905853271484, 26.300243377685547, 27.380578994750977, 28.460914611816406, 29.54125213623047, 30.62158966064453, 31.70192527770996, 32.78226089477539, 33.86259841918945]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 2.0, 13.0, 14.0, 13.0, 13.0, 23.0, 26.0, 35.0, 30.0, 45.0, 63.0, 48.0, 47.0, 54.0, 47.0, 43.0, 54.0, 49.0, 61.0, 51.0, 50.0, 43.0, 36.0, 32.0, 22.0, 15.0, 15.0, 10.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0078125, -3.87908935546875, -3.7503662109375, -3.62164306640625, -3.492919921875, -3.36419677734375, -3.2354736328125, -3.10675048828125, -2.97802734375, -2.84930419921875, -2.7205810546875, -2.59185791015625, -2.463134765625, -2.33441162109375, -2.2056884765625, -2.07696533203125, -1.9482421875, -1.81951904296875, -1.6907958984375, -1.56207275390625, -1.433349609375, -1.30462646484375, -1.1759033203125, -1.04718017578125, -0.91845703125, -0.78973388671875, -0.6610107421875, -0.53228759765625, -0.403564453125, -0.27484130859375, -0.1461181640625, -0.01739501953125, 0.111328125, 0.24005126953125, 0.3687744140625, 0.49749755859375, 0.626220703125, 0.75494384765625, 0.8836669921875, 1.01239013671875, 1.14111328125, 1.26983642578125, 1.3985595703125, 1.52728271484375, 1.656005859375, 1.78472900390625, 1.9134521484375, 2.04217529296875, 2.1708984375, 2.29962158203125, 2.4283447265625, 2.55706787109375, 2.685791015625, 2.81451416015625, 2.9432373046875, 3.07196044921875, 3.20068359375, 3.32940673828125, 3.4581298828125, 3.58685302734375, 3.715576171875, 3.84429931640625, 3.9730224609375, 4.10174560546875, 4.23046875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 10.0, 10.0, 12.0, 14.0, 29.0, 23.0, 39.0, 58.0, 91.0, 123.0, 179.0, 226.0, 356.0, 485.0, 666.0, 997.0, 1523.0, 2328.0, 3473.0, 5645.0, 9071.0, 14842.0, 26161.0, 46669.0, 89180.0, 193891.0, 326692.0, 153572.0, 74716.0, 39622.0, 22377.0, 13117.0, 7870.0, 4935.0, 3119.0, 2084.0, 1357.0, 929.0, 636.0, 420.0, 272.0, 220.0, 144.0, 93.0, 78.0, 59.0, 43.0, 30.0, 19.0, 23.0, 13.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.14599609375, -0.14148521423339844, -0.13697433471679688, -0.1324634552001953, -0.12795257568359375, -0.12344169616699219, -0.11893081665039062, -0.11441993713378906, -0.1099090576171875, -0.10539817810058594, -0.10088729858398438, -0.09637641906738281, -0.09186553955078125, -0.08735466003417969, -0.08284378051757812, -0.07833290100097656, -0.073822021484375, -0.06931114196777344, -0.06480026245117188, -0.06028938293457031, -0.05577850341796875, -0.05126762390136719, -0.046756744384765625, -0.04224586486816406, -0.0377349853515625, -0.03322410583496094, -0.028713226318359375, -0.024202346801757812, -0.01969146728515625, -0.015180587768554688, -0.010669708251953125, -0.0061588287353515625, -0.00164794921875, 0.0028629302978515625, 0.007373809814453125, 0.011884689331054688, 0.01639556884765625, 0.020906448364257812, 0.025417327880859375, 0.029928207397460938, 0.0344390869140625, 0.03894996643066406, 0.043460845947265625, 0.04797172546386719, 0.05248260498046875, 0.05699348449707031, 0.061504364013671875, 0.06601524353027344, 0.070526123046875, 0.07503700256347656, 0.07954788208007812, 0.08405876159667969, 0.08856964111328125, 0.09308052062988281, 0.09759140014648438, 0.10210227966308594, 0.1066131591796875, 0.11112403869628906, 0.11563491821289062, 0.12014579772949219, 0.12465667724609375, 0.1291675567626953, 0.13367843627929688, 0.13818931579589844, 0.1427001953125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 10.0, 7.0, 4.0, 5.0, 3.0, 10.0, 17.0, 10.0, 17.0, 16.0, 19.0, 28.0, 28.0, 24.0, 28.0, 25.0, 30.0, 29.0, 34.0, 34.0, 40.0, 36.0, 40.0, 1062.0, 34.0, 35.0, 35.0, 38.0, 32.0, 37.0, 18.0, 34.0, 27.0, 30.0, 28.0, 20.0, 20.0, 14.0, 8.0, 12.0, 11.0, 9.0, 7.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0], "bins": [-2.537109375, -2.462982177734375, -2.38885498046875, -2.314727783203125, -2.2406005859375, -2.166473388671875, -2.09234619140625, -2.018218994140625, -1.944091796875, -1.869964599609375, -1.79583740234375, -1.721710205078125, -1.6475830078125, -1.573455810546875, -1.49932861328125, -1.425201416015625, -1.35107421875, -1.276947021484375, -1.20281982421875, -1.128692626953125, -1.0545654296875, -0.980438232421875, -0.90631103515625, -0.832183837890625, -0.758056640625, -0.683929443359375, -0.60980224609375, -0.535675048828125, -0.4615478515625, -0.387420654296875, -0.31329345703125, -0.239166259765625, -0.1650390625, -0.090911865234375, -0.01678466796875, 0.057342529296875, 0.1314697265625, 0.205596923828125, 0.27972412109375, 0.353851318359375, 0.427978515625, 0.502105712890625, 0.57623291015625, 0.650360107421875, 0.7244873046875, 0.798614501953125, 0.87274169921875, 0.946868896484375, 1.02099609375, 1.095123291015625, 1.16925048828125, 1.243377685546875, 1.3175048828125, 1.391632080078125, 1.46575927734375, 1.539886474609375, 1.614013671875, 1.688140869140625, 1.76226806640625, 1.836395263671875, 1.9105224609375, 1.984649658203125, 2.05877685546875, 2.132904052734375, 2.20703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 9.0, 10.0, 27.0, 31.0, 41.0, 61.0, 92.0, 168.0, 223.0, 355.0, 583.0, 873.0, 1236.0, 1945.0, 3136.0, 4818.0, 7752.0, 12431.0, 20251.0, 32867.0, 54987.0, 97655.0, 208681.0, 1337840.0, 133417.0, 69802.0, 41526.0, 25050.0, 15091.0, 9646.0, 5929.0, 3785.0, 2357.0, 1549.0, 957.0, 699.0, 427.0, 268.0, 208.0, 127.0, 76.0, 50.0, 31.0, 22.0, 24.0, 8.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 4.0], "bins": [-0.09344482421875, -0.0907144546508789, -0.08798408508300781, -0.08525371551513672, -0.08252334594726562, -0.07979297637939453, -0.07706260681152344, -0.07433223724365234, -0.07160186767578125, -0.06887149810791016, -0.06614112854003906, -0.06341075897216797, -0.060680389404296875, -0.05795001983642578, -0.05521965026855469, -0.052489280700683594, -0.0497589111328125, -0.047028541564941406, -0.04429817199707031, -0.04156780242919922, -0.038837432861328125, -0.03610706329345703, -0.03337669372558594, -0.030646324157714844, -0.02791595458984375, -0.025185585021972656, -0.022455215454101562, -0.01972484588623047, -0.016994476318359375, -0.014264106750488281, -0.011533737182617188, -0.008803367614746094, -0.006072998046875, -0.0033426284790039062, -0.0006122589111328125, 0.0021181106567382812, 0.004848480224609375, 0.007578849792480469, 0.010309219360351562, 0.013039588928222656, 0.01576995849609375, 0.018500328063964844, 0.021230697631835938, 0.02396106719970703, 0.026691436767578125, 0.02942180633544922, 0.03215217590332031, 0.034882545471191406, 0.0376129150390625, 0.040343284606933594, 0.04307365417480469, 0.04580402374267578, 0.048534393310546875, 0.05126476287841797, 0.05399513244628906, 0.056725502014160156, 0.05945587158203125, 0.062186241149902344, 0.06491661071777344, 0.06764698028564453, 0.07037734985351562, 0.07310771942138672, 0.07583808898925781, 0.0785684585571289, 0.081298828125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 4.0, 4.0, 3.0, 15.0, 13.0, 17.0, 17.0, 26.0, 27.0, 31.0, 36.0, 38.0, 35.0, 37.0, 42.0, 38.0, 63.0, 58.0, 52.0, 48.0, 46.0, 36.0, 48.0, 43.0, 32.0, 28.0, 28.0, 25.0, 22.0, 18.0, 16.0, 12.0, 7.0, 9.0, 2.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.24249267578125e-05, -3.144051879644394e-05, -3.045611083507538e-05, -2.9471702873706818e-05, -2.8487294912338257e-05, -2.7502886950969696e-05, -2.6518478989601135e-05, -2.5534071028232574e-05, -2.4549663066864014e-05, -2.3565255105495453e-05, -2.2580847144126892e-05, -2.159643918275833e-05, -2.061203122138977e-05, -1.962762326002121e-05, -1.864321529865265e-05, -1.7658807337284088e-05, -1.6674399375915527e-05, -1.5689991414546967e-05, -1.4705583453178406e-05, -1.3721175491809845e-05, -1.2736767530441284e-05, -1.1752359569072723e-05, -1.0767951607704163e-05, -9.783543646335602e-06, -8.799135684967041e-06, -7.81472772359848e-06, -6.8303197622299194e-06, -5.845911800861359e-06, -4.861503839492798e-06, -3.877095878124237e-06, -2.8926879167556763e-06, -1.9082799553871155e-06, -9.238719940185547e-07, 6.05359673500061e-08, 1.044943928718567e-06, 2.0293518900871277e-06, 3.0137598514556885e-06, 3.998167812824249e-06, 4.98257577419281e-06, 5.966983735561371e-06, 6.951391696929932e-06, 7.935799658298492e-06, 8.920207619667053e-06, 9.904615581035614e-06, 1.0889023542404175e-05, 1.1873431503772736e-05, 1.2857839465141296e-05, 1.3842247426509857e-05, 1.4826655387878418e-05, 1.581106334924698e-05, 1.679547131061554e-05, 1.77798792719841e-05, 1.876428723335266e-05, 1.9748695194721222e-05, 2.0733103156089783e-05, 2.1717511117458344e-05, 2.2701919078826904e-05, 2.3686327040195465e-05, 2.4670735001564026e-05, 2.5655142962932587e-05, 2.6639550924301147e-05, 2.7623958885669708e-05, 2.860836684703827e-05, 2.959277480840683e-05, 3.057718276977539e-05]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 7.0, 0.0, 8.0, 13.0, 8.0, 18.0, 17.0, 20.0, 30.0, 23.0, 35.0, 43.0, 52.0, 72.0, 93.0, 115.0, 132.0, 129.0, 205.0, 416.0, 1738.0, 28865.0, 682789.0, 321816.0, 9637.0, 979.0, 326.0, 181.0, 141.0, 112.0, 92.0, 81.0, 69.0, 70.0, 60.0, 37.0, 27.0, 13.0, 17.0, 12.0, 11.0, 14.0, 7.0, 4.0, 5.0, 1.0, 5.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0], "bins": [-0.0004813671112060547, -0.00046714022755622864, -0.0004529133439064026, -0.00043868646025657654, -0.0004244595766067505, -0.00041023269295692444, -0.0003960058093070984, -0.00038177892565727234, -0.0003675520420074463, -0.00035332515835762024, -0.0003390982747077942, -0.00032487139105796814, -0.0003106445074081421, -0.00029641762375831604, -0.00028219074010849, -0.00026796385645866394, -0.0002537369728088379, -0.00023951008915901184, -0.0002252832055091858, -0.00021105632185935974, -0.0001968294382095337, -0.00018260255455970764, -0.0001683756709098816, -0.00015414878726005554, -0.0001399219036102295, -0.00012569501996040344, -0.00011146813631057739, -9.724125266075134e-05, -8.301436901092529e-05, -6.878748536109924e-05, -5.456060171127319e-05, -4.0333718061447144e-05, -2.6106834411621094e-05, -1.1879950761795044e-05, 2.346932888031006e-06, 1.6573816537857056e-05, 3.0800700187683105e-05, 4.5027583837509155e-05, 5.9254467487335205e-05, 7.348135113716125e-05, 8.77082347869873e-05, 0.00010193511843681335, 0.0001161620020866394, 0.00013038888573646545, 0.0001446157693862915, 0.00015884265303611755, 0.0001730695366859436, 0.00018729642033576965, 0.0002015233039855957, 0.00021575018763542175, 0.0002299770712852478, 0.00024420395493507385, 0.0002584308385848999, 0.00027265772223472595, 0.000286884605884552, 0.00030111148953437805, 0.0003153383731842041, 0.00032956525683403015, 0.0003437921404838562, 0.00035801902413368225, 0.0003722459077835083, 0.00038647279143333435, 0.0004006996750831604, 0.00041492655873298645, 0.0004291534423828125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 50.0, 188.0, 383.0, 289.0, 76.0, 12.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.816213863203302e-05, -6.351246702251956e-05, -5.886279177502729e-05, -5.421312016551383e-05, -4.956344491802156e-05, -4.49137733085081e-05, -4.0264101698994637e-05, -3.561442645150237e-05, -3.0964754841988906e-05, -2.631508141348604e-05, -2.1665407984983176e-05, -1.7015736375469714e-05, -1.236606294696685e-05, -7.716389518463984e-06, -3.0667179089505225e-06, 1.5829573385417461e-06, 6.232628948055208e-06, 1.0882302376558073e-05, 1.5531975805060938e-05, 2.01816474145744e-05, 2.4831320843077265e-05, 2.948099427158013e-05, 3.413066588109359e-05, 3.878034112858586e-05, 4.343001273809932e-05, 4.807968434761278e-05, 5.272935959510505e-05, 5.7379031204618514e-05, 6.202870281413198e-05, 6.667837442364544e-05, 7.13280460331589e-05, 7.597772491862997e-05, 8.062738925218582e-05, 8.527706086169928e-05, 8.992673247121274e-05, 9.45764040807262e-05, 9.922608296619728e-05, 0.00010387575457571074, 0.0001085254261852242, 0.00011317510507069528, 0.00011782477668020874, 0.0001224744482897222, 0.00012712411989923567, 0.00013177379150874913, 0.0001364234631182626, 0.00014107313472777605, 0.00014572282088920474, 0.0001503724924987182, 0.00015502216410823166, 0.00015967183571774513, 0.0001643215073272586, 0.00016897117893677205, 0.0001736208505462855, 0.0001782705367077142, 0.00018292019376531243, 0.00018756987992674112, 0.00019221953698433936, 0.00019686920859385282, 0.00020151888020336628, 0.00020616855181287974, 0.0002108182234223932, 0.0002154679095838219, 0.00022011756664142013, 0.00022476725280284882, 0.00022941692441236228]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 4.0, 6.0, 5.0, 5.0, 7.0, 9.0, 11.0, 17.0, 10.0, 15.0, 21.0, 24.0, 43.0, 35.0, 35.0, 30.0, 31.0, 25.0, 33.0, 45.0, 44.0, 34.0, 50.0, 31.0, 42.0, 45.0, 37.0, 38.0, 35.0, 43.0, 23.0, 26.0, 23.0, 21.0, 12.0, 20.0, 15.0, 12.0, 9.0, 5.0, 6.0, 4.0, 6.0, 0.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.0265579223632812e-05, -1.968536525964737e-05, -1.9105151295661926e-05, -1.8524937331676483e-05, -1.794472336769104e-05, -1.7364509403705597e-05, -1.6784295439720154e-05, -1.620408147573471e-05, -1.5623867511749268e-05, -1.5043653547763824e-05, -1.4463439583778381e-05, -1.3883225619792938e-05, -1.3303011655807495e-05, -1.2722797691822052e-05, -1.2142583727836609e-05, -1.1562369763851166e-05, -1.0982155799865723e-05, -1.040194183588028e-05, -9.821727871894836e-06, -9.241513907909393e-06, -8.66129994392395e-06, -8.081085979938507e-06, -7.500872015953064e-06, -6.920658051967621e-06, -6.340444087982178e-06, -5.760230123996735e-06, -5.1800161600112915e-06, -4.599802196025848e-06, -4.019588232040405e-06, -3.439374268054962e-06, -2.859160304069519e-06, -2.278946340084076e-06, -1.6987323760986328e-06, -1.1185184121131897e-06, -5.383044481277466e-07, 4.190951585769653e-08, 6.221234798431396e-07, 1.2023374438285828e-06, 1.7825514078140259e-06, 2.362765371799469e-06, 2.942979335784912e-06, 3.5231932997703552e-06, 4.103407263755798e-06, 4.6836212277412415e-06, 5.2638351917266846e-06, 5.844049155712128e-06, 6.424263119697571e-06, 7.004477083683014e-06, 7.584691047668457e-06, 8.1649050116539e-06, 8.745118975639343e-06, 9.325332939624786e-06, 9.90554690361023e-06, 1.0485760867595673e-05, 1.1065974831581116e-05, 1.1646188795566559e-05, 1.2226402759552002e-05, 1.2806616723537445e-05, 1.3386830687522888e-05, 1.3967044651508331e-05, 1.4547258615493774e-05, 1.5127472579479218e-05, 1.570768654346466e-05, 1.6287900507450104e-05, 1.6868114471435547e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 2.0, 13.0, 14.0, 13.0, 13.0, 23.0, 26.0, 35.0, 30.0, 45.0, 63.0, 48.0, 47.0, 54.0, 47.0, 43.0, 54.0, 49.0, 61.0, 51.0, 50.0, 43.0, 36.0, 32.0, 22.0, 15.0, 15.0, 10.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0078125, -3.87908935546875, -3.7503662109375, -3.62164306640625, -3.492919921875, -3.36419677734375, -3.2354736328125, -3.10675048828125, -2.97802734375, -2.84930419921875, -2.7205810546875, -2.59185791015625, -2.463134765625, -2.33441162109375, -2.2056884765625, -2.07696533203125, -1.9482421875, -1.81951904296875, -1.6907958984375, -1.56207275390625, -1.433349609375, -1.30462646484375, -1.1759033203125, -1.04718017578125, -0.91845703125, -0.78973388671875, -0.6610107421875, -0.53228759765625, -0.403564453125, -0.27484130859375, -0.1461181640625, -0.01739501953125, 0.111328125, 0.24005126953125, 0.3687744140625, 0.49749755859375, 0.626220703125, 0.75494384765625, 0.8836669921875, 1.01239013671875, 1.14111328125, 1.26983642578125, 1.3985595703125, 1.52728271484375, 1.656005859375, 1.78472900390625, 1.9134521484375, 2.04217529296875, 2.1708984375, 2.29962158203125, 2.4283447265625, 2.55706787109375, 2.685791015625, 2.81451416015625, 2.9432373046875, 3.07196044921875, 3.20068359375, 3.32940673828125, 3.4581298828125, 3.58685302734375, 3.715576171875, 3.84429931640625, 3.9730224609375, 4.10174560546875, 4.23046875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 5.0, 11.0, 16.0, 15.0, 21.0, 31.0, 48.0, 71.0, 111.0, 173.0, 273.0, 434.0, 812.0, 1555.0, 3019.0, 6489.0, 14187.0, 35086.0, 107381.0, 509123.0, 258646.0, 66680.0, 23959.0, 10385.0, 4753.0, 2382.0, 1208.0, 674.0, 356.0, 217.0, 136.0, 63.0, 50.0, 46.0, 37.0, 18.0, 21.0, 15.0, 11.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.9921875, -2.900970458984375, -2.80975341796875, -2.718536376953125, -2.6273193359375, -2.536102294921875, -2.44488525390625, -2.353668212890625, -2.262451171875, -2.171234130859375, -2.08001708984375, -1.988800048828125, -1.8975830078125, -1.806365966796875, -1.71514892578125, -1.623931884765625, -1.53271484375, -1.441497802734375, -1.35028076171875, -1.259063720703125, -1.1678466796875, -1.076629638671875, -0.98541259765625, -0.894195556640625, -0.802978515625, -0.711761474609375, -0.62054443359375, -0.529327392578125, -0.4381103515625, -0.346893310546875, -0.25567626953125, -0.164459228515625, -0.0732421875, 0.017974853515625, 0.10919189453125, 0.200408935546875, 0.2916259765625, 0.382843017578125, 0.47406005859375, 0.565277099609375, 0.656494140625, 0.747711181640625, 0.83892822265625, 0.930145263671875, 1.0213623046875, 1.112579345703125, 1.20379638671875, 1.295013427734375, 1.38623046875, 1.477447509765625, 1.56866455078125, 1.659881591796875, 1.7510986328125, 1.842315673828125, 1.93353271484375, 2.024749755859375, 2.115966796875, 2.207183837890625, 2.29840087890625, 2.389617919921875, 2.4808349609375, 2.572052001953125, 2.66326904296875, 2.754486083984375, 2.845703125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 3.0, 10.0, 10.0, 11.0, 17.0, 17.0, 12.0, 21.0, 23.0, 23.0, 37.0, 48.0, 33.0, 50.0, 45.0, 44.0, 62.0, 85.0, 1976.0, 72.0, 53.0, 37.0, 42.0, 36.0, 41.0, 41.0, 29.0, 26.0, 20.0, 21.0, 16.0, 10.0, 11.0, 13.0, 11.0, 7.0, 5.0, 10.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.171875, -11.7840576171875, -11.396240234375, -11.0084228515625, -10.62060546875, -10.2327880859375, -9.844970703125, -9.4571533203125, -9.0693359375, -8.6815185546875, -8.293701171875, -7.9058837890625, -7.51806640625, -7.1302490234375, -6.742431640625, -6.3546142578125, -5.966796875, -5.5789794921875, -5.191162109375, -4.8033447265625, -4.41552734375, -4.0277099609375, -3.639892578125, -3.2520751953125, -2.8642578125, -2.4764404296875, -2.088623046875, -1.7008056640625, -1.31298828125, -0.9251708984375, -0.537353515625, -0.1495361328125, 0.23828125, 0.6260986328125, 1.013916015625, 1.4017333984375, 1.78955078125, 2.1773681640625, 2.565185546875, 2.9530029296875, 3.3408203125, 3.7286376953125, 4.116455078125, 4.5042724609375, 4.89208984375, 5.2799072265625, 5.667724609375, 6.0555419921875, 6.443359375, 6.8311767578125, 7.218994140625, 7.6068115234375, 7.99462890625, 8.3824462890625, 8.770263671875, 9.1580810546875, 9.5458984375, 9.9337158203125, 10.321533203125, 10.7093505859375, 11.09716796875, 11.4849853515625, 11.872802734375, 12.2606201171875, 12.6484375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 3.0, 6.0, 11.0, 15.0, 7.0, 16.0, 16.0, 17.0, 25.0, 27.0, 31.0, 44.0, 67.0, 86.0, 157.0, 351.0, 983.0, 8534.0, 3084602.0, 47605.0, 1898.0, 519.0, 203.0, 136.0, 53.0, 67.0, 38.0, 29.0, 24.0, 19.0, 13.0, 18.0, 17.0, 13.0, 11.0, 8.0, 7.0, 1.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-27.296875, -26.462158203125, -25.62744140625, -24.792724609375, -23.9580078125, -23.123291015625, -22.28857421875, -21.453857421875, -20.619140625, -19.784423828125, -18.94970703125, -18.114990234375, -17.2802734375, -16.445556640625, -15.61083984375, -14.776123046875, -13.94140625, -13.106689453125, -12.27197265625, -11.437255859375, -10.6025390625, -9.767822265625, -8.93310546875, -8.098388671875, -7.263671875, -6.428955078125, -5.59423828125, -4.759521484375, -3.9248046875, -3.090087890625, -2.25537109375, -1.420654296875, -0.5859375, 0.248779296875, 1.08349609375, 1.918212890625, 2.7529296875, 3.587646484375, 4.42236328125, 5.257080078125, 6.091796875, 6.926513671875, 7.76123046875, 8.595947265625, 9.4306640625, 10.265380859375, 11.10009765625, 11.934814453125, 12.76953125, 13.604248046875, 14.43896484375, 15.273681640625, 16.1083984375, 16.943115234375, 17.77783203125, 18.612548828125, 19.447265625, 20.281982421875, 21.11669921875, 21.951416015625, 22.7861328125, 23.620849609375, 24.45556640625, 25.290283203125, 26.125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [32.0, 973.0, 15.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.357064247131348, -2.43745756149292, 3.482149124145508, 9.401755332946777, 15.321362495422363, 21.240970611572266, 27.16057586669922, 33.08018493652344, 38.99979019165039, 44.919395446777344, 50.83900451660156, 56.758609771728516, 62.67821502685547, 68.59782409667969, 74.51742553710938, 80.43704223632812, 86.35664367675781, 92.27625274658203, 98.19585418701172, 104.11546325683594, 110.03507232666016, 115.95468139648438, 121.87428283691406, 127.79389190673828, 133.7135009765625, 139.6331024169922, 145.55271911621094, 151.47232055664062, 157.3919219970703, 163.31153869628906, 169.23114013671875, 175.1507568359375, 181.0703582763672, 186.98995971679688, 192.90957641601562, 198.8291778564453, 204.748779296875, 210.66839599609375, 216.58799743652344, 222.50759887695312, 228.42721557617188, 234.34681701660156, 240.2664337158203, 246.18603515625, 252.1056365966797, 258.0252380371094, 263.9448547363281, 269.8644714355469, 275.7840576171875, 281.70367431640625, 287.6232604980469, 293.5428771972656, 299.4624938964844, 305.382080078125, 311.30169677734375, 317.2213134765625, 323.14093017578125, 329.060546875, 334.9801330566406, 340.8997497558594, 346.8193664550781, 352.73895263671875, 358.6585693359375, 364.57818603515625, 370.4977722167969]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 3.0, 6.0, 5.0, 9.0, 8.0, 14.0, 24.0, 19.0, 23.0, 22.0, 23.0, 35.0, 25.0, 28.0, 24.0, 46.0, 60.0, 36.0, 36.0, 40.0, 41.0, 38.0, 37.0, 49.0, 43.0, 38.0, 28.0, 33.0, 33.0, 26.0, 22.0, 19.0, 14.0, 15.0, 19.0, 16.0, 8.0, 11.0, 3.0, 9.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.23114776611328, -36.970375061035156, -35.7096061706543, -34.44883728027344, -33.18806457519531, -31.92729377746582, -30.666522979736328, -29.405752182006836, -28.144981384277344, -26.88421058654785, -25.62343978881836, -24.362668991088867, -23.101898193359375, -21.841127395629883, -20.58035659790039, -19.3195858001709, -18.058815002441406, -16.798044204711914, -15.537273406982422, -14.27650260925293, -13.015731811523438, -11.754961013793945, -10.494190216064453, -9.233419418334961, -7.972648620605469, -6.711877822875977, -5.451107025146484, -4.190336227416992, -2.9295654296875, -1.6687946319580078, -0.4080238342285156, 0.8527469635009766, 2.113513946533203, 3.3742847442626953, 4.6350555419921875, 5.89582633972168, 7.156597137451172, 8.417367935180664, 9.678138732910156, 10.938909530639648, 12.19968032836914, 13.460451126098633, 14.721221923828125, 15.981992721557617, 17.24276351928711, 18.5035343170166, 19.764305114746094, 21.025075912475586, 22.285846710205078, 23.54661750793457, 24.807388305664062, 26.068159103393555, 27.328929901123047, 28.58970069885254, 29.85047149658203, 31.111242294311523, 32.372013092041016, 33.632781982421875, 34.8935546875, 36.154327392578125, 37.415096282958984, 38.675865173339844, 39.93663787841797, 41.197410583496094, 42.45817947387695]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 2.0, 2.0, 4.0, 8.0, 13.0, 13.0, 14.0, 21.0, 23.0, 28.0, 35.0, 27.0, 50.0, 56.0, 54.0, 48.0, 45.0, 53.0, 48.0, 54.0, 53.0, 55.0, 49.0, 52.0, 34.0, 41.0, 28.0, 18.0, 15.0, 14.0, 7.0, 11.0, 8.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.998046875, -3.868194580078125, -3.73834228515625, -3.608489990234375, -3.4786376953125, -3.348785400390625, -3.21893310546875, -3.089080810546875, -2.959228515625, -2.829376220703125, -2.69952392578125, -2.569671630859375, -2.4398193359375, -2.309967041015625, -2.18011474609375, -2.050262451171875, -1.92041015625, -1.790557861328125, -1.66070556640625, -1.530853271484375, -1.4010009765625, -1.271148681640625, -1.14129638671875, -1.011444091796875, -0.881591796875, -0.751739501953125, -0.62188720703125, -0.492034912109375, -0.3621826171875, -0.232330322265625, -0.10247802734375, 0.027374267578125, 0.1572265625, 0.287078857421875, 0.41693115234375, 0.546783447265625, 0.6766357421875, 0.806488037109375, 0.93634033203125, 1.066192626953125, 1.196044921875, 1.325897216796875, 1.45574951171875, 1.585601806640625, 1.7154541015625, 1.845306396484375, 1.97515869140625, 2.105010986328125, 2.23486328125, 2.364715576171875, 2.49456787109375, 2.624420166015625, 2.7542724609375, 2.884124755859375, 3.01397705078125, 3.143829345703125, 3.273681640625, 3.403533935546875, 3.53338623046875, 3.663238525390625, 3.7930908203125, 3.922943115234375, 4.05279541015625, 4.182647705078125, 4.3125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 5.0, 15.0, 15.0, 22.0, 27.0, 38.0, 60.0, 70.0, 104.0, 143.0, 192.0, 299.0, 476.0, 773.0, 1520.0, 3456.0, 10084.0, 51824.0, 795749.0, 3169264.0, 131434.0, 18727.0, 5194.0, 2057.0, 1022.0, 581.0, 345.0, 237.0, 156.0, 119.0, 83.0, 51.0, 38.0, 30.0, 20.0, 8.0, 16.0, 6.0, 8.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.984375, -19.400146484375, -18.81591796875, -18.231689453125, -17.6474609375, -17.063232421875, -16.47900390625, -15.894775390625, -15.310546875, -14.726318359375, -14.14208984375, -13.557861328125, -12.9736328125, -12.389404296875, -11.80517578125, -11.220947265625, -10.63671875, -10.052490234375, -9.46826171875, -8.884033203125, -8.2998046875, -7.715576171875, -7.13134765625, -6.547119140625, -5.962890625, -5.378662109375, -4.79443359375, -4.210205078125, -3.6259765625, -3.041748046875, -2.45751953125, -1.873291015625, -1.2890625, -0.704833984375, -0.12060546875, 0.463623046875, 1.0478515625, 1.632080078125, 2.21630859375, 2.800537109375, 3.384765625, 3.968994140625, 4.55322265625, 5.137451171875, 5.7216796875, 6.305908203125, 6.89013671875, 7.474365234375, 8.05859375, 8.642822265625, 9.22705078125, 9.811279296875, 10.3955078125, 10.979736328125, 11.56396484375, 12.148193359375, 12.732421875, 13.316650390625, 13.90087890625, 14.485107421875, 15.0693359375, 15.653564453125, 16.23779296875, 16.822021484375, 17.40625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 7.0, 11.0, 13.0, 25.0, 28.0, 48.0, 84.0, 114.0, 201.0, 259.0, 421.0, 692.0, 733.0, 521.0, 311.0, 200.0, 141.0, 88.0, 59.0, 27.0, 22.0, 25.0, 11.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0, -17.5623779296875, -17.124755859375, -16.6871337890625, -16.24951171875, -15.8118896484375, -15.374267578125, -14.9366455078125, -14.4990234375, -14.0614013671875, -13.623779296875, -13.1861572265625, -12.74853515625, -12.3109130859375, -11.873291015625, -11.4356689453125, -10.998046875, -10.5604248046875, -10.122802734375, -9.6851806640625, -9.24755859375, -8.8099365234375, -8.372314453125, -7.9346923828125, -7.4970703125, -7.0594482421875, -6.621826171875, -6.1842041015625, -5.74658203125, -5.3089599609375, -4.871337890625, -4.4337158203125, -3.99609375, -3.5584716796875, -3.120849609375, -2.6832275390625, -2.24560546875, -1.8079833984375, -1.370361328125, -0.9327392578125, -0.4951171875, -0.0574951171875, 0.380126953125, 0.8177490234375, 1.25537109375, 1.6929931640625, 2.130615234375, 2.5682373046875, 3.005859375, 3.4434814453125, 3.881103515625, 4.3187255859375, 4.75634765625, 5.1939697265625, 5.631591796875, 6.0692138671875, 6.5068359375, 6.9444580078125, 7.382080078125, 7.8197021484375, 8.25732421875, 8.6949462890625, 9.132568359375, 9.5701904296875, 10.0078125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 25.0, 26.0, 52.0, 81.0, 129.0, 228.0, 484.0, 1026.0, 2355.0, 6422.0, 22540.0, 124853.0, 1828834.0, 2039116.0, 133362.0, 23529.0, 6668.0, 2445.0, 989.0, 492.0, 216.0, 157.0, 87.0, 68.0, 33.0, 12.0, 10.0, 9.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.328125, -19.481689453125, -18.63525390625, -17.788818359375, -16.9423828125, -16.095947265625, -15.24951171875, -14.403076171875, -13.556640625, -12.710205078125, -11.86376953125, -11.017333984375, -10.1708984375, -9.324462890625, -8.47802734375, -7.631591796875, -6.78515625, -5.938720703125, -5.09228515625, -4.245849609375, -3.3994140625, -2.552978515625, -1.70654296875, -0.860107421875, -0.013671875, 0.832763671875, 1.67919921875, 2.525634765625, 3.3720703125, 4.218505859375, 5.06494140625, 5.911376953125, 6.7578125, 7.604248046875, 8.45068359375, 9.297119140625, 10.1435546875, 10.989990234375, 11.83642578125, 12.682861328125, 13.529296875, 14.375732421875, 15.22216796875, 16.068603515625, 16.9150390625, 17.761474609375, 18.60791015625, 19.454345703125, 20.30078125, 21.147216796875, 21.99365234375, 22.840087890625, 23.6865234375, 24.532958984375, 25.37939453125, 26.225830078125, 27.072265625, 27.918701171875, 28.76513671875, 29.611572265625, 30.4580078125, 31.304443359375, 32.15087890625, 32.997314453125, 33.84375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 13.0, 22.0, 39.0, 67.0, 98.0, 151.0, 152.0, 163.0, 111.0, 76.0, 58.0, 28.0, 18.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.28873825073242, -34.372779846191406, -31.456823348999023, -28.540864944458008, -25.624908447265625, -22.70895004272461, -19.792991638183594, -16.87703514099121, -13.961076736450195, -11.045119285583496, -8.129161834716797, -5.213203430175781, -2.297245979309082, 0.6187114715576172, 3.534669876098633, 6.450626373291016, 9.366584777832031, 12.28254222869873, 15.19849967956543, 18.114458084106445, 21.030414581298828, 23.946372985839844, 26.86233139038086, 29.778287887573242, 32.694244384765625, 35.61020278930664, 38.526161193847656, 41.442115783691406, 44.35807418823242, 47.27403259277344, 50.18999099731445, 53.10594940185547, 56.02190399169922, 58.937862396240234, 61.85382080078125, 64.769775390625, 67.68573760986328, 70.60169219970703, 73.51765441894531, 76.43360900878906, 79.34956359863281, 82.26551818847656, 85.18148040771484, 88.0974349975586, 91.01339721679688, 93.92935180664062, 96.84530639648438, 99.76126861572266, 102.67723083496094, 105.59318542480469, 108.50914764404297, 111.42510223388672, 114.341064453125, 117.25701904296875, 120.1729736328125, 123.08893585205078, 126.00489044189453, 128.9208526611328, 131.83680725097656, 134.7527618408203, 137.66871643066406, 140.58468627929688, 143.50064086914062, 146.41659545898438, 149.33255004882812]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 0.0, 4.0, 10.0, 8.0, 4.0, 10.0, 10.0, 13.0, 17.0, 16.0, 23.0, 29.0, 25.0, 23.0, 26.0, 26.0, 29.0, 38.0, 36.0, 26.0, 34.0, 42.0, 36.0, 43.0, 32.0, 38.0, 32.0, 40.0, 29.0, 27.0, 40.0, 29.0, 27.0, 28.0, 26.0, 14.0, 15.0, 8.0, 9.0, 13.0, 12.0, 11.0, 12.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-32.762451171875, -31.75228500366211, -30.74212074279785, -29.73195457458496, -28.72178840637207, -27.711624145507812, -26.701457977294922, -25.69129180908203, -24.68112564086914, -23.67095947265625, -22.660795211791992, -21.6506290435791, -20.64046287536621, -19.630298614501953, -18.620132446289062, -17.609966278076172, -16.599802017211914, -15.58963680267334, -14.57947063446045, -13.569305419921875, -12.559139251708984, -11.54897403717041, -10.538808822631836, -9.528642654418945, -8.518477439880371, -7.508311748504639, -6.498146057128906, -5.487980842590332, -4.4778151512146, -3.467649459838867, -2.457484245300293, -1.4473185539245605, -0.4371528625488281, 0.5730127096176147, 1.5831782817840576, 2.593343734741211, 3.6035094261169434, 4.613675117492676, 5.62384033203125, 6.634006023406982, 7.644171714782715, 8.654336929321289, 9.66450309753418, 10.674668312072754, 11.684833526611328, 12.694999694824219, 13.705164909362793, 14.715330123901367, 15.725496292114258, 16.73566246032715, 17.745826721191406, 18.755992889404297, 19.766159057617188, 20.776325225830078, 21.786489486694336, 22.796655654907227, 23.806819915771484, 24.816986083984375, 25.827150344848633, 26.837316513061523, 27.847482681274414, 28.857646942138672, 29.867813110351562, 30.877979278564453, 31.888145446777344]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 9.0, 4.0, 8.0, 6.0, 14.0, 13.0, 24.0, 20.0, 32.0, 32.0, 37.0, 29.0, 54.0, 45.0, 44.0, 60.0, 47.0, 61.0, 47.0, 45.0, 49.0, 36.0, 46.0, 46.0, 30.0, 36.0, 29.0, 23.0, 18.0, 9.0, 10.0, 10.0, 5.0, 4.0, 1.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.943359375, -3.817108154296875, -3.69085693359375, -3.564605712890625, -3.4383544921875, -3.312103271484375, -3.18585205078125, -3.059600830078125, -2.933349609375, -2.807098388671875, -2.68084716796875, -2.554595947265625, -2.4283447265625, -2.302093505859375, -2.17584228515625, -2.049591064453125, -1.92333984375, -1.797088623046875, -1.67083740234375, -1.544586181640625, -1.4183349609375, -1.292083740234375, -1.16583251953125, -1.039581298828125, -0.913330078125, -0.787078857421875, -0.66082763671875, -0.534576416015625, -0.4083251953125, -0.282073974609375, -0.15582275390625, -0.029571533203125, 0.0966796875, 0.222930908203125, 0.34918212890625, 0.475433349609375, 0.6016845703125, 0.727935791015625, 0.85418701171875, 0.980438232421875, 1.106689453125, 1.232940673828125, 1.35919189453125, 1.485443115234375, 1.6116943359375, 1.737945556640625, 1.86419677734375, 1.990447998046875, 2.11669921875, 2.242950439453125, 2.36920166015625, 2.495452880859375, 2.6217041015625, 2.747955322265625, 2.87420654296875, 3.000457763671875, 3.126708984375, 3.252960205078125, 3.37921142578125, 3.505462646484375, 3.6317138671875, 3.757965087890625, 3.88421630859375, 4.010467529296875, 4.13671875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 4.0, 5.0, 7.0, 16.0, 17.0, 33.0, 56.0, 81.0, 92.0, 158.0, 230.0, 345.0, 491.0, 778.0, 1162.0, 1830.0, 2839.0, 4751.0, 7932.0, 13744.0, 24261.0, 44829.0, 86853.0, 202127.0, 360837.0, 141689.0, 68681.0, 36248.0, 19681.0, 11333.0, 6627.0, 3933.0, 2398.0, 1510.0, 957.0, 696.0, 457.0, 276.0, 186.0, 131.0, 96.0, 63.0, 37.0, 18.0, 27.0, 16.0, 12.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.16455078125, -0.15946006774902344, -0.15436935424804688, -0.1492786407470703, -0.14418792724609375, -0.1390972137451172, -0.13400650024414062, -0.12891578674316406, -0.1238250732421875, -0.11873435974121094, -0.11364364624023438, -0.10855293273925781, -0.10346221923828125, -0.09837150573730469, -0.09328079223632812, -0.08819007873535156, -0.083099365234375, -0.07800865173339844, -0.07291793823242188, -0.06782722473144531, -0.06273651123046875, -0.05764579772949219, -0.052555084228515625, -0.04746437072753906, -0.0423736572265625, -0.03728294372558594, -0.032192230224609375, -0.027101516723632812, -0.02201080322265625, -0.016920089721679688, -0.011829376220703125, -0.0067386627197265625, -0.00164794921875, 0.0034427642822265625, 0.008533477783203125, 0.013624191284179688, 0.01871490478515625, 0.023805618286132812, 0.028896331787109375, 0.03398704528808594, 0.0390777587890625, 0.04416847229003906, 0.049259185791015625, 0.05434989929199219, 0.05944061279296875, 0.06453132629394531, 0.06962203979492188, 0.07471275329589844, 0.079803466796875, 0.08489418029785156, 0.08998489379882812, 0.09507560729980469, 0.10016632080078125, 0.10525703430175781, 0.11034774780273438, 0.11543846130371094, 0.1205291748046875, 0.12561988830566406, 0.13071060180664062, 0.1358013153076172, 0.14089202880859375, 0.1459827423095703, 0.15107345581054688, 0.15616416931152344, 0.1612548828125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 5.0, 11.0, 18.0, 19.0, 15.0, 29.0, 14.0, 28.0, 23.0, 26.0, 28.0, 38.0, 39.0, 31.0, 35.0, 34.0, 49.0, 1066.0, 35.0, 38.0, 44.0, 40.0, 37.0, 30.0, 29.0, 34.0, 23.0, 25.0, 24.0, 21.0, 22.0, 23.0, 14.0, 11.0, 8.0, 7.0, 5.0, 7.0, 2.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-2.70703125, -2.62725830078125, -2.5474853515625, -2.46771240234375, -2.387939453125, -2.30816650390625, -2.2283935546875, -2.14862060546875, -2.06884765625, -1.98907470703125, -1.9093017578125, -1.82952880859375, -1.749755859375, -1.66998291015625, -1.5902099609375, -1.51043701171875, -1.4306640625, -1.35089111328125, -1.2711181640625, -1.19134521484375, -1.111572265625, -1.03179931640625, -0.9520263671875, -0.87225341796875, -0.79248046875, -0.71270751953125, -0.6329345703125, -0.55316162109375, -0.473388671875, -0.39361572265625, -0.3138427734375, -0.23406982421875, -0.154296875, -0.07452392578125, 0.0052490234375, 0.08502197265625, 0.164794921875, 0.24456787109375, 0.3243408203125, 0.40411376953125, 0.48388671875, 0.56365966796875, 0.6434326171875, 0.72320556640625, 0.802978515625, 0.88275146484375, 0.9625244140625, 1.04229736328125, 1.1220703125, 1.20184326171875, 1.2816162109375, 1.36138916015625, 1.441162109375, 1.52093505859375, 1.6007080078125, 1.68048095703125, 1.76025390625, 1.84002685546875, 1.9197998046875, 1.99957275390625, 2.079345703125, 2.15911865234375, 2.2388916015625, 2.31866455078125, 2.3984375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 5.0, 15.0, 18.0, 30.0, 42.0, 65.0, 106.0, 172.0, 251.0, 391.0, 566.0, 935.0, 1407.0, 2345.0, 3780.0, 5881.0, 9740.0, 16122.0, 26587.0, 44801.0, 79425.0, 165451.0, 1367679.0, 173045.0, 82262.0, 45954.0, 27384.0, 16249.0, 9897.0, 6220.0, 3755.0, 2341.0, 1514.0, 950.0, 610.0, 413.0, 253.0, 167.0, 101.0, 85.0, 40.0, 25.0, 12.0, 15.0, 11.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0986328125, -0.09569072723388672, -0.09274864196777344, -0.08980655670166016, -0.08686447143554688, -0.0839223861694336, -0.08098030090332031, -0.07803821563720703, -0.07509613037109375, -0.07215404510498047, -0.06921195983886719, -0.0662698745727539, -0.06332778930664062, -0.060385704040527344, -0.05744361877441406, -0.05450153350830078, -0.0515594482421875, -0.04861736297607422, -0.04567527770996094, -0.042733192443847656, -0.039791107177734375, -0.036849021911621094, -0.03390693664550781, -0.03096485137939453, -0.02802276611328125, -0.02508068084716797, -0.022138595581054688, -0.019196510314941406, -0.016254425048828125, -0.013312339782714844, -0.010370254516601562, -0.007428169250488281, -0.004486083984375, -0.0015439987182617188, 0.0013980865478515625, 0.004340171813964844, 0.007282257080078125, 0.010224342346191406, 0.013166427612304688, 0.01610851287841797, 0.01905059814453125, 0.02199268341064453, 0.024934768676757812, 0.027876853942871094, 0.030818939208984375, 0.033761024475097656, 0.03670310974121094, 0.03964519500732422, 0.0425872802734375, 0.04552936553955078, 0.04847145080566406, 0.051413536071777344, 0.054355621337890625, 0.057297706604003906, 0.06023979187011719, 0.06318187713623047, 0.06612396240234375, 0.06906604766845703, 0.07200813293457031, 0.0749502182006836, 0.07789230346679688, 0.08083438873291016, 0.08377647399902344, 0.08671855926513672, 0.08966064453125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 7.0, 13.0, 7.0, 14.0, 13.0, 12.0, 23.0, 10.0, 26.0, 20.0, 23.0, 31.0, 35.0, 39.0, 51.0, 48.0, 45.0, 55.0, 55.0, 39.0, 53.0, 27.0, 37.0, 34.0, 46.0, 24.0, 17.0, 28.0, 32.0, 19.0, 19.0, 12.0, 12.0, 17.0, 7.0, 9.0, 7.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.5881996154785156e-05, -3.4800730645656586e-05, -3.3719465136528015e-05, -3.2638199627399445e-05, -3.1556934118270874e-05, -3.0475668609142303e-05, -2.9394403100013733e-05, -2.8313137590885162e-05, -2.7231872081756592e-05, -2.615060657262802e-05, -2.506934106349945e-05, -2.398807555437088e-05, -2.290681004524231e-05, -2.182554453611374e-05, -2.074427902698517e-05, -1.9663013517856598e-05, -1.8581748008728027e-05, -1.7500482499599457e-05, -1.6419216990470886e-05, -1.5337951481342316e-05, -1.4256685972213745e-05, -1.3175420463085175e-05, -1.2094154953956604e-05, -1.1012889444828033e-05, -9.931623935699463e-06, -8.850358426570892e-06, -7.769092917442322e-06, -6.687827408313751e-06, -5.606561899185181e-06, -4.52529639005661e-06, -3.4440308809280396e-06, -2.362765371799469e-06, -1.2814998626708984e-06, -2.0023435354232788e-07, 8.810311555862427e-07, 1.9622966647148132e-06, 3.043562173843384e-06, 4.124827682971954e-06, 5.206093192100525e-06, 6.2873587012290955e-06, 7.368624210357666e-06, 8.449889719486237e-06, 9.531155228614807e-06, 1.0612420737743378e-05, 1.1693686246871948e-05, 1.2774951756000519e-05, 1.385621726512909e-05, 1.493748277425766e-05, 1.601874828338623e-05, 1.71000137925148e-05, 1.818127930164337e-05, 1.9262544810771942e-05, 2.0343810319900513e-05, 2.1425075829029083e-05, 2.2506341338157654e-05, 2.3587606847286224e-05, 2.4668872356414795e-05, 2.5750137865543365e-05, 2.6831403374671936e-05, 2.7912668883800507e-05, 2.8993934392929077e-05, 3.0075199902057648e-05, 3.115646541118622e-05, 3.223773092031479e-05, 3.331899642944336e-05]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 10.0, 9.0, 8.0, 14.0, 19.0, 16.0, 26.0, 35.0, 31.0, 47.0, 59.0, 63.0, 67.0, 75.0, 142.0, 151.0, 241.0, 447.0, 2517.0, 58363.0, 761932.0, 215289.0, 7065.0, 764.0, 299.0, 174.0, 131.0, 113.0, 93.0, 74.0, 63.0, 40.0, 28.0, 29.0, 24.0, 23.0, 14.0, 11.0, 10.0, 17.0, 5.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-0.0005521774291992188, -0.0005357861518859863, -0.0005193948745727539, -0.0005030035972595215, -0.00048661231994628906, -0.00047022104263305664, -0.0004538297653198242, -0.0004374384880065918, -0.0004210472106933594, -0.00040465593338012695, -0.00038826465606689453, -0.0003718733787536621, -0.0003554821014404297, -0.00033909082412719727, -0.00032269954681396484, -0.0003063082695007324, -0.0002899169921875, -0.0002735257148742676, -0.00025713443756103516, -0.00024074316024780273, -0.0002243518829345703, -0.0002079606056213379, -0.00019156932830810547, -0.00017517805099487305, -0.00015878677368164062, -0.0001423954963684082, -0.00012600421905517578, -0.00010961294174194336, -9.322166442871094e-05, -7.683038711547852e-05, -6.0439109802246094e-05, -4.404783248901367e-05, -2.765655517578125e-05, -1.1265277862548828e-05, 5.125999450683594e-06, 2.1517276763916016e-05, 3.790855407714844e-05, 5.429983139038086e-05, 7.069110870361328e-05, 8.70823860168457e-05, 0.00010347366333007812, 0.00011986494064331055, 0.00013625621795654297, 0.0001526474952697754, 0.0001690387725830078, 0.00018543004989624023, 0.00020182132720947266, 0.00021821260452270508, 0.0002346038818359375, 0.0002509951591491699, 0.00026738643646240234, 0.00028377771377563477, 0.0003001689910888672, 0.0003165602684020996, 0.00033295154571533203, 0.00034934282302856445, 0.0003657341003417969, 0.0003821253776550293, 0.0003985166549682617, 0.00041490793228149414, 0.00043129920959472656, 0.000447690486907959, 0.0004640817642211914, 0.00048047304153442383, 0.0004968643188476562]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 14.0, 38.0, 138.0, 291.0, 313.0, 149.0, 57.0, 12.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.985628664959222e-05, -8.512732165399939e-05, -8.039835665840656e-05, -7.566939166281372e-05, -7.094042666722089e-05, -6.621146167162806e-05, -6.148248940007761e-05, -5.675352440448478e-05, -5.2024559408891946e-05, -4.7295594413299114e-05, -4.256662941770628e-05, -3.783766078413464e-05, -3.310869578854181e-05, -2.8379730792948976e-05, -2.365076397836674e-05, -1.8921797163784504e-05, -1.4192832168191671e-05, -9.463866263104137e-06, -4.734900358016603e-06, -5.934452929068357e-09, 4.723031452158466e-06, 9.451996447751299e-06, 1.4180963262333535e-05, 1.890993007691577e-05, 2.3638895072508603e-05, 2.8367860068101436e-05, 3.309682506369427e-05, 3.782579369726591e-05, 4.255475869285874e-05, 4.728372368845157e-05, 5.201269232202321e-05, 5.6741657317616045e-05, 6.14706368651241e-05, 6.619960186071694e-05, 7.092856685630977e-05, 7.56575318519026e-05, 8.038649684749544e-05, 8.511546184308827e-05, 8.984443411463872e-05, 9.457339911023155e-05, 9.930236410582438e-05, 0.00010403132910141721, 0.00010876029409701005, 0.00011348925909260288, 0.00011821823136415333, 0.00012294719635974616, 0.000127676161355339, 0.00013240512635093182, 0.00013713409134652466, 0.0001418630563421175, 0.00014659202133771032, 0.00015132098633330315, 0.00015604995132889599, 0.00016077891632448882, 0.00016550788132008165, 0.0001702368608675897, 0.00017496582586318254, 0.00017969479085877538, 0.0001844237558543682, 0.00018915272084996104, 0.00019388168584555387, 0.0001986106508411467, 0.00020333961583673954, 0.00020806858083233237, 0.0002127975458279252]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 2.0, 17.0, 12.0, 10.0, 16.0, 24.0, 16.0, 19.0, 24.0, 28.0, 32.0, 25.0, 39.0, 35.0, 43.0, 38.0, 46.0, 39.0, 42.0, 32.0, 30.0, 42.0, 36.0, 34.0, 29.0, 32.0, 35.0, 25.0, 26.0, 28.0, 20.0, 22.0, 17.0, 8.0, 8.0, 10.0, 7.0, 16.0, 6.0, 7.0, 3.0, 0.0, 8.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.6524066925048828e-05, -2.5663524866104126e-05, -2.4802982807159424e-05, -2.394244074821472e-05, -2.308189868927002e-05, -2.2221356630325317e-05, -2.1360814571380615e-05, -2.0500272512435913e-05, -1.963973045349121e-05, -1.877918839454651e-05, -1.7918646335601807e-05, -1.7058104276657104e-05, -1.6197562217712402e-05, -1.53370201587677e-05, -1.4476478099822998e-05, -1.3615936040878296e-05, -1.2755393981933594e-05, -1.1894851922988892e-05, -1.103430986404419e-05, -1.0173767805099487e-05, -9.313225746154785e-06, -8.452683687210083e-06, -7.592141628265381e-06, -6.731599569320679e-06, -5.8710575103759766e-06, -5.010515451431274e-06, -4.149973392486572e-06, -3.28943133354187e-06, -2.428889274597168e-06, -1.5683472156524658e-06, -7.078051567077637e-07, 1.5273690223693848e-07, 1.0132789611816406e-06, 1.8738210201263428e-06, 2.734363079071045e-06, 3.594905138015747e-06, 4.455447196960449e-06, 5.315989255905151e-06, 6.1765313148498535e-06, 7.037073373794556e-06, 7.897615432739258e-06, 8.75815749168396e-06, 9.618699550628662e-06, 1.0479241609573364e-05, 1.1339783668518066e-05, 1.2200325727462769e-05, 1.306086778640747e-05, 1.3921409845352173e-05, 1.4781951904296875e-05, 1.5642493963241577e-05, 1.650303602218628e-05, 1.736357808113098e-05, 1.8224120140075684e-05, 1.9084662199020386e-05, 1.9945204257965088e-05, 2.080574631690979e-05, 2.1666288375854492e-05, 2.2526830434799194e-05, 2.3387372493743896e-05, 2.42479145526886e-05, 2.51084566116333e-05, 2.5968998670578003e-05, 2.6829540729522705e-05, 2.7690082788467407e-05, 2.855062484741211e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 9.0, 4.0, 8.0, 6.0, 14.0, 13.0, 24.0, 20.0, 32.0, 32.0, 37.0, 29.0, 54.0, 45.0, 44.0, 60.0, 47.0, 61.0, 47.0, 45.0, 49.0, 36.0, 46.0, 46.0, 30.0, 36.0, 29.0, 23.0, 18.0, 9.0, 10.0, 10.0, 5.0, 4.0, 1.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.943359375, -3.817108154296875, -3.69085693359375, -3.564605712890625, -3.4383544921875, -3.312103271484375, -3.18585205078125, -3.059600830078125, -2.933349609375, -2.807098388671875, -2.68084716796875, -2.554595947265625, -2.4283447265625, -2.302093505859375, -2.17584228515625, -2.049591064453125, -1.92333984375, -1.797088623046875, -1.67083740234375, -1.544586181640625, -1.4183349609375, -1.292083740234375, -1.16583251953125, -1.039581298828125, -0.913330078125, -0.787078857421875, -0.66082763671875, -0.534576416015625, -0.4083251953125, -0.282073974609375, -0.15582275390625, -0.029571533203125, 0.0966796875, 0.222930908203125, 0.34918212890625, 0.475433349609375, 0.6016845703125, 0.727935791015625, 0.85418701171875, 0.980438232421875, 1.106689453125, 1.232940673828125, 1.35919189453125, 1.485443115234375, 1.6116943359375, 1.737945556640625, 1.86419677734375, 1.990447998046875, 2.11669921875, 2.242950439453125, 2.36920166015625, 2.495452880859375, 2.6217041015625, 2.747955322265625, 2.87420654296875, 3.000457763671875, 3.126708984375, 3.252960205078125, 3.37921142578125, 3.505462646484375, 3.6317138671875, 3.757965087890625, 3.88421630859375, 4.010467529296875, 4.13671875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 1.0, 4.0, 5.0, 2.0, 6.0, 8.0, 6.0, 13.0, 15.0, 18.0, 19.0, 27.0, 71.0, 73.0, 160.0, 258.0, 516.0, 976.0, 1994.0, 4427.0, 11258.0, 37488.0, 286310.0, 628004.0, 52285.0, 14460.0, 5299.0, 2318.0, 1160.0, 592.0, 298.0, 197.0, 88.0, 58.0, 41.0, 22.0, 16.0, 20.0, 9.0, 11.0, 7.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.203125, -7.939453125, -7.67578125, -7.412109375, -7.1484375, -6.884765625, -6.62109375, -6.357421875, -6.09375, -5.830078125, -5.56640625, -5.302734375, -5.0390625, -4.775390625, -4.51171875, -4.248046875, -3.984375, -3.720703125, -3.45703125, -3.193359375, -2.9296875, -2.666015625, -2.40234375, -2.138671875, -1.875, -1.611328125, -1.34765625, -1.083984375, -0.8203125, -0.556640625, -0.29296875, -0.029296875, 0.234375, 0.498046875, 0.76171875, 1.025390625, 1.2890625, 1.552734375, 1.81640625, 2.080078125, 2.34375, 2.607421875, 2.87109375, 3.134765625, 3.3984375, 3.662109375, 3.92578125, 4.189453125, 4.453125, 4.716796875, 4.98046875, 5.244140625, 5.5078125, 5.771484375, 6.03515625, 6.298828125, 6.5625, 6.826171875, 7.08984375, 7.353515625, 7.6171875, 7.880859375, 8.14453125, 8.408203125, 8.671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 8.0, 3.0, 10.0, 7.0, 11.0, 8.0, 22.0, 14.0, 19.0, 21.0, 18.0, 24.0, 36.0, 37.0, 45.0, 44.0, 36.0, 47.0, 66.0, 89.0, 1688.0, 243.0, 98.0, 64.0, 48.0, 42.0, 46.0, 41.0, 24.0, 20.0, 33.0, 29.0, 18.0, 21.0, 11.0, 13.0, 18.0, 10.0, 5.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0], "bins": [-14.859375, -14.487060546875, -14.11474609375, -13.742431640625, -13.3701171875, -12.997802734375, -12.62548828125, -12.253173828125, -11.880859375, -11.508544921875, -11.13623046875, -10.763916015625, -10.3916015625, -10.019287109375, -9.64697265625, -9.274658203125, -8.90234375, -8.530029296875, -8.15771484375, -7.785400390625, -7.4130859375, -7.040771484375, -6.66845703125, -6.296142578125, -5.923828125, -5.551513671875, -5.17919921875, -4.806884765625, -4.4345703125, -4.062255859375, -3.68994140625, -3.317626953125, -2.9453125, -2.572998046875, -2.20068359375, -1.828369140625, -1.4560546875, -1.083740234375, -0.71142578125, -0.339111328125, 0.033203125, 0.405517578125, 0.77783203125, 1.150146484375, 1.5224609375, 1.894775390625, 2.26708984375, 2.639404296875, 3.01171875, 3.384033203125, 3.75634765625, 4.128662109375, 4.5009765625, 4.873291015625, 5.24560546875, 5.617919921875, 5.990234375, 6.362548828125, 6.73486328125, 7.107177734375, 7.4794921875, 7.851806640625, 8.22412109375, 8.596435546875, 8.96875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 12.0, 12.0, 10.0, 11.0, 16.0, 18.0, 20.0, 27.0, 48.0, 46.0, 65.0, 149.0, 244.0, 506.0, 1011.0, 2394.0, 6506.0, 24956.0, 191066.0, 2782992.0, 108203.0, 17973.0, 5430.0, 2012.0, 876.0, 437.0, 227.0, 117.0, 74.0, 47.0, 30.0, 23.0, 24.0, 23.0, 18.0, 18.0, 10.0, 10.0, 7.0, 6.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.046875, -11.59033203125, -11.1337890625, -10.67724609375, -10.220703125, -9.76416015625, -9.3076171875, -8.85107421875, -8.39453125, -7.93798828125, -7.4814453125, -7.02490234375, -6.568359375, -6.11181640625, -5.6552734375, -5.19873046875, -4.7421875, -4.28564453125, -3.8291015625, -3.37255859375, -2.916015625, -2.45947265625, -2.0029296875, -1.54638671875, -1.08984375, -0.63330078125, -0.1767578125, 0.27978515625, 0.736328125, 1.19287109375, 1.6494140625, 2.10595703125, 2.5625, 3.01904296875, 3.4755859375, 3.93212890625, 4.388671875, 4.84521484375, 5.3017578125, 5.75830078125, 6.21484375, 6.67138671875, 7.1279296875, 7.58447265625, 8.041015625, 8.49755859375, 8.9541015625, 9.41064453125, 9.8671875, 10.32373046875, 10.7802734375, 11.23681640625, 11.693359375, 12.14990234375, 12.6064453125, 13.06298828125, 13.51953125, 13.97607421875, 14.4326171875, 14.88916015625, 15.345703125, 15.80224609375, 16.2587890625, 16.71533203125, 17.171875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [476.0, 542.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4761323928833, -0.3498659133911133, 11.776400566101074, 23.902667999267578, 36.028934478759766, 48.15520095825195, 60.28146743774414, 72.40773010253906, 84.53399658203125, 96.66026306152344, 108.78652954101562, 120.91279602050781, 133.0390625, 145.1653289794922, 157.29159545898438, 169.41786193847656, 181.54412841796875, 193.67039489746094, 205.79666137695312, 217.9229278564453, 230.0491943359375, 242.1754608154297, 254.30172729492188, 266.427978515625, 278.55426025390625, 290.6805419921875, 302.8067932128906, 314.93304443359375, 327.059326171875, 339.18560791015625, 351.3118591308594, 363.4381103515625, 375.56439208984375, 387.690673828125, 399.8169250488281, 411.94317626953125, 424.0694580078125, 436.19573974609375, 448.3219909667969, 460.4482421875, 472.57452392578125, 484.7008056640625, 496.8270568847656, 508.95330810546875, 521.07958984375, 533.2058715820312, 545.3321533203125, 557.4583740234375, 569.5846557617188, 581.7109375, 593.837158203125, 605.9634399414062, 618.0897216796875, 630.2160034179688, 642.34228515625, 654.468505859375, 666.5947875976562, 678.7210693359375, 690.8472900390625, 702.9735717773438, 715.099853515625, 727.2261352539062, 739.3524169921875, 751.4786376953125, 763.6049194335938]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 4.0, 10.0, 12.0, 13.0, 9.0, 15.0, 22.0, 19.0, 21.0, 24.0, 27.0, 38.0, 33.0, 36.0, 37.0, 43.0, 46.0, 45.0, 41.0, 31.0, 35.0, 37.0, 47.0, 36.0, 29.0, 35.0, 39.0, 22.0, 34.0, 14.0, 27.0, 15.0, 19.0, 9.0, 8.0, 6.0, 12.0, 11.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.21539306640625, -32.09511184692383, -30.974830627441406, -29.854549407958984, -28.734268188476562, -27.61398696899414, -26.49370574951172, -25.373424530029297, -24.253143310546875, -23.132862091064453, -22.01258087158203, -20.89229965209961, -19.772018432617188, -18.651737213134766, -17.531455993652344, -16.411174774169922, -15.2908935546875, -14.170612335205078, -13.050331115722656, -11.930049896240234, -10.809768676757812, -9.68948745727539, -8.569206237792969, -7.448925018310547, -6.328643798828125, -5.208362579345703, -4.088081359863281, -2.9678001403808594, -1.8475189208984375, -0.7272377014160156, 0.39304351806640625, 1.5133247375488281, 2.6336021423339844, 3.7538833618164062, 4.874164581298828, 5.99444580078125, 7.114727020263672, 8.235008239746094, 9.355289459228516, 10.475570678710938, 11.59585189819336, 12.716133117675781, 13.836414337158203, 14.956695556640625, 16.076976776123047, 17.19725799560547, 18.31753921508789, 19.437820434570312, 20.558101654052734, 21.678382873535156, 22.798664093017578, 23.9189453125, 25.039226531982422, 26.159507751464844, 27.279788970947266, 28.400070190429688, 29.52035140991211, 30.64063262939453, 31.760913848876953, 32.881195068359375, 34.0014762878418, 35.12175750732422, 36.24203872680664, 37.36231994628906, 38.482601165771484]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 7.0, 6.0, 4.0, 16.0, 13.0, 14.0, 25.0, 24.0, 36.0, 37.0, 36.0, 40.0, 48.0, 52.0, 55.0, 46.0, 54.0, 51.0, 53.0, 58.0, 42.0, 41.0, 37.0, 43.0, 36.0, 25.0, 28.0, 12.0, 12.0, 12.0, 8.0, 7.0, 2.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140625, -4.00933837890625, -3.8780517578125, -3.74676513671875, -3.615478515625, -3.48419189453125, -3.3529052734375, -3.22161865234375, -3.09033203125, -2.95904541015625, -2.8277587890625, -2.69647216796875, -2.565185546875, -2.43389892578125, -2.3026123046875, -2.17132568359375, -2.0400390625, -1.90875244140625, -1.7774658203125, -1.64617919921875, -1.514892578125, -1.38360595703125, -1.2523193359375, -1.12103271484375, -0.98974609375, -0.85845947265625, -0.7271728515625, -0.59588623046875, -0.464599609375, -0.33331298828125, -0.2020263671875, -0.07073974609375, 0.060546875, 0.19183349609375, 0.3231201171875, 0.45440673828125, 0.585693359375, 0.71697998046875, 0.8482666015625, 0.97955322265625, 1.11083984375, 1.24212646484375, 1.3734130859375, 1.50469970703125, 1.635986328125, 1.76727294921875, 1.8985595703125, 2.02984619140625, 2.1611328125, 2.29241943359375, 2.4237060546875, 2.55499267578125, 2.686279296875, 2.81756591796875, 2.9488525390625, 3.08013916015625, 3.21142578125, 3.34271240234375, 3.4739990234375, 3.60528564453125, 3.736572265625, 3.86785888671875, 3.9991455078125, 4.13043212890625, 4.26171875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 10.0, 8.0, 10.0, 12.0, 20.0, 20.0, 37.0, 63.0, 80.0, 115.0, 213.0, 310.0, 519.0, 1024.0, 2377.0, 7127.0, 33864.0, 385613.0, 3541840.0, 189311.0, 22389.0, 5332.0, 1949.0, 853.0, 432.0, 263.0, 163.0, 109.0, 69.0, 49.0, 30.0, 19.0, 21.0, 15.0, 4.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.75, -20.146484375, -19.54296875, -18.939453125, -18.3359375, -17.732421875, -17.12890625, -16.525390625, -15.921875, -15.318359375, -14.71484375, -14.111328125, -13.5078125, -12.904296875, -12.30078125, -11.697265625, -11.09375, -10.490234375, -9.88671875, -9.283203125, -8.6796875, -8.076171875, -7.47265625, -6.869140625, -6.265625, -5.662109375, -5.05859375, -4.455078125, -3.8515625, -3.248046875, -2.64453125, -2.041015625, -1.4375, -0.833984375, -0.23046875, 0.373046875, 0.9765625, 1.580078125, 2.18359375, 2.787109375, 3.390625, 3.994140625, 4.59765625, 5.201171875, 5.8046875, 6.408203125, 7.01171875, 7.615234375, 8.21875, 8.822265625, 9.42578125, 10.029296875, 10.6328125, 11.236328125, 11.83984375, 12.443359375, 13.046875, 13.650390625, 14.25390625, 14.857421875, 15.4609375, 16.064453125, 16.66796875, 17.271484375, 17.875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 6.0, 5.0, 4.0, 6.0, 9.0, 11.0, 11.0, 20.0, 36.0, 46.0, 60.0, 103.0, 126.0, 240.0, 319.0, 556.0, 714.0, 631.0, 391.0, 251.0, 156.0, 113.0, 64.0, 52.0, 36.0, 40.0, 18.0, 9.0, 14.0, 7.0, 5.0, 2.0, 6.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0, -12.613525390625, -12.22705078125, -11.840576171875, -11.4541015625, -11.067626953125, -10.68115234375, -10.294677734375, -9.908203125, -9.521728515625, -9.13525390625, -8.748779296875, -8.3623046875, -7.975830078125, -7.58935546875, -7.202880859375, -6.81640625, -6.429931640625, -6.04345703125, -5.656982421875, -5.2705078125, -4.884033203125, -4.49755859375, -4.111083984375, -3.724609375, -3.338134765625, -2.95166015625, -2.565185546875, -2.1787109375, -1.792236328125, -1.40576171875, -1.019287109375, -0.6328125, -0.246337890625, 0.14013671875, 0.526611328125, 0.9130859375, 1.299560546875, 1.68603515625, 2.072509765625, 2.458984375, 2.845458984375, 3.23193359375, 3.618408203125, 4.0048828125, 4.391357421875, 4.77783203125, 5.164306640625, 5.55078125, 5.937255859375, 6.32373046875, 6.710205078125, 7.0966796875, 7.483154296875, 7.86962890625, 8.256103515625, 8.642578125, 9.029052734375, 9.41552734375, 9.802001953125, 10.1884765625, 10.574951171875, 10.96142578125, 11.347900390625, 11.734375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 13.0, 7.0, 9.0, 22.0, 19.0, 30.0, 46.0, 72.0, 106.0, 137.0, 233.0, 387.0, 561.0, 876.0, 1571.0, 2805.0, 5018.0, 10631.0, 25361.0, 75727.0, 323234.0, 2324375.0, 1154188.0, 183175.0, 49902.0, 18122.0, 7968.0, 4109.0, 2209.0, 1274.0, 761.0, 469.0, 303.0, 182.0, 115.0, 89.0, 59.0, 38.0, 25.0, 14.0, 14.0, 8.0, 6.0, 8.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.6328125, -15.1256103515625, -14.618408203125, -14.1112060546875, -13.60400390625, -13.0968017578125, -12.589599609375, -12.0823974609375, -11.5751953125, -11.0679931640625, -10.560791015625, -10.0535888671875, -9.54638671875, -9.0391845703125, -8.531982421875, -8.0247802734375, -7.517578125, -7.0103759765625, -6.503173828125, -5.9959716796875, -5.48876953125, -4.9815673828125, -4.474365234375, -3.9671630859375, -3.4599609375, -2.9527587890625, -2.445556640625, -1.9383544921875, -1.43115234375, -0.9239501953125, -0.416748046875, 0.0904541015625, 0.59765625, 1.1048583984375, 1.612060546875, 2.1192626953125, 2.62646484375, 3.1336669921875, 3.640869140625, 4.1480712890625, 4.6552734375, 5.1624755859375, 5.669677734375, 6.1768798828125, 6.68408203125, 7.1912841796875, 7.698486328125, 8.2056884765625, 8.712890625, 9.2200927734375, 9.727294921875, 10.2344970703125, 10.74169921875, 11.2489013671875, 11.756103515625, 12.2633056640625, 12.7705078125, 13.2777099609375, 13.784912109375, 14.2921142578125, 14.79931640625, 15.3065185546875, 15.813720703125, 16.3209228515625, 16.828125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 11.0, 11.0, 11.0, 24.0, 26.0, 36.0, 59.0, 72.0, 86.0, 93.0, 111.0, 68.0, 98.0, 81.0, 65.0, 42.0, 32.0, 26.0, 19.0, 14.0, 11.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.32262420654297, -39.52180480957031, -37.720985412597656, -35.920166015625, -34.119346618652344, -32.31852722167969, -30.51770782470703, -28.716888427734375, -26.91606903076172, -25.115249633789062, -23.314430236816406, -21.51361083984375, -19.712791442871094, -17.911972045898438, -16.11115264892578, -14.310334205627441, -12.509515762329102, -10.708696365356445, -8.907876968383789, -7.107058048248291, -5.306238651275635, -3.5054197311401367, -1.7046003341674805, 0.09621906280517578, 1.897038459777832, 3.6978578567504883, 5.4986772537231445, 7.299496173858643, 9.10031509399414, 10.901134490966797, 12.701953887939453, 14.50277328491211, 16.303592681884766, 18.104412078857422, 19.905231475830078, 21.706050872802734, 23.50687026977539, 25.307689666748047, 27.108509063720703, 28.90932846069336, 30.710147857666016, 32.51096725463867, 34.31178665161133, 36.112606048583984, 37.91342544555664, 39.7142448425293, 41.51506423950195, 43.31588363647461, 45.11669921875, 46.917518615722656, 48.71833801269531, 50.51915740966797, 52.319976806640625, 54.12079620361328, 55.92161560058594, 57.722434997558594, 59.52325439453125, 61.324073791503906, 63.12489318847656, 64.92571258544922, 66.72653198242188, 68.52735137939453, 70.32817077636719, 72.12899017333984, 73.9298095703125]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 3.0, 8.0, 9.0, 9.0, 10.0, 10.0, 9.0, 12.0, 20.0, 17.0, 20.0, 18.0, 21.0, 22.0, 27.0, 36.0, 26.0, 25.0, 23.0, 31.0, 35.0, 45.0, 31.0, 53.0, 39.0, 35.0, 36.0, 28.0, 29.0, 35.0, 27.0, 23.0, 25.0, 28.0, 20.0, 19.0, 13.0, 25.0, 14.0, 14.0, 12.0, 8.0, 9.0, 9.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0], "bins": [-32.93708038330078, -31.973960876464844, -31.010839462280273, -30.047718048095703, -29.084598541259766, -28.121479034423828, -27.158357620239258, -26.195236206054688, -25.23211669921875, -24.268997192382812, -23.305875778198242, -22.342754364013672, -21.379634857177734, -20.416515350341797, -19.453393936157227, -18.490272521972656, -17.52715301513672, -16.56403350830078, -15.600912094116211, -14.637791633605957, -13.674671173095703, -12.71155071258545, -11.748430252075195, -10.785309791564941, -9.822189331054688, -8.859068870544434, -7.89594841003418, -6.932827949523926, -5.969707489013672, -5.006587028503418, -4.043466567993164, -3.08034610748291, -2.1172256469726562, -1.1541051864624023, -0.19098472595214844, 0.7721357345581055, 1.7352561950683594, 2.6983766555786133, 3.661497116088867, 4.624617576599121, 5.587738037109375, 6.550858497619629, 7.513978958129883, 8.477099418640137, 9.44021987915039, 10.403340339660645, 11.366460800170898, 12.329581260681152, 13.292701721191406, 14.25582218170166, 15.218942642211914, 16.182064056396484, 17.145183563232422, 18.10830307006836, 19.07142448425293, 20.0345458984375, 20.997665405273438, 21.960784912109375, 22.923906326293945, 23.887027740478516, 24.850147247314453, 25.81326675415039, 26.77638816833496, 27.73950958251953, 28.70262908935547]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 12.0, 17.0, 17.0, 23.0, 20.0, 32.0, 29.0, 35.0, 38.0, 60.0, 46.0, 52.0, 49.0, 57.0, 54.0, 47.0, 60.0, 57.0, 33.0, 41.0, 33.0, 31.0, 29.0, 29.0, 12.0, 15.0, 12.0, 11.0, 8.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.888671875, -3.753387451171875, -3.61810302734375, -3.482818603515625, -3.3475341796875, -3.212249755859375, -3.07696533203125, -2.941680908203125, -2.806396484375, -2.671112060546875, -2.53582763671875, -2.400543212890625, -2.2652587890625, -2.129974365234375, -1.99468994140625, -1.859405517578125, -1.72412109375, -1.588836669921875, -1.45355224609375, -1.318267822265625, -1.1829833984375, -1.047698974609375, -0.91241455078125, -0.777130126953125, -0.641845703125, -0.506561279296875, -0.37127685546875, -0.235992431640625, -0.1007080078125, 0.034576416015625, 0.16986083984375, 0.305145263671875, 0.4404296875, 0.575714111328125, 0.71099853515625, 0.846282958984375, 0.9815673828125, 1.116851806640625, 1.25213623046875, 1.387420654296875, 1.522705078125, 1.657989501953125, 1.79327392578125, 1.928558349609375, 2.0638427734375, 2.199127197265625, 2.33441162109375, 2.469696044921875, 2.60498046875, 2.740264892578125, 2.87554931640625, 3.010833740234375, 3.1461181640625, 3.281402587890625, 3.41668701171875, 3.551971435546875, 3.687255859375, 3.822540283203125, 3.95782470703125, 4.093109130859375, 4.2283935546875, 4.363677978515625, 4.49896240234375, 4.634246826171875, 4.76953125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 6.0, 9.0, 3.0, 19.0, 18.0, 29.0, 40.0, 67.0, 86.0, 121.0, 180.0, 262.0, 419.0, 610.0, 880.0, 1434.0, 2221.0, 3443.0, 5736.0, 9151.0, 15231.0, 25663.0, 44516.0, 82539.0, 179696.0, 335406.0, 161136.0, 76462.0, 41338.0, 24251.0, 14168.0, 8681.0, 5327.0, 3287.0, 2164.0, 1330.0, 898.0, 581.0, 382.0, 261.0, 169.0, 113.0, 80.0, 56.0, 29.0, 20.0, 12.0, 12.0, 6.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1368408203125, -0.13219261169433594, -0.12754440307617188, -0.12289619445800781, -0.11824798583984375, -0.11359977722167969, -0.10895156860351562, -0.10430335998535156, -0.0996551513671875, -0.09500694274902344, -0.09035873413085938, -0.08571052551269531, -0.08106231689453125, -0.07641410827636719, -0.07176589965820312, -0.06711769104003906, -0.062469482421875, -0.05782127380371094, -0.053173065185546875, -0.04852485656738281, -0.04387664794921875, -0.03922843933105469, -0.034580230712890625, -0.029932022094726562, -0.0252838134765625, -0.020635604858398438, -0.015987396240234375, -0.011339187622070312, -0.00669097900390625, -0.0020427703857421875, 0.002605438232421875, 0.0072536468505859375, 0.01190185546875, 0.016550064086914062, 0.021198272705078125, 0.025846481323242188, 0.03049468994140625, 0.03514289855957031, 0.039791107177734375, 0.04443931579589844, 0.0490875244140625, 0.05373573303222656, 0.058383941650390625, 0.06303215026855469, 0.06768035888671875, 0.07232856750488281, 0.07697677612304688, 0.08162498474121094, 0.086273193359375, 0.09092140197753906, 0.09556961059570312, 0.10021781921386719, 0.10486602783203125, 0.10951423645019531, 0.11416244506835938, 0.11881065368652344, 0.1234588623046875, 0.12810707092285156, 0.13275527954101562, 0.1374034881591797, 0.14205169677734375, 0.1466999053955078, 0.15134811401367188, 0.15599632263183594, 0.16064453125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 7.0, 6.0, 5.0, 4.0, 2.0, 12.0, 15.0, 14.0, 12.0, 16.0, 17.0, 18.0, 21.0, 30.0, 20.0, 32.0, 41.0, 26.0, 35.0, 37.0, 31.0, 41.0, 42.0, 1064.0, 32.0, 36.0, 35.0, 39.0, 36.0, 39.0, 26.0, 27.0, 25.0, 31.0, 14.0, 17.0, 24.0, 15.0, 12.0, 6.0, 8.0, 13.0, 11.0, 5.0, 4.0, 5.0, 3.0, 5.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.46484375, -2.38568115234375, -2.3065185546875, -2.22735595703125, -2.148193359375, -2.06903076171875, -1.9898681640625, -1.91070556640625, -1.83154296875, -1.75238037109375, -1.6732177734375, -1.59405517578125, -1.514892578125, -1.43572998046875, -1.3565673828125, -1.27740478515625, -1.1982421875, -1.11907958984375, -1.0399169921875, -0.96075439453125, -0.881591796875, -0.80242919921875, -0.7232666015625, -0.64410400390625, -0.56494140625, -0.48577880859375, -0.4066162109375, -0.32745361328125, -0.248291015625, -0.16912841796875, -0.0899658203125, -0.01080322265625, 0.068359375, 0.14752197265625, 0.2266845703125, 0.30584716796875, 0.385009765625, 0.46417236328125, 0.5433349609375, 0.62249755859375, 0.70166015625, 0.78082275390625, 0.8599853515625, 0.93914794921875, 1.018310546875, 1.09747314453125, 1.1766357421875, 1.25579833984375, 1.3349609375, 1.41412353515625, 1.4932861328125, 1.57244873046875, 1.651611328125, 1.73077392578125, 1.8099365234375, 1.88909912109375, 1.96826171875, 2.04742431640625, 2.1265869140625, 2.20574951171875, 2.284912109375, 2.36407470703125, 2.4432373046875, 2.52239990234375, 2.6015625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 14.0, 16.0, 26.0, 40.0, 49.0, 104.0, 137.0, 197.0, 305.0, 436.0, 687.0, 1036.0, 1437.0, 2214.0, 3465.0, 5139.0, 7939.0, 12158.0, 19333.0, 30943.0, 51656.0, 91474.0, 190019.0, 1341728.0, 144494.0, 74943.0, 43106.0, 26353.0, 16652.0, 10681.0, 6866.0, 4546.0, 2918.0, 1977.0, 1347.0, 843.0, 639.0, 421.0, 236.0, 186.0, 125.0, 93.0, 51.0, 31.0, 24.0, 12.0, 9.0, 10.0, 5.0, 1.0, 4.0, 0.0, 3.0, 2.0, 3.0], "bins": [-0.0919189453125, -0.08907604217529297, -0.08623313903808594, -0.0833902359008789, -0.08054733276367188, -0.07770442962646484, -0.07486152648925781, -0.07201862335205078, -0.06917572021484375, -0.06633281707763672, -0.06348991394042969, -0.060647010803222656, -0.057804107666015625, -0.054961204528808594, -0.05211830139160156, -0.04927539825439453, -0.0464324951171875, -0.04358959197998047, -0.04074668884277344, -0.037903785705566406, -0.035060882568359375, -0.032217979431152344, -0.029375076293945312, -0.02653217315673828, -0.02368927001953125, -0.02084636688232422, -0.018003463745117188, -0.015160560607910156, -0.012317657470703125, -0.009474754333496094, -0.0066318511962890625, -0.0037889480590820312, -0.000946044921875, 0.0018968582153320312, 0.0047397613525390625, 0.007582664489746094, 0.010425567626953125, 0.013268470764160156, 0.016111373901367188, 0.01895427703857422, 0.02179718017578125, 0.02464008331298828, 0.027482986450195312, 0.030325889587402344, 0.033168792724609375, 0.036011695861816406, 0.03885459899902344, 0.04169750213623047, 0.0445404052734375, 0.04738330841064453, 0.05022621154785156, 0.053069114685058594, 0.055912017822265625, 0.058754920959472656, 0.06159782409667969, 0.06444072723388672, 0.06728363037109375, 0.07012653350830078, 0.07296943664550781, 0.07581233978271484, 0.07865524291992188, 0.0814981460571289, 0.08434104919433594, 0.08718395233154297, 0.09002685546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 3.0, 3.0, 7.0, 12.0, 16.0, 9.0, 17.0, 19.0, 19.0, 29.0, 35.0, 33.0, 49.0, 36.0, 55.0, 51.0, 61.0, 69.0, 54.0, 50.0, 50.0, 48.0, 45.0, 44.0, 30.0, 24.0, 30.0, 24.0, 26.0, 12.0, 11.0, 6.0, 8.0, 11.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83393669128418e-05, -4.682410508394241e-05, -4.530884325504303e-05, -4.3793581426143646e-05, -4.227831959724426e-05, -4.076305776834488e-05, -3.9247795939445496e-05, -3.773253411054611e-05, -3.621727228164673e-05, -3.4702010452747345e-05, -3.318674862384796e-05, -3.167148679494858e-05, -3.0156224966049194e-05, -2.864096313714981e-05, -2.7125701308250427e-05, -2.5610439479351044e-05, -2.409517765045166e-05, -2.2579915821552277e-05, -2.1064653992652893e-05, -1.954939216375351e-05, -1.8034130334854126e-05, -1.6518868505954742e-05, -1.5003606677055359e-05, -1.3488344848155975e-05, -1.1973083019256592e-05, -1.0457821190357208e-05, -8.942559361457825e-06, -7.427297532558441e-06, -5.912035703659058e-06, -4.396773874759674e-06, -2.8815120458602905e-06, -1.366250216960907e-06, 1.4901161193847656e-07, 1.6642734408378601e-06, 3.1795352697372437e-06, 4.694797098636627e-06, 6.210058927536011e-06, 7.725320756435394e-06, 9.240582585334778e-06, 1.0755844414234161e-05, 1.2271106243133545e-05, 1.3786368072032928e-05, 1.5301629900932312e-05, 1.6816891729831696e-05, 1.833215355873108e-05, 1.9847415387630463e-05, 2.1362677216529846e-05, 2.287793904542923e-05, 2.4393200874328613e-05, 2.5908462703227997e-05, 2.742372453212738e-05, 2.8938986361026764e-05, 3.0454248189926147e-05, 3.196951001882553e-05, 3.3484771847724915e-05, 3.50000336766243e-05, 3.651529550552368e-05, 3.8030557334423065e-05, 3.954581916332245e-05, 4.106108099222183e-05, 4.2576342821121216e-05, 4.40916046500206e-05, 4.560686647891998e-05, 4.7122128307819366e-05, 4.863739013671875e-05]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 7.0, 13.0, 12.0, 11.0, 35.0, 26.0, 28.0, 45.0, 67.0, 76.0, 90.0, 129.0, 167.0, 301.0, 838.0, 5846.0, 115159.0, 797818.0, 119979.0, 5964.0, 880.0, 310.0, 176.0, 140.0, 96.0, 76.0, 53.0, 46.0, 41.0, 22.0, 24.0, 18.0, 14.0, 7.0, 13.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0006532669067382812, -0.0006343349814414978, -0.0006154030561447144, -0.0005964711308479309, -0.0005775392055511475, -0.000558607280254364, -0.0005396753549575806, -0.0005207434296607971, -0.0005018115043640137, -0.0004828795790672302, -0.0004639476537704468, -0.00044501572847366333, -0.0004260838031768799, -0.00040715187788009644, -0.000388219952583313, -0.00036928802728652954, -0.0003503561019897461, -0.00033142417669296265, -0.0003124922513961792, -0.00029356032609939575, -0.0002746284008026123, -0.00025569647550582886, -0.0002367645502090454, -0.00021783262491226196, -0.00019890069961547852, -0.00017996877431869507, -0.00016103684902191162, -0.00014210492372512817, -0.00012317299842834473, -0.00010424107313156128, -8.530914783477783e-05, -6.637722253799438e-05, -4.744529724121094e-05, -2.851337194442749e-05, -9.581446647644043e-06, 9.350478649139404e-06, 2.828240394592285e-05, 4.72143292427063e-05, 6.614625453948975e-05, 8.50781798362732e-05, 0.00010401010513305664, 0.0001229420304298401, 0.00014187395572662354, 0.00016080588102340698, 0.00017973780632019043, 0.00019866973161697388, 0.00021760165691375732, 0.00023653358221054077, 0.0002554655075073242, 0.00027439743280410767, 0.0002933293581008911, 0.00031226128339767456, 0.000331193208694458, 0.00035012513399124146, 0.0003690570592880249, 0.00038798898458480835, 0.0004069209098815918, 0.00042585283517837524, 0.0004447847604751587, 0.00046371668577194214, 0.0004826486110687256, 0.000501580536365509, 0.0005205124616622925, 0.0005394443869590759, 0.0005583763122558594]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 8.0, 9.0, 19.0, 23.0, 19.0, 42.0, 42.0, 54.0, 59.0, 82.0, 82.0, 79.0, 94.0, 58.0, 57.0, 54.0, 42.0, 38.0, 27.0, 30.0, 13.0, 10.0, 12.0, 10.0, 8.0, 3.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.65196137863677e-05, -3.532379196258262e-05, -3.4127973776776344e-05, -3.293215195299126e-05, -3.173633012920618e-05, -3.0540511943399906e-05, -2.9344690119614825e-05, -2.8148870114819147e-05, -2.695305011002347e-05, -2.575723010522779e-05, -2.4561410100432113e-05, -2.336558827664703e-05, -2.2169768271851353e-05, -2.0973948267055675e-05, -1.9778126443270594e-05, -1.8582306438474916e-05, -1.7386486433679238e-05, -1.619066642888356e-05, -1.499484551459318e-05, -1.37990246003028e-05, -1.2603204595507123e-05, -1.1407384590711445e-05, -1.0211563676421065e-05, -9.015742762130685e-06, -7.819922757335007e-06, -6.624102297791978e-06, -5.4282818382489495e-06, -4.232461378705921e-06, -3.036640919162892e-06, -1.840820459619863e-06, -6.450000000768341e-07, 5.508209142135456e-07, 1.7466445569880307e-06, 2.9424650165310595e-06, 4.138285476074088e-06, 5.334105935617117e-06, 6.529926395160146e-06, 7.725746399955824e-06, 8.921567314246204e-06, 1.0117388228536583e-05, 1.1313208233332261e-05, 1.250902823812794e-05, 1.3704849152418319e-05, 1.4900670066708699e-05, 1.6096490071504377e-05, 1.7292310076300055e-05, 1.8488131900085136e-05, 1.9683951904880814e-05, 2.0879771909676492e-05, 2.207559191447217e-05, 2.3271411919267848e-05, 2.446723374305293e-05, 2.5663053747848608e-05, 2.6858873752644286e-05, 2.8054695576429367e-05, 2.9250515581225045e-05, 3.0446335586020723e-05, 3.1642157409805804e-05, 3.283797559561208e-05, 3.403379741939716e-05, 3.522961924318224e-05, 3.6425437428988516e-05, 3.76212592527736e-05, 3.881708107655868e-05, 4.0012899262364954e-05]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 8.0, 4.0, 10.0, 6.0, 12.0, 13.0, 12.0, 16.0, 13.0, 30.0, 30.0, 29.0, 32.0, 26.0, 40.0, 45.0, 50.0, 46.0, 64.0, 42.0, 48.0, 51.0, 32.0, 36.0, 49.0, 33.0, 32.0, 34.0, 29.0, 17.0, 24.0, 21.0, 9.0, 14.0, 12.0, 8.0, 10.0, 8.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9921531677246094e-05, -2.8954818844795227e-05, -2.798810601234436e-05, -2.7021393179893494e-05, -2.6054680347442627e-05, -2.508796751499176e-05, -2.4121254682540894e-05, -2.3154541850090027e-05, -2.218782901763916e-05, -2.1221116185188293e-05, -2.0254403352737427e-05, -1.928769052028656e-05, -1.8320977687835693e-05, -1.7354264855384827e-05, -1.638755202293396e-05, -1.5420839190483093e-05, -1.4454126358032227e-05, -1.348741352558136e-05, -1.2520700693130493e-05, -1.1553987860679626e-05, -1.058727502822876e-05, -9.620562195777893e-06, -8.653849363327026e-06, -7.68713653087616e-06, -6.720423698425293e-06, -5.753710865974426e-06, -4.7869980335235596e-06, -3.820285201072693e-06, -2.853572368621826e-06, -1.8868595361709595e-06, -9.201467037200928e-07, 4.6566128730773926e-08, 1.0132789611816406e-06, 1.9799917936325073e-06, 2.946704626083374e-06, 3.913417458534241e-06, 4.880130290985107e-06, 5.846843123435974e-06, 6.813555955886841e-06, 7.780268788337708e-06, 8.746981620788574e-06, 9.713694453239441e-06, 1.0680407285690308e-05, 1.1647120118141174e-05, 1.2613832950592041e-05, 1.3580545783042908e-05, 1.4547258615493774e-05, 1.551397144794464e-05, 1.6480684280395508e-05, 1.7447397112846375e-05, 1.841410994529724e-05, 1.9380822777748108e-05, 2.0347535610198975e-05, 2.131424844264984e-05, 2.2280961275100708e-05, 2.3247674107551575e-05, 2.421438694000244e-05, 2.5181099772453308e-05, 2.6147812604904175e-05, 2.711452543735504e-05, 2.8081238269805908e-05, 2.9047951102256775e-05, 3.001466393470764e-05, 3.098137676715851e-05, 3.1948089599609375e-05]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 12.0, 17.0, 17.0, 23.0, 20.0, 32.0, 29.0, 35.0, 38.0, 60.0, 46.0, 52.0, 49.0, 57.0, 54.0, 47.0, 60.0, 57.0, 33.0, 41.0, 33.0, 31.0, 29.0, 29.0, 12.0, 15.0, 12.0, 11.0, 8.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.888671875, -3.753387451171875, -3.61810302734375, -3.482818603515625, -3.3475341796875, -3.212249755859375, -3.07696533203125, -2.941680908203125, -2.806396484375, -2.671112060546875, -2.53582763671875, -2.400543212890625, -2.2652587890625, -2.129974365234375, -1.99468994140625, -1.859405517578125, -1.72412109375, -1.588836669921875, -1.45355224609375, -1.318267822265625, -1.1829833984375, -1.047698974609375, -0.91241455078125, -0.777130126953125, -0.641845703125, -0.506561279296875, -0.37127685546875, -0.235992431640625, -0.1007080078125, 0.034576416015625, 0.16986083984375, 0.305145263671875, 0.4404296875, 0.575714111328125, 0.71099853515625, 0.846282958984375, 0.9815673828125, 1.116851806640625, 1.25213623046875, 1.387420654296875, 1.522705078125, 1.657989501953125, 1.79327392578125, 1.928558349609375, 2.0638427734375, 2.199127197265625, 2.33441162109375, 2.469696044921875, 2.60498046875, 2.740264892578125, 2.87554931640625, 3.010833740234375, 3.1461181640625, 3.281402587890625, 3.41668701171875, 3.551971435546875, 3.687255859375, 3.822540283203125, 3.95782470703125, 4.093109130859375, 4.2283935546875, 4.363677978515625, 4.49896240234375, 4.634246826171875, 4.76953125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 6.0, 5.0, 10.0, 16.0, 17.0, 29.0, 26.0, 45.0, 71.0, 108.0, 202.0, 373.0, 649.0, 1314.0, 2906.0, 6914.0, 17908.0, 61423.0, 654826.0, 243003.0, 36821.0, 12499.0, 4984.0, 2082.0, 1024.0, 516.0, 306.0, 161.0, 91.0, 63.0, 38.0, 32.0, 13.0, 19.0, 8.0, 5.0, 11.0, 2.0, 4.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5625, -6.3424072265625, -6.122314453125, -5.9022216796875, -5.68212890625, -5.4620361328125, -5.241943359375, -5.0218505859375, -4.8017578125, -4.5816650390625, -4.361572265625, -4.1414794921875, -3.92138671875, -3.7012939453125, -3.481201171875, -3.2611083984375, -3.041015625, -2.8209228515625, -2.600830078125, -2.3807373046875, -2.16064453125, -1.9405517578125, -1.720458984375, -1.5003662109375, -1.2802734375, -1.0601806640625, -0.840087890625, -0.6199951171875, -0.39990234375, -0.1798095703125, 0.040283203125, 0.2603759765625, 0.48046875, 0.7005615234375, 0.920654296875, 1.1407470703125, 1.36083984375, 1.5809326171875, 1.801025390625, 2.0211181640625, 2.2412109375, 2.4613037109375, 2.681396484375, 2.9014892578125, 3.12158203125, 3.3416748046875, 3.561767578125, 3.7818603515625, 4.001953125, 4.2220458984375, 4.442138671875, 4.6622314453125, 4.88232421875, 5.1024169921875, 5.322509765625, 5.5426025390625, 5.7626953125, 5.9827880859375, 6.202880859375, 6.4229736328125, 6.64306640625, 6.8631591796875, 7.083251953125, 7.3033447265625, 7.5234375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 12.0, 12.0, 15.0, 10.0, 21.0, 23.0, 24.0, 33.0, 30.0, 35.0, 40.0, 29.0, 55.0, 47.0, 75.0, 164.0, 1811.0, 146.0, 54.0, 45.0, 54.0, 40.0, 39.0, 35.0, 26.0, 29.0, 18.0, 15.0, 19.0, 18.0, 12.0, 14.0, 5.0, 6.0, 8.0, 7.0, 3.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4140625, -12.972900390625, -12.53173828125, -12.090576171875, -11.6494140625, -11.208251953125, -10.76708984375, -10.325927734375, -9.884765625, -9.443603515625, -9.00244140625, -8.561279296875, -8.1201171875, -7.678955078125, -7.23779296875, -6.796630859375, -6.35546875, -5.914306640625, -5.47314453125, -5.031982421875, -4.5908203125, -4.149658203125, -3.70849609375, -3.267333984375, -2.826171875, -2.385009765625, -1.94384765625, -1.502685546875, -1.0615234375, -0.620361328125, -0.17919921875, 0.261962890625, 0.703125, 1.144287109375, 1.58544921875, 2.026611328125, 2.4677734375, 2.908935546875, 3.35009765625, 3.791259765625, 4.232421875, 4.673583984375, 5.11474609375, 5.555908203125, 5.9970703125, 6.438232421875, 6.87939453125, 7.320556640625, 7.76171875, 8.202880859375, 8.64404296875, 9.085205078125, 9.5263671875, 9.967529296875, 10.40869140625, 10.849853515625, 11.291015625, 11.732177734375, 12.17333984375, 12.614501953125, 13.0556640625, 13.496826171875, 13.93798828125, 14.379150390625, 14.8203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 5.0, 11.0, 16.0, 22.0, 11.0, 12.0, 20.0, 32.0, 39.0, 65.0, 87.0, 143.0, 225.0, 511.0, 1799.0, 13369.0, 1161683.0, 1950115.0, 14508.0, 1769.0, 525.0, 242.0, 135.0, 83.0, 56.0, 45.0, 27.0, 32.0, 21.0, 17.0, 19.0, 10.0, 10.0, 8.0, 8.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.046875, -24.310546875, -23.57421875, -22.837890625, -22.1015625, -21.365234375, -20.62890625, -19.892578125, -19.15625, -18.419921875, -17.68359375, -16.947265625, -16.2109375, -15.474609375, -14.73828125, -14.001953125, -13.265625, -12.529296875, -11.79296875, -11.056640625, -10.3203125, -9.583984375, -8.84765625, -8.111328125, -7.375, -6.638671875, -5.90234375, -5.166015625, -4.4296875, -3.693359375, -2.95703125, -2.220703125, -1.484375, -0.748046875, -0.01171875, 0.724609375, 1.4609375, 2.197265625, 2.93359375, 3.669921875, 4.40625, 5.142578125, 5.87890625, 6.615234375, 7.3515625, 8.087890625, 8.82421875, 9.560546875, 10.296875, 11.033203125, 11.76953125, 12.505859375, 13.2421875, 13.978515625, 14.71484375, 15.451171875, 16.1875, 16.923828125, 17.66015625, 18.396484375, 19.1328125, 19.869140625, 20.60546875, 21.341796875, 22.078125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 11.0, 93.0, 464.0, 379.0, 66.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.226112365722656, -37.10015869140625, -33.974205017089844, -30.84825325012207, -27.722299575805664, -24.596345901489258, -21.470394134521484, -18.344440460205078, -15.218486785888672, -12.092533111572266, -8.966580390930176, -5.840627670288086, -2.7146739959716797, 0.41127967834472656, 3.5372314453125, 6.663185119628906, 9.789138793945312, 12.915092468261719, 16.041046142578125, 19.1669979095459, 22.292951583862305, 25.41890525817871, 28.544857025146484, 31.67081069946289, 34.7967643737793, 37.9227180480957, 41.04867172241211, 44.17462158203125, 47.300575256347656, 50.42652893066406, 53.55248260498047, 56.678436279296875, 59.80438232421875, 62.930335998535156, 66.05628967285156, 69.18224334716797, 72.30819702148438, 75.43415069580078, 78.56010437011719, 81.68605041503906, 84.81201171875, 87.9379653930664, 91.06391906738281, 94.18987274169922, 97.31582641601562, 100.44178009033203, 103.56773376464844, 106.69367980957031, 109.81963348388672, 112.94558715820312, 116.07154083251953, 119.19749450683594, 122.32344818115234, 125.44940185546875, 128.57534790039062, 131.70130920410156, 134.82725524902344, 137.9532012939453, 141.07916259765625, 144.20510864257812, 147.33106994628906, 150.45701599121094, 153.58297729492188, 156.70892333984375, 159.8348846435547]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 16.0, 5.0, 6.0, 7.0, 11.0, 8.0, 21.0, 22.0, 22.0, 23.0, 36.0, 26.0, 23.0, 38.0, 32.0, 30.0, 30.0, 41.0, 34.0, 54.0, 46.0, 45.0, 48.0, 52.0, 45.0, 44.0, 27.0, 25.0, 41.0, 21.0, 25.0, 23.0, 14.0, 10.0, 8.0, 15.0, 10.0, 11.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.94865417480469, -44.49686813354492, -43.045082092285156, -41.593299865722656, -40.14151382446289, -38.689727783203125, -37.23794174194336, -35.786155700683594, -34.334373474121094, -32.88258743286133, -31.430803298950195, -29.97901725769043, -28.527233123779297, -27.07544708251953, -25.623661041259766, -24.171875, -22.720088958740234, -21.26830291748047, -19.816518783569336, -18.36473274230957, -16.912948608398438, -15.461162567138672, -14.009376525878906, -12.557591438293457, -11.105806350708008, -9.654021263122559, -8.20223617553711, -6.750450134277344, -5.2986650466918945, -3.8468799591064453, -2.3950939178466797, -0.9433088302612305, 0.5084800720214844, 1.9602653980255127, 3.412050724029541, 4.863836288452148, 6.315621376037598, 7.767406463623047, 9.219192504882812, 10.670977592468262, 12.122762680053711, 13.57454776763916, 15.02633285522461, 16.478118896484375, 17.92990493774414, 19.381689071655273, 20.83347511291504, 22.285259246826172, 23.737045288085938, 25.188831329345703, 26.640615463256836, 28.0924015045166, 29.544185638427734, 30.9959716796875, 32.447757720947266, 33.89954376220703, 35.35132598876953, 36.8031120300293, 38.25489807128906, 39.70668029785156, 41.15846633911133, 42.610252380371094, 44.06203842163086, 45.513824462890625, 46.96561050415039]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 4.0, 14.0, 13.0, 17.0, 15.0, 20.0, 21.0, 36.0, 36.0, 29.0, 53.0, 54.0, 46.0, 59.0, 47.0, 53.0, 58.0, 50.0, 58.0, 38.0, 40.0, 38.0, 37.0, 32.0, 21.0, 31.0, 8.0, 11.0, 12.0, 12.0, 5.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.912109375, -3.773773193359375, -3.63543701171875, -3.497100830078125, -3.3587646484375, -3.220428466796875, -3.08209228515625, -2.943756103515625, -2.805419921875, -2.667083740234375, -2.52874755859375, -2.390411376953125, -2.2520751953125, -2.113739013671875, -1.97540283203125, -1.837066650390625, -1.69873046875, -1.560394287109375, -1.42205810546875, -1.283721923828125, -1.1453857421875, -1.007049560546875, -0.86871337890625, -0.730377197265625, -0.592041015625, -0.453704833984375, -0.31536865234375, -0.177032470703125, -0.0386962890625, 0.099639892578125, 0.23797607421875, 0.376312255859375, 0.5146484375, 0.652984619140625, 0.79132080078125, 0.929656982421875, 1.0679931640625, 1.206329345703125, 1.34466552734375, 1.483001708984375, 1.621337890625, 1.759674072265625, 1.89801025390625, 2.036346435546875, 2.1746826171875, 2.313018798828125, 2.45135498046875, 2.589691162109375, 2.72802734375, 2.866363525390625, 3.00469970703125, 3.143035888671875, 3.2813720703125, 3.419708251953125, 3.55804443359375, 3.696380615234375, 3.834716796875, 3.973052978515625, 4.11138916015625, 4.249725341796875, 4.3880615234375, 4.526397705078125, 4.66473388671875, 4.803070068359375, 4.94140625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 9.0, 10.0, 16.0, 13.0, 24.0, 24.0, 36.0, 42.0, 54.0, 90.0, 108.0, 162.0, 236.0, 352.0, 570.0, 953.0, 1874.0, 4088.0, 10835.0, 37135.0, 194947.0, 2483680.0, 1296123.0, 120783.0, 26298.0, 8408.0, 3365.0, 1655.0, 854.0, 489.0, 317.0, 204.0, 141.0, 97.0, 81.0, 46.0, 45.0, 36.0, 17.0, 15.0, 9.0, 12.0, 6.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.9375, -13.5260009765625, -13.114501953125, -12.7030029296875, -12.29150390625, -11.8800048828125, -11.468505859375, -11.0570068359375, -10.6455078125, -10.2340087890625, -9.822509765625, -9.4110107421875, -8.99951171875, -8.5880126953125, -8.176513671875, -7.7650146484375, -7.353515625, -6.9420166015625, -6.530517578125, -6.1190185546875, -5.70751953125, -5.2960205078125, -4.884521484375, -4.4730224609375, -4.0615234375, -3.6500244140625, -3.238525390625, -2.8270263671875, -2.41552734375, -2.0040283203125, -1.592529296875, -1.1810302734375, -0.76953125, -0.3580322265625, 0.053466796875, 0.4649658203125, 0.87646484375, 1.2879638671875, 1.699462890625, 2.1109619140625, 2.5224609375, 2.9339599609375, 3.345458984375, 3.7569580078125, 4.16845703125, 4.5799560546875, 4.991455078125, 5.4029541015625, 5.814453125, 6.2259521484375, 6.637451171875, 7.0489501953125, 7.46044921875, 7.8719482421875, 8.283447265625, 8.6949462890625, 9.1064453125, 9.5179443359375, 9.929443359375, 10.3409423828125, 10.75244140625, 11.1639404296875, 11.575439453125, 11.9869384765625, 12.3984375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 1.0, 6.0, 6.0, 7.0, 10.0, 14.0, 16.0, 24.0, 29.0, 30.0, 43.0, 64.0, 88.0, 126.0, 164.0, 270.0, 345.0, 495.0, 608.0, 494.0, 341.0, 256.0, 167.0, 108.0, 98.0, 75.0, 50.0, 35.0, 30.0, 20.0, 13.0, 7.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-12.15625, -11.83935546875, -11.5224609375, -11.20556640625, -10.888671875, -10.57177734375, -10.2548828125, -9.93798828125, -9.62109375, -9.30419921875, -8.9873046875, -8.67041015625, -8.353515625, -8.03662109375, -7.7197265625, -7.40283203125, -7.0859375, -6.76904296875, -6.4521484375, -6.13525390625, -5.818359375, -5.50146484375, -5.1845703125, -4.86767578125, -4.55078125, -4.23388671875, -3.9169921875, -3.60009765625, -3.283203125, -2.96630859375, -2.6494140625, -2.33251953125, -2.015625, -1.69873046875, -1.3818359375, -1.06494140625, -0.748046875, -0.43115234375, -0.1142578125, 0.20263671875, 0.51953125, 0.83642578125, 1.1533203125, 1.47021484375, 1.787109375, 2.10400390625, 2.4208984375, 2.73779296875, 3.0546875, 3.37158203125, 3.6884765625, 4.00537109375, 4.322265625, 4.63916015625, 4.9560546875, 5.27294921875, 5.58984375, 5.90673828125, 6.2236328125, 6.54052734375, 6.857421875, 7.17431640625, 7.4912109375, 7.80810546875, 8.125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 9.0, 28.0, 44.0, 53.0, 102.0, 163.0, 308.0, 548.0, 936.0, 1830.0, 3944.0, 9193.0, 26594.0, 99671.0, 543485.0, 2767601.0, 588887.0, 105367.0, 28030.0, 9535.0, 3939.0, 1722.0, 982.0, 540.0, 326.0, 176.0, 99.0, 65.0, 49.0, 19.0, 11.0, 10.0, 6.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -15.895751953125, -15.33837890625, -14.781005859375, -14.2236328125, -13.666259765625, -13.10888671875, -12.551513671875, -11.994140625, -11.436767578125, -10.87939453125, -10.322021484375, -9.7646484375, -9.207275390625, -8.64990234375, -8.092529296875, -7.53515625, -6.977783203125, -6.42041015625, -5.863037109375, -5.3056640625, -4.748291015625, -4.19091796875, -3.633544921875, -3.076171875, -2.518798828125, -1.96142578125, -1.404052734375, -0.8466796875, -0.289306640625, 0.26806640625, 0.825439453125, 1.3828125, 1.940185546875, 2.49755859375, 3.054931640625, 3.6123046875, 4.169677734375, 4.72705078125, 5.284423828125, 5.841796875, 6.399169921875, 6.95654296875, 7.513916015625, 8.0712890625, 8.628662109375, 9.18603515625, 9.743408203125, 10.30078125, 10.858154296875, 11.41552734375, 11.972900390625, 12.5302734375, 13.087646484375, 13.64501953125, 14.202392578125, 14.759765625, 15.317138671875, 15.87451171875, 16.431884765625, 16.9892578125, 17.546630859375, 18.10400390625, 18.661376953125, 19.21875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 8.0, 13.0, 21.0, 25.0, 59.0, 78.0, 75.0, 132.0, 129.0, 120.0, 111.0, 80.0, 73.0, 30.0, 23.0, 11.0, 11.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.62012481689453, -88.22784423828125, -85.83556365966797, -83.44329071044922, -81.05101013183594, -78.65872955322266, -76.26644897460938, -73.8741683959961, -71.48188781738281, -69.08960723876953, -66.69732666015625, -64.3050537109375, -61.91277313232422, -59.52049255371094, -57.128211975097656, -54.735931396484375, -52.343658447265625, -49.951377868652344, -47.55910110473633, -45.16682052612305, -42.77454376220703, -40.38226318359375, -37.98998260498047, -35.59770202636719, -33.20542526245117, -30.813146591186523, -28.420867919921875, -26.028587341308594, -23.636308670043945, -21.244029998779297, -18.851749420166016, -16.459470748901367, -14.06719970703125, -11.674921035766602, -9.282641410827637, -6.89036226272583, -4.498083114624023, -2.105804443359375, 0.28647518157958984, 2.6787548065185547, 5.071033477783203, 7.46331262588501, 9.855591773986816, 12.247871398925781, 14.64015007019043, 17.032428741455078, 19.42470932006836, 21.816987991333008, 24.209266662597656, 26.601545333862305, 28.993824005126953, 31.386104583740234, 33.77838134765625, 36.17066192626953, 38.56294250488281, 40.955223083496094, 43.34749984741211, 45.73978042602539, 48.132057189941406, 50.52433776855469, 52.91661834716797, 55.308895111083984, 57.701175689697266, 60.09345245361328, 62.48573303222656]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 7.0, 4.0, 9.0, 11.0, 19.0, 16.0, 13.0, 14.0, 21.0, 25.0, 31.0, 28.0, 34.0, 34.0, 47.0, 35.0, 50.0, 44.0, 48.0, 52.0, 46.0, 45.0, 33.0, 44.0, 41.0, 31.0, 33.0, 32.0, 29.0, 25.0, 22.0, 10.0, 17.0, 13.0, 10.0, 6.0, 5.0, 10.0, 2.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.43781280517578, -27.305179595947266, -26.17254638671875, -25.039913177490234, -23.90727996826172, -22.774646759033203, -21.64201545715332, -20.509382247924805, -19.37674903869629, -18.244115829467773, -17.111482620239258, -15.978850364685059, -14.846217155456543, -13.713583946228027, -12.580951690673828, -11.448318481445312, -10.315685272216797, -9.183052062988281, -8.050418853759766, -6.917786598205566, -5.785153388977051, -4.652520179748535, -3.5198874473571777, -2.3872547149658203, -1.2546215057373047, -0.12198853492736816, 1.0106444358825684, 2.143277406692505, 3.2759103775024414, 4.408543586730957, 5.5411763191223145, 6.673809051513672, 7.8064422607421875, 8.939075469970703, 10.071708679199219, 11.204340934753418, 12.336974143981934, 13.46960735321045, 14.602239608764648, 15.734872817993164, 16.86750602722168, 18.000139236450195, 19.13277244567871, 20.265405654907227, 21.39803695678711, 22.530670166015625, 23.66330337524414, 24.795936584472656, 25.928569793701172, 27.061203002929688, 28.193836212158203, 29.32646942138672, 30.459102630615234, 31.59173583984375, 32.724369049072266, 33.85700225830078, 34.98963165283203, 36.12226486206055, 37.25489807128906, 38.38753128051758, 39.520164489746094, 40.65279769897461, 41.785430908203125, 42.918060302734375, 44.050697326660156]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 8.0, 18.0, 12.0, 19.0, 23.0, 22.0, 28.0, 26.0, 39.0, 47.0, 57.0, 55.0, 49.0, 60.0, 57.0, 66.0, 59.0, 45.0, 47.0, 46.0, 39.0, 26.0, 25.0, 24.0, 16.0, 13.0, 5.0, 12.0, 9.0, 7.0, 6.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.928955078125, -3.78369140625, -3.638427734375, -3.4931640625, -3.347900390625, -3.20263671875, -3.057373046875, -2.912109375, -2.766845703125, -2.62158203125, -2.476318359375, -2.3310546875, -2.185791015625, -2.04052734375, -1.895263671875, -1.75, -1.604736328125, -1.45947265625, -1.314208984375, -1.1689453125, -1.023681640625, -0.87841796875, -0.733154296875, -0.587890625, -0.442626953125, -0.29736328125, -0.152099609375, -0.0068359375, 0.138427734375, 0.28369140625, 0.428955078125, 0.57421875, 0.719482421875, 0.86474609375, 1.010009765625, 1.1552734375, 1.300537109375, 1.44580078125, 1.591064453125, 1.736328125, 1.881591796875, 2.02685546875, 2.172119140625, 2.3173828125, 2.462646484375, 2.60791015625, 2.753173828125, 2.8984375, 3.043701171875, 3.18896484375, 3.334228515625, 3.4794921875, 3.624755859375, 3.77001953125, 3.915283203125, 4.060546875, 4.205810546875, 4.35107421875, 4.496337890625, 4.6416015625, 4.786865234375, 4.93212890625, 5.077392578125, 5.22265625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 17.0, 12.0, 24.0, 47.0, 72.0, 79.0, 144.0, 217.0, 314.0, 566.0, 848.0, 1409.0, 2380.0, 3919.0, 6377.0, 10913.0, 19197.0, 35894.0, 71492.0, 173669.0, 401817.0, 167831.0, 70319.0, 34976.0, 18902.0, 10935.0, 6340.0, 3791.0, 2297.0, 1395.0, 880.0, 512.0, 329.0, 234.0, 137.0, 86.0, 55.0, 36.0, 21.0, 25.0, 12.0, 12.0, 4.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1732177734375, -0.1673431396484375, -0.161468505859375, -0.1555938720703125, -0.14971923828125, -0.1438446044921875, -0.137969970703125, -0.1320953369140625, -0.126220703125, -0.1203460693359375, -0.114471435546875, -0.1085968017578125, -0.10272216796875, -0.0968475341796875, -0.090972900390625, -0.0850982666015625, -0.0792236328125, -0.0733489990234375, -0.067474365234375, -0.0615997314453125, -0.05572509765625, -0.0498504638671875, -0.043975830078125, -0.0381011962890625, -0.0322265625, -0.0263519287109375, -0.020477294921875, -0.0146026611328125, -0.00872802734375, -0.0028533935546875, 0.003021240234375, 0.0088958740234375, 0.0147705078125, 0.0206451416015625, 0.026519775390625, 0.0323944091796875, 0.03826904296875, 0.0441436767578125, 0.050018310546875, 0.0558929443359375, 0.061767578125, 0.0676422119140625, 0.073516845703125, 0.0793914794921875, 0.08526611328125, 0.0911407470703125, 0.097015380859375, 0.1028900146484375, 0.1087646484375, 0.1146392822265625, 0.120513916015625, 0.1263885498046875, 0.13226318359375, 0.1381378173828125, 0.144012451171875, 0.1498870849609375, 0.15576171875, 0.1616363525390625, 0.167510986328125, 0.1733856201171875, 0.17926025390625, 0.1851348876953125, 0.191009521484375, 0.1968841552734375, 0.2027587890625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 5.0, 1.0, 6.0, 4.0, 7.0, 5.0, 4.0, 15.0, 18.0, 22.0, 15.0, 19.0, 19.0, 26.0, 32.0, 26.0, 32.0, 15.0, 36.0, 38.0, 33.0, 32.0, 45.0, 40.0, 1062.0, 45.0, 37.0, 38.0, 39.0, 29.0, 34.0, 30.0, 25.0, 23.0, 17.0, 26.0, 13.0, 16.0, 14.0, 13.0, 9.0, 16.0, 5.0, 13.0, 5.0, 3.0, 2.0, 4.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.4140625, -2.337371826171875, -2.26068115234375, -2.183990478515625, -2.1072998046875, -2.030609130859375, -1.95391845703125, -1.877227783203125, -1.800537109375, -1.723846435546875, -1.64715576171875, -1.570465087890625, -1.4937744140625, -1.417083740234375, -1.34039306640625, -1.263702392578125, -1.18701171875, -1.110321044921875, -1.03363037109375, -0.956939697265625, -0.8802490234375, -0.803558349609375, -0.72686767578125, -0.650177001953125, -0.573486328125, -0.496795654296875, -0.42010498046875, -0.343414306640625, -0.2667236328125, -0.190032958984375, -0.11334228515625, -0.036651611328125, 0.0400390625, 0.116729736328125, 0.19342041015625, 0.270111083984375, 0.3468017578125, 0.423492431640625, 0.50018310546875, 0.576873779296875, 0.653564453125, 0.730255126953125, 0.80694580078125, 0.883636474609375, 0.9603271484375, 1.037017822265625, 1.11370849609375, 1.190399169921875, 1.26708984375, 1.343780517578125, 1.42047119140625, 1.497161865234375, 1.5738525390625, 1.650543212890625, 1.72723388671875, 1.803924560546875, 1.880615234375, 1.957305908203125, 2.03399658203125, 2.110687255859375, 2.1873779296875, 2.264068603515625, 2.34075927734375, 2.417449951171875, 2.494140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 3.0, 12.0, 13.0, 18.0, 31.0, 56.0, 96.0, 122.0, 195.0, 282.0, 393.0, 624.0, 920.0, 1398.0, 2062.0, 3192.0, 4920.0, 7545.0, 11559.0, 18265.0, 28626.0, 47529.0, 82902.0, 170920.0, 1348750.0, 163330.0, 79823.0, 45600.0, 28087.0, 17304.0, 11259.0, 7372.0, 4710.0, 3104.0, 2043.0, 1362.0, 872.0, 607.0, 423.0, 267.0, 167.0, 131.0, 81.0, 65.0, 32.0, 16.0, 12.0, 9.0, 11.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.087158203125, -0.08438873291015625, -0.0816192626953125, -0.07884979248046875, -0.076080322265625, -0.07331085205078125, -0.0705413818359375, -0.06777191162109375, -0.06500244140625, -0.06223297119140625, -0.0594635009765625, -0.05669403076171875, -0.053924560546875, -0.05115509033203125, -0.0483856201171875, -0.04561614990234375, -0.0428466796875, -0.04007720947265625, -0.0373077392578125, -0.03453826904296875, -0.031768798828125, -0.02899932861328125, -0.0262298583984375, -0.02346038818359375, -0.02069091796875, -0.01792144775390625, -0.0151519775390625, -0.01238250732421875, -0.009613037109375, -0.00684356689453125, -0.0040740966796875, -0.00130462646484375, 0.00146484375, 0.00423431396484375, 0.0070037841796875, 0.00977325439453125, 0.012542724609375, 0.01531219482421875, 0.0180816650390625, 0.02085113525390625, 0.02362060546875, 0.02639007568359375, 0.0291595458984375, 0.03192901611328125, 0.034698486328125, 0.03746795654296875, 0.0402374267578125, 0.04300689697265625, 0.0457763671875, 0.04854583740234375, 0.0513153076171875, 0.05408477783203125, 0.056854248046875, 0.05962371826171875, 0.0623931884765625, 0.06516265869140625, 0.06793212890625, 0.07070159912109375, 0.0734710693359375, 0.07624053955078125, 0.079010009765625, 0.08177947998046875, 0.0845489501953125, 0.08731842041015625, 0.090087890625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 2.0, 5.0, 5.0, 7.0, 8.0, 14.0, 14.0, 15.0, 19.0, 18.0, 26.0, 16.0, 27.0, 37.0, 35.0, 51.0, 38.0, 38.0, 38.0, 39.0, 39.0, 37.0, 39.0, 40.0, 39.0, 39.0, 39.0, 31.0, 18.0, 29.0, 35.0, 27.0, 22.0, 20.0, 20.0, 14.0, 8.0, 12.0, 11.0, 1.0, 5.0, 5.0, 5.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.1365623474121094e-05, -4.0121376514434814e-05, -3.8877129554748535e-05, -3.7632882595062256e-05, -3.6388635635375977e-05, -3.51443886756897e-05, -3.390014171600342e-05, -3.265589475631714e-05, -3.141164779663086e-05, -3.016740083694458e-05, -2.89231538772583e-05, -2.767890691757202e-05, -2.6434659957885742e-05, -2.5190412998199463e-05, -2.3946166038513184e-05, -2.2701919078826904e-05, -2.1457672119140625e-05, -2.0213425159454346e-05, -1.8969178199768066e-05, -1.7724931240081787e-05, -1.6480684280395508e-05, -1.5236437320709229e-05, -1.399219036102295e-05, -1.274794340133667e-05, -1.150369644165039e-05, -1.0259449481964111e-05, -9.015202522277832e-06, -7.770955562591553e-06, -6.5267086029052734e-06, -5.282461643218994e-06, -4.038214683532715e-06, -2.7939677238464355e-06, -1.5497207641601562e-06, -3.0547380447387695e-07, 9.387731552124023e-07, 2.1830201148986816e-06, 3.427267074584961e-06, 4.67151403427124e-06, 5.9157609939575195e-06, 7.160007953643799e-06, 8.404254913330078e-06, 9.648501873016357e-06, 1.0892748832702637e-05, 1.2136995792388916e-05, 1.3381242752075195e-05, 1.4625489711761475e-05, 1.5869736671447754e-05, 1.7113983631134033e-05, 1.8358230590820312e-05, 1.9602477550506592e-05, 2.084672451019287e-05, 2.209097146987915e-05, 2.333521842956543e-05, 2.457946538925171e-05, 2.5823712348937988e-05, 2.7067959308624268e-05, 2.8312206268310547e-05, 2.9556453227996826e-05, 3.0800700187683105e-05, 3.2044947147369385e-05, 3.3289194107055664e-05, 3.453344106674194e-05, 3.577768802642822e-05, 3.70219349861145e-05, 3.826618194580078e-05]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 6.0, 5.0, 3.0, 5.0, 14.0, 4.0, 18.0, 38.0, 24.0, 43.0, 42.0, 55.0, 69.0, 80.0, 117.0, 154.0, 254.0, 473.0, 2195.0, 30540.0, 521802.0, 463598.0, 25702.0, 1839.0, 509.0, 274.0, 171.0, 111.0, 92.0, 58.0, 49.0, 46.0, 26.0, 30.0, 22.0, 18.0, 14.0, 8.0, 9.0, 8.0, 5.0, 4.0, 2.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005526542663574219, -0.0005342140793800354, -0.0005157738924026489, -0.0004973337054252625, -0.000478893518447876, -0.0004604533314704895, -0.00044201314449310303, -0.00042357295751571655, -0.0004051327705383301, -0.0003866925835609436, -0.00036825239658355713, -0.00034981220960617065, -0.0003313720226287842, -0.0003129318356513977, -0.00029449164867401123, -0.00027605146169662476, -0.0002576112747192383, -0.0002391710877418518, -0.00022073090076446533, -0.00020229071378707886, -0.00018385052680969238, -0.0001654103398323059, -0.00014697015285491943, -0.00012852996587753296, -0.00011008977890014648, -9.164959192276001e-05, -7.320940494537354e-05, -5.476921796798706e-05, -3.6329030990600586e-05, -1.788884401321411e-05, 5.513429641723633e-07, 1.8991529941558838e-05, 3.743171691894531e-05, 5.587190389633179e-05, 7.431209087371826e-05, 9.275227785110474e-05, 0.00011119246482849121, 0.00012963265180587769, 0.00014807283878326416, 0.00016651302576065063, 0.0001849532127380371, 0.00020339339971542358, 0.00022183358669281006, 0.00024027377367019653, 0.000258713960647583, 0.0002771541476249695, 0.00029559433460235596, 0.00031403452157974243, 0.0003324747085571289, 0.0003509148955345154, 0.00036935508251190186, 0.00038779526948928833, 0.0004062354564666748, 0.0004246756434440613, 0.00044311583042144775, 0.00046155601739883423, 0.0004799962043762207, 0.0004984363913536072, 0.0005168765783309937, 0.0005353167653083801, 0.0005537569522857666, 0.0005721971392631531, 0.0005906373262405396, 0.000609077513217926, 0.0006275177001953125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 33.0, 224.0, 521.0, 197.0, 33.0, 3.0, 1.0, 1.0], "bins": [-0.0005321917124092579, -0.0005230947863310575, -0.0005139978602528572, -0.0005049009341746569, -0.0004958040080964565, -0.0004867070820182562, -0.00047761015594005585, -0.0004685132298618555, -0.00045941630378365517, -0.0004503193777054548, -0.0004412224516272545, -0.00043212552554905415, -0.0004230285994708538, -0.00041393167339265347, -0.0004048347473144531, -0.0003957378212362528, -0.000386640866054222, -0.00037754393997602165, -0.0003684470138978213, -0.00035935008781962097, -0.0003502531617414206, -0.0003411562356632203, -0.00033205930958501995, -0.00032296235440298915, -0.0003138654283247888, -0.00030476850224658847, -0.00029567157616838813, -0.0002865746500901878, -0.00027747772401198745, -0.0002683807979337871, -0.00025928387185558677, -0.0002501869457773864, -0.0002410900196991861, -0.00023199309362098575, -0.0002228961675427854, -0.00021379924146458507, -0.00020470231538638473, -0.00019560538930818439, -0.00018650844867806882, -0.00017741152259986848, -0.00016831459652166814, -0.0001592176704434678, -0.00015012074436526746, -0.00014102381828706712, -0.00013192687765695155, -0.0001228299515787512, -0.00011373302550055087, -0.00010463609942235053, -9.553917334415019e-05, -8.644224726594985e-05, -7.73453211877495e-05, -6.824838783359155e-05, -5.915146175539121e-05, -5.005453567719087e-05, -4.095760596101172e-05, -3.1860676244832575e-05, -2.2763750166632235e-05, -1.3666822269442491e-05, -4.569894372252747e-06, 4.527033524936996e-06, 1.362396142212674e-05, 2.272088750032708e-05, 3.181781721650623e-05, 4.0914746932685375e-05, 5.0011673010885715e-05]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 4.0, 12.0, 12.0, 12.0, 12.0, 14.0, 19.0, 23.0, 27.0, 39.0, 38.0, 23.0, 48.0, 36.0, 45.0, 38.0, 40.0, 37.0, 37.0, 38.0, 37.0, 44.0, 39.0, 41.0, 40.0, 27.0, 31.0, 29.0, 34.0, 12.0, 18.0, 15.0, 10.0, 13.0, 15.0, 13.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.950429916381836e-05, -2.8464943170547485e-05, -2.742558717727661e-05, -2.6386231184005737e-05, -2.5346875190734863e-05, -2.430751919746399e-05, -2.3268163204193115e-05, -2.222880721092224e-05, -2.1189451217651367e-05, -2.0150095224380493e-05, -1.911073923110962e-05, -1.8071383237838745e-05, -1.703202724456787e-05, -1.5992671251296997e-05, -1.4953315258026123e-05, -1.3913959264755249e-05, -1.2874603271484375e-05, -1.1835247278213501e-05, -1.0795891284942627e-05, -9.756535291671753e-06, -8.717179298400879e-06, -7.677823305130005e-06, -6.638467311859131e-06, -5.599111318588257e-06, -4.559755325317383e-06, -3.520399332046509e-06, -2.4810433387756348e-06, -1.4416873455047607e-06, -4.023313522338867e-07, 6.370246410369873e-07, 1.6763806343078613e-06, 2.7157366275787354e-06, 3.7550926208496094e-06, 4.794448614120483e-06, 5.833804607391357e-06, 6.8731606006622314e-06, 7.912516593933105e-06, 8.95187258720398e-06, 9.991228580474854e-06, 1.1030584573745728e-05, 1.2069940567016602e-05, 1.3109296560287476e-05, 1.414865255355835e-05, 1.5188008546829224e-05, 1.6227364540100098e-05, 1.726672053337097e-05, 1.8306076526641846e-05, 1.934543251991272e-05, 2.0384788513183594e-05, 2.1424144506454468e-05, 2.2463500499725342e-05, 2.3502856492996216e-05, 2.454221248626709e-05, 2.5581568479537964e-05, 2.6620924472808838e-05, 2.7660280466079712e-05, 2.8699636459350586e-05, 2.973899245262146e-05, 3.0778348445892334e-05, 3.181770443916321e-05, 3.285706043243408e-05, 3.3896416425704956e-05, 3.493577241897583e-05, 3.5975128412246704e-05, 3.701448440551758e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 8.0, 18.0, 12.0, 19.0, 23.0, 22.0, 28.0, 26.0, 39.0, 47.0, 57.0, 55.0, 49.0, 60.0, 57.0, 66.0, 59.0, 45.0, 47.0, 46.0, 39.0, 26.0, 25.0, 24.0, 16.0, 13.0, 5.0, 12.0, 9.0, 7.0, 6.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.928955078125, -3.78369140625, -3.638427734375, -3.4931640625, -3.347900390625, -3.20263671875, -3.057373046875, -2.912109375, -2.766845703125, -2.62158203125, -2.476318359375, -2.3310546875, -2.185791015625, -2.04052734375, -1.895263671875, -1.75, -1.604736328125, -1.45947265625, -1.314208984375, -1.1689453125, -1.023681640625, -0.87841796875, -0.733154296875, -0.587890625, -0.442626953125, -0.29736328125, -0.152099609375, -0.0068359375, 0.138427734375, 0.28369140625, 0.428955078125, 0.57421875, 0.719482421875, 0.86474609375, 1.010009765625, 1.1552734375, 1.300537109375, 1.44580078125, 1.591064453125, 1.736328125, 1.881591796875, 2.02685546875, 2.172119140625, 2.3173828125, 2.462646484375, 2.60791015625, 2.753173828125, 2.8984375, 3.043701171875, 3.18896484375, 3.334228515625, 3.4794921875, 3.624755859375, 3.77001953125, 3.915283203125, 4.060546875, 4.205810546875, 4.35107421875, 4.496337890625, 4.6416015625, 4.786865234375, 4.93212890625, 5.077392578125, 5.22265625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 10.0, 16.0, 20.0, 27.0, 34.0, 53.0, 82.0, 127.0, 156.0, 231.0, 383.0, 556.0, 820.0, 1283.0, 1919.0, 3054.0, 4938.0, 8307.0, 15069.0, 29085.0, 61713.0, 156102.0, 399820.0, 208913.0, 77165.0, 35325.0, 17937.0, 9815.0, 5843.0, 3380.0, 2184.0, 1372.0, 921.0, 579.0, 410.0, 265.0, 180.0, 154.0, 75.0, 67.0, 60.0, 21.0, 17.0, 18.0, 14.0, 10.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.713134765625, -2.62158203125, -2.530029296875, -2.4384765625, -2.346923828125, -2.25537109375, -2.163818359375, -2.072265625, -1.980712890625, -1.88916015625, -1.797607421875, -1.7060546875, -1.614501953125, -1.52294921875, -1.431396484375, -1.33984375, -1.248291015625, -1.15673828125, -1.065185546875, -0.9736328125, -0.882080078125, -0.79052734375, -0.698974609375, -0.607421875, -0.515869140625, -0.42431640625, -0.332763671875, -0.2412109375, -0.149658203125, -0.05810546875, 0.033447265625, 0.125, 0.216552734375, 0.30810546875, 0.399658203125, 0.4912109375, 0.582763671875, 0.67431640625, 0.765869140625, 0.857421875, 0.948974609375, 1.04052734375, 1.132080078125, 1.2236328125, 1.315185546875, 1.40673828125, 1.498291015625, 1.58984375, 1.681396484375, 1.77294921875, 1.864501953125, 1.9560546875, 2.047607421875, 2.13916015625, 2.230712890625, 2.322265625, 2.413818359375, 2.50537109375, 2.596923828125, 2.6884765625, 2.780029296875, 2.87158203125, 2.963134765625, 3.0546875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 8.0, 5.0, 3.0, 4.0, 9.0, 5.0, 7.0, 14.0, 16.0, 22.0, 18.0, 24.0, 17.0, 24.0, 29.0, 24.0, 27.0, 32.0, 28.0, 42.0, 47.0, 57.0, 77.0, 150.0, 1530.0, 269.0, 119.0, 53.0, 40.0, 29.0, 42.0, 29.0, 36.0, 28.0, 32.0, 29.0, 11.0, 22.0, 11.0, 8.0, 11.0, 6.0, 6.0, 10.0, 7.0, 11.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0], "bins": [-11.4921875, -11.1513671875, -10.810546875, -10.4697265625, -10.12890625, -9.7880859375, -9.447265625, -9.1064453125, -8.765625, -8.4248046875, -8.083984375, -7.7431640625, -7.40234375, -7.0615234375, -6.720703125, -6.3798828125, -6.0390625, -5.6982421875, -5.357421875, -5.0166015625, -4.67578125, -4.3349609375, -3.994140625, -3.6533203125, -3.3125, -2.9716796875, -2.630859375, -2.2900390625, -1.94921875, -1.6083984375, -1.267578125, -0.9267578125, -0.5859375, -0.2451171875, 0.095703125, 0.4365234375, 0.77734375, 1.1181640625, 1.458984375, 1.7998046875, 2.140625, 2.4814453125, 2.822265625, 3.1630859375, 3.50390625, 3.8447265625, 4.185546875, 4.5263671875, 4.8671875, 5.2080078125, 5.548828125, 5.8896484375, 6.23046875, 6.5712890625, 6.912109375, 7.2529296875, 7.59375, 7.9345703125, 8.275390625, 8.6162109375, 8.95703125, 9.2978515625, 9.638671875, 9.9794921875, 10.3203125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 10.0, 7.0, 10.0, 6.0, 8.0, 9.0, 13.0, 14.0, 17.0, 33.0, 26.0, 44.0, 58.0, 77.0, 100.0, 175.0, 214.0, 449.0, 1119.0, 4205.0, 28873.0, 966115.0, 2099111.0, 37332.0, 5038.0, 1214.0, 481.0, 263.0, 180.0, 113.0, 65.0, 58.0, 45.0, 45.0, 32.0, 29.0, 24.0, 23.0, 14.0, 10.0, 4.0, 7.0, 7.0, 5.0, 3.0, 7.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.625, -16.07177734375, -15.5185546875, -14.96533203125, -14.412109375, -13.85888671875, -13.3056640625, -12.75244140625, -12.19921875, -11.64599609375, -11.0927734375, -10.53955078125, -9.986328125, -9.43310546875, -8.8798828125, -8.32666015625, -7.7734375, -7.22021484375, -6.6669921875, -6.11376953125, -5.560546875, -5.00732421875, -4.4541015625, -3.90087890625, -3.34765625, -2.79443359375, -2.2412109375, -1.68798828125, -1.134765625, -0.58154296875, -0.0283203125, 0.52490234375, 1.078125, 1.63134765625, 2.1845703125, 2.73779296875, 3.291015625, 3.84423828125, 4.3974609375, 4.95068359375, 5.50390625, 6.05712890625, 6.6103515625, 7.16357421875, 7.716796875, 8.27001953125, 8.8232421875, 9.37646484375, 9.9296875, 10.48291015625, 11.0361328125, 11.58935546875, 12.142578125, 12.69580078125, 13.2490234375, 13.80224609375, 14.35546875, 14.90869140625, 15.4619140625, 16.01513671875, 16.568359375, 17.12158203125, 17.6748046875, 18.22802734375, 18.78125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 53.0, 520.0, 425.0, 22.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.337419509887695, -9.378410339355469, -4.419402122497559, 0.5396060943603516, 5.498615264892578, 10.457624435424805, 15.416631698608398, 20.375642776489258, 25.33465003967285, 30.293659210205078, 35.25266647338867, 40.21167755126953, 45.170684814453125, 50.12969207763672, 55.08869934082031, 60.04771423339844, 65.00672149658203, 69.96572875976562, 74.92473602294922, 79.88374328613281, 84.84275817871094, 89.80176544189453, 94.76077270507812, 99.71978759765625, 104.67878723144531, 109.6377944946289, 114.5968017578125, 119.55581665039062, 124.51482391357422, 129.4738311767578, 134.43283081054688, 139.391845703125, 144.35084533691406, 149.3098602294922, 154.26885986328125, 159.22787475585938, 164.18687438964844, 169.14588928222656, 174.10488891601562, 179.06390380859375, 184.02291870117188, 188.98193359375, 193.94093322753906, 198.8999481201172, 203.85894775390625, 208.81796264648438, 213.7769775390625, 218.73597717285156, 223.69497680664062, 228.65399169921875, 233.6129913330078, 238.57200622558594, 243.531005859375, 248.49002075195312, 253.44903564453125, 258.4080505371094, 263.3670654296875, 268.3260803222656, 273.28509521484375, 278.24407958984375, 283.2030944824219, 288.162109375, 293.1211242675781, 298.08013916015625, 303.03912353515625]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 4.0, 11.0, 12.0, 4.0, 13.0, 13.0, 12.0, 20.0, 13.0, 22.0, 21.0, 31.0, 26.0, 25.0, 40.0, 45.0, 47.0, 44.0, 25.0, 36.0, 37.0, 36.0, 30.0, 48.0, 31.0, 41.0, 31.0, 36.0, 26.0, 28.0, 28.0, 21.0, 26.0, 20.0, 15.0, 12.0, 15.0, 13.0, 3.0, 5.0, 9.0, 8.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.43107604980469, -36.24427032470703, -35.05746078491211, -33.87065124511719, -32.68384552001953, -31.497037887573242, -30.310230255126953, -29.123422622680664, -27.936614990234375, -26.749807357788086, -25.562999725341797, -24.376192092895508, -23.18938446044922, -22.00257682800293, -20.81576919555664, -19.62896156311035, -18.442153930664062, -17.255346298217773, -16.068538665771484, -14.881731033325195, -13.694923400878906, -12.508115768432617, -11.321308135986328, -10.134500503540039, -8.94769287109375, -7.760885238647461, -6.574077606201172, -5.387269973754883, -4.200462341308594, -3.0136547088623047, -1.8268470764160156, -0.6400394439697266, 0.5467720031738281, 1.7335796356201172, 2.9203872680664062, 4.107194900512695, 5.294002532958984, 6.480810165405273, 7.6676177978515625, 8.854425430297852, 10.04123306274414, 11.22804069519043, 12.414848327636719, 13.601655960083008, 14.788463592529297, 15.975271224975586, 17.162078857421875, 18.348886489868164, 19.535694122314453, 20.722501754760742, 21.90930938720703, 23.09611701965332, 24.28292465209961, 25.4697322845459, 26.656539916992188, 27.843347549438477, 29.030155181884766, 30.216962814331055, 31.403770446777344, 32.590576171875, 33.77738571166992, 34.964195251464844, 36.1510009765625, 37.337806701660156, 38.52461624145508]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 10.0, 6.0, 8.0, 9.0, 11.0, 22.0, 18.0, 15.0, 21.0, 19.0, 26.0, 38.0, 29.0, 43.0, 66.0, 51.0, 44.0, 57.0, 54.0, 61.0, 55.0, 48.0, 39.0, 46.0, 33.0, 31.0, 20.0, 19.0, 22.0, 19.0, 10.0, 8.0, 7.0, 8.0, 4.0, 7.0, 6.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.93359375, -3.79736328125, -3.6611328125, -3.52490234375, -3.388671875, -3.25244140625, -3.1162109375, -2.97998046875, -2.84375, -2.70751953125, -2.5712890625, -2.43505859375, -2.298828125, -2.16259765625, -2.0263671875, -1.89013671875, -1.75390625, -1.61767578125, -1.4814453125, -1.34521484375, -1.208984375, -1.07275390625, -0.9365234375, -0.80029296875, -0.6640625, -0.52783203125, -0.3916015625, -0.25537109375, -0.119140625, 0.01708984375, 0.1533203125, 0.28955078125, 0.42578125, 0.56201171875, 0.6982421875, 0.83447265625, 0.970703125, 1.10693359375, 1.2431640625, 1.37939453125, 1.515625, 1.65185546875, 1.7880859375, 1.92431640625, 2.060546875, 2.19677734375, 2.3330078125, 2.46923828125, 2.60546875, 2.74169921875, 2.8779296875, 3.01416015625, 3.150390625, 3.28662109375, 3.4228515625, 3.55908203125, 3.6953125, 3.83154296875, 3.9677734375, 4.10400390625, 4.240234375, 4.37646484375, 4.5126953125, 4.64892578125, 4.78515625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 5.0, 4.0, 14.0, 10.0, 27.0, 31.0, 35.0, 55.0, 96.0, 140.0, 218.0, 489.0, 871.0, 2081.0, 6880.0, 30870.0, 272511.0, 3409860.0, 416115.0, 40825.0, 8569.0, 2562.0, 917.0, 441.0, 246.0, 137.0, 84.0, 60.0, 46.0, 35.0, 18.0, 18.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.46875, -19.876708984375, -19.28466796875, -18.692626953125, -18.1005859375, -17.508544921875, -16.91650390625, -16.324462890625, -15.732421875, -15.140380859375, -14.54833984375, -13.956298828125, -13.3642578125, -12.772216796875, -12.18017578125, -11.588134765625, -10.99609375, -10.404052734375, -9.81201171875, -9.219970703125, -8.6279296875, -8.035888671875, -7.44384765625, -6.851806640625, -6.259765625, -5.667724609375, -5.07568359375, -4.483642578125, -3.8916015625, -3.299560546875, -2.70751953125, -2.115478515625, -1.5234375, -0.931396484375, -0.33935546875, 0.252685546875, 0.8447265625, 1.436767578125, 2.02880859375, 2.620849609375, 3.212890625, 3.804931640625, 4.39697265625, 4.989013671875, 5.5810546875, 6.173095703125, 6.76513671875, 7.357177734375, 7.94921875, 8.541259765625, 9.13330078125, 9.725341796875, 10.3173828125, 10.909423828125, 11.50146484375, 12.093505859375, 12.685546875, 13.277587890625, 13.86962890625, 14.461669921875, 15.0537109375, 15.645751953125, 16.23779296875, 16.829833984375, 17.421875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 4.0, 9.0, 11.0, 15.0, 24.0, 24.0, 35.0, 38.0, 71.0, 96.0, 118.0, 143.0, 259.0, 326.0, 453.0, 573.0, 503.0, 390.0, 274.0, 198.0, 139.0, 92.0, 79.0, 55.0, 39.0, 33.0, 21.0, 15.0, 10.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8671875, -10.5338134765625, -10.200439453125, -9.8670654296875, -9.53369140625, -9.2003173828125, -8.866943359375, -8.5335693359375, -8.2001953125, -7.8668212890625, -7.533447265625, -7.2000732421875, -6.86669921875, -6.5333251953125, -6.199951171875, -5.8665771484375, -5.533203125, -5.1998291015625, -4.866455078125, -4.5330810546875, -4.19970703125, -3.8663330078125, -3.532958984375, -3.1995849609375, -2.8662109375, -2.5328369140625, -2.199462890625, -1.8660888671875, -1.53271484375, -1.1993408203125, -0.865966796875, -0.5325927734375, -0.19921875, 0.1341552734375, 0.467529296875, 0.8009033203125, 1.13427734375, 1.4676513671875, 1.801025390625, 2.1343994140625, 2.4677734375, 2.8011474609375, 3.134521484375, 3.4678955078125, 3.80126953125, 4.1346435546875, 4.468017578125, 4.8013916015625, 5.134765625, 5.4681396484375, 5.801513671875, 6.1348876953125, 6.46826171875, 6.8016357421875, 7.135009765625, 7.4683837890625, 7.8017578125, 8.1351318359375, 8.468505859375, 8.8018798828125, 9.13525390625, 9.4686279296875, 9.802001953125, 10.1353759765625, 10.46875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 12.0, 12.0, 19.0, 45.0, 70.0, 83.0, 149.0, 244.0, 369.0, 624.0, 1063.0, 2008.0, 4012.0, 8599.0, 20123.0, 54053.0, 173617.0, 710912.0, 2291608.0, 672942.0, 165671.0, 52058.0, 19403.0, 8184.0, 3747.0, 1950.0, 1108.0, 601.0, 369.0, 218.0, 149.0, 79.0, 54.0, 45.0, 27.0, 16.0, 17.0, 6.0, 0.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.390625, -11.9703369140625, -11.550048828125, -11.1297607421875, -10.70947265625, -10.2891845703125, -9.868896484375, -9.4486083984375, -9.0283203125, -8.6080322265625, -8.187744140625, -7.7674560546875, -7.34716796875, -6.9268798828125, -6.506591796875, -6.0863037109375, -5.666015625, -5.2457275390625, -4.825439453125, -4.4051513671875, -3.98486328125, -3.5645751953125, -3.144287109375, -2.7239990234375, -2.3037109375, -1.8834228515625, -1.463134765625, -1.0428466796875, -0.62255859375, -0.2022705078125, 0.218017578125, 0.6383056640625, 1.05859375, 1.4788818359375, 1.899169921875, 2.3194580078125, 2.73974609375, 3.1600341796875, 3.580322265625, 4.0006103515625, 4.4208984375, 4.8411865234375, 5.261474609375, 5.6817626953125, 6.10205078125, 6.5223388671875, 6.942626953125, 7.3629150390625, 7.783203125, 8.2034912109375, 8.623779296875, 9.0440673828125, 9.46435546875, 9.8846435546875, 10.304931640625, 10.7252197265625, 11.1455078125, 11.5657958984375, 11.986083984375, 12.4063720703125, 12.82666015625, 13.2469482421875, 13.667236328125, 14.0875244140625, 14.5078125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 11.0, 15.0, 40.0, 79.0, 114.0, 136.0, 161.0, 150.0, 111.0, 88.0, 50.0, 21.0, 16.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-107.01962280273438, -104.02365112304688, -101.0276870727539, -98.0317153930664, -95.0357437133789, -92.0397720336914, -89.04380798339844, -86.04783630371094, -83.05186462402344, -80.05589294433594, -77.05992889404297, -74.06395721435547, -71.06798553466797, -68.07201385498047, -65.0760498046875, -62.080078125, -59.084110260009766, -56.08814239501953, -53.09217071533203, -50.0962028503418, -47.1002311706543, -44.10426330566406, -41.10829162597656, -38.11232376098633, -35.116355895996094, -32.12038803100586, -29.12441635131836, -26.128448486328125, -23.132476806640625, -20.13650894165039, -17.140539169311523, -14.144569396972656, -11.148597717285156, -8.152627944946289, -5.15665864944458, -2.160689353942871, 0.8352804183959961, 3.8312501907348633, 6.827219009399414, 9.823188781738281, 12.819158554077148, 15.815128326416016, 18.811098098754883, 21.80706787109375, 24.803035736083984, 27.799007415771484, 30.79497528076172, 33.79094696044922, 36.78691482543945, 39.78288269042969, 42.77885437011719, 45.77482223510742, 48.77079391479492, 51.766761779785156, 54.762733459472656, 57.75870132446289, 60.754669189453125, 63.75063705444336, 66.7466049194336, 69.7425765991211, 72.7385482788086, 75.7345199584961, 78.73048400878906, 81.72645568847656, 84.72242736816406]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 5.0, 9.0, 8.0, 10.0, 12.0, 16.0, 20.0, 20.0, 18.0, 24.0, 25.0, 30.0, 40.0, 27.0, 29.0, 43.0, 34.0, 38.0, 37.0, 42.0, 30.0, 49.0, 41.0, 45.0, 36.0, 39.0, 31.0, 23.0, 30.0, 29.0, 17.0, 18.0, 27.0, 14.0, 12.0, 16.0, 15.0, 8.0, 7.0, 5.0, 5.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-34.2264404296875, -33.20804214477539, -32.18964767456055, -31.17125129699707, -30.152854919433594, -29.134456634521484, -28.116060256958008, -27.09766387939453, -26.079267501831055, -25.060871124267578, -24.0424747467041, -23.024078369140625, -22.005680084228516, -20.987285614013672, -19.968887329101562, -18.950490951538086, -17.93209457397461, -16.913698196411133, -15.895301818847656, -14.876904487609863, -13.858508110046387, -12.84011173248291, -11.821714401245117, -10.80331802368164, -9.784921646118164, -8.766525268554688, -7.748128414154053, -6.729731559753418, -5.711335182189941, -4.692938804626465, -3.67454195022583, -2.6561450958251953, -1.6377487182617188, -0.6193521022796631, 0.3990445137023926, 1.4174411296844482, 2.435837745666504, 3.4542341232299805, 4.472630977630615, 5.49102783203125, 6.509424209594727, 7.527820587158203, 8.54621696472168, 9.564614295959473, 10.58301067352295, 11.601407051086426, 12.619804382324219, 13.638200759887695, 14.656597137451172, 15.674993515014648, 16.693389892578125, 17.7117862701416, 18.730182647705078, 19.748580932617188, 20.766977310180664, 21.78537368774414, 22.803770065307617, 23.822166442871094, 24.84056282043457, 25.858959197998047, 26.877357482910156, 27.895751953125, 28.91415023803711, 29.932546615600586, 30.950942993164062]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 10.0, 7.0, 12.0, 12.0, 14.0, 19.0, 11.0, 24.0, 23.0, 38.0, 48.0, 49.0, 34.0, 43.0, 54.0, 43.0, 63.0, 63.0, 57.0, 37.0, 48.0, 42.0, 40.0, 29.0, 35.0, 23.0, 25.0, 23.0, 13.0, 12.0, 7.0, 5.0, 5.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.47265625, -4.33099365234375, -4.1893310546875, -4.04766845703125, -3.906005859375, -3.76434326171875, -3.6226806640625, -3.48101806640625, -3.33935546875, -3.19769287109375, -3.0560302734375, -2.91436767578125, -2.772705078125, -2.63104248046875, -2.4893798828125, -2.34771728515625, -2.2060546875, -2.06439208984375, -1.9227294921875, -1.78106689453125, -1.639404296875, -1.49774169921875, -1.3560791015625, -1.21441650390625, -1.07275390625, -0.93109130859375, -0.7894287109375, -0.64776611328125, -0.506103515625, -0.36444091796875, -0.2227783203125, -0.08111572265625, 0.060546875, 0.20220947265625, 0.3438720703125, 0.48553466796875, 0.627197265625, 0.76885986328125, 0.9105224609375, 1.05218505859375, 1.19384765625, 1.33551025390625, 1.4771728515625, 1.61883544921875, 1.760498046875, 1.90216064453125, 2.0438232421875, 2.18548583984375, 2.3271484375, 2.46881103515625, 2.6104736328125, 2.75213623046875, 2.893798828125, 3.03546142578125, 3.1771240234375, 3.31878662109375, 3.46044921875, 3.60211181640625, 3.7437744140625, 3.88543701171875, 4.027099609375, 4.16876220703125, 4.3104248046875, 4.45208740234375, 4.59375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 7.0, 15.0, 16.0, 28.0, 33.0, 44.0, 95.0, 121.0, 151.0, 230.0, 345.0, 572.0, 790.0, 1283.0, 1993.0, 3209.0, 5252.0, 8830.0, 15010.0, 26915.0, 51252.0, 106727.0, 291301.0, 304120.0, 110772.0, 52800.0, 27622.0, 15670.0, 8928.0, 5266.0, 3230.0, 2038.0, 1354.0, 821.0, 561.0, 361.0, 245.0, 174.0, 109.0, 85.0, 54.0, 42.0, 21.0, 15.0, 15.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1788330078125, -0.173248291015625, -0.16766357421875, -0.162078857421875, -0.156494140625, -0.150909423828125, -0.14532470703125, -0.139739990234375, -0.1341552734375, -0.128570556640625, -0.12298583984375, -0.117401123046875, -0.11181640625, -0.106231689453125, -0.10064697265625, -0.095062255859375, -0.0894775390625, -0.083892822265625, -0.07830810546875, -0.072723388671875, -0.067138671875, -0.061553955078125, -0.05596923828125, -0.050384521484375, -0.0447998046875, -0.039215087890625, -0.03363037109375, -0.028045654296875, -0.0224609375, -0.016876220703125, -0.01129150390625, -0.005706787109375, -0.0001220703125, 0.005462646484375, 0.01104736328125, 0.016632080078125, 0.022216796875, 0.027801513671875, 0.03338623046875, 0.038970947265625, 0.0445556640625, 0.050140380859375, 0.05572509765625, 0.061309814453125, 0.06689453125, 0.072479248046875, 0.07806396484375, 0.083648681640625, 0.0892333984375, 0.094818115234375, 0.10040283203125, 0.105987548828125, 0.111572265625, 0.117156982421875, 0.12274169921875, 0.128326416015625, 0.1339111328125, 0.139495849609375, 0.14508056640625, 0.150665283203125, 0.15625, 0.161834716796875, 0.16741943359375, 0.173004150390625, 0.1785888671875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 13.0, 5.0, 13.0, 13.0, 12.0, 16.0, 28.0, 27.0, 25.0, 39.0, 34.0, 43.0, 38.0, 38.0, 38.0, 34.0, 1063.0, 33.0, 44.0, 50.0, 31.0, 33.0, 37.0, 41.0, 30.0, 37.0, 31.0, 22.0, 18.0, 17.0, 13.0, 21.0, 10.0, 16.0, 9.0, 11.0, 7.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.716796875, -2.63177490234375, -2.5467529296875, -2.46173095703125, -2.376708984375, -2.29168701171875, -2.2066650390625, -2.12164306640625, -2.03662109375, -1.95159912109375, -1.8665771484375, -1.78155517578125, -1.696533203125, -1.61151123046875, -1.5264892578125, -1.44146728515625, -1.3564453125, -1.27142333984375, -1.1864013671875, -1.10137939453125, -1.016357421875, -0.93133544921875, -0.8463134765625, -0.76129150390625, -0.67626953125, -0.59124755859375, -0.5062255859375, -0.42120361328125, -0.336181640625, -0.25115966796875, -0.1661376953125, -0.08111572265625, 0.00390625, 0.08892822265625, 0.1739501953125, 0.25897216796875, 0.343994140625, 0.42901611328125, 0.5140380859375, 0.59906005859375, 0.68408203125, 0.76910400390625, 0.8541259765625, 0.93914794921875, 1.024169921875, 1.10919189453125, 1.1942138671875, 1.27923583984375, 1.3642578125, 1.44927978515625, 1.5343017578125, 1.61932373046875, 1.704345703125, 1.78936767578125, 1.8743896484375, 1.95941162109375, 2.04443359375, 2.12945556640625, 2.2144775390625, 2.29949951171875, 2.384521484375, 2.46954345703125, 2.5545654296875, 2.63958740234375, 2.724609375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 10.0, 5.0, 12.0, 23.0, 37.0, 51.0, 71.0, 111.0, 202.0, 317.0, 464.0, 761.0, 1179.0, 1870.0, 2889.0, 4740.0, 7753.0, 12763.0, 21273.0, 36231.0, 65661.0, 127659.0, 1324445.0, 240167.0, 108662.0, 57744.0, 32338.0, 19404.0, 11401.0, 7089.0, 4390.0, 2716.0, 1700.0, 1099.0, 684.0, 439.0, 260.0, 180.0, 106.0, 78.0, 52.0, 34.0, 27.0, 10.0, 11.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0982666015625, -0.0951852798461914, -0.09210395812988281, -0.08902263641357422, -0.08594131469726562, -0.08285999298095703, -0.07977867126464844, -0.07669734954833984, -0.07361602783203125, -0.07053470611572266, -0.06745338439941406, -0.06437206268310547, -0.061290740966796875, -0.05820941925048828, -0.05512809753417969, -0.052046775817871094, -0.0489654541015625, -0.045884132385253906, -0.04280281066894531, -0.03972148895263672, -0.036640167236328125, -0.03355884552001953, -0.030477523803710938, -0.027396202087402344, -0.02431488037109375, -0.021233558654785156, -0.018152236938476562, -0.015070915222167969, -0.011989593505859375, -0.008908271789550781, -0.0058269500732421875, -0.0027456283569335938, 0.000335693359375, 0.0034170150756835938, 0.0064983367919921875, 0.009579658508300781, 0.012660980224609375, 0.01574230194091797, 0.018823623657226562, 0.021904945373535156, 0.02498626708984375, 0.028067588806152344, 0.031148910522460938, 0.03423023223876953, 0.037311553955078125, 0.04039287567138672, 0.04347419738769531, 0.046555519104003906, 0.0496368408203125, 0.052718162536621094, 0.05579948425292969, 0.05888080596923828, 0.061962127685546875, 0.06504344940185547, 0.06812477111816406, 0.07120609283447266, 0.07428741455078125, 0.07736873626708984, 0.08045005798339844, 0.08353137969970703, 0.08661270141601562, 0.08969402313232422, 0.09277534484863281, 0.0958566665649414, 0.09893798828125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 9.0, 9.0, 13.0, 19.0, 29.0, 24.0, 32.0, 25.0, 37.0, 42.0, 40.0, 57.0, 68.0, 57.0, 53.0, 61.0, 53.0, 42.0, 41.0, 41.0, 36.0, 33.0, 34.0, 30.0, 27.0, 14.0, 13.0, 18.0, 8.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.875659942626953e-05, -4.7369860112667084e-05, -4.5983120799064636e-05, -4.459638148546219e-05, -4.320964217185974e-05, -4.1822902858257294e-05, -4.0436163544654846e-05, -3.90494242310524e-05, -3.766268491744995e-05, -3.6275945603847504e-05, -3.4889206290245056e-05, -3.350246697664261e-05, -3.211572766304016e-05, -3.0728988349437714e-05, -2.9342249035835266e-05, -2.795550972223282e-05, -2.656877040863037e-05, -2.5182031095027924e-05, -2.3795291781425476e-05, -2.240855246782303e-05, -2.102181315422058e-05, -1.9635073840618134e-05, -1.8248334527015686e-05, -1.686159521341324e-05, -1.547485589981079e-05, -1.4088116586208344e-05, -1.2701377272605896e-05, -1.1314637959003448e-05, -9.927898645401001e-06, -8.541159331798553e-06, -7.154420018196106e-06, -5.7676807045936584e-06, -4.380941390991211e-06, -2.9942020773887634e-06, -1.607462763786316e-06, -2.207234501838684e-07, 1.166015863418579e-06, 2.5527551770210266e-06, 3.939494490623474e-06, 5.326233804225922e-06, 6.712973117828369e-06, 8.099712431430817e-06, 9.486451745033264e-06, 1.0873191058635712e-05, 1.225993037223816e-05, 1.3646669685840607e-05, 1.5033408999443054e-05, 1.6420148313045502e-05, 1.780688762664795e-05, 1.9193626940250397e-05, 2.0580366253852844e-05, 2.1967105567455292e-05, 2.335384488105774e-05, 2.4740584194660187e-05, 2.6127323508262634e-05, 2.7514062821865082e-05, 2.890080213546753e-05, 3.0287541449069977e-05, 3.1674280762672424e-05, 3.306102007627487e-05, 3.444775938987732e-05, 3.583449870347977e-05, 3.7221238017082214e-05, 3.860797733068466e-05, 3.999471664428711e-05]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 14.0, 12.0, 14.0, 15.0, 19.0, 22.0, 16.0, 27.0, 32.0, 43.0, 61.0, 105.0, 162.0, 372.0, 1433.0, 19053.0, 409140.0, 580801.0, 34058.0, 2136.0, 451.0, 176.0, 107.0, 62.0, 52.0, 34.0, 30.0, 23.0, 25.0, 14.0, 16.0, 5.0, 0.0, 10.0, 4.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006575584411621094, -0.0006357058882713318, -0.0006138533353805542, -0.0005920007824897766, -0.000570148229598999, -0.0005482956767082214, -0.0005264431238174438, -0.0005045905709266663, -0.00048273801803588867, -0.0004608854651451111, -0.0004390329122543335, -0.0004171803593635559, -0.0003953278064727783, -0.00037347525358200073, -0.00035162270069122314, -0.00032977014780044556, -0.00030791759490966797, -0.0002860650420188904, -0.0002642124891281128, -0.0002423599362373352, -0.00022050738334655762, -0.00019865483045578003, -0.00017680227756500244, -0.00015494972467422485, -0.00013309717178344727, -0.00011124461889266968, -8.939206600189209e-05, -6.75395131111145e-05, -4.5686960220336914e-05, -2.3834407329559326e-05, -1.9818544387817383e-06, 1.987069845199585e-05, 4.172325134277344e-05, 6.357580423355103e-05, 8.542835712432861e-05, 0.0001072809100151062, 0.0001291334629058838, 0.00015098601579666138, 0.00017283856868743896, 0.00019469112157821655, 0.00021654367446899414, 0.00023839622735977173, 0.0002602487802505493, 0.0002821013331413269, 0.0003039538860321045, 0.0003258064389228821, 0.00034765899181365967, 0.00036951154470443726, 0.00039136409759521484, 0.00041321665048599243, 0.00043506920337677, 0.0004569217562675476, 0.0004787743091583252, 0.0005006268620491028, 0.0005224794149398804, 0.000544331967830658, 0.0005661845207214355, 0.0005880370736122131, 0.0006098896265029907, 0.0006317421793937683, 0.0006535947322845459, 0.0006754472851753235, 0.0006972998380661011, 0.0007191523909568787, 0.0007410049438476562]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 15.0, 30.0, 63.0, 150.0, 229.0, 244.0, 165.0, 69.0, 28.0, 13.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.304213482304476e-05, -4.825156429433264e-05, -4.346099740359932e-05, -3.86704268748872e-05, -3.3879856346175075e-05, -2.908928581746295e-05, -2.429871710774023e-05, -1.950814839801751e-05, -1.4717577869305387e-05, -9.927008250087965e-06, -5.136438630870543e-06, -3.4586901165312156e-07, 4.4447006075643e-06, 9.235271136276424e-06, 1.4025839845999144e-05, 1.8816408555721864e-05, 2.3606979084433988e-05, 2.839754961314611e-05, 3.318811650387943e-05, 3.797868703259155e-05, 4.2769257561303675e-05, 4.75598280900158e-05, 5.235039861872792e-05, 5.714096550946124e-05, 6.193153967615217e-05, 6.67221102048643e-05, 7.151268073357642e-05, 7.630325126228854e-05, 8.109382179100066e-05, 8.588438504375517e-05, 9.06749555724673e-05, 9.546552610117942e-05, 0.00010025608935393393, 0.00010504665988264605, 0.00010983723041135818, 0.0001146278009400703, 0.00011941837146878242, 0.00012420893472153693, 0.00012899951252620667, 0.00013379007577896118, 0.00013858065358363092, 0.00014337121683638543, 0.00014816179464105517, 0.00015295235789380968, 0.00015774293569847941, 0.00016253349895123392, 0.00016732407675590366, 0.00017211464000865817, 0.00017690520326141268, 0.0001816957665141672, 0.00018648634431883693, 0.00019127690757159144, 0.00019606748537626117, 0.00020085804862901568, 0.00020564862643368542, 0.00021043918968643993, 0.00021522975293919444, 0.00022002031619194895, 0.0002248108939966187, 0.0002296014572493732, 0.00023439203505404294, 0.00023918259830679744, 0.00024397317611146718, 0.0002487637393642217, 0.00025355431716889143]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 8.0, 9.0, 7.0, 11.0, 9.0, 21.0, 23.0, 21.0, 18.0, 27.0, 22.0, 36.0, 38.0, 31.0, 40.0, 41.0, 54.0, 48.0, 43.0, 54.0, 45.0, 26.0, 38.0, 50.0, 46.0, 26.0, 28.0, 29.0, 27.0, 18.0, 16.0, 18.0, 18.0, 12.0, 11.0, 6.0, 9.0, 6.0, 1.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0279159545898438e-05, -2.928357571363449e-05, -2.8287991881370544e-05, -2.7292408049106598e-05, -2.629682421684265e-05, -2.5301240384578705e-05, -2.4305656552314758e-05, -2.3310072720050812e-05, -2.2314488887786865e-05, -2.131890505552292e-05, -2.0323321223258972e-05, -1.9327737390995026e-05, -1.833215355873108e-05, -1.7336569726467133e-05, -1.6340985894203186e-05, -1.534540206193924e-05, -1.4349818229675293e-05, -1.3354234397411346e-05, -1.23586505651474e-05, -1.1363066732883453e-05, -1.0367482900619507e-05, -9.37189906835556e-06, -8.376315236091614e-06, -7.380731403827667e-06, -6.385147571563721e-06, -5.389563739299774e-06, -4.393979907035828e-06, -3.398396074771881e-06, -2.4028122425079346e-06, -1.407228410243988e-06, -4.116445779800415e-07, 5.83939254283905e-07, 1.5795230865478516e-06, 2.575106918811798e-06, 3.5706907510757446e-06, 4.566274583339691e-06, 5.561858415603638e-06, 6.557442247867584e-06, 7.553026080131531e-06, 8.548609912395477e-06, 9.544193744659424e-06, 1.053977757692337e-05, 1.1535361409187317e-05, 1.2530945241451263e-05, 1.352652907371521e-05, 1.4522112905979156e-05, 1.5517696738243103e-05, 1.651328057050705e-05, 1.7508864402770996e-05, 1.8504448235034943e-05, 1.950003206729889e-05, 2.0495615899562836e-05, 2.1491199731826782e-05, 2.248678356409073e-05, 2.3482367396354675e-05, 2.4477951228618622e-05, 2.547353506088257e-05, 2.6469118893146515e-05, 2.746470272541046e-05, 2.8460286557674408e-05, 2.9455870389938354e-05, 3.04514542222023e-05, 3.144703805446625e-05, 3.2442621886730194e-05, 3.343820571899414e-05]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 10.0, 7.0, 12.0, 12.0, 14.0, 19.0, 11.0, 24.0, 23.0, 38.0, 48.0, 49.0, 34.0, 43.0, 54.0, 43.0, 63.0, 63.0, 57.0, 37.0, 48.0, 42.0, 40.0, 29.0, 35.0, 23.0, 25.0, 23.0, 13.0, 12.0, 7.0, 5.0, 5.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.47265625, -4.33099365234375, -4.1893310546875, -4.04766845703125, -3.906005859375, -3.76434326171875, -3.6226806640625, -3.48101806640625, -3.33935546875, -3.19769287109375, -3.0560302734375, -2.91436767578125, -2.772705078125, -2.63104248046875, -2.4893798828125, -2.34771728515625, -2.2060546875, -2.06439208984375, -1.9227294921875, -1.78106689453125, -1.639404296875, -1.49774169921875, -1.3560791015625, -1.21441650390625, -1.07275390625, -0.93109130859375, -0.7894287109375, -0.64776611328125, -0.506103515625, -0.36444091796875, -0.2227783203125, -0.08111572265625, 0.060546875, 0.20220947265625, 0.3438720703125, 0.48553466796875, 0.627197265625, 0.76885986328125, 0.9105224609375, 1.05218505859375, 1.19384765625, 1.33551025390625, 1.4771728515625, 1.61883544921875, 1.760498046875, 1.90216064453125, 2.0438232421875, 2.18548583984375, 2.3271484375, 2.46881103515625, 2.6104736328125, 2.75213623046875, 2.893798828125, 3.03546142578125, 3.1771240234375, 3.31878662109375, 3.46044921875, 3.60211181640625, 3.7437744140625, 3.88543701171875, 4.027099609375, 4.16876220703125, 4.3104248046875, 4.45208740234375, 4.59375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 4.0, 15.0, 8.0, 16.0, 14.0, 27.0, 36.0, 41.0, 68.0, 91.0, 166.0, 234.0, 484.0, 1029.0, 2487.0, 8328.0, 41038.0, 798738.0, 166975.0, 20407.0, 4903.0, 1705.0, 723.0, 396.0, 194.0, 124.0, 72.0, 58.0, 50.0, 22.0, 19.0, 11.0, 16.0, 12.0, 10.0, 2.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5859375, -13.1141357421875, -12.642333984375, -12.1705322265625, -11.69873046875, -11.2269287109375, -10.755126953125, -10.2833251953125, -9.8115234375, -9.3397216796875, -8.867919921875, -8.3961181640625, -7.92431640625, -7.4525146484375, -6.980712890625, -6.5089111328125, -6.037109375, -5.5653076171875, -5.093505859375, -4.6217041015625, -4.14990234375, -3.6781005859375, -3.206298828125, -2.7344970703125, -2.2626953125, -1.7908935546875, -1.319091796875, -0.8472900390625, -0.37548828125, 0.0963134765625, 0.568115234375, 1.0399169921875, 1.51171875, 1.9835205078125, 2.455322265625, 2.9271240234375, 3.39892578125, 3.8707275390625, 4.342529296875, 4.8143310546875, 5.2861328125, 5.7579345703125, 6.229736328125, 6.7015380859375, 7.17333984375, 7.6451416015625, 8.116943359375, 8.5887451171875, 9.060546875, 9.5323486328125, 10.004150390625, 10.4759521484375, 10.94775390625, 11.4195556640625, 11.891357421875, 12.3631591796875, 12.8349609375, 13.3067626953125, 13.778564453125, 14.2503662109375, 14.72216796875, 15.1939697265625, 15.665771484375, 16.1375732421875, 16.609375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 0.0, 4.0, 3.0, 7.0, 6.0, 15.0, 8.0, 9.0, 22.0, 14.0, 28.0, 25.0, 34.0, 19.0, 23.0, 44.0, 35.0, 33.0, 52.0, 52.0, 95.0, 191.0, 1679.0, 132.0, 84.0, 57.0, 47.0, 42.0, 38.0, 33.0, 39.0, 21.0, 31.0, 13.0, 20.0, 17.0, 12.0, 14.0, 13.0, 12.0, 8.0, 5.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5, -13.08203125, -12.6640625, -12.24609375, -11.828125, -11.41015625, -10.9921875, -10.57421875, -10.15625, -9.73828125, -9.3203125, -8.90234375, -8.484375, -8.06640625, -7.6484375, -7.23046875, -6.8125, -6.39453125, -5.9765625, -5.55859375, -5.140625, -4.72265625, -4.3046875, -3.88671875, -3.46875, -3.05078125, -2.6328125, -2.21484375, -1.796875, -1.37890625, -0.9609375, -0.54296875, -0.125, 0.29296875, 0.7109375, 1.12890625, 1.546875, 1.96484375, 2.3828125, 2.80078125, 3.21875, 3.63671875, 4.0546875, 4.47265625, 4.890625, 5.30859375, 5.7265625, 6.14453125, 6.5625, 6.98046875, 7.3984375, 7.81640625, 8.234375, 8.65234375, 9.0703125, 9.48828125, 9.90625, 10.32421875, 10.7421875, 11.16015625, 11.578125, 11.99609375, 12.4140625, 12.83203125, 13.25]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 6.0, 8.0, 8.0, 10.0, 8.0, 14.0, 10.0, 18.0, 22.0, 19.0, 37.0, 50.0, 70.0, 94.0, 128.0, 205.0, 338.0, 943.0, 3496.0, 19726.0, 223352.0, 2811749.0, 72684.0, 9216.0, 2017.0, 616.0, 266.0, 166.0, 104.0, 75.0, 50.0, 40.0, 33.0, 30.0, 22.0, 21.0, 11.0, 12.0, 12.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-26.46875, -25.673828125, -24.87890625, -24.083984375, -23.2890625, -22.494140625, -21.69921875, -20.904296875, -20.109375, -19.314453125, -18.51953125, -17.724609375, -16.9296875, -16.134765625, -15.33984375, -14.544921875, -13.75, -12.955078125, -12.16015625, -11.365234375, -10.5703125, -9.775390625, -8.98046875, -8.185546875, -7.390625, -6.595703125, -5.80078125, -5.005859375, -4.2109375, -3.416015625, -2.62109375, -1.826171875, -1.03125, -0.236328125, 0.55859375, 1.353515625, 2.1484375, 2.943359375, 3.73828125, 4.533203125, 5.328125, 6.123046875, 6.91796875, 7.712890625, 8.5078125, 9.302734375, 10.09765625, 10.892578125, 11.6875, 12.482421875, 13.27734375, 14.072265625, 14.8671875, 15.662109375, 16.45703125, 17.251953125, 18.046875, 18.841796875, 19.63671875, 20.431640625, 21.2265625, 22.021484375, 22.81640625, 23.611328125, 24.40625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [2.0, 44.0, 320.0, 533.0, 116.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.23528480529785, -13.414440155029297, -7.593595504760742, -1.7727508544921875, 4.048093795776367, 9.868938446044922, 15.689783096313477, 21.5106258392334, 27.331472396850586, 33.15231704711914, 38.97315979003906, 44.79400634765625, 50.61485290527344, 56.43569564819336, 62.25653839111328, 68.07738494873047, 73.89823150634766, 79.71907806396484, 85.5399169921875, 91.36076354980469, 97.18161010742188, 103.00245666503906, 108.82330322265625, 114.6441421508789, 120.4649887084961, 126.28583526611328, 132.10667419433594, 137.92752075195312, 143.7483673095703, 149.5692138671875, 155.3900604248047, 161.21090698242188, 167.03173828125, 172.8525848388672, 178.67343139648438, 184.49427795410156, 190.31512451171875, 196.13595581054688, 201.95680236816406, 207.77764892578125, 213.59849548339844, 219.41934204101562, 225.2401885986328, 231.06103515625, 236.88186645507812, 242.7027130126953, 248.5235595703125, 254.3444061279297, 260.1652526855469, 265.986083984375, 271.80694580078125, 277.6277770996094, 283.4486389160156, 289.26947021484375, 295.09033203125, 300.9111633300781, 306.73199462890625, 312.5528259277344, 318.3736877441406, 324.19451904296875, 330.015380859375, 335.8362121582031, 341.6570739746094, 347.4779052734375, 353.29876708984375]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 8.0, 6.0, 10.0, 3.0, 15.0, 13.0, 15.0, 12.0, 15.0, 15.0, 25.0, 28.0, 20.0, 20.0, 26.0, 27.0, 28.0, 32.0, 32.0, 34.0, 35.0, 47.0, 39.0, 33.0, 46.0, 32.0, 38.0, 33.0, 40.0, 33.0, 25.0, 30.0, 26.0, 26.0, 22.0, 17.0, 15.0, 17.0, 12.0, 7.0, 10.0, 3.0, 6.0, 4.0, 6.0, 3.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-33.14991760253906, -32.12135696411133, -31.092798233032227, -30.064239501953125, -29.03567886352539, -28.007118225097656, -26.978559494018555, -25.950000762939453, -24.92144012451172, -23.892879486083984, -22.864320755004883, -21.83576202392578, -20.807201385498047, -19.778640747070312, -18.75008201599121, -17.72152328491211, -16.692962646484375, -15.664402961730957, -14.635843276977539, -13.607283592224121, -12.578723907470703, -11.550164222717285, -10.521604537963867, -9.49304485321045, -8.464485168457031, -7.435925483703613, -6.407365798950195, -5.378806114196777, -4.350246429443359, -3.3216867446899414, -2.2931270599365234, -1.2645673751831055, -0.2360076904296875, 0.7925519943237305, 1.8211116790771484, 2.8496713638305664, 3.8782310485839844, 4.906790733337402, 5.93535041809082, 6.963910102844238, 7.992469787597656, 9.021029472351074, 10.049589157104492, 11.07814884185791, 12.106708526611328, 13.135268211364746, 14.163827896118164, 15.192387580871582, 16.220947265625, 17.249507904052734, 18.278066635131836, 19.306625366210938, 20.335186004638672, 21.363746643066406, 22.392305374145508, 23.42086410522461, 24.449424743652344, 25.477985382080078, 26.50654411315918, 27.53510284423828, 28.563663482666016, 29.59222412109375, 30.62078285217285, 31.649341583251953, 32.67790222167969]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 3.0, 16.0, 6.0, 9.0, 15.0, 14.0, 17.0, 18.0, 22.0, 29.0, 31.0, 45.0, 50.0, 48.0, 43.0, 35.0, 54.0, 67.0, 73.0, 50.0, 40.0, 59.0, 34.0, 35.0, 32.0, 34.0, 20.0, 21.0, 18.0, 17.0, 9.0, 6.0, 10.0, 5.0, 8.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.9375, -4.784912109375, -4.63232421875, -4.479736328125, -4.3271484375, -4.174560546875, -4.02197265625, -3.869384765625, -3.716796875, -3.564208984375, -3.41162109375, -3.259033203125, -3.1064453125, -2.953857421875, -2.80126953125, -2.648681640625, -2.49609375, -2.343505859375, -2.19091796875, -2.038330078125, -1.8857421875, -1.733154296875, -1.58056640625, -1.427978515625, -1.275390625, -1.122802734375, -0.97021484375, -0.817626953125, -0.6650390625, -0.512451171875, -0.35986328125, -0.207275390625, -0.0546875, 0.097900390625, 0.25048828125, 0.403076171875, 0.5556640625, 0.708251953125, 0.86083984375, 1.013427734375, 1.166015625, 1.318603515625, 1.47119140625, 1.623779296875, 1.7763671875, 1.928955078125, 2.08154296875, 2.234130859375, 2.38671875, 2.539306640625, 2.69189453125, 2.844482421875, 2.9970703125, 3.149658203125, 3.30224609375, 3.454833984375, 3.607421875, 3.760009765625, 3.91259765625, 4.065185546875, 4.2177734375, 4.370361328125, 4.52294921875, 4.675537109375, 4.828125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 7.0, 13.0, 16.0, 19.0, 18.0, 29.0, 54.0, 67.0, 103.0, 149.0, 205.0, 365.0, 592.0, 1222.0, 2686.0, 6845.0, 22918.0, 114857.0, 1381724.0, 2435739.0, 178863.0, 32382.0, 8993.0, 3184.0, 1372.0, 749.0, 368.0, 235.0, 175.0, 99.0, 74.0, 46.0, 36.0, 20.0, 12.0, 9.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-15.578125, -15.1214599609375, -14.664794921875, -14.2081298828125, -13.75146484375, -13.2947998046875, -12.838134765625, -12.3814697265625, -11.9248046875, -11.4681396484375, -11.011474609375, -10.5548095703125, -10.09814453125, -9.6414794921875, -9.184814453125, -8.7281494140625, -8.271484375, -7.8148193359375, -7.358154296875, -6.9014892578125, -6.44482421875, -5.9881591796875, -5.531494140625, -5.0748291015625, -4.6181640625, -4.1614990234375, -3.704833984375, -3.2481689453125, -2.79150390625, -2.3348388671875, -1.878173828125, -1.4215087890625, -0.96484375, -0.5081787109375, -0.051513671875, 0.4051513671875, 0.86181640625, 1.3184814453125, 1.775146484375, 2.2318115234375, 2.6884765625, 3.1451416015625, 3.601806640625, 4.0584716796875, 4.51513671875, 4.9718017578125, 5.428466796875, 5.8851318359375, 6.341796875, 6.7984619140625, 7.255126953125, 7.7117919921875, 8.16845703125, 8.6251220703125, 9.081787109375, 9.5384521484375, 9.9951171875, 10.4517822265625, 10.908447265625, 11.3651123046875, 11.82177734375, 12.2784423828125, 12.735107421875, 13.1917724609375, 13.6484375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 6.0, 9.0, 5.0, 7.0, 13.0, 17.0, 29.0, 33.0, 54.0, 60.0, 91.0, 124.0, 199.0, 305.0, 492.0, 649.0, 619.0, 422.0, 279.0, 186.0, 157.0, 83.0, 53.0, 53.0, 34.0, 28.0, 15.0, 19.0, 13.0, 5.0, 4.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-15.375, -14.9990234375, -14.623046875, -14.2470703125, -13.87109375, -13.4951171875, -13.119140625, -12.7431640625, -12.3671875, -11.9912109375, -11.615234375, -11.2392578125, -10.86328125, -10.4873046875, -10.111328125, -9.7353515625, -9.359375, -8.9833984375, -8.607421875, -8.2314453125, -7.85546875, -7.4794921875, -7.103515625, -6.7275390625, -6.3515625, -5.9755859375, -5.599609375, -5.2236328125, -4.84765625, -4.4716796875, -4.095703125, -3.7197265625, -3.34375, -2.9677734375, -2.591796875, -2.2158203125, -1.83984375, -1.4638671875, -1.087890625, -0.7119140625, -0.3359375, 0.0400390625, 0.416015625, 0.7919921875, 1.16796875, 1.5439453125, 1.919921875, 2.2958984375, 2.671875, 3.0478515625, 3.423828125, 3.7998046875, 4.17578125, 4.5517578125, 4.927734375, 5.3037109375, 5.6796875, 6.0556640625, 6.431640625, 6.8076171875, 7.18359375, 7.5595703125, 7.935546875, 8.3115234375, 8.6875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 11.0, 14.0, 35.0, 45.0, 81.0, 127.0, 212.0, 442.0, 925.0, 2168.0, 6158.0, 22615.0, 121455.0, 1385244.0, 2421325.0, 189721.0, 30884.0, 7944.0, 2693.0, 1037.0, 527.0, 247.0, 131.0, 93.0, 40.0, 21.0, 30.0, 7.0, 6.0, 9.0, 7.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.328125, -17.59814453125, -16.8681640625, -16.13818359375, -15.408203125, -14.67822265625, -13.9482421875, -13.21826171875, -12.48828125, -11.75830078125, -11.0283203125, -10.29833984375, -9.568359375, -8.83837890625, -8.1083984375, -7.37841796875, -6.6484375, -5.91845703125, -5.1884765625, -4.45849609375, -3.728515625, -2.99853515625, -2.2685546875, -1.53857421875, -0.80859375, -0.07861328125, 0.6513671875, 1.38134765625, 2.111328125, 2.84130859375, 3.5712890625, 4.30126953125, 5.03125, 5.76123046875, 6.4912109375, 7.22119140625, 7.951171875, 8.68115234375, 9.4111328125, 10.14111328125, 10.87109375, 11.60107421875, 12.3310546875, 13.06103515625, 13.791015625, 14.52099609375, 15.2509765625, 15.98095703125, 16.7109375, 17.44091796875, 18.1708984375, 18.90087890625, 19.630859375, 20.36083984375, 21.0908203125, 21.82080078125, 22.55078125, 23.28076171875, 24.0107421875, 24.74072265625, 25.470703125, 26.20068359375, 26.9306640625, 27.66064453125, 28.390625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 13.0, 33.0, 72.0, 128.0, 198.0, 206.0, 165.0, 100.0, 48.0, 23.0, 13.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.10198974609375, -78.23880767822266, -74.37561798095703, -70.51243591308594, -66.64924621582031, -62.78606414794922, -58.92287826538086, -55.0596923828125, -51.196510314941406, -47.33332443237305, -43.47013854980469, -39.606956481933594, -35.743770599365234, -31.880584716796875, -28.017398834228516, -24.15421485900879, -20.291027069091797, -16.427841186523438, -12.564657211303711, -8.701471328735352, -4.838286399841309, -0.9751014709472656, 2.8880844116210938, 6.75126838684082, 10.61445426940918, 14.477639198303223, 18.340824127197266, 22.204010009765625, 26.067195892333984, 29.93037986755371, 33.79356384277344, 37.6567497253418, 41.519935607910156, 45.383121490478516, 49.246307373046875, 53.10948944091797, 56.97267532348633, 60.83586120605469, 64.69905090332031, 68.5622329711914, 72.4254150390625, 76.2885971069336, 80.15178680419922, 84.01496887207031, 87.87815856933594, 91.74134063720703, 95.60452270507812, 99.46771240234375, 103.33090209960938, 107.19408416748047, 111.0572738647461, 114.92045593261719, 118.78364562988281, 122.6468276977539, 126.510009765625, 130.37319946289062, 134.2363739013672, 138.0995635986328, 141.96273803710938, 145.825927734375, 149.68911743164062, 153.55230712890625, 157.4154815673828, 161.27867126464844, 165.14186096191406]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 4.0, 5.0, 11.0, 9.0, 12.0, 9.0, 16.0, 14.0, 21.0, 23.0, 37.0, 30.0, 33.0, 30.0, 51.0, 49.0, 43.0, 37.0, 42.0, 44.0, 49.0, 48.0, 35.0, 51.0, 22.0, 31.0, 41.0, 37.0, 32.0, 25.0, 20.0, 13.0, 17.0, 12.0, 10.0, 5.0, 8.0, 6.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.405067443847656, -39.14799118041992, -37.89091491699219, -36.63383865356445, -35.37676239013672, -34.119686126708984, -32.86260986328125, -31.605533599853516, -30.34845733642578, -29.091381072998047, -27.834304809570312, -26.577228546142578, -25.320152282714844, -24.06307601928711, -22.805999755859375, -21.54892349243164, -20.291847229003906, -19.034770965576172, -17.777694702148438, -16.520618438720703, -15.263542175292969, -14.006465911865234, -12.7493896484375, -11.492313385009766, -10.235237121582031, -8.978160858154297, -7.7210845947265625, -6.464008331298828, -5.206932067871094, -3.9498558044433594, -2.692779541015625, -1.4357032775878906, -0.17862701416015625, 1.0784492492675781, 2.3355255126953125, 3.592601776123047, 4.849678039550781, 6.106754302978516, 7.36383056640625, 8.620906829833984, 9.877983093261719, 11.135059356689453, 12.392135620117188, 13.649211883544922, 14.906288146972656, 16.16336441040039, 17.420440673828125, 18.67751693725586, 19.934593200683594, 21.191669464111328, 22.448745727539062, 23.705821990966797, 24.96289825439453, 26.219974517822266, 27.47705078125, 28.734127044677734, 29.99120330810547, 31.248279571533203, 32.50535583496094, 33.76243209838867, 35.019508361816406, 36.27658462524414, 37.533660888671875, 38.79073715209961, 40.047813415527344]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 13.0, 16.0, 14.0, 7.0, 14.0, 16.0, 19.0, 23.0, 28.0, 44.0, 39.0, 43.0, 38.0, 40.0, 42.0, 57.0, 50.0, 50.0, 40.0, 43.0, 45.0, 36.0, 40.0, 35.0, 22.0, 39.0, 24.0, 15.0, 22.0, 14.0, 16.0, 7.0, 8.0, 1.0, 6.0, 9.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.36328125, -4.2247314453125, -4.086181640625, -3.9476318359375, -3.80908203125, -3.6705322265625, -3.531982421875, -3.3934326171875, -3.2548828125, -3.1163330078125, -2.977783203125, -2.8392333984375, -2.70068359375, -2.5621337890625, -2.423583984375, -2.2850341796875, -2.146484375, -2.0079345703125, -1.869384765625, -1.7308349609375, -1.59228515625, -1.4537353515625, -1.315185546875, -1.1766357421875, -1.0380859375, -0.8995361328125, -0.760986328125, -0.6224365234375, -0.48388671875, -0.3453369140625, -0.206787109375, -0.0682373046875, 0.0703125, 0.2088623046875, 0.347412109375, 0.4859619140625, 0.62451171875, 0.7630615234375, 0.901611328125, 1.0401611328125, 1.1787109375, 1.3172607421875, 1.455810546875, 1.5943603515625, 1.73291015625, 1.8714599609375, 2.010009765625, 2.1485595703125, 2.287109375, 2.4256591796875, 2.564208984375, 2.7027587890625, 2.84130859375, 2.9798583984375, 3.118408203125, 3.2569580078125, 3.3955078125, 3.5340576171875, 3.672607421875, 3.8111572265625, 3.94970703125, 4.0882568359375, 4.226806640625, 4.3653564453125, 4.50390625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 3.0, 0.0, 6.0, 10.0, 24.0, 18.0, 24.0, 33.0, 69.0, 87.0, 127.0, 139.0, 202.0, 311.0, 496.0, 666.0, 981.0, 1444.0, 2193.0, 3133.0, 4710.0, 7344.0, 11070.0, 17039.0, 28089.0, 46939.0, 84986.0, 177729.0, 302649.0, 160578.0, 78640.0, 44715.0, 26631.0, 16234.0, 10546.0, 6704.0, 4332.0, 3056.0, 2011.0, 1440.0, 978.0, 676.0, 455.0, 315.0, 201.0, 163.0, 105.0, 82.0, 43.0, 42.0, 34.0, 29.0, 14.0, 4.0, 6.0, 1.0, 0.0, 3.0, 5.0, 3.0], "bins": [-0.1568603515625, -0.1520252227783203, -0.14719009399414062, -0.14235496520996094, -0.13751983642578125, -0.13268470764160156, -0.12784957885742188, -0.12301445007324219, -0.1181793212890625, -0.11334419250488281, -0.10850906372070312, -0.10367393493652344, -0.09883880615234375, -0.09400367736816406, -0.08916854858398438, -0.08433341979980469, -0.079498291015625, -0.07466316223144531, -0.06982803344726562, -0.06499290466308594, -0.06015777587890625, -0.05532264709472656, -0.050487518310546875, -0.04565238952636719, -0.0408172607421875, -0.03598213195800781, -0.031147003173828125, -0.026311874389648438, -0.02147674560546875, -0.016641616821289062, -0.011806488037109375, -0.0069713592529296875, -0.00213623046875, 0.0026988983154296875, 0.007534027099609375, 0.012369155883789062, 0.01720428466796875, 0.022039413452148438, 0.026874542236328125, 0.03170967102050781, 0.0365447998046875, 0.04137992858886719, 0.046215057373046875, 0.05105018615722656, 0.05588531494140625, 0.06072044372558594, 0.06555557250976562, 0.07039070129394531, 0.075225830078125, 0.08006095886230469, 0.08489608764648438, 0.08973121643066406, 0.09456634521484375, 0.09940147399902344, 0.10423660278320312, 0.10907173156738281, 0.1139068603515625, 0.11874198913574219, 0.12357711791992188, 0.12841224670410156, 0.13324737548828125, 0.13808250427246094, 0.14291763305664062, 0.1477527618408203, 0.152587890625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 8.0, 11.0, 7.0, 14.0, 17.0, 13.0, 18.0, 26.0, 22.0, 29.0, 22.0, 40.0, 39.0, 32.0, 51.0, 36.0, 44.0, 46.0, 1053.0, 45.0, 43.0, 37.0, 36.0, 39.0, 26.0, 33.0, 30.0, 34.0, 26.0, 15.0, 14.0, 19.0, 18.0, 17.0, 13.0, 11.0, 11.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.392578125, -3.29278564453125, -3.1929931640625, -3.09320068359375, -2.993408203125, -2.89361572265625, -2.7938232421875, -2.69403076171875, -2.59423828125, -2.49444580078125, -2.3946533203125, -2.29486083984375, -2.195068359375, -2.09527587890625, -1.9954833984375, -1.89569091796875, -1.7958984375, -1.69610595703125, -1.5963134765625, -1.49652099609375, -1.396728515625, -1.29693603515625, -1.1971435546875, -1.09735107421875, -0.99755859375, -0.89776611328125, -0.7979736328125, -0.69818115234375, -0.598388671875, -0.49859619140625, -0.3988037109375, -0.29901123046875, -0.19921875, -0.09942626953125, 0.0003662109375, 0.10015869140625, 0.199951171875, 0.29974365234375, 0.3995361328125, 0.49932861328125, 0.59912109375, 0.69891357421875, 0.7987060546875, 0.89849853515625, 0.998291015625, 1.09808349609375, 1.1978759765625, 1.29766845703125, 1.3974609375, 1.49725341796875, 1.5970458984375, 1.69683837890625, 1.796630859375, 1.89642333984375, 1.9962158203125, 2.09600830078125, 2.19580078125, 2.29559326171875, 2.3953857421875, 2.49517822265625, 2.594970703125, 2.69476318359375, 2.7945556640625, 2.89434814453125, 2.994140625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 16.0, 19.0, 30.0, 49.0, 58.0, 87.0, 144.0, 224.0, 392.0, 574.0, 943.0, 1538.0, 2391.0, 4000.0, 6460.0, 10819.0, 17999.0, 30070.0, 52158.0, 97659.0, 219327.0, 1353054.0, 135608.0, 67844.0, 38124.0, 22626.0, 13698.0, 8061.0, 4969.0, 3177.0, 1838.0, 1178.0, 718.0, 473.0, 292.0, 164.0, 117.0, 80.0, 48.0, 25.0, 29.0, 20.0, 13.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1243896484375, -0.12075519561767578, -0.11712074279785156, -0.11348628997802734, -0.10985183715820312, -0.1062173843383789, -0.10258293151855469, -0.09894847869873047, -0.09531402587890625, -0.09167957305908203, -0.08804512023925781, -0.0844106674194336, -0.08077621459960938, -0.07714176177978516, -0.07350730895996094, -0.06987285614013672, -0.0662384033203125, -0.06260395050048828, -0.05896949768066406, -0.055335044860839844, -0.051700592041015625, -0.048066139221191406, -0.04443168640136719, -0.04079723358154297, -0.03716278076171875, -0.03352832794189453, -0.029893875122070312, -0.026259422302246094, -0.022624969482421875, -0.018990516662597656, -0.015356063842773438, -0.011721611022949219, -0.008087158203125, -0.004452705383300781, -0.0008182525634765625, 0.0028162002563476562, 0.006450653076171875, 0.010085105895996094, 0.013719558715820312, 0.01735401153564453, 0.02098846435546875, 0.02462291717529297, 0.028257369995117188, 0.031891822814941406, 0.035526275634765625, 0.039160728454589844, 0.04279518127441406, 0.04642963409423828, 0.0500640869140625, 0.05369853973388672, 0.05733299255371094, 0.060967445373535156, 0.06460189819335938, 0.0682363510131836, 0.07187080383300781, 0.07550525665283203, 0.07913970947265625, 0.08277416229248047, 0.08640861511230469, 0.0900430679321289, 0.09367752075195312, 0.09731197357177734, 0.10094642639160156, 0.10458087921142578, 0.10821533203125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 6.0, 15.0, 17.0, 17.0, 16.0, 19.0, 15.0, 30.0, 33.0, 35.0, 39.0, 58.0, 60.0, 61.0, 68.0, 61.0, 56.0, 50.0, 47.0, 55.0, 50.0, 22.0, 22.0, 15.0, 20.0, 18.0, 12.0, 13.0, 11.0, 14.0, 5.0, 3.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.365776062011719e-05, -6.189383566379547e-05, -6.0129910707473755e-05, -5.836598575115204e-05, -5.660206079483032e-05, -5.4838135838508606e-05, -5.307421088218689e-05, -5.131028592586517e-05, -4.954636096954346e-05, -4.778243601322174e-05, -4.6018511056900024e-05, -4.425458610057831e-05, -4.249066114425659e-05, -4.0726736187934875e-05, -3.896281123161316e-05, -3.719888627529144e-05, -3.5434961318969727e-05, -3.367103636264801e-05, -3.1907111406326294e-05, -3.0143186450004578e-05, -2.837926149368286e-05, -2.6615336537361145e-05, -2.485141158103943e-05, -2.3087486624717712e-05, -2.1323561668395996e-05, -1.955963671207428e-05, -1.7795711755752563e-05, -1.6031786799430847e-05, -1.4267861843109131e-05, -1.2503936886787415e-05, -1.0740011930465698e-05, -8.976086974143982e-06, -7.212162017822266e-06, -5.448237061500549e-06, -3.684312105178833e-06, -1.9203871488571167e-06, -1.564621925354004e-07, 1.607462763786316e-06, 3.3713877201080322e-06, 5.1353126764297485e-06, 6.899237632751465e-06, 8.663162589073181e-06, 1.0427087545394897e-05, 1.2191012501716614e-05, 1.395493745803833e-05, 1.5718862414360046e-05, 1.7482787370681763e-05, 1.924671232700348e-05, 2.1010637283325195e-05, 2.277456223964691e-05, 2.4538487195968628e-05, 2.6302412152290344e-05, 2.806633710861206e-05, 2.9830262064933777e-05, 3.159418702125549e-05, 3.335811197757721e-05, 3.5122036933898926e-05, 3.688596189022064e-05, 3.864988684654236e-05, 4.0413811802864075e-05, 4.217773675918579e-05, 4.394166171550751e-05, 4.5705586671829224e-05, 4.746951162815094e-05, 4.9233436584472656e-05]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 12.0, 12.0, 15.0, 7.0, 25.0, 23.0, 29.0, 44.0, 64.0, 112.0, 221.0, 483.0, 3732.0, 189390.0, 822548.0, 29800.0, 1186.0, 328.0, 171.0, 93.0, 62.0, 22.0, 26.0, 26.0, 23.0, 16.0, 10.0, 16.0, 13.0, 7.0, 2.0, 0.0, 2.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007991790771484375, -0.000769883394241333, -0.0007405877113342285, -0.000711292028427124, -0.0006819963455200195, -0.000652700662612915, -0.0006234049797058105, -0.0005941092967987061, -0.0005648136138916016, -0.0005355179309844971, -0.0005062222480773926, -0.0004769265651702881, -0.0004476308822631836, -0.0004183351993560791, -0.0003890395164489746, -0.0003597438335418701, -0.0003304481506347656, -0.00030115246772766113, -0.00027185678482055664, -0.00024256110191345215, -0.00021326541900634766, -0.00018396973609924316, -0.00015467405319213867, -0.00012537837028503418, -9.608268737792969e-05, -6.67870044708252e-05, -3.74913215637207e-05, -8.195638656616211e-06, 2.110004425048828e-05, 5.0395727157592773e-05, 7.969141006469727e-05, 0.00010898709297180176, 0.00013828277587890625, 0.00016757845878601074, 0.00019687414169311523, 0.00022616982460021973, 0.0002554655075073242, 0.0002847611904144287, 0.0003140568733215332, 0.0003433525562286377, 0.0003726482391357422, 0.0004019439220428467, 0.00043123960494995117, 0.00046053528785705566, 0.0004898309707641602, 0.0005191266536712646, 0.0005484223365783691, 0.0005777180194854736, 0.0006070137023925781, 0.0006363093852996826, 0.0006656050682067871, 0.0006949007511138916, 0.0007241964340209961, 0.0007534921169281006, 0.0007827877998352051, 0.0008120834827423096, 0.0008413791656494141, 0.0008706748485565186, 0.000899970531463623, 0.0009292662143707275, 0.000958561897277832, 0.0009878575801849365, 0.001017153263092041, 0.0010464489459991455, 0.00107574462890625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 16.0, 44.0, 99.0, 231.0, 269.0, 197.0, 99.0, 36.0, 15.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3341970012988895e-05, -3.8189984479686245e-05, -3.3037998946383595e-05, -2.788600977510214e-05, -2.273402424179949e-05, -1.758203870849684e-05, -1.2430049537215382e-05, -7.278064003912732e-06, -2.126078470610082e-06, 3.0259079721872695e-06, 8.177894414984621e-06, 1.3329881767276675e-05, 1.8481867300579324e-05, 2.3633852833881974e-05, 2.878584200516343e-05, 3.393782753846608e-05, 3.908981307176873e-05, 4.424179860507138e-05, 4.939378413837403e-05, 5.454577330965549e-05, 5.969775884295814e-05, 6.484974437626079e-05, 7.000173354754224e-05, 7.515371544286609e-05, 8.030570461414754e-05, 8.5457693785429e-05, 9.060967568075284e-05, 9.57616648520343e-05, 0.00010091364674735814, 0.0001060656359186396, 0.00011121762508992106, 0.00011636961426120251, 0.00012152158888056874, 0.0001266735780518502, 0.00013182556722313166, 0.00013697755639441311, 0.00014212953101377934, 0.0001472815201850608, 0.00015243350935634226, 0.0001575854985276237, 0.00016273747314698994, 0.0001678894623182714, 0.00017304145148955286, 0.0001781934406608343, 0.00018334541528020054, 0.000188497404451482, 0.00019364939362276345, 0.0001988013827940449, 0.00020395337196532637, 0.00020910536113660783, 0.00021425735030788928, 0.0002194093249272555, 0.00022456131409853697, 0.00022971330326981843, 0.00023486529244109988, 0.00024001728161238134, 0.0002451692707836628, 0.00025032125995494425, 0.0002554732491262257, 0.00026062523829750717, 0.0002657772274687886, 0.0002709291875362396, 0.00027608120581135154, 0.00028123316587880254, 0.000286385155050084]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 9.0, 7.0, 6.0, 6.0, 12.0, 17.0, 13.0, 22.0, 15.0, 36.0, 30.0, 37.0, 33.0, 24.0, 43.0, 39.0, 40.0, 39.0, 40.0, 50.0, 46.0, 32.0, 52.0, 27.0, 33.0, 37.0, 47.0, 30.0, 26.0, 33.0, 22.0, 14.0, 19.0, 13.0, 7.0, 12.0, 7.0, 6.0, 4.0, 1.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.07099723815918e-05, -3.952439874410629e-05, -3.833882510662079e-05, -3.7153251469135284e-05, -3.596767783164978e-05, -3.4782104194164276e-05, -3.359653055667877e-05, -3.241095691919327e-05, -3.1225383281707764e-05, -3.003980964422226e-05, -2.8854236006736755e-05, -2.766866236925125e-05, -2.6483088731765747e-05, -2.5297515094280243e-05, -2.411194145679474e-05, -2.2926367819309235e-05, -2.174079418182373e-05, -2.0555220544338226e-05, -1.9369646906852722e-05, -1.8184073269367218e-05, -1.6998499631881714e-05, -1.581292599439621e-05, -1.4627352356910706e-05, -1.3441778719425201e-05, -1.2256205081939697e-05, -1.1070631444454193e-05, -9.885057806968689e-06, -8.699484169483185e-06, -7.513910531997681e-06, -6.3283368945121765e-06, -5.142763257026672e-06, -3.957189619541168e-06, -2.771615982055664e-06, -1.58604234457016e-06, -4.0046870708465576e-07, 7.851049304008484e-07, 1.9706785678863525e-06, 3.1562522053718567e-06, 4.341825842857361e-06, 5.527399480342865e-06, 6.712973117828369e-06, 7.898546755313873e-06, 9.084120392799377e-06, 1.0269694030284882e-05, 1.1455267667770386e-05, 1.264084130525589e-05, 1.3826414942741394e-05, 1.5011988580226898e-05, 1.6197562217712402e-05, 1.7383135855197906e-05, 1.856870949268341e-05, 1.9754283130168915e-05, 2.093985676765442e-05, 2.2125430405139923e-05, 2.3311004042625427e-05, 2.449657768011093e-05, 2.5682151317596436e-05, 2.686772495508194e-05, 2.8053298592567444e-05, 2.9238872230052948e-05, 3.0424445867538452e-05, 3.1610019505023956e-05, 3.279559314250946e-05, 3.3981166779994965e-05, 3.516674041748047e-05]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 13.0, 16.0, 14.0, 7.0, 14.0, 16.0, 19.0, 23.0, 28.0, 44.0, 39.0, 43.0, 38.0, 40.0, 42.0, 57.0, 50.0, 50.0, 40.0, 43.0, 45.0, 36.0, 40.0, 35.0, 22.0, 39.0, 24.0, 15.0, 22.0, 14.0, 16.0, 7.0, 8.0, 1.0, 6.0, 9.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.36328125, -4.2247314453125, -4.086181640625, -3.9476318359375, -3.80908203125, -3.6705322265625, -3.531982421875, -3.3934326171875, -3.2548828125, -3.1163330078125, -2.977783203125, -2.8392333984375, -2.70068359375, -2.5621337890625, -2.423583984375, -2.2850341796875, -2.146484375, -2.0079345703125, -1.869384765625, -1.7308349609375, -1.59228515625, -1.4537353515625, -1.315185546875, -1.1766357421875, -1.0380859375, -0.8995361328125, -0.760986328125, -0.6224365234375, -0.48388671875, -0.3453369140625, -0.206787109375, -0.0682373046875, 0.0703125, 0.2088623046875, 0.347412109375, 0.4859619140625, 0.62451171875, 0.7630615234375, 0.901611328125, 1.0401611328125, 1.1787109375, 1.3172607421875, 1.455810546875, 1.5943603515625, 1.73291015625, 1.8714599609375, 2.010009765625, 2.1485595703125, 2.287109375, 2.4256591796875, 2.564208984375, 2.7027587890625, 2.84130859375, 2.9798583984375, 3.118408203125, 3.2569580078125, 3.3955078125, 3.5340576171875, 3.672607421875, 3.8111572265625, 3.94970703125, 4.0882568359375, 4.226806640625, 4.3653564453125, 4.50390625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 5.0, 7.0, 8.0, 10.0, 9.0, 21.0, 16.0, 26.0, 22.0, 27.0, 37.0, 62.0, 92.0, 115.0, 200.0, 239.0, 348.0, 662.0, 1104.0, 1981.0, 4061.0, 10252.0, 35127.0, 214414.0, 691632.0, 61142.0, 15219.0, 5522.0, 2589.0, 1396.0, 788.0, 422.0, 275.0, 197.0, 128.0, 104.0, 61.0, 52.0, 28.0, 34.0, 32.0, 18.0, 14.0, 12.0, 10.0, 8.0, 8.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.4296875, -12.9847412109375, -12.539794921875, -12.0948486328125, -11.64990234375, -11.2049560546875, -10.760009765625, -10.3150634765625, -9.8701171875, -9.4251708984375, -8.980224609375, -8.5352783203125, -8.09033203125, -7.6453857421875, -7.200439453125, -6.7554931640625, -6.310546875, -5.8656005859375, -5.420654296875, -4.9757080078125, -4.53076171875, -4.0858154296875, -3.640869140625, -3.1959228515625, -2.7509765625, -2.3060302734375, -1.861083984375, -1.4161376953125, -0.97119140625, -0.5262451171875, -0.081298828125, 0.3636474609375, 0.80859375, 1.2535400390625, 1.698486328125, 2.1434326171875, 2.58837890625, 3.0333251953125, 3.478271484375, 3.9232177734375, 4.3681640625, 4.8131103515625, 5.258056640625, 5.7030029296875, 6.14794921875, 6.5928955078125, 7.037841796875, 7.4827880859375, 7.927734375, 8.3726806640625, 8.817626953125, 9.2625732421875, 9.70751953125, 10.1524658203125, 10.597412109375, 11.0423583984375, 11.4873046875, 11.9322509765625, 12.377197265625, 12.8221435546875, 13.26708984375, 13.7120361328125, 14.156982421875, 14.6019287109375, 15.046875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 0.0, 7.0, 8.0, 17.0, 14.0, 16.0, 24.0, 15.0, 28.0, 29.0, 33.0, 40.0, 49.0, 42.0, 44.0, 62.0, 86.0, 112.0, 271.0, 1546.0, 116.0, 78.0, 68.0, 57.0, 40.0, 36.0, 39.0, 26.0, 23.0, 20.0, 22.0, 17.0, 18.0, 10.0, 6.0, 6.0, 5.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.265625, -13.775390625, -13.28515625, -12.794921875, -12.3046875, -11.814453125, -11.32421875, -10.833984375, -10.34375, -9.853515625, -9.36328125, -8.873046875, -8.3828125, -7.892578125, -7.40234375, -6.912109375, -6.421875, -5.931640625, -5.44140625, -4.951171875, -4.4609375, -3.970703125, -3.48046875, -2.990234375, -2.5, -2.009765625, -1.51953125, -1.029296875, -0.5390625, -0.048828125, 0.44140625, 0.931640625, 1.421875, 1.912109375, 2.40234375, 2.892578125, 3.3828125, 3.873046875, 4.36328125, 4.853515625, 5.34375, 5.833984375, 6.32421875, 6.814453125, 7.3046875, 7.794921875, 8.28515625, 8.775390625, 9.265625, 9.755859375, 10.24609375, 10.736328125, 11.2265625, 11.716796875, 12.20703125, 12.697265625, 13.1875, 13.677734375, 14.16796875, 14.658203125, 15.1484375, 15.638671875, 16.12890625, 16.619140625, 17.109375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 7.0, 12.0, 10.0, 10.0, 19.0, 30.0, 27.0, 47.0, 75.0, 89.0, 144.0, 238.0, 439.0, 1047.0, 3584.0, 19184.0, 226188.0, 2790082.0, 89517.0, 10759.0, 2322.0, 774.0, 339.0, 228.0, 165.0, 100.0, 69.0, 49.0, 32.0, 32.0, 22.0, 19.0, 12.0, 7.0, 6.0, 2.0, 7.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.65625, -28.766845703125, -27.87744140625, -26.988037109375, -26.0986328125, -25.209228515625, -24.31982421875, -23.430419921875, -22.541015625, -21.651611328125, -20.76220703125, -19.872802734375, -18.9833984375, -18.093994140625, -17.20458984375, -16.315185546875, -15.42578125, -14.536376953125, -13.64697265625, -12.757568359375, -11.8681640625, -10.978759765625, -10.08935546875, -9.199951171875, -8.310546875, -7.421142578125, -6.53173828125, -5.642333984375, -4.7529296875, -3.863525390625, -2.97412109375, -2.084716796875, -1.1953125, -0.305908203125, 0.58349609375, 1.472900390625, 2.3623046875, 3.251708984375, 4.14111328125, 5.030517578125, 5.919921875, 6.809326171875, 7.69873046875, 8.588134765625, 9.4775390625, 10.366943359375, 11.25634765625, 12.145751953125, 13.03515625, 13.924560546875, 14.81396484375, 15.703369140625, 16.5927734375, 17.482177734375, 18.37158203125, 19.260986328125, 20.150390625, 21.039794921875, 21.92919921875, 22.818603515625, 23.7080078125, 24.597412109375, 25.48681640625, 26.376220703125, 27.265625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 243.0, 756.0, 19.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.11857223510742, -30.582426071166992, -17.046279907226562, -3.5101356506347656, 10.026012420654297, 23.56216049194336, 37.09830093383789, 50.63444900512695, 64.17059326171875, 77.70674133300781, 91.24288940429688, 104.7790298461914, 118.31517791748047, 131.851318359375, 145.38746643066406, 158.92361450195312, 172.4597625732422, 185.99591064453125, 199.5320587158203, 213.06820678710938, 226.60433959960938, 240.1405029296875, 253.6766357421875, 267.2127685546875, 280.7489318847656, 294.2850646972656, 307.82122802734375, 321.35736083984375, 334.8935241699219, 348.4296569824219, 361.9658203125, 375.501953125, 389.0380859375, 402.57421875, 416.1103820800781, 429.6465148925781, 443.18267822265625, 456.71881103515625, 470.25494384765625, 483.7911071777344, 497.3272705078125, 510.8634033203125, 524.3995361328125, 537.9357299804688, 551.4718627929688, 565.0079956054688, 578.5441284179688, 592.080322265625, 605.616455078125, 619.152587890625, 632.688720703125, 646.2249145507812, 659.7610473632812, 673.2971801757812, 686.8333129882812, 700.3695068359375, 713.9055786132812, 727.4417114257812, 740.9778442382812, 754.5140380859375, 768.0501708984375, 781.5863037109375, 795.1224365234375, 808.6585693359375, 822.1947631835938]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 9.0, 4.0, 4.0, 11.0, 7.0, 11.0, 15.0, 10.0, 16.0, 13.0, 30.0, 17.0, 35.0, 25.0, 34.0, 24.0, 36.0, 39.0, 40.0, 40.0, 40.0, 33.0, 43.0, 36.0, 49.0, 35.0, 44.0, 45.0, 35.0, 41.0, 25.0, 20.0, 20.0, 13.0, 25.0, 15.0, 13.0, 9.0, 17.0, 10.0, 5.0, 4.0, 4.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-50.25257873535156, -48.816070556640625, -47.37956237792969, -45.94305419921875, -44.50654220581055, -43.07003402709961, -41.63352584838867, -40.197017669677734, -38.76050567626953, -37.323997497558594, -35.887489318847656, -34.45098114013672, -33.014469146728516, -31.577960968017578, -30.14145278930664, -28.704944610595703, -27.268436431884766, -25.831928253173828, -24.395418167114258, -22.95890998840332, -21.52239990234375, -20.085891723632812, -18.649383544921875, -17.212875366210938, -15.776365280151367, -14.339856147766113, -12.90334701538086, -11.466838836669922, -10.030329704284668, -8.593820571899414, -7.157312393188477, -5.720803260803223, -4.284294128417969, -2.847785234451294, -1.4112763404846191, 0.025232315063476562, 1.4617414474487305, 2.8982505798339844, 4.334758758544922, 5.771267890930176, 7.20777702331543, 8.644286155700684, 10.080795288085938, 11.517303466796875, 12.953812599182129, 14.390321731567383, 15.82682991027832, 17.26333999633789, 18.699848175048828, 20.136356353759766, 21.572866439819336, 23.009374618530273, 24.445884704589844, 25.88239288330078, 27.31890106201172, 28.755409240722656, 30.191919326782227, 31.628427505493164, 33.064937591552734, 34.50144577026367, 35.93795394897461, 37.37446594238281, 38.81097412109375, 40.24748229980469, 41.683990478515625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 7.0, 10.0, 15.0, 10.0, 10.0, 16.0, 13.0, 21.0, 18.0, 31.0, 31.0, 42.0, 34.0, 46.0, 38.0, 52.0, 48.0, 45.0, 31.0, 50.0, 42.0, 42.0, 49.0, 34.0, 30.0, 33.0, 32.0, 33.0, 26.0, 17.0, 20.0, 19.0, 7.0, 8.0, 7.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.3291015625, -4.185546875, -4.0419921875, -3.8984375, -3.7548828125, -3.611328125, -3.4677734375, -3.32421875, -3.1806640625, -3.037109375, -2.8935546875, -2.75, -2.6064453125, -2.462890625, -2.3193359375, -2.17578125, -2.0322265625, -1.888671875, -1.7451171875, -1.6015625, -1.4580078125, -1.314453125, -1.1708984375, -1.02734375, -0.8837890625, -0.740234375, -0.5966796875, -0.453125, -0.3095703125, -0.166015625, -0.0224609375, 0.12109375, 0.2646484375, 0.408203125, 0.5517578125, 0.6953125, 0.8388671875, 0.982421875, 1.1259765625, 1.26953125, 1.4130859375, 1.556640625, 1.7001953125, 1.84375, 1.9873046875, 2.130859375, 2.2744140625, 2.41796875, 2.5615234375, 2.705078125, 2.8486328125, 2.9921875, 3.1357421875, 3.279296875, 3.4228515625, 3.56640625, 3.7099609375, 3.853515625, 3.9970703125, 4.140625, 4.2841796875, 4.427734375, 4.5712890625, 4.71484375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 9.0, 10.0, 21.0, 18.0, 33.0, 42.0, 76.0, 113.0, 187.0, 371.0, 711.0, 1617.0, 5043.0, 20948.0, 131318.0, 2349354.0, 1563243.0, 97295.0, 16763.0, 4210.0, 1433.0, 654.0, 351.0, 164.0, 94.0, 59.0, 49.0, 28.0, 26.0, 9.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.66552734375, -16.1435546875, -15.62158203125, -15.099609375, -14.57763671875, -14.0556640625, -13.53369140625, -13.01171875, -12.48974609375, -11.9677734375, -11.44580078125, -10.923828125, -10.40185546875, -9.8798828125, -9.35791015625, -8.8359375, -8.31396484375, -7.7919921875, -7.27001953125, -6.748046875, -6.22607421875, -5.7041015625, -5.18212890625, -4.66015625, -4.13818359375, -3.6162109375, -3.09423828125, -2.572265625, -2.05029296875, -1.5283203125, -1.00634765625, -0.484375, 0.03759765625, 0.5595703125, 1.08154296875, 1.603515625, 2.12548828125, 2.6474609375, 3.16943359375, 3.69140625, 4.21337890625, 4.7353515625, 5.25732421875, 5.779296875, 6.30126953125, 6.8232421875, 7.34521484375, 7.8671875, 8.38916015625, 8.9111328125, 9.43310546875, 9.955078125, 10.47705078125, 10.9990234375, 11.52099609375, 12.04296875, 12.56494140625, 13.0869140625, 13.60888671875, 14.130859375, 14.65283203125, 15.1748046875, 15.69677734375, 16.21875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 6.0, 4.0, 12.0, 7.0, 18.0, 15.0, 23.0, 44.0, 46.0, 62.0, 121.0, 148.0, 240.0, 340.0, 509.0, 642.0, 528.0, 390.0, 269.0, 175.0, 134.0, 95.0, 79.0, 56.0, 28.0, 16.0, 18.0, 9.0, 13.0, 7.0, 8.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.046875, -10.6856689453125, -10.324462890625, -9.9632568359375, -9.60205078125, -9.2408447265625, -8.879638671875, -8.5184326171875, -8.1572265625, -7.7960205078125, -7.434814453125, -7.0736083984375, -6.71240234375, -6.3511962890625, -5.989990234375, -5.6287841796875, -5.267578125, -4.9063720703125, -4.545166015625, -4.1839599609375, -3.82275390625, -3.4615478515625, -3.100341796875, -2.7391357421875, -2.3779296875, -2.0167236328125, -1.655517578125, -1.2943115234375, -0.93310546875, -0.5718994140625, -0.210693359375, 0.1505126953125, 0.51171875, 0.8729248046875, 1.234130859375, 1.5953369140625, 1.95654296875, 2.3177490234375, 2.678955078125, 3.0401611328125, 3.4013671875, 3.7625732421875, 4.123779296875, 4.4849853515625, 4.84619140625, 5.2073974609375, 5.568603515625, 5.9298095703125, 6.291015625, 6.6522216796875, 7.013427734375, 7.3746337890625, 7.73583984375, 8.0970458984375, 8.458251953125, 8.8194580078125, 9.1806640625, 9.5418701171875, 9.903076171875, 10.2642822265625, 10.62548828125, 10.9866943359375, 11.347900390625, 11.7091064453125, 12.0703125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 7.0, 14.0, 22.0, 27.0, 44.0, 51.0, 117.0, 160.0, 320.0, 520.0, 1123.0, 2581.0, 7087.0, 24092.0, 100715.0, 666013.0, 2838782.0, 448648.0, 75176.0, 18740.0, 5919.0, 2118.0, 919.0, 427.0, 224.0, 136.0, 98.0, 50.0, 36.0, 27.0, 20.0, 15.0, 7.0, 7.0, 5.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.62353515625, -17.0439453125, -16.46435546875, -15.884765625, -15.30517578125, -14.7255859375, -14.14599609375, -13.56640625, -12.98681640625, -12.4072265625, -11.82763671875, -11.248046875, -10.66845703125, -10.0888671875, -9.50927734375, -8.9296875, -8.35009765625, -7.7705078125, -7.19091796875, -6.611328125, -6.03173828125, -5.4521484375, -4.87255859375, -4.29296875, -3.71337890625, -3.1337890625, -2.55419921875, -1.974609375, -1.39501953125, -0.8154296875, -0.23583984375, 0.34375, 0.92333984375, 1.5029296875, 2.08251953125, 2.662109375, 3.24169921875, 3.8212890625, 4.40087890625, 4.98046875, 5.56005859375, 6.1396484375, 6.71923828125, 7.298828125, 7.87841796875, 8.4580078125, 9.03759765625, 9.6171875, 10.19677734375, 10.7763671875, 11.35595703125, 11.935546875, 12.51513671875, 13.0947265625, 13.67431640625, 14.25390625, 14.83349609375, 15.4130859375, 15.99267578125, 16.572265625, 17.15185546875, 17.7314453125, 18.31103515625, 18.890625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 13.0, 33.0, 55.0, 76.0, 105.0, 117.0, 138.0, 141.0, 109.0, 82.0, 54.0, 28.0, 31.0, 10.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.2820816040039, -90.87358856201172, -88.46509552001953, -86.05660247802734, -83.64810943603516, -81.23961639404297, -78.83112335205078, -76.42263793945312, -74.01414489746094, -71.60565185546875, -69.19715881347656, -66.78866577148438, -64.38017272949219, -61.9716796875, -59.56319046020508, -57.15469741821289, -54.74620056152344, -52.33770751953125, -49.92921447753906, -47.520721435546875, -45.11222839355469, -42.7037353515625, -40.29524612426758, -37.88675308227539, -35.4782600402832, -33.069766998291016, -30.661273956298828, -28.252782821655273, -25.844289779663086, -23.4357967376709, -21.027305603027344, -18.618812561035156, -16.21031951904297, -13.801826477050781, -11.39333438873291, -8.984842300415039, -6.576349258422852, -4.167856216430664, -1.759364128112793, 0.6491279602050781, 3.0576210021972656, 5.466113567352295, 7.874606132507324, 10.283098220825195, 12.691591262817383, 15.10008430480957, 17.508575439453125, 19.917068481445312, 22.3255615234375, 24.734054565429688, 27.142547607421875, 29.55103874206543, 31.959531784057617, 34.36802673339844, 36.77651596069336, 39.18500900268555, 41.593502044677734, 44.00199508666992, 46.41048812866211, 48.8189811706543, 51.22747039794922, 53.635963439941406, 56.044456481933594, 58.45294952392578, 60.86144256591797]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 7.0, 3.0, 13.0, 18.0, 20.0, 22.0, 16.0, 26.0, 26.0, 28.0, 28.0, 42.0, 35.0, 43.0, 48.0, 43.0, 48.0, 35.0, 33.0, 41.0, 50.0, 37.0, 42.0, 48.0, 30.0, 30.0, 30.0, 24.0, 28.0, 17.0, 18.0, 13.0, 13.0, 8.0, 8.0, 2.0, 4.0, 0.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.360870361328125, -34.18288803100586, -33.004905700683594, -31.826923370361328, -30.648941040039062, -29.470958709716797, -28.29297637939453, -27.114994049072266, -25.93701171875, -24.759029388427734, -23.58104705810547, -22.403064727783203, -21.225082397460938, -20.047100067138672, -18.869117736816406, -17.69113540649414, -16.513151168823242, -15.335168838500977, -14.157186508178711, -12.979204177856445, -11.80122184753418, -10.623239517211914, -9.445256233215332, -8.267273902893066, -7.089291572570801, -5.911309242248535, -4.7333269119262695, -3.5553441047668457, -2.37736177444458, -1.1993794441223145, -0.021396636962890625, 1.156585693359375, 2.3345680236816406, 3.5125503540039062, 4.690532684326172, 5.868515491485596, 7.046497821807861, 8.224479675292969, 9.40246295928955, 10.580445289611816, 11.758427619934082, 12.936409950256348, 14.114392280578613, 15.292375564575195, 16.47035789489746, 17.648340225219727, 18.826322555541992, 20.004304885864258, 21.182287216186523, 22.36026954650879, 23.538251876831055, 24.71623420715332, 25.894216537475586, 27.07219886779785, 28.25018310546875, 29.428165435791016, 30.60614776611328, 31.784130096435547, 32.96211242675781, 34.14009475708008, 35.318077087402344, 36.49605941772461, 37.674041748046875, 38.85202407836914, 40.030006408691406]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 8.0, 8.0, 12.0, 14.0, 16.0, 20.0, 17.0, 8.0, 25.0, 31.0, 24.0, 45.0, 34.0, 35.0, 39.0, 50.0, 41.0, 44.0, 40.0, 36.0, 38.0, 30.0, 38.0, 31.0, 43.0, 39.0, 34.0, 29.0, 22.0, 27.0, 21.0, 13.0, 15.0, 8.0, 12.0, 12.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.1328125, -3.99810791015625, -3.8634033203125, -3.72869873046875, -3.593994140625, -3.45928955078125, -3.3245849609375, -3.18988037109375, -3.05517578125, -2.92047119140625, -2.7857666015625, -2.65106201171875, -2.516357421875, -2.38165283203125, -2.2469482421875, -2.11224365234375, -1.9775390625, -1.84283447265625, -1.7081298828125, -1.57342529296875, -1.438720703125, -1.30401611328125, -1.1693115234375, -1.03460693359375, -0.89990234375, -0.76519775390625, -0.6304931640625, -0.49578857421875, -0.361083984375, -0.22637939453125, -0.0916748046875, 0.04302978515625, 0.177734375, 0.31243896484375, 0.4471435546875, 0.58184814453125, 0.716552734375, 0.85125732421875, 0.9859619140625, 1.12066650390625, 1.25537109375, 1.39007568359375, 1.5247802734375, 1.65948486328125, 1.794189453125, 1.92889404296875, 2.0635986328125, 2.19830322265625, 2.3330078125, 2.46771240234375, 2.6024169921875, 2.73712158203125, 2.871826171875, 3.00653076171875, 3.1412353515625, 3.27593994140625, 3.41064453125, 3.54534912109375, 3.6800537109375, 3.81475830078125, 3.949462890625, 4.08416748046875, 4.2188720703125, 4.35357666015625, 4.48828125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 8.0, 3.0, 5.0, 9.0, 12.0, 27.0, 41.0, 52.0, 65.0, 115.0, 178.0, 236.0, 375.0, 532.0, 792.0, 1148.0, 1822.0, 2615.0, 4046.0, 6065.0, 9212.0, 14058.0, 22074.0, 35308.0, 58223.0, 102685.0, 215080.0, 265091.0, 126167.0, 68766.0, 41086.0, 25384.0, 16153.0, 10570.0, 6864.0, 4494.0, 3049.0, 2003.0, 1438.0, 845.0, 624.0, 414.0, 285.0, 194.0, 128.0, 73.0, 54.0, 43.0, 18.0, 10.0, 11.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1529541015625, -0.14804458618164062, -0.14313507080078125, -0.13822555541992188, -0.1333160400390625, -0.12840652465820312, -0.12349700927734375, -0.11858749389648438, -0.113677978515625, -0.10876846313476562, -0.10385894775390625, -0.09894943237304688, -0.0940399169921875, -0.08913040161132812, -0.08422088623046875, -0.07931137084960938, -0.07440185546875, -0.06949234008789062, -0.06458282470703125, -0.059673309326171875, -0.0547637939453125, -0.049854278564453125, -0.04494476318359375, -0.040035247802734375, -0.035125732421875, -0.030216217041015625, -0.02530670166015625, -0.020397186279296875, -0.0154876708984375, -0.010578155517578125, -0.00566864013671875, -0.000759124755859375, 0.004150390625, 0.009059906005859375, 0.01396942138671875, 0.018878936767578125, 0.0237884521484375, 0.028697967529296875, 0.03360748291015625, 0.038516998291015625, 0.043426513671875, 0.048336029052734375, 0.05324554443359375, 0.058155059814453125, 0.0630645751953125, 0.06797409057617188, 0.07288360595703125, 0.07779312133789062, 0.08270263671875, 0.08761215209960938, 0.09252166748046875, 0.09743118286132812, 0.1023406982421875, 0.10725021362304688, 0.11215972900390625, 0.11706924438476562, 0.121978759765625, 0.12688827514648438, 0.13179779052734375, 0.13670730590820312, 0.1416168212890625, 0.14652633666992188, 0.15143585205078125, 0.15634536743164062, 0.1612548828125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 4.0, 4.0, 8.0, 13.0, 11.0, 7.0, 11.0, 18.0, 21.0, 31.0, 21.0, 31.0, 27.0, 28.0, 43.0, 32.0, 32.0, 39.0, 46.0, 41.0, 1074.0, 47.0, 46.0, 41.0, 29.0, 28.0, 33.0, 32.0, 23.0, 18.0, 19.0, 22.0, 25.0, 19.0, 14.0, 17.0, 11.0, 16.0, 8.0, 6.0, 7.0, 6.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.26953125, -3.1728515625, -3.076171875, -2.9794921875, -2.8828125, -2.7861328125, -2.689453125, -2.5927734375, -2.49609375, -2.3994140625, -2.302734375, -2.2060546875, -2.109375, -2.0126953125, -1.916015625, -1.8193359375, -1.72265625, -1.6259765625, -1.529296875, -1.4326171875, -1.3359375, -1.2392578125, -1.142578125, -1.0458984375, -0.94921875, -0.8525390625, -0.755859375, -0.6591796875, -0.5625, -0.4658203125, -0.369140625, -0.2724609375, -0.17578125, -0.0791015625, 0.017578125, 0.1142578125, 0.2109375, 0.3076171875, 0.404296875, 0.5009765625, 0.59765625, 0.6943359375, 0.791015625, 0.8876953125, 0.984375, 1.0810546875, 1.177734375, 1.2744140625, 1.37109375, 1.4677734375, 1.564453125, 1.6611328125, 1.7578125, 1.8544921875, 1.951171875, 2.0478515625, 2.14453125, 2.2412109375, 2.337890625, 2.4345703125, 2.53125, 2.6279296875, 2.724609375, 2.8212890625, 2.91796875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 13.0, 19.0, 14.0, 35.0, 44.0, 81.0, 109.0, 174.0, 263.0, 397.0, 627.0, 926.0, 1522.0, 2323.0, 3760.0, 5891.0, 9434.0, 15717.0, 25457.0, 42636.0, 74903.0, 156719.0, 1376636.0, 180505.0, 81371.0, 45960.0, 27277.0, 16879.0, 10220.0, 6358.0, 3902.0, 2515.0, 1568.0, 1018.0, 635.0, 430.0, 259.0, 189.0, 113.0, 80.0, 50.0, 36.0, 28.0, 11.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11602783203125, -0.11246585845947266, -0.10890388488769531, -0.10534191131591797, -0.10177993774414062, -0.09821796417236328, -0.09465599060058594, -0.0910940170288086, -0.08753204345703125, -0.0839700698852539, -0.08040809631347656, -0.07684612274169922, -0.07328414916992188, -0.06972217559814453, -0.06616020202636719, -0.06259822845458984, -0.0590362548828125, -0.055474281311035156, -0.05191230773925781, -0.04835033416748047, -0.044788360595703125, -0.04122638702392578, -0.03766441345214844, -0.034102439880371094, -0.03054046630859375, -0.026978492736816406, -0.023416519165039062, -0.01985454559326172, -0.016292572021484375, -0.012730598449707031, -0.009168624877929688, -0.005606651306152344, -0.002044677734375, 0.0015172958374023438, 0.0050792694091796875, 0.008641242980957031, 0.012203216552734375, 0.01576519012451172, 0.019327163696289062, 0.022889137268066406, 0.02645111083984375, 0.030013084411621094, 0.03357505798339844, 0.03713703155517578, 0.040699005126953125, 0.04426097869873047, 0.04782295227050781, 0.051384925842285156, 0.0549468994140625, 0.058508872985839844, 0.06207084655761719, 0.06563282012939453, 0.06919479370117188, 0.07275676727294922, 0.07631874084472656, 0.0798807144165039, 0.08344268798828125, 0.0870046615600586, 0.09056663513183594, 0.09412860870361328, 0.09769058227539062, 0.10125255584716797, 0.10481452941894531, 0.10837650299072266, 0.1119384765625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 6.0, 5.0, 2.0, 6.0, 3.0, 9.0, 12.0, 11.0, 21.0, 20.0, 24.0, 26.0, 31.0, 33.0, 42.0, 39.0, 45.0, 36.0, 33.0, 44.0, 51.0, 50.0, 38.0, 43.0, 42.0, 36.0, 42.0, 43.0, 30.0, 22.0, 26.0, 17.0, 15.0, 13.0, 15.0, 14.0, 9.0, 5.0, 5.0, 8.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0], "bins": [-4.792213439941406e-05, -4.655681550502777e-05, -4.519149661064148e-05, -4.382617771625519e-05, -4.2460858821868896e-05, -4.1095539927482605e-05, -3.9730221033096313e-05, -3.836490213871002e-05, -3.699958324432373e-05, -3.563426434993744e-05, -3.426894545555115e-05, -3.2903626561164856e-05, -3.1538307666778564e-05, -3.0172988772392273e-05, -2.880766987800598e-05, -2.744235098361969e-05, -2.60770320892334e-05, -2.4711713194847107e-05, -2.3346394300460815e-05, -2.1981075406074524e-05, -2.0615756511688232e-05, -1.925043761730194e-05, -1.788511872291565e-05, -1.6519799828529358e-05, -1.5154480934143066e-05, -1.3789162039756775e-05, -1.2423843145370483e-05, -1.1058524250984192e-05, -9.6932053565979e-06, -8.327886462211609e-06, -6.962567567825317e-06, -5.597248673439026e-06, -4.231929779052734e-06, -2.866610884666443e-06, -1.5012919902801514e-06, -1.3597309589385986e-07, 1.2293457984924316e-06, 2.594664692878723e-06, 3.959983587265015e-06, 5.325302481651306e-06, 6.690621376037598e-06, 8.05594027042389e-06, 9.42125916481018e-06, 1.0786578059196472e-05, 1.2151896953582764e-05, 1.3517215847969055e-05, 1.4882534742355347e-05, 1.6247853636741638e-05, 1.761317253112793e-05, 1.897849142551422e-05, 2.0343810319900513e-05, 2.1709129214286804e-05, 2.3074448108673096e-05, 2.4439767003059387e-05, 2.580508589744568e-05, 2.717040479183197e-05, 2.8535723686218262e-05, 2.9901042580604553e-05, 3.1266361474990845e-05, 3.2631680369377136e-05, 3.399699926376343e-05, 3.536231815814972e-05, 3.672763705253601e-05, 3.80929559469223e-05, 3.9458274841308594e-05]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 7.0, 6.0, 9.0, 9.0, 9.0, 16.0, 15.0, 16.0, 30.0, 29.0, 38.0, 74.0, 99.0, 144.0, 318.0, 855.0, 7534.0, 224995.0, 764020.0, 46811.0, 2355.0, 494.0, 188.0, 109.0, 88.0, 61.0, 42.0, 39.0, 20.0, 29.0, 12.0, 14.0, 11.0, 10.0, 4.0, 2.0, 9.0, 3.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006771087646484375, -0.0006539821624755859, -0.0006308555603027344, -0.0006077289581298828, -0.0005846023559570312, -0.0005614757537841797, -0.0005383491516113281, -0.0005152225494384766, -0.000492095947265625, -0.00046896934509277344, -0.0004458427429199219, -0.0004227161407470703, -0.00039958953857421875, -0.0003764629364013672, -0.0003533363342285156, -0.00033020973205566406, -0.0003070831298828125, -0.00028395652770996094, -0.0002608299255371094, -0.0002377033233642578, -0.00021457672119140625, -0.0001914501190185547, -0.00016832351684570312, -0.00014519691467285156, -0.0001220703125, -9.894371032714844e-05, -7.581710815429688e-05, -5.269050598144531e-05, -2.956390380859375e-05, -6.4373016357421875e-06, 1.6689300537109375e-05, 3.981590270996094e-05, 6.29425048828125e-05, 8.606910705566406e-05, 0.00010919570922851562, 0.0001323223114013672, 0.00015544891357421875, 0.0001785755157470703, 0.00020170211791992188, 0.00022482872009277344, 0.000247955322265625, 0.00027108192443847656, 0.0002942085266113281, 0.0003173351287841797, 0.00034046173095703125, 0.0003635883331298828, 0.0003867149353027344, 0.00040984153747558594, 0.0004329681396484375, 0.00045609474182128906, 0.0004792213439941406, 0.0005023479461669922, 0.0005254745483398438, 0.0005486011505126953, 0.0005717277526855469, 0.0005948543548583984, 0.00061798095703125, 0.0006411075592041016, 0.0006642341613769531, 0.0006873607635498047, 0.0007104873657226562, 0.0007336139678955078, 0.0007567405700683594, 0.0007798671722412109, 0.0008029937744140625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [5.0, 78.0, 478.0, 399.0, 54.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.225445470889099e-05, -2.1058283891761675e-05, -9.862113074632362e-06, 1.3340577424969524e-06, 1.2530228559626266e-05, 2.372639937675558e-05, 3.4922570193884894e-05, 4.611874101101421e-05, 5.731491182814352e-05, 6.851108628325164e-05, 7.970725710038096e-05, 9.090342791751027e-05, 0.00010209959873463959, 0.0001132957695517689, 0.0001244919403688982, 0.00013568811118602753, 0.00014688428200315684, 0.00015808045282028615, 0.00016927662363741547, 0.00018047279445454478, 0.0001916689652716741, 0.0002028651360888034, 0.00021406130690593272, 0.00022525747772306204, 0.00023645364854019135, 0.00024764981935732067, 0.00025884597562253475, 0.0002700421609915793, 0.00028123834636062384, 0.0002924345026258379, 0.000303630658891052, 0.00031482684426009655, 0.0003260230296291411, 0.00033721921499818563, 0.0003484153712633997, 0.0003596115275286138, 0.00037080771289765835, 0.0003820038982667029, 0.000393200054531917, 0.00040439621079713106, 0.0004155923961661756, 0.00042678858153522015, 0.00043798473780043423, 0.0004491808940656483, 0.00046037707943469286, 0.0004715732648037374, 0.0004827694210689515, 0.0004939655773341656, 0.0005051617627032101, 0.0005163579480722547, 0.0005275540752336383, 0.0005387502606026828, 0.0005499464459717274, 0.0005611426313407719, 0.0005723388167098165, 0.0005835349438712001, 0.0005947311292402446, 0.0006059273146092892, 0.0006171234417706728, 0.0006283196271397173, 0.0006395158125087619, 0.0006507119978778064, 0.000661908183246851, 0.0006731043104082346, 0.0006843004957772791]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 10.0, 21.0, 13.0, 18.0, 19.0, 18.0, 36.0, 22.0, 29.0, 31.0, 37.0, 32.0, 46.0, 49.0, 32.0, 46.0, 45.0, 55.0, 37.0, 44.0, 32.0, 44.0, 37.0, 32.0, 39.0, 25.0, 23.0, 19.0, 21.0, 13.0, 8.0, 7.0, 6.0, 8.0, 7.0, 5.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.921985626220703e-05, -3.806035965681076e-05, -3.690086305141449e-05, -3.574136644601822e-05, -3.458186984062195e-05, -3.342237323522568e-05, -3.226287662982941e-05, -3.1103380024433136e-05, -2.9943883419036865e-05, -2.8784386813640594e-05, -2.7624890208244324e-05, -2.6465393602848053e-05, -2.5305896997451782e-05, -2.414640039205551e-05, -2.298690378665924e-05, -2.182740718126297e-05, -2.06679105758667e-05, -1.950841397047043e-05, -1.8348917365074158e-05, -1.7189420759677887e-05, -1.6029924154281616e-05, -1.4870427548885345e-05, -1.3710930943489075e-05, -1.2551434338092804e-05, -1.1391937732696533e-05, -1.0232441127300262e-05, -9.072944521903992e-06, -7.913447916507721e-06, -6.75395131111145e-06, -5.5944547057151794e-06, -4.434958100318909e-06, -3.275461494922638e-06, -2.115964889526367e-06, -9.564682841300964e-07, 2.0302832126617432e-07, 1.362524926662445e-06, 2.522021532058716e-06, 3.6815181374549866e-06, 4.841014742851257e-06, 6.000511348247528e-06, 7.160007953643799e-06, 8.31950455904007e-06, 9.47900116443634e-06, 1.0638497769832611e-05, 1.1797994375228882e-05, 1.2957490980625153e-05, 1.4116987586021423e-05, 1.5276484191417694e-05, 1.6435980796813965e-05, 1.7595477402210236e-05, 1.8754974007606506e-05, 1.9914470613002777e-05, 2.1073967218399048e-05, 2.223346382379532e-05, 2.339296042919159e-05, 2.455245703458786e-05, 2.571195363998413e-05, 2.68714502453804e-05, 2.8030946850776672e-05, 2.9190443456172943e-05, 3.0349940061569214e-05, 3.1509436666965485e-05, 3.2668933272361755e-05, 3.3828429877758026e-05, 3.49879264831543e-05]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 8.0, 8.0, 12.0, 14.0, 16.0, 20.0, 17.0, 8.0, 25.0, 31.0, 24.0, 45.0, 34.0, 35.0, 39.0, 50.0, 41.0, 44.0, 40.0, 36.0, 38.0, 30.0, 38.0, 31.0, 43.0, 39.0, 34.0, 29.0, 22.0, 27.0, 21.0, 13.0, 15.0, 8.0, 12.0, 12.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.1328125, -3.99810791015625, -3.8634033203125, -3.72869873046875, -3.593994140625, -3.45928955078125, -3.3245849609375, -3.18988037109375, -3.05517578125, -2.92047119140625, -2.7857666015625, -2.65106201171875, -2.516357421875, -2.38165283203125, -2.2469482421875, -2.11224365234375, -1.9775390625, -1.84283447265625, -1.7081298828125, -1.57342529296875, -1.438720703125, -1.30401611328125, -1.1693115234375, -1.03460693359375, -0.89990234375, -0.76519775390625, -0.6304931640625, -0.49578857421875, -0.361083984375, -0.22637939453125, -0.0916748046875, 0.04302978515625, 0.177734375, 0.31243896484375, 0.4471435546875, 0.58184814453125, 0.716552734375, 0.85125732421875, 0.9859619140625, 1.12066650390625, 1.25537109375, 1.39007568359375, 1.5247802734375, 1.65948486328125, 1.794189453125, 1.92889404296875, 2.0635986328125, 2.19830322265625, 2.3330078125, 2.46771240234375, 2.6024169921875, 2.73712158203125, 2.871826171875, 3.00653076171875, 3.1412353515625, 3.27593994140625, 3.41064453125, 3.54534912109375, 3.6800537109375, 3.81475830078125, 3.949462890625, 4.08416748046875, 4.2188720703125, 4.35357666015625, 4.48828125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 8.0, 9.0, 7.0, 9.0, 21.0, 16.0, 28.0, 39.0, 45.0, 74.0, 113.0, 138.0, 256.0, 371.0, 593.0, 997.0, 1845.0, 4023.0, 11298.0, 43249.0, 293803.0, 585789.0, 77136.0, 17357.0, 5588.0, 2439.0, 1230.0, 712.0, 452.0, 269.0, 181.0, 114.0, 86.0, 75.0, 42.0, 31.0, 21.0, 17.0, 9.0, 11.0, 6.0, 10.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.7578125, -9.4344482421875, -9.111083984375, -8.7877197265625, -8.46435546875, -8.1409912109375, -7.817626953125, -7.4942626953125, -7.1708984375, -6.8475341796875, -6.524169921875, -6.2008056640625, -5.87744140625, -5.5540771484375, -5.230712890625, -4.9073486328125, -4.583984375, -4.2606201171875, -3.937255859375, -3.6138916015625, -3.29052734375, -2.9671630859375, -2.643798828125, -2.3204345703125, -1.9970703125, -1.6737060546875, -1.350341796875, -1.0269775390625, -0.70361328125, -0.3802490234375, -0.056884765625, 0.2664794921875, 0.58984375, 0.9132080078125, 1.236572265625, 1.5599365234375, 1.88330078125, 2.2066650390625, 2.530029296875, 2.8533935546875, 3.1767578125, 3.5001220703125, 3.823486328125, 4.1468505859375, 4.47021484375, 4.7935791015625, 5.116943359375, 5.4403076171875, 5.763671875, 6.0870361328125, 6.410400390625, 6.7337646484375, 7.05712890625, 7.3804931640625, 7.703857421875, 8.0272216796875, 8.3505859375, 8.6739501953125, 8.997314453125, 9.3206787109375, 9.64404296875, 9.9674072265625, 10.290771484375, 10.6141357421875, 10.9375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 9.0, 11.0, 9.0, 9.0, 18.0, 16.0, 22.0, 23.0, 24.0, 34.0, 40.0, 34.0, 49.0, 65.0, 78.0, 109.0, 253.0, 1507.0, 171.0, 103.0, 73.0, 57.0, 44.0, 42.0, 36.0, 27.0, 34.0, 29.0, 15.0, 17.0, 10.0, 8.0, 9.0, 11.0, 11.0, 7.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.15625, -16.609375, -16.0625, -15.515625, -14.96875, -14.421875, -13.875, -13.328125, -12.78125, -12.234375, -11.6875, -11.140625, -10.59375, -10.046875, -9.5, -8.953125, -8.40625, -7.859375, -7.3125, -6.765625, -6.21875, -5.671875, -5.125, -4.578125, -4.03125, -3.484375, -2.9375, -2.390625, -1.84375, -1.296875, -0.75, -0.203125, 0.34375, 0.890625, 1.4375, 1.984375, 2.53125, 3.078125, 3.625, 4.171875, 4.71875, 5.265625, 5.8125, 6.359375, 6.90625, 7.453125, 8.0, 8.546875, 9.09375, 9.640625, 10.1875, 10.734375, 11.28125, 11.828125, 12.375, 12.921875, 13.46875, 14.015625, 14.5625, 15.109375, 15.65625, 16.203125, 16.75, 17.296875, 17.84375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 8.0, 13.0, 10.0, 10.0, 11.0, 16.0, 25.0, 55.0, 37.0, 56.0, 73.0, 86.0, 128.0, 230.0, 432.0, 1107.0, 3471.0, 23261.0, 739463.0, 2332194.0, 37968.0, 4522.0, 1205.0, 484.0, 257.0, 130.0, 110.0, 84.0, 55.0, 43.0, 30.0, 23.0, 16.0, 18.0, 17.0, 15.0, 7.0, 7.0, 3.0, 5.0, 2.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-32.53125, -31.517578125, -30.50390625, -29.490234375, -28.4765625, -27.462890625, -26.44921875, -25.435546875, -24.421875, -23.408203125, -22.39453125, -21.380859375, -20.3671875, -19.353515625, -18.33984375, -17.326171875, -16.3125, -15.298828125, -14.28515625, -13.271484375, -12.2578125, -11.244140625, -10.23046875, -9.216796875, -8.203125, -7.189453125, -6.17578125, -5.162109375, -4.1484375, -3.134765625, -2.12109375, -1.107421875, -0.09375, 0.919921875, 1.93359375, 2.947265625, 3.9609375, 4.974609375, 5.98828125, 7.001953125, 8.015625, 9.029296875, 10.04296875, 11.056640625, 12.0703125, 13.083984375, 14.09765625, 15.111328125, 16.125, 17.138671875, 18.15234375, 19.166015625, 20.1796875, 21.193359375, 22.20703125, 23.220703125, 24.234375, 25.248046875, 26.26171875, 27.275390625, 28.2890625, 29.302734375, 30.31640625, 31.330078125, 32.34375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [10.0, 522.0, 479.0, 8.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.799762725830078, -10.760702133178711, 0.27835845947265625, 11.31741714477539, 22.35647964477539, 33.39554214477539, 44.43459701538086, 55.47365951538086, 66.51272583007812, 77.55178833007812, 88.59085083007812, 99.6299057006836, 110.6689682006836, 121.7080307006836, 132.74708557128906, 143.78614807128906, 154.82521057128906, 165.86427307128906, 176.90333557128906, 187.9423828125, 198.9814453125, 210.0205078125, 221.0595703125, 232.0986328125, 243.1376953125, 254.1767578125, 265.2158203125, 276.2548828125, 287.2939453125, 298.3330078125, 309.3720703125, 320.4111328125, 331.4501953125, 342.4892578125, 353.5283203125, 364.5673828125, 375.6064453125, 386.6455078125, 397.6845703125, 408.7236328125, 419.7626953125, 430.8017578125, 441.8408203125, 452.8798828125, 463.9189453125, 474.9580078125, 485.9970703125, 497.0361328125, 508.0751647949219, 519.1141967773438, 530.1532592773438, 541.1923217773438, 552.2313842773438, 563.2704467773438, 574.3095092773438, 585.3485717773438, 596.3876342773438, 607.4266967773438, 618.4657592773438, 629.5048217773438, 640.5438842773438, 651.5829467773438, 662.6220092773438, 673.6610717773438, 684.7001342773438]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 18.0, 9.0, 14.0, 11.0, 17.0, 18.0, 32.0, 28.0, 18.0, 21.0, 35.0, 27.0, 39.0, 33.0, 37.0, 44.0, 50.0, 30.0, 56.0, 52.0, 41.0, 32.0, 33.0, 36.0, 31.0, 30.0, 27.0, 26.0, 25.0, 18.0, 20.0, 13.0, 10.0, 17.0, 8.0, 6.0, 3.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-47.15910339355469, -45.7601318359375, -44.36116409301758, -42.96219253540039, -41.56322479248047, -40.16425323486328, -38.765281677246094, -37.36631393432617, -35.967342376708984, -34.5683708190918, -33.169403076171875, -31.770431518554688, -30.371461868286133, -28.972492218017578, -27.573522567749023, -26.17455291748047, -24.775583267211914, -23.37661361694336, -21.977643966674805, -20.57867431640625, -19.179702758789062, -17.780733108520508, -16.381763458251953, -14.982792854309082, -13.583823204040527, -12.184853553771973, -10.785882949829102, -9.386913299560547, -7.987943172454834, -6.588973045349121, -5.190003395080566, -3.7910327911376953, -2.3920631408691406, -0.9930931329727173, 0.40587687492370605, 1.8048467636108398, 3.2038168907165527, 4.602787017822266, 6.00175666809082, 7.400727272033691, 8.799696922302246, 10.1986665725708, 11.597637176513672, 12.996606826782227, 14.395576477050781, 15.794547080993652, 17.19351577758789, 18.592487335205078, 19.991456985473633, 21.390426635742188, 22.789396286010742, 24.188365936279297, 25.587337493896484, 26.98630714416504, 28.385276794433594, 29.78424835205078, 31.183216094970703, 32.58218765258789, 33.98115539550781, 35.380126953125, 36.77909469604492, 38.17806625366211, 39.57703399658203, 40.97600555419922, 42.374977111816406]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 7.0, 13.0, 10.0, 15.0, 13.0, 14.0, 24.0, 20.0, 17.0, 31.0, 25.0, 44.0, 35.0, 46.0, 52.0, 32.0, 44.0, 49.0, 39.0, 44.0, 42.0, 39.0, 31.0, 27.0, 44.0, 33.0, 37.0, 31.0, 27.0, 20.0, 19.0, 13.0, 14.0, 9.0, 6.0, 8.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.48828125, -4.340576171875, -4.19287109375, -4.045166015625, -3.8974609375, -3.749755859375, -3.60205078125, -3.454345703125, -3.306640625, -3.158935546875, -3.01123046875, -2.863525390625, -2.7158203125, -2.568115234375, -2.42041015625, -2.272705078125, -2.125, -1.977294921875, -1.82958984375, -1.681884765625, -1.5341796875, -1.386474609375, -1.23876953125, -1.091064453125, -0.943359375, -0.795654296875, -0.64794921875, -0.500244140625, -0.3525390625, -0.204833984375, -0.05712890625, 0.090576171875, 0.23828125, 0.385986328125, 0.53369140625, 0.681396484375, 0.8291015625, 0.976806640625, 1.12451171875, 1.272216796875, 1.419921875, 1.567626953125, 1.71533203125, 1.863037109375, 2.0107421875, 2.158447265625, 2.30615234375, 2.453857421875, 2.6015625, 2.749267578125, 2.89697265625, 3.044677734375, 3.1923828125, 3.340087890625, 3.48779296875, 3.635498046875, 3.783203125, 3.930908203125, 4.07861328125, 4.226318359375, 4.3740234375, 4.521728515625, 4.66943359375, 4.817138671875, 4.96484375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 5.0, 7.0, 6.0, 11.0, 23.0, 31.0, 34.0, 60.0, 63.0, 91.0, 137.0, 219.0, 363.0, 606.0, 1094.0, 2424.0, 6665.0, 24079.0, 136408.0, 1989108.0, 1869003.0, 128940.0, 23221.0, 6465.0, 2351.0, 1148.0, 610.0, 352.0, 235.0, 147.0, 120.0, 64.0, 53.0, 46.0, 17.0, 18.0, 17.0, 11.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0], "bins": [-16.5, -16.0145263671875, -15.529052734375, -15.0435791015625, -14.55810546875, -14.0726318359375, -13.587158203125, -13.1016845703125, -12.6162109375, -12.1307373046875, -11.645263671875, -11.1597900390625, -10.67431640625, -10.1888427734375, -9.703369140625, -9.2178955078125, -8.732421875, -8.2469482421875, -7.761474609375, -7.2760009765625, -6.79052734375, -6.3050537109375, -5.819580078125, -5.3341064453125, -4.8486328125, -4.3631591796875, -3.877685546875, -3.3922119140625, -2.90673828125, -2.4212646484375, -1.935791015625, -1.4503173828125, -0.96484375, -0.4793701171875, 0.006103515625, 0.4915771484375, 0.97705078125, 1.4625244140625, 1.947998046875, 2.4334716796875, 2.9189453125, 3.4044189453125, 3.889892578125, 4.3753662109375, 4.86083984375, 5.3463134765625, 5.831787109375, 6.3172607421875, 6.802734375, 7.2882080078125, 7.773681640625, 8.2591552734375, 8.74462890625, 9.2301025390625, 9.715576171875, 10.2010498046875, 10.6865234375, 11.1719970703125, 11.657470703125, 12.1429443359375, 12.62841796875, 13.1138916015625, 13.599365234375, 14.0848388671875, 14.5703125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 3.0, 10.0, 9.0, 18.0, 21.0, 42.0, 70.0, 97.0, 137.0, 227.0, 374.0, 641.0, 801.0, 568.0, 347.0, 238.0, 138.0, 110.0, 66.0, 47.0, 21.0, 26.0, 15.0, 10.0, 7.0, 6.0, 5.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.140625, -11.7138671875, -11.287109375, -10.8603515625, -10.43359375, -10.0068359375, -9.580078125, -9.1533203125, -8.7265625, -8.2998046875, -7.873046875, -7.4462890625, -7.01953125, -6.5927734375, -6.166015625, -5.7392578125, -5.3125, -4.8857421875, -4.458984375, -4.0322265625, -3.60546875, -3.1787109375, -2.751953125, -2.3251953125, -1.8984375, -1.4716796875, -1.044921875, -0.6181640625, -0.19140625, 0.2353515625, 0.662109375, 1.0888671875, 1.515625, 1.9423828125, 2.369140625, 2.7958984375, 3.22265625, 3.6494140625, 4.076171875, 4.5029296875, 4.9296875, 5.3564453125, 5.783203125, 6.2099609375, 6.63671875, 7.0634765625, 7.490234375, 7.9169921875, 8.34375, 8.7705078125, 9.197265625, 9.6240234375, 10.05078125, 10.4775390625, 10.904296875, 11.3310546875, 11.7578125, 12.1845703125, 12.611328125, 13.0380859375, 13.46484375, 13.8916015625, 14.318359375, 14.7451171875, 15.171875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 11.0, 6.0, 8.0, 7.0, 20.0, 39.0, 54.0, 104.0, 189.0, 391.0, 881.0, 2298.0, 8391.0, 52721.0, 862710.0, 3095471.0, 148267.0, 16667.0, 3736.0, 1275.0, 526.0, 241.0, 112.0, 61.0, 29.0, 22.0, 17.0, 5.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.84375, -33.931884765625, -33.02001953125, -32.108154296875, -31.1962890625, -30.284423828125, -29.37255859375, -28.460693359375, -27.548828125, -26.636962890625, -25.72509765625, -24.813232421875, -23.9013671875, -22.989501953125, -22.07763671875, -21.165771484375, -20.25390625, -19.342041015625, -18.43017578125, -17.518310546875, -16.6064453125, -15.694580078125, -14.78271484375, -13.870849609375, -12.958984375, -12.047119140625, -11.13525390625, -10.223388671875, -9.3115234375, -8.399658203125, -7.48779296875, -6.575927734375, -5.6640625, -4.752197265625, -3.84033203125, -2.928466796875, -2.0166015625, -1.104736328125, -0.19287109375, 0.718994140625, 1.630859375, 2.542724609375, 3.45458984375, 4.366455078125, 5.2783203125, 6.190185546875, 7.10205078125, 8.013916015625, 8.92578125, 9.837646484375, 10.74951171875, 11.661376953125, 12.5732421875, 13.485107421875, 14.39697265625, 15.308837890625, 16.220703125, 17.132568359375, 18.04443359375, 18.956298828125, 19.8681640625, 20.780029296875, 21.69189453125, 22.603759765625, 23.515625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [2.0, 6.0, 15.0, 18.0, 35.0, 96.0, 130.0, 165.0, 175.0, 130.0, 130.0, 63.0, 33.0, 12.0, 8.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.355392456054688, -24.0870361328125, -20.818679809570312, -17.550325393676758, -14.28196907043457, -11.013612747192383, -7.745258331298828, -4.476902008056641, -1.2085456848144531, 2.059810161590576, 5.3281660079956055, 8.596521377563477, 11.864877700805664, 15.133234024047852, 18.401588439941406, 21.669944763183594, 24.93830108642578, 28.20665740966797, 31.475013732910156, 34.743370056152344, 38.01172637939453, 41.28008270263672, 44.54843521118164, 47.81679153442383, 51.085147857666016, 54.3535041809082, 57.62186050415039, 60.89021301269531, 64.1585693359375, 67.42692565917969, 70.69528198242188, 73.96363830566406, 77.23199462890625, 80.50035095214844, 83.76870727539062, 87.03706359863281, 90.305419921875, 93.57377624511719, 96.84213256835938, 100.11048889160156, 103.37884521484375, 106.64720153808594, 109.91555786132812, 113.18391418457031, 116.4522705078125, 119.72062683105469, 122.98898315429688, 126.25733947753906, 129.52569580078125, 132.79405212402344, 136.06240844726562, 139.3307647705078, 142.59912109375, 145.8674774169922, 149.13583374023438, 152.40419006347656, 155.6725311279297, 158.94088745117188, 162.20924377441406, 165.47760009765625, 168.74595642089844, 172.01431274414062, 175.2826690673828, 178.551025390625, 181.8193817138672]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 5.0, 4.0, 12.0, 7.0, 17.0, 12.0, 6.0, 21.0, 17.0, 27.0, 23.0, 36.0, 36.0, 35.0, 38.0, 48.0, 46.0, 44.0, 48.0, 55.0, 47.0, 37.0, 39.0, 32.0, 39.0, 34.0, 32.0, 32.0, 31.0, 31.0, 24.0, 18.0, 14.0, 13.0, 8.0, 7.0, 8.0, 4.0, 4.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-42.333343505859375, -41.19486999511719, -40.056396484375, -38.91792297363281, -37.779449462890625, -36.64097595214844, -35.50250244140625, -34.36403274536133, -33.22555923461914, -32.08708572387695, -30.948612213134766, -29.810138702392578, -28.671667098999023, -27.533193588256836, -26.39472007751465, -25.25624656677246, -24.117773056030273, -22.979299545288086, -21.8408260345459, -20.702354431152344, -19.563880920410156, -18.42540740966797, -17.28693389892578, -16.148460388183594, -15.009987831115723, -13.871514320373535, -12.733041763305664, -11.594568252563477, -10.456094741821289, -9.317622184753418, -8.17914867401123, -7.040675640106201, -5.902202606201172, -4.763729572296143, -3.625256299972534, -2.486783027648926, -1.3483099937438965, -0.2098369598388672, 0.9286365509033203, 2.0671095848083496, 3.205582618713379, 4.344055652618408, 5.4825286865234375, 6.621002197265625, 7.759475231170654, 8.897948265075684, 10.036421775817871, 11.174894332885742, 12.31336784362793, 13.451841354370117, 14.590313911437988, 15.728787422180176, 16.867259979248047, 18.005733489990234, 19.144207000732422, 20.28268051147461, 21.421154022216797, 22.559627532958984, 23.698101043701172, 24.83657455444336, 25.975046157836914, 27.1135196685791, 28.25199317932129, 29.390466690063477, 30.52893829345703]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 13.0, 15.0, 15.0, 24.0, 14.0, 20.0, 27.0, 29.0, 34.0, 44.0, 32.0, 49.0, 39.0, 49.0, 51.0, 49.0, 46.0, 55.0, 44.0, 38.0, 35.0, 37.0, 26.0, 29.0, 28.0, 33.0, 26.0, 19.0, 17.0, 12.0, 11.0, 9.0, 6.0, 4.0, 1.0, 5.0, 4.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.28948974609375, -4.1297607421875, -3.97003173828125, -3.810302734375, -3.65057373046875, -3.4908447265625, -3.33111572265625, -3.17138671875, -3.01165771484375, -2.8519287109375, -2.69219970703125, -2.532470703125, -2.37274169921875, -2.2130126953125, -2.05328369140625, -1.8935546875, -1.73382568359375, -1.5740966796875, -1.41436767578125, -1.254638671875, -1.09490966796875, -0.9351806640625, -0.77545166015625, -0.61572265625, -0.45599365234375, -0.2962646484375, -0.13653564453125, 0.023193359375, 0.18292236328125, 0.3426513671875, 0.50238037109375, 0.662109375, 0.82183837890625, 0.9815673828125, 1.14129638671875, 1.301025390625, 1.46075439453125, 1.6204833984375, 1.78021240234375, 1.93994140625, 2.09967041015625, 2.2593994140625, 2.41912841796875, 2.578857421875, 2.73858642578125, 2.8983154296875, 3.05804443359375, 3.2177734375, 3.37750244140625, 3.5372314453125, 3.69696044921875, 3.856689453125, 4.01641845703125, 4.1761474609375, 4.33587646484375, 4.49560546875, 4.65533447265625, 4.8150634765625, 4.97479248046875, 5.134521484375, 5.29425048828125, 5.4539794921875, 5.61370849609375, 5.7734375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 7.0, 10.0, 7.0, 17.0, 24.0, 39.0, 56.0, 84.0, 115.0, 178.0, 234.0, 397.0, 505.0, 821.0, 1313.0, 1983.0, 2945.0, 4402.0, 6827.0, 10695.0, 17071.0, 28016.0, 48060.0, 87986.0, 197711.0, 318661.0, 145463.0, 70661.0, 39941.0, 23580.0, 14344.0, 9179.0, 5884.0, 3860.0, 2431.0, 1668.0, 1127.0, 739.0, 480.0, 330.0, 234.0, 129.0, 102.0, 73.0, 47.0, 37.0, 27.0, 22.0, 7.0, 9.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.179443359375, -0.17371559143066406, -0.16798782348632812, -0.1622600555419922, -0.15653228759765625, -0.1508045196533203, -0.14507675170898438, -0.13934898376464844, -0.1336212158203125, -0.12789344787597656, -0.12216567993164062, -0.11643791198730469, -0.11071014404296875, -0.10498237609863281, -0.09925460815429688, -0.09352684020996094, -0.087799072265625, -0.08207130432128906, -0.07634353637695312, -0.07061576843261719, -0.06488800048828125, -0.05916023254394531, -0.053432464599609375, -0.04770469665527344, -0.0419769287109375, -0.03624916076660156, -0.030521392822265625, -0.024793624877929688, -0.01906585693359375, -0.013338088989257812, -0.007610321044921875, -0.0018825531005859375, 0.00384521484375, 0.009572982788085938, 0.015300750732421875, 0.021028518676757812, 0.02675628662109375, 0.03248405456542969, 0.038211822509765625, 0.04393959045410156, 0.0496673583984375, 0.05539512634277344, 0.061122894287109375, 0.06685066223144531, 0.07257843017578125, 0.07830619812011719, 0.08403396606445312, 0.08976173400878906, 0.095489501953125, 0.10121726989746094, 0.10694503784179688, 0.11267280578613281, 0.11840057373046875, 0.12412834167480469, 0.12985610961914062, 0.13558387756347656, 0.1413116455078125, 0.14703941345214844, 0.15276718139648438, 0.1584949493408203, 0.16422271728515625, 0.1699504852294922, 0.17567825317382812, 0.18140602111816406, 0.1871337890625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 12.0, 7.0, 12.0, 14.0, 13.0, 18.0, 14.0, 18.0, 12.0, 30.0, 27.0, 34.0, 40.0, 33.0, 43.0, 44.0, 35.0, 40.0, 57.0, 1066.0, 42.0, 40.0, 43.0, 40.0, 35.0, 34.0, 31.0, 27.0, 27.0, 25.0, 18.0, 18.0, 7.0, 17.0, 15.0, 12.0, 7.0, 6.0, 5.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0], "bins": [-3.8359375, -3.735137939453125, -3.63433837890625, -3.533538818359375, -3.4327392578125, -3.331939697265625, -3.23114013671875, -3.130340576171875, -3.029541015625, -2.928741455078125, -2.82794189453125, -2.727142333984375, -2.6263427734375, -2.525543212890625, -2.42474365234375, -2.323944091796875, -2.22314453125, -2.122344970703125, -2.02154541015625, -1.920745849609375, -1.8199462890625, -1.719146728515625, -1.61834716796875, -1.517547607421875, -1.416748046875, -1.315948486328125, -1.21514892578125, -1.114349365234375, -1.0135498046875, -0.912750244140625, -0.81195068359375, -0.711151123046875, -0.6103515625, -0.509552001953125, -0.40875244140625, -0.307952880859375, -0.2071533203125, -0.106353759765625, -0.00555419921875, 0.095245361328125, 0.196044921875, 0.296844482421875, 0.39764404296875, 0.498443603515625, 0.5992431640625, 0.700042724609375, 0.80084228515625, 0.901641845703125, 1.00244140625, 1.103240966796875, 1.20404052734375, 1.304840087890625, 1.4056396484375, 1.506439208984375, 1.60723876953125, 1.708038330078125, 1.808837890625, 1.909637451171875, 2.01043701171875, 2.111236572265625, 2.2120361328125, 2.312835693359375, 2.41363525390625, 2.514434814453125, 2.615234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 7.0, 5.0, 13.0, 18.0, 29.0, 48.0, 70.0, 115.0, 201.0, 294.0, 487.0, 881.0, 1402.0, 2270.0, 3889.0, 6312.0, 10522.0, 18061.0, 30635.0, 54454.0, 106646.0, 254652.0, 1341012.0, 121572.0, 61052.0, 33638.0, 19726.0, 11656.0, 6957.0, 4084.0, 2516.0, 1502.0, 932.0, 598.0, 329.0, 208.0, 133.0, 74.0, 47.0, 26.0, 20.0, 11.0, 9.0, 7.0, 3.0, 8.0, 1.0, 2.0, 3.0], "bins": [-0.1365966796875, -0.13291358947753906, -0.12923049926757812, -0.1255474090576172, -0.12186431884765625, -0.11818122863769531, -0.11449813842773438, -0.11081504821777344, -0.1071319580078125, -0.10344886779785156, -0.09976577758789062, -0.09608268737792969, -0.09239959716796875, -0.08871650695800781, -0.08503341674804688, -0.08135032653808594, -0.077667236328125, -0.07398414611816406, -0.07030105590820312, -0.06661796569824219, -0.06293487548828125, -0.05925178527832031, -0.055568695068359375, -0.05188560485839844, -0.0482025146484375, -0.04451942443847656, -0.040836334228515625, -0.03715324401855469, -0.03347015380859375, -0.029787063598632812, -0.026103973388671875, -0.022420883178710938, -0.01873779296875, -0.015054702758789062, -0.011371612548828125, -0.0076885223388671875, -0.00400543212890625, -0.0003223419189453125, 0.003360748291015625, 0.0070438385009765625, 0.0107269287109375, 0.014410018920898438, 0.018093109130859375, 0.021776199340820312, 0.02545928955078125, 0.029142379760742188, 0.032825469970703125, 0.03650856018066406, 0.040191650390625, 0.04387474060058594, 0.047557830810546875, 0.05124092102050781, 0.05492401123046875, 0.05860710144042969, 0.062290191650390625, 0.06597328186035156, 0.0696563720703125, 0.07333946228027344, 0.07702255249023438, 0.08070564270019531, 0.08438873291015625, 0.08807182312011719, 0.09175491333007812, 0.09543800354003906, 0.09912109375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 7.0, 4.0, 4.0, 11.0, 9.0, 19.0, 23.0, 26.0, 27.0, 29.0, 39.0, 33.0, 53.0, 53.0, 67.0, 55.0, 51.0, 66.0, 70.0, 53.0, 43.0, 46.0, 37.0, 31.0, 21.0, 26.0, 18.0, 19.0, 17.0, 7.0, 10.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.817413330078125e-05, -5.6619755923748016e-05, -5.506537854671478e-05, -5.351100116968155e-05, -5.1956623792648315e-05, -5.040224641561508e-05, -4.884786903858185e-05, -4.7293491661548615e-05, -4.573911428451538e-05, -4.418473690748215e-05, -4.2630359530448914e-05, -4.107598215341568e-05, -3.9521604776382446e-05, -3.796722739934921e-05, -3.641285002231598e-05, -3.4858472645282745e-05, -3.330409526824951e-05, -3.174971789121628e-05, -3.0195340514183044e-05, -2.864096313714981e-05, -2.7086585760116577e-05, -2.5532208383083344e-05, -2.397783100605011e-05, -2.2423453629016876e-05, -2.0869076251983643e-05, -1.931469887495041e-05, -1.7760321497917175e-05, -1.620594412088394e-05, -1.4651566743850708e-05, -1.3097189366817474e-05, -1.154281198978424e-05, -9.988434612751007e-06, -8.434057235717773e-06, -6.87967985868454e-06, -5.325302481651306e-06, -3.7709251046180725e-06, -2.216547727584839e-06, -6.621703505516052e-07, 8.922070264816284e-07, 2.446584403514862e-06, 4.000961780548096e-06, 5.555339157581329e-06, 7.109716534614563e-06, 8.664093911647797e-06, 1.021847128868103e-05, 1.1772848665714264e-05, 1.3327226042747498e-05, 1.4881603419780731e-05, 1.6435980796813965e-05, 1.79903581738472e-05, 1.9544735550880432e-05, 2.1099112927913666e-05, 2.26534903049469e-05, 2.4207867681980133e-05, 2.5762245059013367e-05, 2.73166224360466e-05, 2.8870999813079834e-05, 3.0425377190113068e-05, 3.19797545671463e-05, 3.3534131944179535e-05, 3.508850932121277e-05, 3.6642886698246e-05, 3.8197264075279236e-05, 3.975164145231247e-05, 4.13060188293457e-05]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 1.0, 5.0, 10.0, 4.0, 8.0, 18.0, 15.0, 19.0, 29.0, 27.0, 35.0, 48.0, 74.0, 135.0, 410.0, 1807.0, 31345.0, 701802.0, 302274.0, 8959.0, 892.0, 252.0, 110.0, 58.0, 43.0, 33.0, 24.0, 41.0, 15.0, 12.0, 7.0, 11.0, 8.0, 5.0, 5.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007033348083496094, -0.0006780475378036499, -0.0006527602672576904, -0.000627472996711731, -0.0006021857261657715, -0.000576898455619812, -0.0005516111850738525, -0.0005263239145278931, -0.0005010366439819336, -0.0004757493734359741, -0.00045046210289001465, -0.0004251748323440552, -0.0003998875617980957, -0.00037460029125213623, -0.00034931302070617676, -0.0003240257501602173, -0.0002987384796142578, -0.00027345120906829834, -0.00024816393852233887, -0.0002228766679763794, -0.00019758939743041992, -0.00017230212688446045, -0.00014701485633850098, -0.0001217275857925415, -9.644031524658203e-05, -7.115304470062256e-05, -4.5865774154663086e-05, -2.0578503608703613e-05, 4.708766937255859e-06, 2.9996037483215332e-05, 5.5283308029174805e-05, 8.057057857513428e-05, 0.00010585784912109375, 0.00013114511966705322, 0.0001564323902130127, 0.00018171966075897217, 0.00020700693130493164, 0.0002322942018508911, 0.0002575814723968506, 0.00028286874294281006, 0.00030815601348876953, 0.000333443284034729, 0.0003587305545806885, 0.00038401782512664795, 0.0004093050956726074, 0.0004345923662185669, 0.00045987963676452637, 0.00048516690731048584, 0.0005104541778564453, 0.0005357414484024048, 0.0005610287189483643, 0.0005863159894943237, 0.0006116032600402832, 0.0006368905305862427, 0.0006621778011322021, 0.0006874650716781616, 0.0007127523422241211, 0.0007380396127700806, 0.00076332688331604, 0.0007886141538619995, 0.000813901424407959, 0.0008391886949539185, 0.0008644759654998779, 0.0008897632360458374, 0.0009150505065917969]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 10.0, 19.0, 34.0, 88.0, 156.0, 258.0, 233.0, 134.0, 50.0, 16.0, 11.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.847589687211439e-05, -3.4081738704117015e-05, -2.968758053611964e-05, -2.5293424187111668e-05, -2.0899266019114293e-05, -1.6505107851116918e-05, -1.2110951502108946e-05, -7.716793334111571e-06, -3.322635166114196e-06, 1.071522547135828e-06, 5.465680260385852e-06, 9.859837518888526e-06, 1.42539956868859e-05, 1.8648153854883276e-05, 2.3042310203891248e-05, 2.7436468371888623e-05, 3.1830626539886e-05, 3.622478470788337e-05, 4.061894287588075e-05, 4.5013097405899316e-05, 4.94072592118755e-05, 5.3801413741894066e-05, 5.819557190989144e-05, 6.258973007788882e-05, 6.6983891883865e-05, 7.137804641388357e-05, 7.577220821985975e-05, 8.016636274987832e-05, 8.45605245558545e-05, 8.895467908587307e-05, 9.334883361589164e-05, 9.774299542186782e-05, 0.00010213714267592877, 0.00010653129720594734, 0.00011092545901192352, 0.00011531961354194209, 0.00011971377534791827, 0.00012410792987793684, 0.0001285020844079554, 0.00013289623893797398, 0.00013729040801990777, 0.00014168456254992634, 0.0001460787170799449, 0.0001504728861618787, 0.00015486704069189727, 0.00015926119522191584, 0.0001636553497519344, 0.00016804950428195298, 0.00017244365881197155, 0.0001768378133419901, 0.00018123196787200868, 0.00018562613695394248, 0.00019002029148396105, 0.00019441444601397961, 0.00019880860054399818, 0.00020320276962593198, 0.00020759692415595055, 0.00021199107868596911, 0.00021638523321598768, 0.00022077940229792148, 0.00022517355682794005, 0.00022956771135795861, 0.00023396186588797718, 0.00023835603496991098, 0.00024275018949992955]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 6.0, 11.0, 19.0, 17.0, 15.0, 24.0, 23.0, 23.0, 18.0, 29.0, 35.0, 39.0, 28.0, 19.0, 55.0, 48.0, 40.0, 40.0, 51.0, 39.0, 34.0, 26.0, 34.0, 37.0, 30.0, 30.0, 27.0, 26.0, 30.0, 26.0, 12.0, 15.0, 7.0, 13.0, 12.0, 11.0, 9.0, 5.0, 4.0, 1.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5212764739990234e-05, -2.442300319671631e-05, -2.3633241653442383e-05, -2.2843480110168457e-05, -2.205371856689453e-05, -2.1263957023620605e-05, -2.047419548034668e-05, -1.9684433937072754e-05, -1.8894672393798828e-05, -1.8104910850524902e-05, -1.7315149307250977e-05, -1.652538776397705e-05, -1.5735626220703125e-05, -1.49458646774292e-05, -1.4156103134155273e-05, -1.3366341590881348e-05, -1.2576580047607422e-05, -1.1786818504333496e-05, -1.099705696105957e-05, -1.0207295417785645e-05, -9.417533874511719e-06, -8.627772331237793e-06, -7.838010787963867e-06, -7.048249244689941e-06, -6.258487701416016e-06, -5.46872615814209e-06, -4.678964614868164e-06, -3.889203071594238e-06, -3.0994415283203125e-06, -2.3096799850463867e-06, -1.519918441772461e-06, -7.301568984985352e-07, 5.960464477539063e-08, 8.493661880493164e-07, 1.6391277313232422e-06, 2.428889274597168e-06, 3.2186508178710938e-06, 4.0084123611450195e-06, 4.798173904418945e-06, 5.587935447692871e-06, 6.377696990966797e-06, 7.167458534240723e-06, 7.957220077514648e-06, 8.746981620788574e-06, 9.5367431640625e-06, 1.0326504707336426e-05, 1.1116266250610352e-05, 1.1906027793884277e-05, 1.2695789337158203e-05, 1.3485550880432129e-05, 1.4275312423706055e-05, 1.506507396697998e-05, 1.5854835510253906e-05, 1.6644597053527832e-05, 1.7434358596801758e-05, 1.8224120140075684e-05, 1.901388168334961e-05, 1.9803643226623535e-05, 2.059340476989746e-05, 2.1383166313171387e-05, 2.2172927856445312e-05, 2.2962689399719238e-05, 2.3752450942993164e-05, 2.454221248626709e-05, 2.5331974029541016e-05]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 13.0, 15.0, 15.0, 24.0, 14.0, 20.0, 27.0, 29.0, 34.0, 44.0, 32.0, 49.0, 39.0, 49.0, 51.0, 49.0, 46.0, 55.0, 44.0, 38.0, 35.0, 37.0, 26.0, 29.0, 28.0, 33.0, 26.0, 19.0, 17.0, 12.0, 11.0, 9.0, 6.0, 4.0, 1.0, 5.0, 4.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.28948974609375, -4.1297607421875, -3.97003173828125, -3.810302734375, -3.65057373046875, -3.4908447265625, -3.33111572265625, -3.17138671875, -3.01165771484375, -2.8519287109375, -2.69219970703125, -2.532470703125, -2.37274169921875, -2.2130126953125, -2.05328369140625, -1.8935546875, -1.73382568359375, -1.5740966796875, -1.41436767578125, -1.254638671875, -1.09490966796875, -0.9351806640625, -0.77545166015625, -0.61572265625, -0.45599365234375, -0.2962646484375, -0.13653564453125, 0.023193359375, 0.18292236328125, 0.3426513671875, 0.50238037109375, 0.662109375, 0.82183837890625, 0.9815673828125, 1.14129638671875, 1.301025390625, 1.46075439453125, 1.6204833984375, 1.78021240234375, 1.93994140625, 2.09967041015625, 2.2593994140625, 2.41912841796875, 2.578857421875, 2.73858642578125, 2.8983154296875, 3.05804443359375, 3.2177734375, 3.37750244140625, 3.5372314453125, 3.69696044921875, 3.856689453125, 4.01641845703125, 4.1761474609375, 4.33587646484375, 4.49560546875, 4.65533447265625, 4.8150634765625, 4.97479248046875, 5.134521484375, 5.29425048828125, 5.4539794921875, 5.61370849609375, 5.7734375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 8.0, 8.0, 15.0, 32.0, 42.0, 61.0, 87.0, 137.0, 261.0, 493.0, 889.0, 1781.0, 3720.0, 8184.0, 20411.0, 55810.0, 242920.0, 578874.0, 85191.0, 28612.0, 11416.0, 4787.0, 2283.0, 1096.0, 580.0, 326.0, 171.0, 134.0, 79.0, 36.0, 33.0, 20.0, 15.0, 11.0, 2.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.5809326171875, -8.286865234375, -7.9927978515625, -7.69873046875, -7.4046630859375, -7.110595703125, -6.8165283203125, -6.5224609375, -6.2283935546875, -5.934326171875, -5.6402587890625, -5.34619140625, -5.0521240234375, -4.758056640625, -4.4639892578125, -4.169921875, -3.8758544921875, -3.581787109375, -3.2877197265625, -2.99365234375, -2.6995849609375, -2.405517578125, -2.1114501953125, -1.8173828125, -1.5233154296875, -1.229248046875, -0.9351806640625, -0.64111328125, -0.3470458984375, -0.052978515625, 0.2410888671875, 0.53515625, 0.8292236328125, 1.123291015625, 1.4173583984375, 1.71142578125, 2.0054931640625, 2.299560546875, 2.5936279296875, 2.8876953125, 3.1817626953125, 3.475830078125, 3.7698974609375, 4.06396484375, 4.3580322265625, 4.652099609375, 4.9461669921875, 5.240234375, 5.5343017578125, 5.828369140625, 6.1224365234375, 6.41650390625, 6.7105712890625, 7.004638671875, 7.2987060546875, 7.5927734375, 7.8868408203125, 8.180908203125, 8.4749755859375, 8.76904296875, 9.0631103515625, 9.357177734375, 9.6512451171875, 9.9453125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 3.0, 2.0, 4.0, 10.0, 5.0, 7.0, 12.0, 11.0, 28.0, 21.0, 19.0, 34.0, 41.0, 40.0, 45.0, 58.0, 64.0, 105.0, 116.0, 269.0, 1542.0, 110.0, 86.0, 78.0, 60.0, 51.0, 38.0, 44.0, 22.0, 23.0, 16.0, 20.0, 17.0, 15.0, 11.0, 8.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.25, -18.700439453125, -18.15087890625, -17.601318359375, -17.0517578125, -16.502197265625, -15.95263671875, -15.403076171875, -14.853515625, -14.303955078125, -13.75439453125, -13.204833984375, -12.6552734375, -12.105712890625, -11.55615234375, -11.006591796875, -10.45703125, -9.907470703125, -9.35791015625, -8.808349609375, -8.2587890625, -7.709228515625, -7.15966796875, -6.610107421875, -6.060546875, -5.510986328125, -4.96142578125, -4.411865234375, -3.8623046875, -3.312744140625, -2.76318359375, -2.213623046875, -1.6640625, -1.114501953125, -0.56494140625, -0.015380859375, 0.5341796875, 1.083740234375, 1.63330078125, 2.182861328125, 2.732421875, 3.281982421875, 3.83154296875, 4.381103515625, 4.9306640625, 5.480224609375, 6.02978515625, 6.579345703125, 7.12890625, 7.678466796875, 8.22802734375, 8.777587890625, 9.3271484375, 9.876708984375, 10.42626953125, 10.975830078125, 11.525390625, 12.074951171875, 12.62451171875, 13.174072265625, 13.7236328125, 14.273193359375, 14.82275390625, 15.372314453125, 15.921875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 1.0, 7.0, 8.0, 15.0, 11.0, 13.0, 27.0, 28.0, 38.0, 59.0, 76.0, 116.0, 162.0, 311.0, 730.0, 3116.0, 36942.0, 2732105.0, 356503.0, 12536.0, 1598.0, 529.0, 267.0, 133.0, 91.0, 73.0, 58.0, 39.0, 33.0, 22.0, 12.0, 5.0, 10.0, 8.0, 7.0, 7.0, 2.0, 1.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.9375, -34.73193359375, -33.5263671875, -32.32080078125, -31.115234375, -29.90966796875, -28.7041015625, -27.49853515625, -26.29296875, -25.08740234375, -23.8818359375, -22.67626953125, -21.470703125, -20.26513671875, -19.0595703125, -17.85400390625, -16.6484375, -15.44287109375, -14.2373046875, -13.03173828125, -11.826171875, -10.62060546875, -9.4150390625, -8.20947265625, -7.00390625, -5.79833984375, -4.5927734375, -3.38720703125, -2.181640625, -0.97607421875, 0.2294921875, 1.43505859375, 2.640625, 3.84619140625, 5.0517578125, 6.25732421875, 7.462890625, 8.66845703125, 9.8740234375, 11.07958984375, 12.28515625, 13.49072265625, 14.6962890625, 15.90185546875, 17.107421875, 18.31298828125, 19.5185546875, 20.72412109375, 21.9296875, 23.13525390625, 24.3408203125, 25.54638671875, 26.751953125, 27.95751953125, 29.1630859375, 30.36865234375, 31.57421875, 32.77978515625, 33.9853515625, 35.19091796875, 36.396484375, 37.60205078125, 38.8076171875, 40.01318359375, 41.21875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 49.0, 252.0, 460.0, 210.0, 35.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.912212371826172, -21.15459442138672, -16.3969783782959, -11.639361381530762, -6.881744384765625, -2.124126434326172, 2.6334896087646484, 7.391105651855469, 12.148723602294922, 16.906341552734375, 21.663957595825195, 26.421573638916016, 31.17919158935547, 35.93680953979492, 40.694427490234375, 45.45204162597656, 50.209659576416016, 54.96727752685547, 59.724891662597656, 64.48251342773438, 69.24012756347656, 73.99774169921875, 78.75536346435547, 83.51297760009766, 88.27059936523438, 93.02821350097656, 97.78583526611328, 102.54344940185547, 107.30107116699219, 112.05868530273438, 116.81629943847656, 121.57391357421875, 126.33154296875, 131.0891571044922, 135.84677124023438, 140.60440063476562, 145.3620147705078, 150.11962890625, 154.8772430419922, 159.63485717773438, 164.39248657226562, 169.1501007080078, 173.90771484375, 178.66534423828125, 183.42295837402344, 188.18057250976562, 192.9381866455078, 197.69580078125, 202.4534149169922, 207.21102905273438, 211.96864318847656, 216.7262725830078, 221.48388671875, 226.2415008544922, 230.99911499023438, 235.75672912597656, 240.51434326171875, 245.27195739746094, 250.02957153320312, 254.78720092773438, 259.5447998046875, 264.30242919921875, 269.06005859375, 273.8176574707031, 278.5752868652344]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 3.0, 12.0, 9.0, 11.0, 12.0, 12.0, 24.0, 21.0, 27.0, 22.0, 22.0, 29.0, 34.0, 39.0, 40.0, 44.0, 39.0, 32.0, 52.0, 34.0, 39.0, 39.0, 45.0, 35.0, 37.0, 27.0, 28.0, 25.0, 28.0, 25.0, 24.0, 18.0, 16.0, 7.0, 7.0, 13.0, 11.0, 12.0, 9.0, 6.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-41.16782760620117, -39.84314727783203, -38.518463134765625, -37.193782806396484, -35.869102478027344, -34.54441833496094, -33.2197380065918, -31.895055770874023, -30.57037353515625, -29.245691299438477, -27.921009063720703, -26.596328735351562, -25.27164649963379, -23.946964263916016, -22.622283935546875, -21.2976016998291, -19.972919464111328, -18.648237228393555, -17.32355499267578, -15.99887466430664, -14.674192428588867, -13.349510192871094, -12.024828910827637, -10.70014762878418, -9.375465393066406, -8.050783157348633, -6.726101875305176, -5.4014201164245605, -4.076738357543945, -2.75205659866333, -1.4273748397827148, -0.10269355773925781, 1.22198486328125, 2.5466666221618652, 3.8713483810424805, 5.196030139923096, 6.520711898803711, 7.845393657684326, 9.170075416564941, 10.494756698608398, 11.819438934326172, 13.144121170043945, 14.468802452087402, 15.79348373413086, 17.118165969848633, 18.442848205566406, 19.767528533935547, 21.09221076965332, 22.416893005371094, 23.741575241088867, 25.06625747680664, 26.39093780517578, 27.715620040893555, 29.040302276611328, 30.36498260498047, 31.689664840698242, 33.014347076416016, 34.339027404785156, 35.66371154785156, 36.9883918762207, 38.313072204589844, 39.63775634765625, 40.96243667602539, 42.28711700439453, 43.61180114746094]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 13.0, 9.0, 16.0, 24.0, 24.0, 18.0, 28.0, 24.0, 41.0, 40.0, 41.0, 44.0, 44.0, 44.0, 41.0, 46.0, 52.0, 45.0, 40.0, 42.0, 38.0, 32.0, 30.0, 27.0, 37.0, 27.0, 22.0, 14.0, 28.0, 12.0, 7.0, 5.0, 14.0, 5.0, 3.0, 5.0, 2.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.38385009765625, -4.2208251953125, -4.05780029296875, -3.894775390625, -3.73175048828125, -3.5687255859375, -3.40570068359375, -3.24267578125, -3.07965087890625, -2.9166259765625, -2.75360107421875, -2.590576171875, -2.42755126953125, -2.2645263671875, -2.10150146484375, -1.9384765625, -1.77545166015625, -1.6124267578125, -1.44940185546875, -1.286376953125, -1.12335205078125, -0.9603271484375, -0.79730224609375, -0.63427734375, -0.47125244140625, -0.3082275390625, -0.14520263671875, 0.017822265625, 0.18084716796875, 0.3438720703125, 0.50689697265625, 0.669921875, 0.83294677734375, 0.9959716796875, 1.15899658203125, 1.322021484375, 1.48504638671875, 1.6480712890625, 1.81109619140625, 1.97412109375, 2.13714599609375, 2.3001708984375, 2.46319580078125, 2.626220703125, 2.78924560546875, 2.9522705078125, 3.11529541015625, 3.2783203125, 3.44134521484375, 3.6043701171875, 3.76739501953125, 3.930419921875, 4.09344482421875, 4.2564697265625, 4.41949462890625, 4.58251953125, 4.74554443359375, 4.9085693359375, 5.07159423828125, 5.234619140625, 5.39764404296875, 5.5606689453125, 5.72369384765625, 5.88671875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 11.0, 6.0, 16.0, 32.0, 36.0, 57.0, 86.0, 154.0, 255.0, 526.0, 1178.0, 3119.0, 9427.0, 42049.0, 354452.0, 3159282.0, 548661.0, 56511.0, 11826.0, 3645.0, 1477.0, 633.0, 342.0, 194.0, 96.0, 57.0, 42.0, 36.0, 20.0, 11.0, 13.0, 7.0, 7.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-17.4375, -16.918212890625, -16.39892578125, -15.879638671875, -15.3603515625, -14.841064453125, -14.32177734375, -13.802490234375, -13.283203125, -12.763916015625, -12.24462890625, -11.725341796875, -11.2060546875, -10.686767578125, -10.16748046875, -9.648193359375, -9.12890625, -8.609619140625, -8.09033203125, -7.571044921875, -7.0517578125, -6.532470703125, -6.01318359375, -5.493896484375, -4.974609375, -4.455322265625, -3.93603515625, -3.416748046875, -2.8974609375, -2.378173828125, -1.85888671875, -1.339599609375, -0.8203125, -0.301025390625, 0.21826171875, 0.737548828125, 1.2568359375, 1.776123046875, 2.29541015625, 2.814697265625, 3.333984375, 3.853271484375, 4.37255859375, 4.891845703125, 5.4111328125, 5.930419921875, 6.44970703125, 6.968994140625, 7.48828125, 8.007568359375, 8.52685546875, 9.046142578125, 9.5654296875, 10.084716796875, 10.60400390625, 11.123291015625, 11.642578125, 12.161865234375, 12.68115234375, 13.200439453125, 13.7197265625, 14.239013671875, 14.75830078125, 15.277587890625, 15.796875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 14.0, 25.0, 21.0, 37.0, 47.0, 51.0, 87.0, 118.0, 156.0, 227.0, 313.0, 427.0, 550.0, 548.0, 400.0, 272.0, 186.0, 147.0, 105.0, 92.0, 62.0, 41.0, 30.0, 23.0, 19.0, 15.0, 7.0, 6.0, 5.0, 3.0, 7.0, 1.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3046875, -9.9715576171875, -9.638427734375, -9.3052978515625, -8.97216796875, -8.6390380859375, -8.305908203125, -7.9727783203125, -7.6396484375, -7.3065185546875, -6.973388671875, -6.6402587890625, -6.30712890625, -5.9739990234375, -5.640869140625, -5.3077392578125, -4.974609375, -4.6414794921875, -4.308349609375, -3.9752197265625, -3.64208984375, -3.3089599609375, -2.975830078125, -2.6427001953125, -2.3095703125, -1.9764404296875, -1.643310546875, -1.3101806640625, -0.97705078125, -0.6439208984375, -0.310791015625, 0.0223388671875, 0.35546875, 0.6885986328125, 1.021728515625, 1.3548583984375, 1.68798828125, 2.0211181640625, 2.354248046875, 2.6873779296875, 3.0205078125, 3.3536376953125, 3.686767578125, 4.0198974609375, 4.35302734375, 4.6861572265625, 5.019287109375, 5.3524169921875, 5.685546875, 6.0186767578125, 6.351806640625, 6.6849365234375, 7.01806640625, 7.3511962890625, 7.684326171875, 8.0174560546875, 8.3505859375, 8.6837158203125, 9.016845703125, 9.3499755859375, 9.68310546875, 10.0162353515625, 10.349365234375, 10.6824951171875, 11.015625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 4.0, 3.0, 1.0, 5.0, 9.0, 8.0, 11.0, 14.0, 18.0, 26.0, 33.0, 43.0, 102.0, 118.0, 215.0, 410.0, 1164.0, 4262.0, 26937.0, 356218.0, 3467679.0, 306452.0, 24526.0, 3936.0, 1059.0, 456.0, 217.0, 118.0, 68.0, 57.0, 34.0, 24.0, 20.0, 8.0, 8.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.515625, -28.547119140625, -27.57861328125, -26.610107421875, -25.6416015625, -24.673095703125, -23.70458984375, -22.736083984375, -21.767578125, -20.799072265625, -19.83056640625, -18.862060546875, -17.8935546875, -16.925048828125, -15.95654296875, -14.988037109375, -14.01953125, -13.051025390625, -12.08251953125, -11.114013671875, -10.1455078125, -9.177001953125, -8.20849609375, -7.239990234375, -6.271484375, -5.302978515625, -4.33447265625, -3.365966796875, -2.3974609375, -1.428955078125, -0.46044921875, 0.508056640625, 1.4765625, 2.445068359375, 3.41357421875, 4.382080078125, 5.3505859375, 6.319091796875, 7.28759765625, 8.256103515625, 9.224609375, 10.193115234375, 11.16162109375, 12.130126953125, 13.0986328125, 14.067138671875, 15.03564453125, 16.004150390625, 16.97265625, 17.941162109375, 18.90966796875, 19.878173828125, 20.8466796875, 21.815185546875, 22.78369140625, 23.752197265625, 24.720703125, 25.689208984375, 26.65771484375, 27.626220703125, 28.5947265625, 29.563232421875, 30.53173828125, 31.500244140625, 32.46875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 16.0, 39.0, 67.0, 127.0, 178.0, 188.0, 168.0, 102.0, 66.0, 32.0, 13.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.212127685546875, -53.722389221191406, -50.23265075683594, -46.74291229248047, -43.253173828125, -39.76343536376953, -36.27370071411133, -32.78396224975586, -29.29422378540039, -25.804485321044922, -22.314746856689453, -18.825010299682617, -15.335271835327148, -11.84553337097168, -8.355796813964844, -4.866058349609375, -1.3763198852539062, 2.1134181022644043, 5.603156089782715, 9.092893600463867, 12.582632064819336, 16.072370529174805, 19.56210708618164, 23.05184555053711, 26.541584014892578, 30.031322479248047, 33.521060943603516, 37.01079559326172, 40.50053405761719, 43.990272521972656, 47.480010986328125, 50.969749450683594, 54.45948791503906, 57.94922637939453, 61.43896484375, 64.92870330810547, 68.41844177246094, 71.9081802368164, 75.39791870117188, 78.88764953613281, 82.37739562988281, 85.86713409423828, 89.35687255859375, 92.84661102294922, 96.33634948730469, 99.82608795166016, 103.31582641601562, 106.80555725097656, 110.29529571533203, 113.7850341796875, 117.27477264404297, 120.76451110839844, 124.2542495727539, 127.74398803710938, 131.2337188720703, 134.7234649658203, 138.21319580078125, 141.7029266357422, 145.1926727294922, 148.68240356445312, 152.17214965820312, 155.66188049316406, 159.15162658691406, 162.641357421875, 166.131103515625]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 5.0, 8.0, 10.0, 10.0, 10.0, 17.0, 17.0, 17.0, 21.0, 23.0, 24.0, 28.0, 38.0, 38.0, 35.0, 37.0, 31.0, 40.0, 38.0, 39.0, 37.0, 40.0, 38.0, 39.0, 31.0, 29.0, 34.0, 33.0, 30.0, 26.0, 22.0, 23.0, 10.0, 15.0, 9.0, 16.0, 14.0, 7.0, 13.0, 8.0, 8.0, 9.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.246986389160156, -27.224376678466797, -26.201766967773438, -25.179157257080078, -24.15654754638672, -23.13393783569336, -22.111330032348633, -21.088720321655273, -20.066110610961914, -19.043500900268555, -18.020891189575195, -16.998281478881836, -15.975672721862793, -14.953063011169434, -13.93045425415039, -12.907844543457031, -11.885234832763672, -10.862625122070312, -9.840015411376953, -8.81740665435791, -7.794796943664551, -6.772187232971191, -5.74957799911499, -4.726968765258789, -3.7043590545654297, -2.6817495822906494, -1.6591401100158691, -0.6365306377410889, 0.3860788345336914, 1.4086885452270508, 2.431297779083252, 3.453907012939453, 4.4765167236328125, 5.499126434326172, 6.521735668182373, 7.544344902038574, 8.566954612731934, 9.589564323425293, 10.612173080444336, 11.634782791137695, 12.657392501831055, 13.680002212524414, 14.702611923217773, 15.725220680236816, 16.74782943725586, 17.77043914794922, 18.793048858642578, 19.815658569335938, 20.838268280029297, 21.860877990722656, 22.883487701416016, 23.906097412109375, 24.928707122802734, 25.951316833496094, 26.97392463684082, 27.99653434753418, 29.01914405822754, 30.0417537689209, 31.064363479614258, 32.086971282958984, 33.109580993652344, 34.1321907043457, 35.15480041503906, 36.17741012573242, 37.20001983642578]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 8.0, 10.0, 13.0, 17.0, 18.0, 14.0, 20.0, 25.0, 37.0, 49.0, 34.0, 38.0, 46.0, 44.0, 46.0, 48.0, 48.0, 44.0, 48.0, 45.0, 37.0, 54.0, 32.0, 40.0, 35.0, 21.0, 22.0, 24.0, 21.0, 14.0, 6.0, 10.0, 6.0, 2.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0078125, -4.83251953125, -4.6572265625, -4.48193359375, -4.306640625, -4.13134765625, -3.9560546875, -3.78076171875, -3.60546875, -3.43017578125, -3.2548828125, -3.07958984375, -2.904296875, -2.72900390625, -2.5537109375, -2.37841796875, -2.203125, -2.02783203125, -1.8525390625, -1.67724609375, -1.501953125, -1.32666015625, -1.1513671875, -0.97607421875, -0.80078125, -0.62548828125, -0.4501953125, -0.27490234375, -0.099609375, 0.07568359375, 0.2509765625, 0.42626953125, 0.6015625, 0.77685546875, 0.9521484375, 1.12744140625, 1.302734375, 1.47802734375, 1.6533203125, 1.82861328125, 2.00390625, 2.17919921875, 2.3544921875, 2.52978515625, 2.705078125, 2.88037109375, 3.0556640625, 3.23095703125, 3.40625, 3.58154296875, 3.7568359375, 3.93212890625, 4.107421875, 4.28271484375, 4.4580078125, 4.63330078125, 4.80859375, 4.98388671875, 5.1591796875, 5.33447265625, 5.509765625, 5.68505859375, 5.8603515625, 6.03564453125, 6.2109375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 14.0, 16.0, 24.0, 26.0, 35.0, 59.0, 105.0, 146.0, 198.0, 300.0, 480.0, 754.0, 1155.0, 1739.0, 2644.0, 4034.0, 6275.0, 9340.0, 14454.0, 23424.0, 37426.0, 63245.0, 117009.0, 255787.0, 240895.0, 110011.0, 60016.0, 36389.0, 22185.0, 13904.0, 9245.0, 5880.0, 3903.0, 2458.0, 1701.0, 1086.0, 745.0, 484.0, 297.0, 218.0, 129.0, 107.0, 74.0, 46.0, 32.0, 14.0, 17.0, 9.0, 8.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.18505859375, -0.179443359375, -0.173828125, -0.168212890625, -0.16259765625, -0.156982421875, -0.1513671875, -0.145751953125, -0.14013671875, -0.134521484375, -0.12890625, -0.123291015625, -0.11767578125, -0.112060546875, -0.1064453125, -0.100830078125, -0.09521484375, -0.089599609375, -0.083984375, -0.078369140625, -0.07275390625, -0.067138671875, -0.0615234375, -0.055908203125, -0.05029296875, -0.044677734375, -0.0390625, -0.033447265625, -0.02783203125, -0.022216796875, -0.0166015625, -0.010986328125, -0.00537109375, 0.000244140625, 0.005859375, 0.011474609375, 0.01708984375, 0.022705078125, 0.0283203125, 0.033935546875, 0.03955078125, 0.045166015625, 0.05078125, 0.056396484375, 0.06201171875, 0.067626953125, 0.0732421875, 0.078857421875, 0.08447265625, 0.090087890625, 0.095703125, 0.101318359375, 0.10693359375, 0.112548828125, 0.1181640625, 0.123779296875, 0.12939453125, 0.135009765625, 0.140625, 0.146240234375, 0.15185546875, 0.157470703125, 0.1630859375, 0.168701171875, 0.17431640625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 7.0, 3.0, 9.0, 7.0, 9.0, 8.0, 17.0, 17.0, 11.0, 12.0, 18.0, 16.0, 23.0, 30.0, 31.0, 39.0, 43.0, 31.0, 41.0, 37.0, 40.0, 43.0, 1070.0, 38.0, 34.0, 38.0, 37.0, 37.0, 32.0, 36.0, 31.0, 18.0, 28.0, 18.0, 25.0, 12.0, 17.0, 6.0, 9.0, 14.0, 4.0, 12.0, 6.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-3.017578125, -2.923431396484375, -2.82928466796875, -2.735137939453125, -2.6409912109375, -2.546844482421875, -2.45269775390625, -2.358551025390625, -2.264404296875, -2.170257568359375, -2.07611083984375, -1.981964111328125, -1.8878173828125, -1.793670654296875, -1.69952392578125, -1.605377197265625, -1.51123046875, -1.417083740234375, -1.32293701171875, -1.228790283203125, -1.1346435546875, -1.040496826171875, -0.94635009765625, -0.852203369140625, -0.758056640625, -0.663909912109375, -0.56976318359375, -0.475616455078125, -0.3814697265625, -0.287322998046875, -0.19317626953125, -0.099029541015625, -0.0048828125, 0.089263916015625, 0.18341064453125, 0.277557373046875, 0.3717041015625, 0.465850830078125, 0.55999755859375, 0.654144287109375, 0.748291015625, 0.842437744140625, 0.93658447265625, 1.030731201171875, 1.1248779296875, 1.219024658203125, 1.31317138671875, 1.407318115234375, 1.50146484375, 1.595611572265625, 1.68975830078125, 1.783905029296875, 1.8780517578125, 1.972198486328125, 2.06634521484375, 2.160491943359375, 2.254638671875, 2.348785400390625, 2.44293212890625, 2.537078857421875, 2.6312255859375, 2.725372314453125, 2.81951904296875, 2.913665771484375, 3.0078125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 11.0, 19.0, 31.0, 55.0, 76.0, 94.0, 162.0, 220.0, 327.0, 516.0, 783.0, 1155.0, 1813.0, 2755.0, 4259.0, 6873.0, 10393.0, 16771.0, 27771.0, 47806.0, 88292.0, 189562.0, 1354932.0, 156821.0, 76449.0, 42025.0, 24847.0, 15438.0, 9503.0, 5949.0, 3988.0, 2573.0, 1612.0, 1090.0, 725.0, 452.0, 327.0, 225.0, 145.0, 88.0, 70.0, 43.0, 25.0, 16.0, 11.0, 10.0, 3.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.10638427734375, -0.10299491882324219, -0.09960556030273438, -0.09621620178222656, -0.09282684326171875, -0.08943748474121094, -0.08604812622070312, -0.08265876770019531, -0.0792694091796875, -0.07588005065917969, -0.07249069213867188, -0.06910133361816406, -0.06571197509765625, -0.06232261657714844, -0.058933258056640625, -0.05554389953613281, -0.052154541015625, -0.04876518249511719, -0.045375823974609375, -0.04198646545410156, -0.03859710693359375, -0.03520774841308594, -0.031818389892578125, -0.028429031372070312, -0.0250396728515625, -0.021650314331054688, -0.018260955810546875, -0.014871597290039062, -0.01148223876953125, -0.008092880249023438, -0.004703521728515625, -0.0013141632080078125, 0.0020751953125, 0.0054645538330078125, 0.008853912353515625, 0.012243270874023438, 0.01563262939453125, 0.019021987915039062, 0.022411346435546875, 0.025800704956054688, 0.0291900634765625, 0.03257942199707031, 0.035968780517578125, 0.03935813903808594, 0.04274749755859375, 0.04613685607910156, 0.049526214599609375, 0.05291557312011719, 0.056304931640625, 0.05969429016113281, 0.06308364868164062, 0.06647300720214844, 0.06986236572265625, 0.07325172424316406, 0.07664108276367188, 0.08003044128417969, 0.0834197998046875, 0.08680915832519531, 0.09019851684570312, 0.09358787536621094, 0.09697723388671875, 0.10036659240722656, 0.10375595092773438, 0.10714530944824219, 0.11053466796875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 18.0, 7.0, 18.0, 15.0, 33.0, 39.0, 26.0, 37.0, 50.0, 37.0, 58.0, 49.0, 58.0, 50.0, 40.0, 59.0, 62.0, 45.0, 39.0, 37.0, 38.0, 25.0, 19.0, 26.0, 21.0, 12.0, 13.0, 7.0, 8.0, 14.0, 9.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.975629806518555e-05, -3.861915320158005e-05, -3.748200833797455e-05, -3.634486347436905e-05, -3.520771861076355e-05, -3.407057374715805e-05, -3.293342888355255e-05, -3.179628401994705e-05, -3.065913915634155e-05, -2.9521994292736053e-05, -2.8384849429130554e-05, -2.7247704565525055e-05, -2.6110559701919556e-05, -2.4973414838314056e-05, -2.3836269974708557e-05, -2.2699125111103058e-05, -2.156198024749756e-05, -2.042483538389206e-05, -1.928769052028656e-05, -1.815054565668106e-05, -1.701340079307556e-05, -1.5876255929470062e-05, -1.4739111065864563e-05, -1.3601966202259064e-05, -1.2464821338653564e-05, -1.1327676475048065e-05, -1.0190531611442566e-05, -9.053386747837067e-06, -7.916241884231567e-06, -6.779097020626068e-06, -5.641952157020569e-06, -4.50480729341507e-06, -3.3676624298095703e-06, -2.230517566204071e-06, -1.0933727025985718e-06, 4.377216100692749e-08, 1.1809170246124268e-06, 2.318061888217926e-06, 3.4552067518234253e-06, 4.5923516154289246e-06, 5.729496479034424e-06, 6.866641342639923e-06, 8.003786206245422e-06, 9.140931069850922e-06, 1.0278075933456421e-05, 1.141522079706192e-05, 1.255236566066742e-05, 1.3689510524272919e-05, 1.4826655387878418e-05, 1.5963800251483917e-05, 1.7100945115089417e-05, 1.8238089978694916e-05, 1.9375234842300415e-05, 2.0512379705905914e-05, 2.1649524569511414e-05, 2.2786669433116913e-05, 2.3923814296722412e-05, 2.506095916032791e-05, 2.619810402393341e-05, 2.733524888753891e-05, 2.847239375114441e-05, 2.960953861474991e-05, 3.074668347835541e-05, 3.188382834196091e-05, 3.3020973205566406e-05]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 8.0, 6.0, 13.0, 15.0, 11.0, 13.0, 17.0, 17.0, 22.0, 20.0, 41.0, 53.0, 84.0, 139.0, 249.0, 878.0, 10655.0, 284167.0, 702358.0, 46564.0, 2272.0, 418.0, 174.0, 91.0, 51.0, 41.0, 36.0, 32.0, 23.0, 18.0, 16.0, 13.0, 11.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006003379821777344, -0.0005804747343063354, -0.0005606114864349365, -0.0005407482385635376, -0.0005208849906921387, -0.0005010217428207397, -0.0004811584949493408, -0.0004612952470779419, -0.00044143199920654297, -0.00042156875133514404, -0.0004017055034637451, -0.0003818422555923462, -0.00036197900772094727, -0.00034211575984954834, -0.0003222525119781494, -0.0003023892641067505, -0.00028252601623535156, -0.00026266276836395264, -0.0002427995204925537, -0.00022293627262115479, -0.00020307302474975586, -0.00018320977687835693, -0.000163346529006958, -0.00014348328113555908, -0.00012362003326416016, -0.00010375678539276123, -8.38935375213623e-05, -6.403028964996338e-05, -4.416704177856445e-05, -2.4303793907165527e-05, -4.4405460357666016e-06, 1.5422701835632324e-05, 3.528594970703125e-05, 5.5149197578430176e-05, 7.50124454498291e-05, 9.487569332122803e-05, 0.00011473894119262695, 0.00013460218906402588, 0.0001544654369354248, 0.00017432868480682373, 0.00019419193267822266, 0.00021405518054962158, 0.0002339184284210205, 0.00025378167629241943, 0.00027364492416381836, 0.0002935081720352173, 0.0003133714199066162, 0.00033323466777801514, 0.00035309791564941406, 0.000372961163520813, 0.0003928244113922119, 0.00041268765926361084, 0.00043255090713500977, 0.0004524141550064087, 0.0004722774028778076, 0.0004921406507492065, 0.0005120038986206055, 0.0005318671464920044, 0.0005517303943634033, 0.0005715936422348022, 0.0005914568901062012, 0.0006113201379776001, 0.000631183385848999, 0.000651046633720398, 0.0006709098815917969]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 21.0, 111.0, 332.0, 371.0, 130.0, 35.0, 11.0], "bins": [-0.0003826766333077103, -0.00037630938459187746, -0.0003699421067722142, -0.00036357485805638134, -0.0003572076093405485, -0.00035084033152088523, -0.0003444730828050524, -0.00033810583408921957, -0.00033173858537338674, -0.0003253713366575539, -0.0003190040588378906, -0.0003126368101220578, -0.00030626956140622497, -0.0002999022835865617, -0.00029353503487072885, -0.000287167786154896, -0.00028080050833523273, -0.0002744332596193999, -0.0002680659817997366, -0.0002616987330839038, -0.00025533148436807096, -0.00024896423565223813, -0.00024259695783257484, -0.00023622970911674201, -0.00022986246040090919, -0.00022349519713316113, -0.0002171279484173283, -0.00021076068514958024, -0.0002043934364337474, -0.00019802617316599935, -0.0001916589098982513, -0.00018529166118241847, -0.00017892441246658564, -0.00017255714919883758, -0.00016618990048300475, -0.0001598226372152567, -0.00015345538849942386, -0.0001470881252316758, -0.00014072086196392775, -0.00013435361324809492, -0.00012798634998034686, -0.00012161909398855641, -0.00011525183799676597, -0.00010888457472901791, -0.00010251731873722747, -9.615006274543703e-05, -8.978280675364658e-05, -8.341555076185614e-05, -7.70482947700657e-05, -7.068103877827525e-05, -6.431378278648481e-05, -5.794652315671556e-05, -5.1579263526946306e-05, -4.521200753515586e-05, -3.884475154336542e-05, -3.247749191359617e-05, -2.611023410281632e-05, -1.9742976292036474e-05, -1.3375719390751328e-05, -7.008462489466183e-06, -6.412046786863357e-07, 5.7260531320935115e-06, 1.2093309123883955e-05, 1.8460568753653206e-05, 2.482782474544365e-05]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 8.0, 7.0, 11.0, 19.0, 19.0, 18.0, 25.0, 26.0, 27.0, 33.0, 28.0, 28.0, 42.0, 31.0, 36.0, 36.0, 36.0, 45.0, 52.0, 49.0, 51.0, 37.0, 39.0, 42.0, 38.0, 36.0, 23.0, 25.0, 29.0, 17.0, 15.0, 17.0, 9.0, 7.0, 12.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.895427703857422e-05, -1.8271617591381073e-05, -1.7588958144187927e-05, -1.690629869699478e-05, -1.6223639249801636e-05, -1.554097980260849e-05, -1.4858320355415344e-05, -1.4175660908222198e-05, -1.3493001461029053e-05, -1.2810342013835907e-05, -1.2127682566642761e-05, -1.1445023119449615e-05, -1.076236367225647e-05, -1.0079704225063324e-05, -9.397044777870178e-06, -8.714385330677032e-06, -8.031725883483887e-06, -7.349066436290741e-06, -6.666406989097595e-06, -5.9837475419044495e-06, -5.301088094711304e-06, -4.618428647518158e-06, -3.935769200325012e-06, -3.2531097531318665e-06, -2.5704503059387207e-06, -1.887790858745575e-06, -1.2051314115524292e-06, -5.224719643592834e-07, 1.601874828338623e-07, 8.428469300270081e-07, 1.5255063772201538e-06, 2.2081658244132996e-06, 2.8908252716064453e-06, 3.573484718799591e-06, 4.256144165992737e-06, 4.9388036131858826e-06, 5.621463060379028e-06, 6.304122507572174e-06, 6.98678195476532e-06, 7.669441401958466e-06, 8.352100849151611e-06, 9.034760296344757e-06, 9.717419743537903e-06, 1.0400079190731049e-05, 1.1082738637924194e-05, 1.176539808511734e-05, 1.2448057532310486e-05, 1.3130716979503632e-05, 1.3813376426696777e-05, 1.4496035873889923e-05, 1.5178695321083069e-05, 1.5861354768276215e-05, 1.654401421546936e-05, 1.7226673662662506e-05, 1.7909333109855652e-05, 1.8591992557048798e-05, 1.9274652004241943e-05, 1.995731145143509e-05, 2.0639970898628235e-05, 2.132263034582138e-05, 2.2005289793014526e-05, 2.2687949240207672e-05, 2.3370608687400818e-05, 2.4053268134593964e-05, 2.473592758178711e-05]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 8.0, 10.0, 13.0, 17.0, 18.0, 14.0, 20.0, 25.0, 37.0, 49.0, 34.0, 38.0, 46.0, 44.0, 46.0, 48.0, 48.0, 44.0, 48.0, 45.0, 37.0, 54.0, 32.0, 40.0, 35.0, 21.0, 22.0, 24.0, 21.0, 14.0, 6.0, 10.0, 6.0, 2.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0078125, -4.83251953125, -4.6572265625, -4.48193359375, -4.306640625, -4.13134765625, -3.9560546875, -3.78076171875, -3.60546875, -3.43017578125, -3.2548828125, -3.07958984375, -2.904296875, -2.72900390625, -2.5537109375, -2.37841796875, -2.203125, -2.02783203125, -1.8525390625, -1.67724609375, -1.501953125, -1.32666015625, -1.1513671875, -0.97607421875, -0.80078125, -0.62548828125, -0.4501953125, -0.27490234375, -0.099609375, 0.07568359375, 0.2509765625, 0.42626953125, 0.6015625, 0.77685546875, 0.9521484375, 1.12744140625, 1.302734375, 1.47802734375, 1.6533203125, 1.82861328125, 2.00390625, 2.17919921875, 2.3544921875, 2.52978515625, 2.705078125, 2.88037109375, 3.0556640625, 3.23095703125, 3.40625, 3.58154296875, 3.7568359375, 3.93212890625, 4.107421875, 4.28271484375, 4.4580078125, 4.63330078125, 4.80859375, 4.98388671875, 5.1591796875, 5.33447265625, 5.509765625, 5.68505859375, 5.8603515625, 6.03564453125, 6.2109375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 15.0, 19.0, 17.0, 32.0, 42.0, 54.0, 59.0, 89.0, 137.0, 191.0, 367.0, 482.0, 720.0, 1198.0, 2226.0, 3986.0, 8031.0, 19506.0, 59506.0, 244702.0, 508610.0, 134699.0, 36671.0, 13344.0, 6050.0, 3174.0, 1742.0, 1022.0, 612.0, 356.0, 277.0, 180.0, 110.0, 83.0, 54.0, 42.0, 22.0, 22.0, 20.0, 18.0, 5.0, 11.0, 7.0, 6.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.0234375, -7.7750244140625, -7.526611328125, -7.2781982421875, -7.02978515625, -6.7813720703125, -6.532958984375, -6.2845458984375, -6.0361328125, -5.7877197265625, -5.539306640625, -5.2908935546875, -5.04248046875, -4.7940673828125, -4.545654296875, -4.2972412109375, -4.048828125, -3.8004150390625, -3.552001953125, -3.3035888671875, -3.05517578125, -2.8067626953125, -2.558349609375, -2.3099365234375, -2.0615234375, -1.8131103515625, -1.564697265625, -1.3162841796875, -1.06787109375, -0.8194580078125, -0.571044921875, -0.3226318359375, -0.07421875, 0.1741943359375, 0.422607421875, 0.6710205078125, 0.91943359375, 1.1678466796875, 1.416259765625, 1.6646728515625, 1.9130859375, 2.1614990234375, 2.409912109375, 2.6583251953125, 2.90673828125, 3.1551513671875, 3.403564453125, 3.6519775390625, 3.900390625, 4.1488037109375, 4.397216796875, 4.6456298828125, 4.89404296875, 5.1424560546875, 5.390869140625, 5.6392822265625, 5.8876953125, 6.1361083984375, 6.384521484375, 6.6329345703125, 6.88134765625, 7.1297607421875, 7.378173828125, 7.6265869140625, 7.875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 9.0, 11.0, 11.0, 13.0, 14.0, 18.0, 21.0, 25.0, 21.0, 28.0, 29.0, 28.0, 43.0, 37.0, 62.0, 68.0, 102.0, 140.0, 1406.0, 311.0, 135.0, 93.0, 61.0, 52.0, 53.0, 23.0, 28.0, 32.0, 23.0, 17.0, 19.0, 18.0, 16.0, 15.0, 9.0, 11.0, 10.0, 4.0, 9.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-15.9140625, -15.4583740234375, -15.002685546875, -14.5469970703125, -14.09130859375, -13.6356201171875, -13.179931640625, -12.7242431640625, -12.2685546875, -11.8128662109375, -11.357177734375, -10.9014892578125, -10.44580078125, -9.9901123046875, -9.534423828125, -9.0787353515625, -8.623046875, -8.1673583984375, -7.711669921875, -7.2559814453125, -6.80029296875, -6.3446044921875, -5.888916015625, -5.4332275390625, -4.9775390625, -4.5218505859375, -4.066162109375, -3.6104736328125, -3.15478515625, -2.6990966796875, -2.243408203125, -1.7877197265625, -1.33203125, -0.8763427734375, -0.420654296875, 0.0350341796875, 0.49072265625, 0.9464111328125, 1.402099609375, 1.8577880859375, 2.3134765625, 2.7691650390625, 3.224853515625, 3.6805419921875, 4.13623046875, 4.5919189453125, 5.047607421875, 5.5032958984375, 5.958984375, 6.4146728515625, 6.870361328125, 7.3260498046875, 7.78173828125, 8.2374267578125, 8.693115234375, 9.1488037109375, 9.6044921875, 10.0601806640625, 10.515869140625, 10.9715576171875, 11.42724609375, 11.8829345703125, 12.338623046875, 12.7943115234375, 13.25]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 2.0, 9.0, 6.0, 11.0, 11.0, 17.0, 16.0, 28.0, 35.0, 36.0, 44.0, 53.0, 71.0, 75.0, 123.0, 122.0, 209.0, 298.0, 644.0, 2321.0, 16534.0, 433589.0, 2634533.0, 49475.0, 4946.0, 1063.0, 414.0, 226.0, 162.0, 142.0, 96.0, 75.0, 67.0, 53.0, 41.0, 38.0, 23.0, 15.0, 26.0, 14.0, 11.0, 6.0, 3.0, 6.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.03125, -22.21484375, -21.3984375, -20.58203125, -19.765625, -18.94921875, -18.1328125, -17.31640625, -16.5, -15.68359375, -14.8671875, -14.05078125, -13.234375, -12.41796875, -11.6015625, -10.78515625, -9.96875, -9.15234375, -8.3359375, -7.51953125, -6.703125, -5.88671875, -5.0703125, -4.25390625, -3.4375, -2.62109375, -1.8046875, -0.98828125, -0.171875, 0.64453125, 1.4609375, 2.27734375, 3.09375, 3.91015625, 4.7265625, 5.54296875, 6.359375, 7.17578125, 7.9921875, 8.80859375, 9.625, 10.44140625, 11.2578125, 12.07421875, 12.890625, 13.70703125, 14.5234375, 15.33984375, 16.15625, 16.97265625, 17.7890625, 18.60546875, 19.421875, 20.23828125, 21.0546875, 21.87109375, 22.6875, 23.50390625, 24.3203125, 25.13671875, 25.953125, 26.76953125, 27.5859375, 28.40234375, 29.21875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 18.0, 57.0, 62.0, 122.0, 150.0, 179.0, 139.0, 122.0, 77.0, 41.0, 20.0, 9.0, 4.0, 3.0, 0.0, 1.0], "bins": [-76.39627838134766, -74.9651107788086, -73.53395080566406, -72.102783203125, -70.67162322998047, -69.2404556274414, -67.80929565429688, -66.37812805175781, -64.94696044921875, -63.51579666137695, -62.084632873535156, -60.653465270996094, -59.2223014831543, -57.7911376953125, -56.3599739074707, -54.928810119628906, -53.49764633178711, -52.06648254394531, -50.635318756103516, -49.20415496826172, -47.772987365722656, -46.34182357788086, -44.91065979003906, -43.479496002197266, -42.04833221435547, -40.61716842651367, -39.186004638671875, -37.75483703613281, -36.323673248291016, -34.89250946044922, -33.46134567260742, -32.030181884765625, -30.599010467529297, -29.1678466796875, -27.73668098449707, -26.305517196655273, -24.874351501464844, -23.443187713623047, -22.01202392578125, -20.580860137939453, -19.149696350097656, -17.71853256225586, -16.28736686706543, -14.856203079223633, -13.42503833770752, -11.993873596191406, -10.56270980834961, -9.131545066833496, -7.700379371643066, -6.269214630126953, -4.838050365447998, -3.406886100769043, -1.9757213592529297, -0.5445566177368164, 0.8866071701049805, 2.3177719116210938, 3.748936653137207, 5.18010139465332, 6.611265659332275, 8.04242992401123, 9.473594665527344, 10.904759407043457, 12.335923194885254, 13.767087936401367, 15.19825267791748]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 10.0, 9.0, 4.0, 14.0, 17.0, 7.0, 13.0, 10.0, 15.0, 22.0, 21.0, 25.0, 17.0, 30.0, 18.0, 31.0, 30.0, 44.0, 45.0, 41.0, 39.0, 32.0, 31.0, 35.0, 37.0, 36.0, 30.0, 36.0, 26.0, 21.0, 20.0, 36.0, 22.0, 23.0, 27.0, 17.0, 12.0, 14.0, 12.0, 15.0, 9.0, 10.0, 9.0, 4.0, 5.0, 4.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-36.84569549560547, -35.63563919067383, -34.42558288574219, -33.21552276611328, -32.00546646118164, -30.79541015625, -29.58535385131836, -28.375295639038086, -27.165237426757812, -25.955181121826172, -24.7451229095459, -23.535066604614258, -22.325008392333984, -21.114952087402344, -19.904895782470703, -18.69483757019043, -17.48478126525879, -16.27472496032715, -15.064666748046875, -13.854610443115234, -12.644552230834961, -11.43449592590332, -10.224438667297363, -9.014381408691406, -7.804324150085449, -6.594266891479492, -5.384209632873535, -4.174152851104736, -2.9640955924987793, -1.7540383338928223, -0.5439815521240234, 0.6660757064819336, 1.8761329650878906, 3.0861902236938477, 4.296247482299805, 5.5063042640686035, 6.7163615226745605, 7.926418781280518, 9.136475563049316, 10.346532821655273, 11.55659008026123, 12.766647338867188, 13.976704597473145, 15.186761856079102, 16.396818161010742, 17.606876373291016, 18.816932678222656, 20.026988983154297, 21.23704719543457, 22.44710350036621, 23.657161712646484, 24.867218017578125, 26.0772762298584, 27.28733253479004, 28.497390747070312, 29.707447052001953, 30.917503356933594, 32.127559661865234, 33.337615966796875, 34.54767608642578, 35.75773239135742, 36.96778869628906, 38.1778450012207, 39.387901306152344, 40.59796142578125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 8.0, 21.0, 16.0, 13.0, 18.0, 20.0, 33.0, 41.0, 50.0, 34.0, 49.0, 41.0, 41.0, 45.0, 54.0, 54.0, 42.0, 47.0, 54.0, 44.0, 38.0, 41.0, 36.0, 24.0, 22.0, 18.0, 24.0, 11.0, 9.0, 10.0, 11.0, 2.0, 6.0, 6.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.96136474609375, -4.7781982421875, -4.59503173828125, -4.411865234375, -4.22869873046875, -4.0455322265625, -3.86236572265625, -3.67919921875, -3.49603271484375, -3.3128662109375, -3.12969970703125, -2.946533203125, -2.76336669921875, -2.5802001953125, -2.39703369140625, -2.2138671875, -2.03070068359375, -1.8475341796875, -1.66436767578125, -1.481201171875, -1.29803466796875, -1.1148681640625, -0.93170166015625, -0.74853515625, -0.56536865234375, -0.3822021484375, -0.19903564453125, -0.015869140625, 0.16729736328125, 0.3504638671875, 0.53363037109375, 0.716796875, 0.89996337890625, 1.0831298828125, 1.26629638671875, 1.449462890625, 1.63262939453125, 1.8157958984375, 1.99896240234375, 2.18212890625, 2.36529541015625, 2.5484619140625, 2.73162841796875, 2.914794921875, 3.09796142578125, 3.2811279296875, 3.46429443359375, 3.6474609375, 3.83062744140625, 4.0137939453125, 4.19696044921875, 4.380126953125, 4.56329345703125, 4.7464599609375, 4.92962646484375, 5.11279296875, 5.29595947265625, 5.4791259765625, 5.66229248046875, 5.845458984375, 6.02862548828125, 6.2117919921875, 6.39495849609375, 6.578125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 4.0, 7.0, 11.0, 21.0, 26.0, 42.0, 67.0, 132.0, 219.0, 438.0, 791.0, 1926.0, 5024.0, 15389.0, 62460.0, 444948.0, 3016063.0, 548449.0, 71300.0, 17231.0, 5585.0, 2156.0, 904.0, 467.0, 236.0, 147.0, 84.0, 45.0, 37.0, 21.0, 15.0, 9.0, 3.0, 1.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.0625, -13.63037109375, -13.1982421875, -12.76611328125, -12.333984375, -11.90185546875, -11.4697265625, -11.03759765625, -10.60546875, -10.17333984375, -9.7412109375, -9.30908203125, -8.876953125, -8.44482421875, -8.0126953125, -7.58056640625, -7.1484375, -6.71630859375, -6.2841796875, -5.85205078125, -5.419921875, -4.98779296875, -4.5556640625, -4.12353515625, -3.69140625, -3.25927734375, -2.8271484375, -2.39501953125, -1.962890625, -1.53076171875, -1.0986328125, -0.66650390625, -0.234375, 0.19775390625, 0.6298828125, 1.06201171875, 1.494140625, 1.92626953125, 2.3583984375, 2.79052734375, 3.22265625, 3.65478515625, 4.0869140625, 4.51904296875, 4.951171875, 5.38330078125, 5.8154296875, 6.24755859375, 6.6796875, 7.11181640625, 7.5439453125, 7.97607421875, 8.408203125, 8.84033203125, 9.2724609375, 9.70458984375, 10.13671875, 10.56884765625, 11.0009765625, 11.43310546875, 11.865234375, 12.29736328125, 12.7294921875, 13.16162109375, 13.59375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 8.0, 11.0, 12.0, 27.0, 30.0, 44.0, 53.0, 87.0, 93.0, 152.0, 194.0, 274.0, 388.0, 587.0, 629.0, 428.0, 297.0, 197.0, 147.0, 120.0, 74.0, 69.0, 35.0, 29.0, 18.0, 17.0, 10.0, 8.0, 5.0, 7.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.8795166015625, -9.571533203125, -9.2635498046875, -8.95556640625, -8.6475830078125, -8.339599609375, -8.0316162109375, -7.7236328125, -7.4156494140625, -7.107666015625, -6.7996826171875, -6.49169921875, -6.1837158203125, -5.875732421875, -5.5677490234375, -5.259765625, -4.9517822265625, -4.643798828125, -4.3358154296875, -4.02783203125, -3.7198486328125, -3.411865234375, -3.1038818359375, -2.7958984375, -2.4879150390625, -2.179931640625, -1.8719482421875, -1.56396484375, -1.2559814453125, -0.947998046875, -0.6400146484375, -0.33203125, -0.0240478515625, 0.283935546875, 0.5919189453125, 0.89990234375, 1.2078857421875, 1.515869140625, 1.8238525390625, 2.1318359375, 2.4398193359375, 2.747802734375, 3.0557861328125, 3.36376953125, 3.6717529296875, 3.979736328125, 4.2877197265625, 4.595703125, 4.9036865234375, 5.211669921875, 5.5196533203125, 5.82763671875, 6.1356201171875, 6.443603515625, 6.7515869140625, 7.0595703125, 7.3675537109375, 7.675537109375, 7.9835205078125, 8.29150390625, 8.5994873046875, 8.907470703125, 9.2154541015625, 9.5234375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 9.0, 13.0, 25.0, 22.0, 48.0, 62.0, 78.0, 146.0, 235.0, 360.0, 833.0, 2648.0, 14156.0, 145787.0, 3061031.0, 905442.0, 53665.0, 6766.0, 1524.0, 606.0, 295.0, 175.0, 93.0, 68.0, 53.0, 36.0, 22.0, 20.0, 17.0, 11.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.75, -22.895751953125, -22.04150390625, -21.187255859375, -20.3330078125, -19.478759765625, -18.62451171875, -17.770263671875, -16.916015625, -16.061767578125, -15.20751953125, -14.353271484375, -13.4990234375, -12.644775390625, -11.79052734375, -10.936279296875, -10.08203125, -9.227783203125, -8.37353515625, -7.519287109375, -6.6650390625, -5.810791015625, -4.95654296875, -4.102294921875, -3.248046875, -2.393798828125, -1.53955078125, -0.685302734375, 0.1689453125, 1.023193359375, 1.87744140625, 2.731689453125, 3.5859375, 4.440185546875, 5.29443359375, 6.148681640625, 7.0029296875, 7.857177734375, 8.71142578125, 9.565673828125, 10.419921875, 11.274169921875, 12.12841796875, 12.982666015625, 13.8369140625, 14.691162109375, 15.54541015625, 16.399658203125, 17.25390625, 18.108154296875, 18.96240234375, 19.816650390625, 20.6708984375, 21.525146484375, 22.37939453125, 23.233642578125, 24.087890625, 24.942138671875, 25.79638671875, 26.650634765625, 27.5048828125, 28.359130859375, 29.21337890625, 30.067626953125, 30.921875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 29.0, 35.0, 47.0, 70.0, 75.0, 100.0, 117.0, 114.0, 104.0, 71.0, 62.0, 69.0, 33.0, 26.0, 11.0, 15.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.11507034301758, -56.42194747924805, -54.72882080078125, -53.03569793701172, -51.34257507324219, -49.649452209472656, -47.956329345703125, -46.26320266723633, -44.5700798034668, -42.876956939697266, -41.18383026123047, -39.49070739746094, -37.797584533691406, -36.104461669921875, -34.411338806152344, -32.71821212768555, -31.025089263916016, -29.331966400146484, -27.63884162902832, -25.945716857910156, -24.252593994140625, -22.559471130371094, -20.86634635925293, -19.173221588134766, -17.480098724365234, -15.786974906921387, -14.093851089477539, -12.400727272033691, -10.707603454589844, -9.014479637145996, -7.321355819702148, -5.628232002258301, -3.9351119995117188, -2.241988182067871, -0.5488643646240234, 1.1442594528198242, 2.837383270263672, 4.5305070877075195, 6.223630905151367, 7.916754722595215, 9.609878540039062, 11.30300235748291, 12.996126174926758, 14.689249992370605, 16.382373809814453, 18.075496673583984, 19.76862144470215, 21.461746215820312, 23.154869079589844, 24.847991943359375, 26.54111671447754, 28.234241485595703, 29.927364349365234, 31.620487213134766, 33.31361389160156, 35.006736755371094, 36.699859619140625, 38.392982482910156, 40.08610534667969, 41.779232025146484, 43.472354888916016, 45.16547775268555, 46.858604431152344, 48.551727294921875, 50.244850158691406]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 5.0, 3.0, 6.0, 4.0, 11.0, 8.0, 11.0, 10.0, 17.0, 14.0, 18.0, 20.0, 25.0, 23.0, 21.0, 31.0, 30.0, 39.0, 25.0, 27.0, 40.0, 39.0, 24.0, 32.0, 30.0, 39.0, 47.0, 22.0, 37.0, 45.0, 27.0, 31.0, 24.0, 30.0, 23.0, 26.0, 15.0, 17.0, 22.0, 10.0, 15.0, 10.0, 12.0, 8.0, 6.0, 7.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-24.57305908203125, -23.747072219848633, -22.921085357666016, -22.09510040283203, -21.269113540649414, -20.443126678466797, -19.61713981628418, -18.791152954101562, -17.965167999267578, -17.13918113708496, -16.313194274902344, -15.487208366394043, -14.661222457885742, -13.835235595703125, -13.009248733520508, -12.18326187133789, -11.357275009155273, -10.531288146972656, -9.705302238464355, -8.879315376281738, -8.053329467773438, -7.22734260559082, -6.401355743408203, -5.575369358062744, -4.749382972717285, -3.923396587371826, -3.097409963607788, -2.27142333984375, -1.445436954498291, -0.619450569152832, 0.20653629302978516, 1.0325226783752441, 1.8585090637207031, 2.684495449066162, 3.5104820728302, 4.336468696594238, 5.162455081939697, 5.988441467285156, 6.814428329467773, 7.640414714813232, 8.466401100158691, 9.292387962341309, 10.11837387084961, 10.944360733032227, 11.770347595214844, 12.596333503723145, 13.422320365905762, 14.248306274414062, 15.07429313659668, 15.900279998779297, 16.726266860961914, 17.55225372314453, 18.378238677978516, 19.204225540161133, 20.03021240234375, 20.856199264526367, 21.682186126708984, 22.5081729888916, 23.33415985107422, 24.160144805908203, 24.98613166809082, 25.812118530273438, 26.638105392456055, 27.464092254638672, 28.290077209472656]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 20.0, 13.0, 18.0, 23.0, 20.0, 24.0, 22.0, 36.0, 35.0, 45.0, 51.0, 44.0, 43.0, 35.0, 47.0, 47.0, 54.0, 37.0, 50.0, 47.0, 37.0, 46.0, 36.0, 27.0, 30.0, 19.0, 13.0, 17.0, 12.0, 12.0, 7.0, 10.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.26190185546875, -5.0823974609375, -4.90289306640625, -4.723388671875, -4.54388427734375, -4.3643798828125, -4.18487548828125, -4.00537109375, -3.82586669921875, -3.6463623046875, -3.46685791015625, -3.287353515625, -3.10784912109375, -2.9283447265625, -2.74884033203125, -2.5693359375, -2.38983154296875, -2.2103271484375, -2.03082275390625, -1.851318359375, -1.67181396484375, -1.4923095703125, -1.31280517578125, -1.13330078125, -0.95379638671875, -0.7742919921875, -0.59478759765625, -0.415283203125, -0.23577880859375, -0.0562744140625, 0.12322998046875, 0.302734375, 0.48223876953125, 0.6617431640625, 0.84124755859375, 1.020751953125, 1.20025634765625, 1.3797607421875, 1.55926513671875, 1.73876953125, 1.91827392578125, 2.0977783203125, 2.27728271484375, 2.456787109375, 2.63629150390625, 2.8157958984375, 2.99530029296875, 3.1748046875, 3.35430908203125, 3.5338134765625, 3.71331787109375, 3.892822265625, 4.07232666015625, 4.2518310546875, 4.43133544921875, 4.61083984375, 4.79034423828125, 4.9698486328125, 5.14935302734375, 5.328857421875, 5.50836181640625, 5.6878662109375, 5.86737060546875, 6.046875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 2.0, 6.0, 7.0, 13.0, 13.0, 20.0, 31.0, 41.0, 58.0, 102.0, 117.0, 151.0, 222.0, 340.0, 467.0, 708.0, 1072.0, 1497.0, 2191.0, 3340.0, 5029.0, 7599.0, 11383.0, 17506.0, 27416.0, 45723.0, 78823.0, 153309.0, 287904.0, 177948.0, 88634.0, 50322.0, 30459.0, 18967.0, 12254.0, 8153.0, 5518.0, 3503.0, 2448.0, 1614.0, 1213.0, 800.0, 511.0, 349.0, 250.0, 139.0, 108.0, 71.0, 52.0, 51.0, 32.0, 22.0, 16.0, 13.0, 13.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.176513671875, -0.1709270477294922, -0.16534042358398438, -0.15975379943847656, -0.15416717529296875, -0.14858055114746094, -0.14299392700195312, -0.1374073028564453, -0.1318206787109375, -0.1262340545654297, -0.12064743041992188, -0.11506080627441406, -0.10947418212890625, -0.10388755798339844, -0.09830093383789062, -0.09271430969238281, -0.087127685546875, -0.08154106140136719, -0.07595443725585938, -0.07036781311035156, -0.06478118896484375, -0.05919456481933594, -0.053607940673828125, -0.04802131652832031, -0.0424346923828125, -0.03684806823730469, -0.031261444091796875, -0.025674819946289062, -0.02008819580078125, -0.014501571655273438, -0.008914947509765625, -0.0033283233642578125, 0.00225830078125, 0.007844924926757812, 0.013431549072265625, 0.019018173217773438, 0.02460479736328125, 0.030191421508789062, 0.035778045654296875, 0.04136466979980469, 0.0469512939453125, 0.05253791809082031, 0.058124542236328125, 0.06371116638183594, 0.06929779052734375, 0.07488441467285156, 0.08047103881835938, 0.08605766296386719, 0.091644287109375, 0.09723091125488281, 0.10281753540039062, 0.10840415954589844, 0.11399078369140625, 0.11957740783691406, 0.12516403198242188, 0.1307506561279297, 0.1363372802734375, 0.1419239044189453, 0.14751052856445312, 0.15309715270996094, 0.15868377685546875, 0.16427040100097656, 0.16985702514648438, 0.1754436492919922, 0.1810302734375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 3.0, 6.0, 5.0, 6.0, 8.0, 12.0, 17.0, 15.0, 12.0, 16.0, 23.0, 11.0, 20.0, 25.0, 38.0, 22.0, 36.0, 28.0, 44.0, 42.0, 36.0, 1068.0, 50.0, 53.0, 38.0, 41.0, 40.0, 40.0, 40.0, 35.0, 24.0, 23.0, 28.0, 25.0, 14.0, 15.0, 15.0, 13.0, 9.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.396484375, -3.290252685546875, -3.18402099609375, -3.077789306640625, -2.9715576171875, -2.865325927734375, -2.75909423828125, -2.652862548828125, -2.546630859375, -2.440399169921875, -2.33416748046875, -2.227935791015625, -2.1217041015625, -2.015472412109375, -1.90924072265625, -1.803009033203125, -1.69677734375, -1.590545654296875, -1.48431396484375, -1.378082275390625, -1.2718505859375, -1.165618896484375, -1.05938720703125, -0.953155517578125, -0.846923828125, -0.740692138671875, -0.63446044921875, -0.528228759765625, -0.4219970703125, -0.315765380859375, -0.20953369140625, -0.103302001953125, 0.0029296875, 0.109161376953125, 0.21539306640625, 0.321624755859375, 0.4278564453125, 0.534088134765625, 0.64031982421875, 0.746551513671875, 0.852783203125, 0.959014892578125, 1.06524658203125, 1.171478271484375, 1.2777099609375, 1.383941650390625, 1.49017333984375, 1.596405029296875, 1.70263671875, 1.808868408203125, 1.91510009765625, 2.021331787109375, 2.1275634765625, 2.233795166015625, 2.34002685546875, 2.446258544921875, 2.552490234375, 2.658721923828125, 2.76495361328125, 2.871185302734375, 2.9774169921875, 3.083648681640625, 3.18988037109375, 3.296112060546875, 3.40234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 9.0, 12.0, 28.0, 33.0, 63.0, 73.0, 122.0, 190.0, 289.0, 474.0, 725.0, 1130.0, 1827.0, 2921.0, 4698.0, 7386.0, 12079.0, 19800.0, 33098.0, 57146.0, 113191.0, 928723.0, 656874.0, 112983.0, 58249.0, 33108.0, 19908.0, 12112.0, 7385.0, 4559.0, 2969.0, 1784.0, 1161.0, 694.0, 473.0, 293.0, 201.0, 125.0, 87.0, 49.0, 32.0, 21.0, 20.0, 8.0, 8.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.1259765625, -0.12215900421142578, -0.11834144592285156, -0.11452388763427734, -0.11070632934570312, -0.1068887710571289, -0.10307121276855469, -0.09925365447998047, -0.09543609619140625, -0.09161853790283203, -0.08780097961425781, -0.0839834213256836, -0.08016586303710938, -0.07634830474853516, -0.07253074645996094, -0.06871318817138672, -0.0648956298828125, -0.06107807159423828, -0.05726051330566406, -0.053442955017089844, -0.049625396728515625, -0.045807838439941406, -0.04199028015136719, -0.03817272186279297, -0.03435516357421875, -0.03053760528564453, -0.026720046997070312, -0.022902488708496094, -0.019084930419921875, -0.015267372131347656, -0.011449813842773438, -0.007632255554199219, -0.003814697265625, 2.86102294921875e-06, 0.0038204193115234375, 0.007637977600097656, 0.011455535888671875, 0.015273094177246094, 0.019090652465820312, 0.02290821075439453, 0.02672576904296875, 0.03054332733154297, 0.03436088562011719, 0.038178443908691406, 0.041996002197265625, 0.045813560485839844, 0.04963111877441406, 0.05344867706298828, 0.0572662353515625, 0.06108379364013672, 0.06490135192871094, 0.06871891021728516, 0.07253646850585938, 0.0763540267944336, 0.08017158508300781, 0.08398914337158203, 0.08780670166015625, 0.09162425994873047, 0.09544181823730469, 0.0992593765258789, 0.10307693481445312, 0.10689449310302734, 0.11071205139160156, 0.11452960968017578, 0.11834716796875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 13.0, 10.0, 8.0, 15.0, 12.0, 15.0, 19.0, 19.0, 28.0, 31.0, 28.0, 38.0, 45.0, 48.0, 34.0, 49.0, 41.0, 31.0, 39.0, 47.0, 34.0, 43.0, 41.0, 36.0, 41.0, 29.0, 27.0, 24.0, 26.0, 24.0, 18.0, 16.0, 11.0, 13.0, 9.0, 6.0, 6.0, 4.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.202127456665039e-05, -4.076492041349411e-05, -3.950856626033783e-05, -3.825221210718155e-05, -3.699585795402527e-05, -3.573950380086899e-05, -3.448314964771271e-05, -3.322679549455643e-05, -3.1970441341400146e-05, -3.0714087188243866e-05, -2.9457733035087585e-05, -2.8201378881931305e-05, -2.6945024728775024e-05, -2.5688670575618744e-05, -2.4432316422462463e-05, -2.3175962269306183e-05, -2.1919608116149902e-05, -2.0663253962993622e-05, -1.940689980983734e-05, -1.815054565668106e-05, -1.689419150352478e-05, -1.56378373503685e-05, -1.438148319721222e-05, -1.3125129044055939e-05, -1.1868774890899658e-05, -1.0612420737743378e-05, -9.356066584587097e-06, -8.099712431430817e-06, -6.843358278274536e-06, -5.587004125118256e-06, -4.330649971961975e-06, -3.0742958188056946e-06, -1.817941665649414e-06, -5.615875124931335e-07, 6.94766640663147e-07, 1.9511207938194275e-06, 3.207474946975708e-06, 4.4638291001319885e-06, 5.720183253288269e-06, 6.9765374064445496e-06, 8.23289155960083e-06, 9.48924571275711e-06, 1.0745599865913391e-05, 1.2001954019069672e-05, 1.3258308172225952e-05, 1.4514662325382233e-05, 1.5771016478538513e-05, 1.7027370631694794e-05, 1.8283724784851074e-05, 1.9540078938007355e-05, 2.0796433091163635e-05, 2.2052787244319916e-05, 2.3309141397476196e-05, 2.4565495550632477e-05, 2.5821849703788757e-05, 2.7078203856945038e-05, 2.833455801010132e-05, 2.95909121632576e-05, 3.084726631641388e-05, 3.210362046957016e-05, 3.335997462272644e-05, 3.461632877588272e-05, 3.5872682929039e-05, 3.712903708219528e-05, 3.838539123535156e-05]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 5.0, 2.0, 1.0, 6.0, 3.0, 3.0, 4.0, 9.0, 15.0, 10.0, 6.0, 13.0, 26.0, 22.0, 28.0, 26.0, 36.0, 48.0, 53.0, 84.0, 140.0, 221.0, 673.0, 4755.0, 153984.0, 819659.0, 64934.0, 2687.0, 507.0, 190.0, 100.0, 69.0, 39.0, 34.0, 26.0, 28.0, 22.0, 22.0, 7.0, 9.0, 12.0, 11.0, 7.0, 7.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0006852149963378906, -0.0006626620888710022, -0.0006401091814041138, -0.0006175562739372253, -0.0005950033664703369, -0.0005724504590034485, -0.0005498975515365601, -0.0005273446440696716, -0.0005047917366027832, -0.0004822388291358948, -0.00045968592166900635, -0.0004371330142021179, -0.0004145801067352295, -0.00039202719926834106, -0.00036947429180145264, -0.0003469213843345642, -0.0003243684768676758, -0.00030181556940078735, -0.0002792626619338989, -0.0002567097544670105, -0.00023415684700012207, -0.00021160393953323364, -0.00018905103206634521, -0.0001664981245994568, -0.00014394521713256836, -0.00012139230966567993, -9.88394021987915e-05, -7.628649473190308e-05, -5.373358726501465e-05, -3.118067979812622e-05, -8.627772331237793e-06, 1.3925135135650635e-05, 3.647804260253906e-05, 5.903095006942749e-05, 8.158385753631592e-05, 0.00010413676500320435, 0.00012668967247009277, 0.0001492425799369812, 0.00017179548740386963, 0.00019434839487075806, 0.00021690130233764648, 0.0002394542098045349, 0.00026200711727142334, 0.00028456002473831177, 0.0003071129322052002, 0.0003296658396720886, 0.00035221874713897705, 0.0003747716546058655, 0.0003973245620727539, 0.00041987746953964233, 0.00044243037700653076, 0.0004649832844734192, 0.0004875361919403076, 0.000510089099407196, 0.0005326420068740845, 0.0005551949143409729, 0.0005777478218078613, 0.0006003007292747498, 0.0006228536367416382, 0.0006454065442085266, 0.000667959451675415, 0.0006905123591423035, 0.0007130652666091919, 0.0007356181740760803, 0.0007581710815429688]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 22.0, 345.0, 607.0, 44.0], "bins": [-0.0008578122942708433, -0.0008440157980658114, -0.0008302193018607795, -0.0008164228056557477, -0.0008026263094507158, -0.0007888298714533448, -0.000775033375248313, -0.0007612368790432811, -0.0007474403828382492, -0.0007336438866332173, -0.0007198473904281855, -0.0007060508942231536, -0.0006922543980181217, -0.0006784579018130898, -0.000664661405608058, -0.000650864967610687, -0.0006370684131979942, -0.0006232719169929624, -0.0006094754207879305, -0.0005956789245828986, -0.0005818824283778667, -0.0005680859321728349, -0.000554289435967803, -0.000540492997970432, -0.0005266965017654002, -0.0005129000055603683, -0.0004991035093553364, -0.00048530701315030456, -0.00047151054604910314, -0.00045771404984407127, -0.0004439175536390394, -0.0004301210574340075, -0.0004163245903328061, -0.00040252809412777424, -0.00038873159792274237, -0.0003749351017177105, -0.0003611386346165091, -0.0003473421384114772, -0.00033354564220644534, -0.00031974914600141346, -0.00030595267890021205, -0.0002921561826951802, -0.0002783596864901483, -0.00026456319028511643, -0.000250766723183915, -0.00023697022697888315, -0.00022317373077385128, -0.0002093772345688194, -0.00019558073836378753, -0.00018178424215875566, -0.00016798776050563902, -0.00015419126430060714, -0.0001403947826474905, -0.00012659828644245863, -0.00011280179023742676, -9.90053013083525e-05, -8.520881237927824e-05, -7.141232345020398e-05, -5.761583088315092e-05, -4.3819338316097856e-05, -3.0022849387023598e-05, -1.622636045794934e-05, -2.4298642529174685e-06, 1.1366624676156789e-05, 2.516310996725224e-05]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 9.0, 12.0, 13.0, 12.0, 22.0, 16.0, 23.0, 31.0, 29.0, 48.0, 52.0, 51.0, 51.0, 57.0, 64.0, 47.0, 59.0, 60.0, 50.0, 41.0, 46.0, 46.0, 35.0, 29.0, 21.0, 23.0, 13.0, 13.0, 11.0, 10.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9027462005615234e-05, -2.7797184884548187e-05, -2.656690776348114e-05, -2.5336630642414093e-05, -2.4106353521347046e-05, -2.287607640028e-05, -2.164579927921295e-05, -2.0415522158145905e-05, -1.9185245037078857e-05, -1.795496791601181e-05, -1.6724690794944763e-05, -1.5494413673877716e-05, -1.4264136552810669e-05, -1.3033859431743622e-05, -1.1803582310676575e-05, -1.0573305189609528e-05, -9.34302806854248e-06, -8.112750947475433e-06, -6.882473826408386e-06, -5.652196705341339e-06, -4.421919584274292e-06, -3.191642463207245e-06, -1.9613653421401978e-06, -7.310882210731506e-07, 4.991888999938965e-07, 1.7294660210609436e-06, 2.9597431421279907e-06, 4.190020263195038e-06, 5.420297384262085e-06, 6.650574505329132e-06, 7.88085162639618e-06, 9.111128747463226e-06, 1.0341405868530273e-05, 1.157168298959732e-05, 1.2801960110664368e-05, 1.4032237231731415e-05, 1.5262514352798462e-05, 1.649279147386551e-05, 1.7723068594932556e-05, 1.8953345715999603e-05, 2.018362283706665e-05, 2.1413899958133698e-05, 2.2644177079200745e-05, 2.3874454200267792e-05, 2.510473132133484e-05, 2.6335008442401886e-05, 2.7565285563468933e-05, 2.879556268453598e-05, 3.0025839805603027e-05, 3.1256116926670074e-05, 3.248639404773712e-05, 3.371667116880417e-05, 3.4946948289871216e-05, 3.617722541093826e-05, 3.740750253200531e-05, 3.863777965307236e-05, 3.9868056774139404e-05, 4.109833389520645e-05, 4.23286110162735e-05, 4.3558888137340546e-05, 4.478916525840759e-05, 4.601944237947464e-05, 4.724971950054169e-05, 4.8479996621608734e-05, 4.971027374267578e-05]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 20.0, 13.0, 18.0, 23.0, 20.0, 24.0, 22.0, 36.0, 35.0, 45.0, 51.0, 44.0, 43.0, 35.0, 47.0, 47.0, 54.0, 37.0, 50.0, 47.0, 37.0, 46.0, 36.0, 27.0, 30.0, 19.0, 13.0, 17.0, 12.0, 12.0, 7.0, 10.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.26190185546875, -5.0823974609375, -4.90289306640625, -4.723388671875, -4.54388427734375, -4.3643798828125, -4.18487548828125, -4.00537109375, -3.82586669921875, -3.6463623046875, -3.46685791015625, -3.287353515625, -3.10784912109375, -2.9283447265625, -2.74884033203125, -2.5693359375, -2.38983154296875, -2.2103271484375, -2.03082275390625, -1.851318359375, -1.67181396484375, -1.4923095703125, -1.31280517578125, -1.13330078125, -0.95379638671875, -0.7742919921875, -0.59478759765625, -0.415283203125, -0.23577880859375, -0.0562744140625, 0.12322998046875, 0.302734375, 0.48223876953125, 0.6617431640625, 0.84124755859375, 1.020751953125, 1.20025634765625, 1.3797607421875, 1.55926513671875, 1.73876953125, 1.91827392578125, 2.0977783203125, 2.27728271484375, 2.456787109375, 2.63629150390625, 2.8157958984375, 2.99530029296875, 3.1748046875, 3.35430908203125, 3.5338134765625, 3.71331787109375, 3.892822265625, 4.07232666015625, 4.2518310546875, 4.43133544921875, 4.61083984375, 4.79034423828125, 4.9698486328125, 5.14935302734375, 5.328857421875, 5.50836181640625, 5.6878662109375, 5.86737060546875, 6.046875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 10.0, 9.0, 13.0, 12.0, 15.0, 31.0, 33.0, 58.0, 62.0, 122.0, 162.0, 261.0, 426.0, 652.0, 1125.0, 1866.0, 3526.0, 7285.0, 17349.0, 54823.0, 253564.0, 532893.0, 120126.0, 31109.0, 11258.0, 5180.0, 2658.0, 1480.0, 855.0, 550.0, 345.0, 228.0, 141.0, 102.0, 66.0, 43.0, 23.0, 28.0, 21.0, 9.0, 9.0, 6.0, 5.0, 2.0, 5.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.875, -5.6871337890625, -5.499267578125, -5.3114013671875, -5.12353515625, -4.9356689453125, -4.747802734375, -4.5599365234375, -4.3720703125, -4.1842041015625, -3.996337890625, -3.8084716796875, -3.62060546875, -3.4327392578125, -3.244873046875, -3.0570068359375, -2.869140625, -2.6812744140625, -2.493408203125, -2.3055419921875, -2.11767578125, -1.9298095703125, -1.741943359375, -1.5540771484375, -1.3662109375, -1.1783447265625, -0.990478515625, -0.8026123046875, -0.61474609375, -0.4268798828125, -0.239013671875, -0.0511474609375, 0.13671875, 0.3245849609375, 0.512451171875, 0.7003173828125, 0.88818359375, 1.0760498046875, 1.263916015625, 1.4517822265625, 1.6396484375, 1.8275146484375, 2.015380859375, 2.2032470703125, 2.39111328125, 2.5789794921875, 2.766845703125, 2.9547119140625, 3.142578125, 3.3304443359375, 3.518310546875, 3.7061767578125, 3.89404296875, 4.0819091796875, 4.269775390625, 4.4576416015625, 4.6455078125, 4.8333740234375, 5.021240234375, 5.2091064453125, 5.39697265625, 5.5848388671875, 5.772705078125, 5.9605712890625, 6.1484375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 5.0, 7.0, 8.0, 5.0, 12.0, 14.0, 21.0, 16.0, 30.0, 17.0, 35.0, 23.0, 28.0, 27.0, 34.0, 46.0, 46.0, 63.0, 94.0, 322.0, 1542.0, 156.0, 76.0, 58.0, 47.0, 41.0, 29.0, 38.0, 27.0, 45.0, 18.0, 20.0, 21.0, 13.0, 18.0, 9.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4140625, -14.9190673828125, -14.424072265625, -13.9290771484375, -13.43408203125, -12.9390869140625, -12.444091796875, -11.9490966796875, -11.4541015625, -10.9591064453125, -10.464111328125, -9.9691162109375, -9.47412109375, -8.9791259765625, -8.484130859375, -7.9891357421875, -7.494140625, -6.9991455078125, -6.504150390625, -6.0091552734375, -5.51416015625, -5.0191650390625, -4.524169921875, -4.0291748046875, -3.5341796875, -3.0391845703125, -2.544189453125, -2.0491943359375, -1.55419921875, -1.0592041015625, -0.564208984375, -0.0692138671875, 0.42578125, 0.9207763671875, 1.415771484375, 1.9107666015625, 2.40576171875, 2.9007568359375, 3.395751953125, 3.8907470703125, 4.3857421875, 4.8807373046875, 5.375732421875, 5.8707275390625, 6.36572265625, 6.8607177734375, 7.355712890625, 7.8507080078125, 8.345703125, 8.8406982421875, 9.335693359375, 9.8306884765625, 10.32568359375, 10.8206787109375, 11.315673828125, 11.8106689453125, 12.3056640625, 12.8006591796875, 13.295654296875, 13.7906494140625, 14.28564453125, 14.7806396484375, 15.275634765625, 15.7706298828125, 16.265625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 10.0, 10.0, 14.0, 17.0, 22.0, 47.0, 36.0, 43.0, 81.0, 94.0, 118.0, 180.0, 269.0, 505.0, 1103.0, 4401.0, 43034.0, 2862960.0, 219009.0, 10116.0, 1825.0, 649.0, 364.0, 208.0, 128.0, 99.0, 75.0, 65.0, 51.0, 29.0, 29.0, 22.0, 18.0, 17.0, 14.0, 9.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0], "bins": [-27.71875, -26.896728515625, -26.07470703125, -25.252685546875, -24.4306640625, -23.608642578125, -22.78662109375, -21.964599609375, -21.142578125, -20.320556640625, -19.49853515625, -18.676513671875, -17.8544921875, -17.032470703125, -16.21044921875, -15.388427734375, -14.56640625, -13.744384765625, -12.92236328125, -12.100341796875, -11.2783203125, -10.456298828125, -9.63427734375, -8.812255859375, -7.990234375, -7.168212890625, -6.34619140625, -5.524169921875, -4.7021484375, -3.880126953125, -3.05810546875, -2.236083984375, -1.4140625, -0.592041015625, 0.22998046875, 1.052001953125, 1.8740234375, 2.696044921875, 3.51806640625, 4.340087890625, 5.162109375, 5.984130859375, 6.80615234375, 7.628173828125, 8.4501953125, 9.272216796875, 10.09423828125, 10.916259765625, 11.73828125, 12.560302734375, 13.38232421875, 14.204345703125, 15.0263671875, 15.848388671875, 16.67041015625, 17.492431640625, 18.314453125, 19.136474609375, 19.95849609375, 20.780517578125, 21.6025390625, 22.424560546875, 23.24658203125, 24.068603515625, 24.890625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [2.0, 56.0, 831.0, 127.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.220638275146484, -13.68605899810791, -5.151479721069336, 3.383098602294922, 11.917678833007812, 20.452259063720703, 28.986835479736328, 37.52141571044922, 46.05599594116211, 54.590576171875, 63.125152587890625, 71.65972900390625, 80.1943130493164, 88.72889709472656, 97.26347351074219, 105.79804992675781, 114.33262634277344, 122.86720275878906, 131.4017791748047, 139.93637084960938, 148.470947265625, 157.00552368164062, 165.54010009765625, 174.07467651367188, 182.60926818847656, 191.1438446044922, 199.6784210205078, 208.2130126953125, 216.74758911132812, 225.28216552734375, 233.81674194335938, 242.351318359375, 250.88589477539062, 259.42047119140625, 267.9550476074219, 276.4896240234375, 285.0242004394531, 293.55877685546875, 302.0933837890625, 310.6279602050781, 319.16253662109375, 327.6971130371094, 336.231689453125, 344.7662658691406, 353.30084228515625, 361.83544921875, 370.3699951171875, 378.90460205078125, 387.43914794921875, 395.9737243652344, 404.50830078125, 413.0428771972656, 421.57745361328125, 430.112060546875, 438.6466064453125, 447.18121337890625, 455.7157897949219, 464.2503662109375, 472.7849426269531, 481.31951904296875, 489.8540954589844, 498.388671875, 506.92327880859375, 515.4578247070312, 523.992431640625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 9.0, 9.0, 5.0, 13.0, 13.0, 16.0, 26.0, 18.0, 16.0, 30.0, 33.0, 32.0, 44.0, 35.0, 43.0, 32.0, 35.0, 48.0, 37.0, 33.0, 54.0, 41.0, 45.0, 40.0, 34.0, 33.0, 22.0, 26.0, 25.0, 29.0, 21.0, 19.0, 12.0, 9.0, 15.0, 9.0, 7.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.14728927612305, -47.708553314208984, -46.26981735229492, -44.83108139038086, -43.39234161376953, -41.95360565185547, -40.514869689941406, -39.076133728027344, -37.63739776611328, -36.19866180419922, -34.759925842285156, -33.321189880371094, -31.8824520111084, -30.443716049194336, -29.00497817993164, -27.566242218017578, -26.127506256103516, -24.688770294189453, -23.25003433227539, -21.811296463012695, -20.372560501098633, -18.93382453918457, -17.495086669921875, -16.056350708007812, -14.61761474609375, -13.178878784179688, -11.740141868591309, -10.30140495300293, -8.862668991088867, -7.4239325523376465, -5.985196113586426, -4.546459197998047, -3.1077232360839844, -1.6689867973327637, -0.23025035858154297, 1.2084860801696777, 2.6472225189208984, 4.085958957672119, 5.52469539642334, 6.963432312011719, 8.402168273925781, 9.840904235839844, 11.279641151428223, 12.718378067016602, 14.157114028930664, 15.595849990844727, 17.034587860107422, 18.473323822021484, 19.912059783935547, 21.35079574584961, 22.789531707763672, 24.228269577026367, 25.66700553894043, 27.105741500854492, 28.544479370117188, 29.98321533203125, 31.421951293945312, 32.860687255859375, 34.29942321777344, 35.7381591796875, 37.17689514160156, 38.61563491821289, 40.05437088012695, 41.493106842041016, 42.93184280395508]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 16.0, 18.0, 17.0, 18.0, 24.0, 24.0, 32.0, 37.0, 39.0, 45.0, 41.0, 53.0, 38.0, 40.0, 44.0, 56.0, 41.0, 44.0, 45.0, 51.0, 36.0, 41.0, 33.0, 27.0, 26.0, 16.0, 12.0, 17.0, 12.0, 12.0, 11.0, 5.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40625, -5.2254638671875, -5.044677734375, -4.8638916015625, -4.68310546875, -4.5023193359375, -4.321533203125, -4.1407470703125, -3.9599609375, -3.7791748046875, -3.598388671875, -3.4176025390625, -3.23681640625, -3.0560302734375, -2.875244140625, -2.6944580078125, -2.513671875, -2.3328857421875, -2.152099609375, -1.9713134765625, -1.79052734375, -1.6097412109375, -1.428955078125, -1.2481689453125, -1.0673828125, -0.8865966796875, -0.705810546875, -0.5250244140625, -0.34423828125, -0.1634521484375, 0.017333984375, 0.1981201171875, 0.37890625, 0.5596923828125, 0.740478515625, 0.9212646484375, 1.10205078125, 1.2828369140625, 1.463623046875, 1.6444091796875, 1.8251953125, 2.0059814453125, 2.186767578125, 2.3675537109375, 2.54833984375, 2.7291259765625, 2.909912109375, 3.0906982421875, 3.271484375, 3.4522705078125, 3.633056640625, 3.8138427734375, 3.99462890625, 4.1754150390625, 4.356201171875, 4.5369873046875, 4.7177734375, 4.8985595703125, 5.079345703125, 5.2601318359375, 5.44091796875, 5.6217041015625, 5.802490234375, 5.9832763671875, 6.1640625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 7.0, 5.0, 7.0, 17.0, 20.0, 25.0, 31.0, 53.0, 95.0, 163.0, 205.0, 376.0, 649.0, 1288.0, 2815.0, 7086.0, 22308.0, 89969.0, 677138.0, 2852694.0, 441134.0, 68669.0, 18283.0, 6103.0, 2491.0, 1117.0, 588.0, 312.0, 249.0, 109.0, 85.0, 51.0, 41.0, 25.0, 24.0, 14.0, 7.0, 6.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-13.484375, -13.080810546875, -12.67724609375, -12.273681640625, -11.8701171875, -11.466552734375, -11.06298828125, -10.659423828125, -10.255859375, -9.852294921875, -9.44873046875, -9.045166015625, -8.6416015625, -8.238037109375, -7.83447265625, -7.430908203125, -7.02734375, -6.623779296875, -6.22021484375, -5.816650390625, -5.4130859375, -5.009521484375, -4.60595703125, -4.202392578125, -3.798828125, -3.395263671875, -2.99169921875, -2.588134765625, -2.1845703125, -1.781005859375, -1.37744140625, -0.973876953125, -0.5703125, -0.166748046875, 0.23681640625, 0.640380859375, 1.0439453125, 1.447509765625, 1.85107421875, 2.254638671875, 2.658203125, 3.061767578125, 3.46533203125, 3.868896484375, 4.2724609375, 4.676025390625, 5.07958984375, 5.483154296875, 5.88671875, 6.290283203125, 6.69384765625, 7.097412109375, 7.5009765625, 7.904541015625, 8.30810546875, 8.711669921875, 9.115234375, 9.518798828125, 9.92236328125, 10.325927734375, 10.7294921875, 11.133056640625, 11.53662109375, 11.940185546875, 12.34375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 10.0, 22.0, 24.0, 40.0, 74.0, 112.0, 162.0, 286.0, 484.0, 761.0, 827.0, 486.0, 294.0, 183.0, 103.0, 66.0, 48.0, 32.0, 20.0, 15.0, 14.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.375, -17.927001953125, -17.47900390625, -17.031005859375, -16.5830078125, -16.135009765625, -15.68701171875, -15.239013671875, -14.791015625, -14.343017578125, -13.89501953125, -13.447021484375, -12.9990234375, -12.551025390625, -12.10302734375, -11.655029296875, -11.20703125, -10.759033203125, -10.31103515625, -9.863037109375, -9.4150390625, -8.967041015625, -8.51904296875, -8.071044921875, -7.623046875, -7.175048828125, -6.72705078125, -6.279052734375, -5.8310546875, -5.383056640625, -4.93505859375, -4.487060546875, -4.0390625, -3.591064453125, -3.14306640625, -2.695068359375, -2.2470703125, -1.799072265625, -1.35107421875, -0.903076171875, -0.455078125, -0.007080078125, 0.44091796875, 0.888916015625, 1.3369140625, 1.784912109375, 2.23291015625, 2.680908203125, 3.12890625, 3.576904296875, 4.02490234375, 4.472900390625, 4.9208984375, 5.368896484375, 5.81689453125, 6.264892578125, 6.712890625, 7.160888671875, 7.60888671875, 8.056884765625, 8.5048828125, 8.952880859375, 9.40087890625, 9.848876953125, 10.296875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 14.0, 11.0, 24.0, 22.0, 37.0, 65.0, 118.0, 230.0, 426.0, 1019.0, 10534.0, 1297104.0, 2866377.0, 16106.0, 1205.0, 428.0, 240.0, 147.0, 71.0, 42.0, 24.0, 16.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.75, -40.083984375, -38.41796875, -36.751953125, -35.0859375, -33.419921875, -31.75390625, -30.087890625, -28.421875, -26.755859375, -25.08984375, -23.423828125, -21.7578125, -20.091796875, -18.42578125, -16.759765625, -15.09375, -13.427734375, -11.76171875, -10.095703125, -8.4296875, -6.763671875, -5.09765625, -3.431640625, -1.765625, -0.099609375, 1.56640625, 3.232421875, 4.8984375, 6.564453125, 8.23046875, 9.896484375, 11.5625, 13.228515625, 14.89453125, 16.560546875, 18.2265625, 19.892578125, 21.55859375, 23.224609375, 24.890625, 26.556640625, 28.22265625, 29.888671875, 31.5546875, 33.220703125, 34.88671875, 36.552734375, 38.21875, 39.884765625, 41.55078125, 43.216796875, 44.8828125, 46.548828125, 48.21484375, 49.880859375, 51.546875, 53.212890625, 54.87890625, 56.544921875, 58.2109375, 59.876953125, 61.54296875, 63.208984375, 64.875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 8.0, 11.0, 35.0, 57.0, 103.0, 120.0, 163.0, 157.0, 134.0, 92.0, 63.0, 29.0, 19.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.79570007324219, -81.18170928955078, -78.56771087646484, -75.95372009277344, -73.33972930908203, -70.72573852539062, -68.11174011230469, -65.49774932861328, -62.88375473022461, -60.26976013183594, -57.65576934814453, -55.04177474975586, -52.42778015136719, -49.81378936767578, -47.19979476928711, -44.58580017089844, -41.97180938720703, -39.35781478881836, -36.74382400512695, -34.12982940673828, -31.515836715698242, -28.901844024658203, -26.28784942626953, -23.673856735229492, -21.059864044189453, -18.445871353149414, -15.831877708435059, -13.217884063720703, -10.603891372680664, -7.989898681640625, -5.3759050369262695, -2.761911392211914, -0.147918701171875, 2.4660744667053223, 5.0800676345825195, 7.694060802459717, 10.308053970336914, 12.922046661376953, 15.536040306091309, 18.150033950805664, 20.764026641845703, 23.378019332885742, 25.99201202392578, 28.606006622314453, 31.219999313354492, 33.83399200439453, 36.4479866027832, 39.061981201171875, 41.67597198486328, 44.28996658325195, 46.90395736694336, 49.51795196533203, 52.13194274902344, 54.74593734741211, 57.35993194580078, 59.97392272949219, 62.58791732788086, 65.20191192626953, 67.81590270996094, 70.42989349365234, 73.04389190673828, 75.65788269042969, 78.2718734741211, 80.88587188720703, 83.49986267089844]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 5.0, 4.0, 0.0, 14.0, 11.0, 13.0, 10.0, 15.0, 10.0, 21.0, 33.0, 20.0, 31.0, 34.0, 31.0, 45.0, 36.0, 35.0, 35.0, 39.0, 40.0, 41.0, 48.0, 48.0, 45.0, 37.0, 42.0, 35.0, 29.0, 36.0, 41.0, 26.0, 18.0, 14.0, 8.0, 14.0, 7.0, 5.0, 9.0, 8.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.581565856933594, -28.5837345123291, -27.585901260375977, -26.588069915771484, -25.590238571166992, -24.5924072265625, -23.594573974609375, -22.596742630004883, -21.59891128540039, -20.6010799407959, -19.603246688842773, -18.60541534423828, -17.60758399963379, -16.609752655029297, -15.611919403076172, -14.61408805847168, -13.616254806518555, -12.618422508239746, -11.620591163635254, -10.622758865356445, -9.624927520751953, -8.627095222473145, -7.629262924194336, -6.6314311027526855, -5.633599281311035, -4.635767459869385, -3.6379354000091553, -2.640103340148926, -1.6422715187072754, -0.644439697265625, 0.3533926010131836, 1.351224422454834, 2.3490562438964844, 3.3468880653381348, 4.344719886779785, 5.342552185058594, 6.340384006500244, 7.3382158279418945, 8.336048126220703, 9.333879470825195, 10.331711769104004, 11.329544067382812, 12.327375411987305, 13.325207710266113, 14.323040008544922, 15.320871353149414, 16.318702697753906, 17.31653594970703, 18.314367294311523, 19.312198638916016, 20.31003189086914, 21.307863235473633, 22.305694580078125, 23.30352783203125, 24.301359176635742, 25.299190521240234, 26.29702377319336, 27.29485511779785, 28.292688369750977, 29.29051971435547, 30.28835105895996, 31.286182403564453, 32.28401565551758, 33.2818489074707, 34.27967834472656]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 11.0, 21.0, 16.0, 14.0, 22.0, 25.0, 30.0, 42.0, 45.0, 29.0, 45.0, 51.0, 52.0, 48.0, 44.0, 44.0, 49.0, 56.0, 47.0, 46.0, 42.0, 41.0, 38.0, 29.0, 23.0, 18.0, 13.0, 10.0, 7.0, 14.0, 3.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6953125, -6.49761962890625, -6.2999267578125, -6.10223388671875, -5.904541015625, -5.70684814453125, -5.5091552734375, -5.31146240234375, -5.11376953125, -4.91607666015625, -4.7183837890625, -4.52069091796875, -4.322998046875, -4.12530517578125, -3.9276123046875, -3.72991943359375, -3.5322265625, -3.33453369140625, -3.1368408203125, -2.93914794921875, -2.741455078125, -2.54376220703125, -2.3460693359375, -2.14837646484375, -1.95068359375, -1.75299072265625, -1.5552978515625, -1.35760498046875, -1.159912109375, -0.96221923828125, -0.7645263671875, -0.56683349609375, -0.369140625, -0.17144775390625, 0.0262451171875, 0.22393798828125, 0.421630859375, 0.61932373046875, 0.8170166015625, 1.01470947265625, 1.21240234375, 1.41009521484375, 1.6077880859375, 1.80548095703125, 2.003173828125, 2.20086669921875, 2.3985595703125, 2.59625244140625, 2.7939453125, 2.99163818359375, 3.1893310546875, 3.38702392578125, 3.584716796875, 3.78240966796875, 3.9801025390625, 4.17779541015625, 4.37548828125, 4.57318115234375, 4.7708740234375, 4.96856689453125, 5.166259765625, 5.36395263671875, 5.5616455078125, 5.75933837890625, 5.95703125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 9.0, 16.0, 31.0, 45.0, 66.0, 112.0, 180.0, 298.0, 532.0, 1012.0, 1822.0, 3335.0, 6574.0, 12826.0, 25951.0, 53807.0, 125095.0, 355700.0, 275039.0, 97897.0, 44291.0, 21171.0, 10663.0, 5750.0, 2899.0, 1518.0, 794.0, 439.0, 251.0, 135.0, 103.0, 64.0, 45.0, 26.0, 15.0, 11.0, 9.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.301025390625, -0.29213714599609375, -0.2832489013671875, -0.27436065673828125, -0.265472412109375, -0.25658416748046875, -0.2476959228515625, -0.23880767822265625, -0.22991943359375, -0.22103118896484375, -0.2121429443359375, -0.20325469970703125, -0.194366455078125, -0.18547821044921875, -0.1765899658203125, -0.16770172119140625, -0.1588134765625, -0.14992523193359375, -0.1410369873046875, -0.13214874267578125, -0.123260498046875, -0.11437225341796875, -0.1054840087890625, -0.09659576416015625, -0.08770751953125, -0.07881927490234375, -0.0699310302734375, -0.06104278564453125, -0.052154541015625, -0.04326629638671875, -0.0343780517578125, -0.02548980712890625, -0.0166015625, -0.00771331787109375, 0.0011749267578125, 0.01006317138671875, 0.018951416015625, 0.02783966064453125, 0.0367279052734375, 0.04561614990234375, 0.05450439453125, 0.06339263916015625, 0.0722808837890625, 0.08116912841796875, 0.090057373046875, 0.09894561767578125, 0.1078338623046875, 0.11672210693359375, 0.1256103515625, 0.13449859619140625, 0.1433868408203125, 0.15227508544921875, 0.161163330078125, 0.17005157470703125, 0.1789398193359375, 0.18782806396484375, 0.19671630859375, 0.20560455322265625, 0.2144927978515625, 0.22338104248046875, 0.232269287109375, 0.24115753173828125, 0.2500457763671875, 0.25893402099609375, 0.267822265625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 10.0, 5.0, 7.0, 11.0, 9.0, 15.0, 12.0, 20.0, 20.0, 17.0, 18.0, 34.0, 29.0, 36.0, 42.0, 34.0, 53.0, 48.0, 36.0, 49.0, 1069.0, 47.0, 38.0, 44.0, 40.0, 42.0, 37.0, 31.0, 35.0, 29.0, 20.0, 14.0, 16.0, 10.0, 14.0, 10.0, 9.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.525390625, -3.4085693359375, -3.291748046875, -3.1749267578125, -3.05810546875, -2.9412841796875, -2.824462890625, -2.7076416015625, -2.5908203125, -2.4739990234375, -2.357177734375, -2.2403564453125, -2.12353515625, -2.0067138671875, -1.889892578125, -1.7730712890625, -1.65625, -1.5394287109375, -1.422607421875, -1.3057861328125, -1.18896484375, -1.0721435546875, -0.955322265625, -0.8385009765625, -0.7216796875, -0.6048583984375, -0.488037109375, -0.3712158203125, -0.25439453125, -0.1375732421875, -0.020751953125, 0.0960693359375, 0.212890625, 0.3297119140625, 0.446533203125, 0.5633544921875, 0.68017578125, 0.7969970703125, 0.913818359375, 1.0306396484375, 1.1474609375, 1.2642822265625, 1.381103515625, 1.4979248046875, 1.61474609375, 1.7315673828125, 1.848388671875, 1.9652099609375, 2.08203125, 2.1988525390625, 2.315673828125, 2.4324951171875, 2.54931640625, 2.6661376953125, 2.782958984375, 2.8997802734375, 3.0166015625, 3.1334228515625, 3.250244140625, 3.3670654296875, 3.48388671875, 3.6007080078125, 3.717529296875, 3.8343505859375, 3.951171875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 7.0, 9.0, 18.0, 23.0, 26.0, 63.0, 96.0, 135.0, 216.0, 358.0, 604.0, 964.0, 1553.0, 2667.0, 4387.0, 7272.0, 12771.0, 21779.0, 39304.0, 75192.0, 165232.0, 1385593.0, 193231.0, 84725.0, 43171.0, 23892.0, 13901.0, 8093.0, 4583.0, 2864.0, 1716.0, 1026.0, 638.0, 401.0, 221.0, 148.0, 94.0, 55.0, 35.0, 23.0, 22.0, 11.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.12622642517089844, -0.12195968627929688, -0.11769294738769531, -0.11342620849609375, -0.10915946960449219, -0.10489273071289062, -0.10062599182128906, -0.0963592529296875, -0.09209251403808594, -0.08782577514648438, -0.08355903625488281, -0.07929229736328125, -0.07502555847167969, -0.07075881958007812, -0.06649208068847656, -0.062225341796875, -0.05795860290527344, -0.053691864013671875, -0.04942512512207031, -0.04515838623046875, -0.04089164733886719, -0.036624908447265625, -0.03235816955566406, -0.0280914306640625, -0.023824691772460938, -0.019557952880859375, -0.015291213989257812, -0.01102447509765625, -0.0067577362060546875, -0.002490997314453125, 0.0017757415771484375, 0.00604248046875, 0.010309219360351562, 0.014575958251953125, 0.018842697143554688, 0.02310943603515625, 0.027376174926757812, 0.031642913818359375, 0.03590965270996094, 0.0401763916015625, 0.04444313049316406, 0.048709869384765625, 0.05297660827636719, 0.05724334716796875, 0.06151008605957031, 0.06577682495117188, 0.07004356384277344, 0.074310302734375, 0.07857704162597656, 0.08284378051757812, 0.08711051940917969, 0.09137725830078125, 0.09564399719238281, 0.09991073608398438, 0.10417747497558594, 0.1084442138671875, 0.11271095275878906, 0.11697769165039062, 0.12124443054199219, 0.12551116943359375, 0.1297779083251953, 0.13404464721679688, 0.13831138610839844, 0.142578125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 5.0, 6.0, 4.0, 9.0, 8.0, 9.0, 11.0, 18.0, 13.0, 20.0, 29.0, 38.0, 36.0, 40.0, 46.0, 45.0, 53.0, 50.0, 53.0, 55.0, 52.0, 55.0, 40.0, 35.0, 44.0, 45.0, 42.0, 26.0, 21.0, 27.0, 19.0, 14.0, 10.0, 6.0, 4.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7954578399658203e-05, -2.6697292923927307e-05, -2.544000744819641e-05, -2.4182721972465515e-05, -2.292543649673462e-05, -2.1668151021003723e-05, -2.0410865545272827e-05, -1.915358006954193e-05, -1.7896294593811035e-05, -1.663900911808014e-05, -1.5381723642349243e-05, -1.4124438166618347e-05, -1.2867152690887451e-05, -1.1609867215156555e-05, -1.035258173942566e-05, -9.095296263694763e-06, -7.838010787963867e-06, -6.580725312232971e-06, -5.323439836502075e-06, -4.066154360771179e-06, -2.808868885040283e-06, -1.5515834093093872e-06, -2.942979335784912e-07, 9.629875421524048e-07, 2.2202730178833008e-06, 3.4775584936141968e-06, 4.734843969345093e-06, 5.992129445075989e-06, 7.249414920806885e-06, 8.50670039653778e-06, 9.763985872268677e-06, 1.1021271347999573e-05, 1.2278556823730469e-05, 1.3535842299461365e-05, 1.479312777519226e-05, 1.6050413250923157e-05, 1.7307698726654053e-05, 1.856498420238495e-05, 1.9822269678115845e-05, 2.107955515384674e-05, 2.2336840629577637e-05, 2.3594126105308533e-05, 2.485141158103943e-05, 2.6108697056770325e-05, 2.736598253250122e-05, 2.8623268008232117e-05, 2.9880553483963013e-05, 3.113783895969391e-05, 3.2395124435424805e-05, 3.36524099111557e-05, 3.49096953868866e-05, 3.616698086261749e-05, 3.742426633834839e-05, 3.8681551814079285e-05, 3.993883728981018e-05, 4.119612276554108e-05, 4.245340824127197e-05, 4.371069371700287e-05, 4.4967979192733765e-05, 4.622526466846466e-05, 4.748255014419556e-05, 4.873983561992645e-05, 4.999712109565735e-05, 5.1254406571388245e-05, 5.251169204711914e-05]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 10.0, 14.0, 13.0, 15.0, 18.0, 25.0, 26.0, 42.0, 44.0, 57.0, 100.0, 190.0, 460.0, 2700.0, 105091.0, 854117.0, 82344.0, 2315.0, 400.0, 170.0, 114.0, 66.0, 47.0, 31.0, 30.0, 15.0, 22.0, 7.0, 16.0, 11.0, 7.0, 9.0, 3.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0], "bins": [-0.0009331703186035156, -0.0009101107716560364, -0.0008870512247085571, -0.0008639916777610779, -0.0008409321308135986, -0.0008178725838661194, -0.0007948130369186401, -0.0007717534899711609, -0.0007486939430236816, -0.0007256343960762024, -0.0007025748491287231, -0.0006795153021812439, -0.0006564557552337646, -0.0006333962082862854, -0.0006103366613388062, -0.0005872771143913269, -0.0005642175674438477, -0.0005411580204963684, -0.0005180984735488892, -0.0004950389266014099, -0.00047197937965393066, -0.0004489198327064514, -0.00042586028575897217, -0.0004028007388114929, -0.00037974119186401367, -0.0003566816449165344, -0.0003336220979690552, -0.00031056255102157593, -0.0002875030040740967, -0.00026444345712661743, -0.00024138391017913818, -0.00021832436323165894, -0.0001952648162841797, -0.00017220526933670044, -0.0001491457223892212, -0.00012608617544174194, -0.0001030266284942627, -7.996708154678345e-05, -5.69075345993042e-05, -3.384798765182495e-05, -1.0788440704345703e-05, 1.2271106243133545e-05, 3.533065319061279e-05, 5.839020013809204e-05, 8.144974708557129e-05, 0.00010450929403305054, 0.00012756884098052979, 0.00015062838792800903, 0.00017368793487548828, 0.00019674748182296753, 0.00021980702877044678, 0.00024286657571792603, 0.0002659261226654053, 0.0002889856696128845, 0.00031204521656036377, 0.000335104763507843, 0.00035816431045532227, 0.0003812238574028015, 0.00040428340435028076, 0.00042734295129776, 0.00045040249824523926, 0.0004734620451927185, 0.0004965215921401978, 0.000519581139087677, 0.0005426406860351562]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 58.0, 414.0, 485.0, 56.0, 3.0], "bins": [-0.0006435181712731719, -0.0006329793250188231, -0.0006224404205568135, -0.0006119015743024647, -0.000601362728048116, -0.0005908238817937672, -0.0005802849773317575, -0.0005697461310774088, -0.00055920728482306, -0.0005486684385687113, -0.0005381295341067016, -0.0005275906878523529, -0.0005170518415980041, -0.0005065129953436553, -0.0004959740908816457, -0.0004854352446272969, -0.0004748963692691177, -0.0004643574939109385, -0.00045381864765658975, -0.00044327977229841053, -0.0004327409260440618, -0.00042220205068588257, -0.0004116632044315338, -0.0004011243290733546, -0.0003905854537151754, -0.0003800465783569962, -0.0003695077321026474, -0.0003589688567444682, -0.00034843001049011946, -0.00033789113513194025, -0.00032735225977376103, -0.0003168134135194123, -0.0003062745672650635, -0.0002957356919068843, -0.00028519684565253556, -0.00027465797029435635, -0.0002641191240400076, -0.0002535802486818284, -0.0002430413878755644, -0.0002325025270693004, -0.00022196368081495166, -0.00021142482000868767, -0.0002008859592024237, -0.00019034708384424448, -0.00017980823758989573, -0.00016926936223171651, -0.00015873050142545253, -0.00014819164061918855, -0.00013765277981292456, -0.00012711391900666058, -0.0001165750582003966, -0.000106036190118175, -9.549732931191102e-05, -8.495846850564703e-05, -7.441960042342544e-05, -6.388073961716145e-05, -5.334187517291866e-05, -4.280301072867587e-05, -3.226414992241189e-05, -2.17252854781691e-05, -1.1186424671905115e-05, -6.47563865641132e-07, 9.891304216580465e-06, 2.043016502284445e-05, 3.096902582910843e-05]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 10.0, 13.0, 5.0, 15.0, 26.0, 20.0, 23.0, 33.0, 37.0, 35.0, 40.0, 38.0, 55.0, 46.0, 64.0, 48.0, 56.0, 39.0, 55.0, 58.0, 35.0, 47.0, 25.0, 29.0, 24.0, 20.0, 17.0, 20.0, 22.0, 7.0, 12.0, 6.0, 6.0, 6.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.568960189819336e-05, -2.481415867805481e-05, -2.393871545791626e-05, -2.306327223777771e-05, -2.218782901763916e-05, -2.131238579750061e-05, -2.043694257736206e-05, -1.956149935722351e-05, -1.868605613708496e-05, -1.781061291694641e-05, -1.693516969680786e-05, -1.605972647666931e-05, -1.5184283256530762e-05, -1.4308840036392212e-05, -1.3433396816253662e-05, -1.2557953596115112e-05, -1.1682510375976562e-05, -1.0807067155838013e-05, -9.931623935699463e-06, -9.056180715560913e-06, -8.180737495422363e-06, -7.3052942752838135e-06, -6.429851055145264e-06, -5.554407835006714e-06, -4.678964614868164e-06, -3.8035213947296143e-06, -2.9280781745910645e-06, -2.0526349544525146e-06, -1.1771917343139648e-06, -3.0174851417541504e-07, 5.736947059631348e-07, 1.4491379261016846e-06, 2.3245811462402344e-06, 3.200024366378784e-06, 4.075467586517334e-06, 4.950910806655884e-06, 5.826354026794434e-06, 6.701797246932983e-06, 7.577240467071533e-06, 8.452683687210083e-06, 9.328126907348633e-06, 1.0203570127487183e-05, 1.1079013347625732e-05, 1.1954456567764282e-05, 1.2829899787902832e-05, 1.3705343008041382e-05, 1.4580786228179932e-05, 1.545622944831848e-05, 1.633167266845703e-05, 1.720711588859558e-05, 1.808255910873413e-05, 1.895800232887268e-05, 1.983344554901123e-05, 2.070888876914978e-05, 2.158433198928833e-05, 2.245977520942688e-05, 2.333521842956543e-05, 2.421066164970398e-05, 2.508610486984253e-05, 2.596154808998108e-05, 2.683699131011963e-05, 2.771243453025818e-05, 2.858787775039673e-05, 2.946332097053528e-05, 3.0338764190673828e-05]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 11.0, 21.0, 16.0, 14.0, 22.0, 25.0, 30.0, 42.0, 45.0, 29.0, 45.0, 51.0, 52.0, 48.0, 44.0, 44.0, 49.0, 56.0, 47.0, 46.0, 42.0, 41.0, 38.0, 29.0, 23.0, 18.0, 13.0, 10.0, 7.0, 14.0, 3.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6953125, -6.49761962890625, -6.2999267578125, -6.10223388671875, -5.904541015625, -5.70684814453125, -5.5091552734375, -5.31146240234375, -5.11376953125, -4.91607666015625, -4.7183837890625, -4.52069091796875, -4.322998046875, -4.12530517578125, -3.9276123046875, -3.72991943359375, -3.5322265625, -3.33453369140625, -3.1368408203125, -2.93914794921875, -2.741455078125, -2.54376220703125, -2.3460693359375, -2.14837646484375, -1.95068359375, -1.75299072265625, -1.5552978515625, -1.35760498046875, -1.159912109375, -0.96221923828125, -0.7645263671875, -0.56683349609375, -0.369140625, -0.17144775390625, 0.0262451171875, 0.22393798828125, 0.421630859375, 0.61932373046875, 0.8170166015625, 1.01470947265625, 1.21240234375, 1.41009521484375, 1.6077880859375, 1.80548095703125, 2.003173828125, 2.20086669921875, 2.3985595703125, 2.59625244140625, 2.7939453125, 2.99163818359375, 3.1893310546875, 3.38702392578125, 3.584716796875, 3.78240966796875, 3.9801025390625, 4.17779541015625, 4.37548828125, 4.57318115234375, 4.7708740234375, 4.96856689453125, 5.166259765625, 5.36395263671875, 5.5616455078125, 5.75933837890625, 5.95703125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 12.0, 10.0, 16.0, 27.0, 36.0, 67.0, 106.0, 149.0, 299.0, 541.0, 1067.0, 2078.0, 4354.0, 8965.0, 20157.0, 51823.0, 224808.0, 566434.0, 107124.0, 33374.0, 14126.0, 6536.0, 3117.0, 1562.0, 771.0, 441.0, 220.0, 116.0, 76.0, 52.0, 31.0, 24.0, 16.0, 8.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6796875, -8.458740234375, -8.23779296875, -8.016845703125, -7.7958984375, -7.574951171875, -7.35400390625, -7.133056640625, -6.912109375, -6.691162109375, -6.47021484375, -6.249267578125, -6.0283203125, -5.807373046875, -5.58642578125, -5.365478515625, -5.14453125, -4.923583984375, -4.70263671875, -4.481689453125, -4.2607421875, -4.039794921875, -3.81884765625, -3.597900390625, -3.376953125, -3.156005859375, -2.93505859375, -2.714111328125, -2.4931640625, -2.272216796875, -2.05126953125, -1.830322265625, -1.609375, -1.388427734375, -1.16748046875, -0.946533203125, -0.7255859375, -0.504638671875, -0.28369140625, -0.062744140625, 0.158203125, 0.379150390625, 0.60009765625, 0.821044921875, 1.0419921875, 1.262939453125, 1.48388671875, 1.704833984375, 1.92578125, 2.146728515625, 2.36767578125, 2.588623046875, 2.8095703125, 3.030517578125, 3.25146484375, 3.472412109375, 3.693359375, 3.914306640625, 4.13525390625, 4.356201171875, 4.5771484375, 4.798095703125, 5.01904296875, 5.239990234375, 5.4609375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 11.0, 8.0, 11.0, 12.0, 10.0, 18.0, 22.0, 25.0, 18.0, 25.0, 25.0, 41.0, 31.0, 57.0, 48.0, 78.0, 95.0, 450.0, 1477.0, 110.0, 82.0, 54.0, 42.0, 37.0, 35.0, 32.0, 34.0, 32.0, 28.0, 25.0, 17.0, 16.0, 13.0, 13.0, 8.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.765625, -17.192626953125, -16.61962890625, -16.046630859375, -15.4736328125, -14.900634765625, -14.32763671875, -13.754638671875, -13.181640625, -12.608642578125, -12.03564453125, -11.462646484375, -10.8896484375, -10.316650390625, -9.74365234375, -9.170654296875, -8.59765625, -8.024658203125, -7.45166015625, -6.878662109375, -6.3056640625, -5.732666015625, -5.15966796875, -4.586669921875, -4.013671875, -3.440673828125, -2.86767578125, -2.294677734375, -1.7216796875, -1.148681640625, -0.57568359375, -0.002685546875, 0.5703125, 1.143310546875, 1.71630859375, 2.289306640625, 2.8623046875, 3.435302734375, 4.00830078125, 4.581298828125, 5.154296875, 5.727294921875, 6.30029296875, 6.873291015625, 7.4462890625, 8.019287109375, 8.59228515625, 9.165283203125, 9.73828125, 10.311279296875, 10.88427734375, 11.457275390625, 12.0302734375, 12.603271484375, 13.17626953125, 13.749267578125, 14.322265625, 14.895263671875, 15.46826171875, 16.041259765625, 16.6142578125, 17.187255859375, 17.76025390625, 18.333251953125, 18.90625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 15.0, 14.0, 15.0, 19.0, 29.0, 34.0, 50.0, 61.0, 73.0, 123.0, 129.0, 175.0, 275.0, 519.0, 4722.0, 735728.0, 2395531.0, 6563.0, 664.0, 262.0, 164.0, 113.0, 93.0, 78.0, 51.0, 40.0, 35.0, 27.0, 26.0, 14.0, 14.0, 9.0, 10.0, 10.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.6875, -39.45654296875, -38.2255859375, -36.99462890625, -35.763671875, -34.53271484375, -33.3017578125, -32.07080078125, -30.83984375, -29.60888671875, -28.3779296875, -27.14697265625, -25.916015625, -24.68505859375, -23.4541015625, -22.22314453125, -20.9921875, -19.76123046875, -18.5302734375, -17.29931640625, -16.068359375, -14.83740234375, -13.6064453125, -12.37548828125, -11.14453125, -9.91357421875, -8.6826171875, -7.45166015625, -6.220703125, -4.98974609375, -3.7587890625, -2.52783203125, -1.296875, -0.06591796875, 1.1650390625, 2.39599609375, 3.626953125, 4.85791015625, 6.0888671875, 7.31982421875, 8.55078125, 9.78173828125, 11.0126953125, 12.24365234375, 13.474609375, 14.70556640625, 15.9365234375, 17.16748046875, 18.3984375, 19.62939453125, 20.8603515625, 22.09130859375, 23.322265625, 24.55322265625, 25.7841796875, 27.01513671875, 28.24609375, 29.47705078125, 30.7080078125, 31.93896484375, 33.169921875, 34.40087890625, 35.6318359375, 36.86279296875, 38.09375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 103.0, 862.0, 53.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.199392318725586, -15.809703826904297, -9.420015335083008, -3.0303268432617188, 3.3593616485595703, 9.74905014038086, 16.13873863220215, 22.52842903137207, 28.918115615844727, 35.307804107666016, 41.69749450683594, 48.087181091308594, 54.47686767578125, 60.86655807495117, 67.2562484741211, 73.64593505859375, 80.0356216430664, 86.42530822753906, 92.81500244140625, 99.2046890258789, 105.59437561035156, 111.98406219482422, 118.37374877929688, 124.76344299316406, 131.15313720703125, 137.54283142089844, 143.93251037597656, 150.32220458984375, 156.71188354492188, 163.10157775878906, 169.49127197265625, 175.88095092773438, 182.2706298828125, 188.6603240966797, 195.0500030517578, 201.439697265625, 207.82937622070312, 214.2190704345703, 220.6087646484375, 226.99844360351562, 233.3881378173828, 239.77783203125, 246.16751098632812, 252.5572052001953, 258.9468994140625, 265.3365783691406, 271.72625732421875, 278.115966796875, 284.5056457519531, 290.89532470703125, 297.2850341796875, 303.6747131347656, 310.06439208984375, 316.4541015625, 322.8437805175781, 329.23345947265625, 335.6231689453125, 342.0128479003906, 348.4025573730469, 354.792236328125, 361.1819152832031, 367.5716247558594, 373.9613037109375, 380.3509826660156, 386.74066162109375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 5.0, 6.0, 10.0, 8.0, 15.0, 14.0, 12.0, 15.0, 20.0, 16.0, 15.0, 28.0, 22.0, 28.0, 34.0, 30.0, 26.0, 44.0, 42.0, 50.0, 31.0, 44.0, 40.0, 47.0, 38.0, 34.0, 31.0, 26.0, 28.0, 21.0, 32.0, 31.0, 22.0, 16.0, 19.0, 16.0, 14.0, 16.0, 8.0, 13.0, 9.0, 6.0, 5.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.385005950927734, -41.04255294799805, -39.700096130371094, -38.357643127441406, -37.01518630981445, -35.672733306884766, -34.33027648925781, -32.987823486328125, -31.645368576049805, -30.302913665771484, -28.960458755493164, -27.618003845214844, -26.275550842285156, -24.933094024658203, -23.590641021728516, -22.248186111450195, -20.905731201171875, -19.563276290893555, -18.220821380615234, -16.878368377685547, -15.53591251373291, -14.19345760345459, -12.851003646850586, -11.508548736572266, -10.166093826293945, -8.823638916015625, -7.481184482574463, -6.138730049133301, -4.7962751388549805, -3.45382022857666, -2.1113662719726562, -0.7689113616943359, 0.57354736328125, 1.9160020351409912, 3.2584567070007324, 4.6009111404418945, 5.943366050720215, 7.285820960998535, 8.628274917602539, 9.97072982788086, 11.31318473815918, 12.6556396484375, 13.99809455871582, 15.340548515319824, 16.683002471923828, 18.02545928955078, 19.36791229248047, 20.71036720275879, 22.05282211303711, 23.39527702331543, 24.73773193359375, 26.080184936523438, 27.42264175415039, 28.765094757080078, 30.1075496673584, 31.45000457763672, 32.792457580566406, 34.134910583496094, 35.47736740112305, 36.819820404052734, 38.16227722167969, 39.504730224609375, 40.84718322753906, 42.189640045166016, 43.53209686279297]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 15.0, 19.0, 17.0, 20.0, 23.0, 23.0, 28.0, 40.0, 42.0, 36.0, 50.0, 51.0, 50.0, 41.0, 46.0, 35.0, 64.0, 39.0, 48.0, 47.0, 43.0, 49.0, 27.0, 29.0, 27.0, 16.0, 8.0, 16.0, 12.0, 11.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.3280029296875, -6.128662109375, -5.9293212890625, -5.72998046875, -5.5306396484375, -5.331298828125, -5.1319580078125, -4.9326171875, -4.7332763671875, -4.533935546875, -4.3345947265625, -4.13525390625, -3.9359130859375, -3.736572265625, -3.5372314453125, -3.337890625, -3.1385498046875, -2.939208984375, -2.7398681640625, -2.54052734375, -2.3411865234375, -2.141845703125, -1.9425048828125, -1.7431640625, -1.5438232421875, -1.344482421875, -1.1451416015625, -0.94580078125, -0.7464599609375, -0.547119140625, -0.3477783203125, -0.1484375, 0.0509033203125, 0.250244140625, 0.4495849609375, 0.64892578125, 0.8482666015625, 1.047607421875, 1.2469482421875, 1.4462890625, 1.6456298828125, 1.844970703125, 2.0443115234375, 2.24365234375, 2.4429931640625, 2.642333984375, 2.8416748046875, 3.041015625, 3.2403564453125, 3.439697265625, 3.6390380859375, 3.83837890625, 4.0377197265625, 4.237060546875, 4.4364013671875, 4.6357421875, 4.8350830078125, 5.034423828125, 5.2337646484375, 5.43310546875, 5.6324462890625, 5.831787109375, 6.0311279296875, 6.23046875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 8.0, 8.0, 10.0, 13.0, 21.0, 31.0, 27.0, 50.0, 44.0, 99.0, 125.0, 182.0, 266.0, 499.0, 1027.0, 2653.0, 9213.0, 40769.0, 320663.0, 3119039.0, 618588.0, 61819.0, 12562.0, 3675.0, 1322.0, 583.0, 302.0, 195.0, 118.0, 77.0, 72.0, 61.0, 37.0, 29.0, 21.0, 20.0, 13.0, 10.0, 8.0, 2.0, 3.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.5078125, -15.017333984375, -14.52685546875, -14.036376953125, -13.5458984375, -13.055419921875, -12.56494140625, -12.074462890625, -11.583984375, -11.093505859375, -10.60302734375, -10.112548828125, -9.6220703125, -9.131591796875, -8.64111328125, -8.150634765625, -7.66015625, -7.169677734375, -6.67919921875, -6.188720703125, -5.6982421875, -5.207763671875, -4.71728515625, -4.226806640625, -3.736328125, -3.245849609375, -2.75537109375, -2.264892578125, -1.7744140625, -1.283935546875, -0.79345703125, -0.302978515625, 0.1875, 0.677978515625, 1.16845703125, 1.658935546875, 2.1494140625, 2.639892578125, 3.13037109375, 3.620849609375, 4.111328125, 4.601806640625, 5.09228515625, 5.582763671875, 6.0732421875, 6.563720703125, 7.05419921875, 7.544677734375, 8.03515625, 8.525634765625, 9.01611328125, 9.506591796875, 9.9970703125, 10.487548828125, 10.97802734375, 11.468505859375, 11.958984375, 12.449462890625, 12.93994140625, 13.430419921875, 13.9208984375, 14.411376953125, 14.90185546875, 15.392333984375, 15.8828125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 4.0, 3.0, 12.0, 18.0, 24.0, 58.0, 80.0, 137.0, 250.0, 418.0, 822.0, 927.0, 515.0, 319.0, 191.0, 122.0, 61.0, 45.0, 26.0, 19.0, 11.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15625, -14.669921875, -14.18359375, -13.697265625, -13.2109375, -12.724609375, -12.23828125, -11.751953125, -11.265625, -10.779296875, -10.29296875, -9.806640625, -9.3203125, -8.833984375, -8.34765625, -7.861328125, -7.375, -6.888671875, -6.40234375, -5.916015625, -5.4296875, -4.943359375, -4.45703125, -3.970703125, -3.484375, -2.998046875, -2.51171875, -2.025390625, -1.5390625, -1.052734375, -0.56640625, -0.080078125, 0.40625, 0.892578125, 1.37890625, 1.865234375, 2.3515625, 2.837890625, 3.32421875, 3.810546875, 4.296875, 4.783203125, 5.26953125, 5.755859375, 6.2421875, 6.728515625, 7.21484375, 7.701171875, 8.1875, 8.673828125, 9.16015625, 9.646484375, 10.1328125, 10.619140625, 11.10546875, 11.591796875, 12.078125, 12.564453125, 13.05078125, 13.537109375, 14.0234375, 14.509765625, 14.99609375, 15.482421875, 15.96875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 12.0, 24.0, 34.0, 52.0, 86.0, 209.0, 434.0, 1269.0, 16365.0, 3758184.0, 412050.0, 4302.0, 719.0, 255.0, 109.0, 71.0, 40.0, 21.0, 14.0, 13.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.46875, -60.50439453125, -58.5400390625, -56.57568359375, -54.611328125, -52.64697265625, -50.6826171875, -48.71826171875, -46.75390625, -44.78955078125, -42.8251953125, -40.86083984375, -38.896484375, -36.93212890625, -34.9677734375, -33.00341796875, -31.0390625, -29.07470703125, -27.1103515625, -25.14599609375, -23.181640625, -21.21728515625, -19.2529296875, -17.28857421875, -15.32421875, -13.35986328125, -11.3955078125, -9.43115234375, -7.466796875, -5.50244140625, -3.5380859375, -1.57373046875, 0.390625, 2.35498046875, 4.3193359375, 6.28369140625, 8.248046875, 10.21240234375, 12.1767578125, 14.14111328125, 16.10546875, 18.06982421875, 20.0341796875, 21.99853515625, 23.962890625, 25.92724609375, 27.8916015625, 29.85595703125, 31.8203125, 33.78466796875, 35.7490234375, 37.71337890625, 39.677734375, 41.64208984375, 43.6064453125, 45.57080078125, 47.53515625, 49.49951171875, 51.4638671875, 53.42822265625, 55.392578125, 57.35693359375, 59.3212890625, 61.28564453125, 63.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 8.0, 8.0, 12.0, 33.0, 47.0, 53.0, 76.0, 86.0, 104.0, 104.0, 105.0, 91.0, 81.0, 58.0, 51.0, 34.0, 18.0, 17.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.58395767211914, -24.022319793701172, -22.46068000793457, -20.8990421295166, -19.33740234375, -17.77576446533203, -16.214126586914062, -14.652487754821777, -13.090848922729492, -11.529210090637207, -9.967571258544922, -8.405933380126953, -6.844294548034668, -5.282655715942383, -3.721017837524414, -2.159379005432129, -0.5977401733398438, 0.9638984203338623, 2.5255370140075684, 4.087175369262695, 5.6488142013549805, 7.210453033447266, 8.772090911865234, 10.33372974395752, 11.895368576049805, 13.45700740814209, 15.018646240234375, 16.580284118652344, 18.141921997070312, 19.703561782836914, 21.265199661254883, 22.826839447021484, 24.38848114013672, 25.950119018554688, 27.51175880432129, 29.073396682739258, 30.63503646850586, 32.19667434692383, 33.7583122253418, 35.319950103759766, 36.881591796875, 38.44322967529297, 40.00486755371094, 41.566505432128906, 43.12814712524414, 44.68978500366211, 46.25142288208008, 47.81306076049805, 49.374698638916016, 50.936336517333984, 52.49797439575195, 54.05961608886719, 55.621253967285156, 57.182891845703125, 58.744529724121094, 60.30616760253906, 61.86780548095703, 63.429443359375, 64.99108123779297, 66.55271911621094, 68.1143569946289, 69.67599487304688, 71.23764038085938, 72.79927825927734, 74.36091613769531]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 12.0, 7.0, 9.0, 16.0, 14.0, 16.0, 19.0, 21.0, 18.0, 33.0, 24.0, 28.0, 22.0, 24.0, 37.0, 32.0, 35.0, 47.0, 41.0, 31.0, 40.0, 38.0, 53.0, 28.0, 36.0, 41.0, 38.0, 22.0, 34.0, 29.0, 16.0, 13.0, 25.0, 15.0, 16.0, 8.0, 11.0, 10.0, 5.0, 11.0, 3.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-32.1839599609375, -31.28742218017578, -30.39088249206543, -29.49434471130371, -28.59780502319336, -27.70126724243164, -26.804729461669922, -25.908191680908203, -25.01165199279785, -24.115114212036133, -23.21857452392578, -22.322036743164062, -21.425498962402344, -20.528959274291992, -19.632421493530273, -18.735881805419922, -17.839344024658203, -16.942806243896484, -16.046266555786133, -15.149728775024414, -14.253190040588379, -13.356651306152344, -12.460113525390625, -11.56357479095459, -10.667036056518555, -9.77049732208252, -8.873958587646484, -7.977420806884766, -7.0808820724487305, -6.184343338012695, -5.287805080413818, -4.391266822814941, -3.4947280883789062, -2.59818959236145, -1.7016510963439941, -0.8051126003265381, 0.09142589569091797, 0.9879646301269531, 1.88450288772583, 2.781041145324707, 3.677579879760742, 4.574118614196777, 5.470656871795654, 6.367195129394531, 7.263733863830566, 8.160272598266602, 9.05681037902832, 9.953349113464355, 10.84988784790039, 11.746426582336426, 12.642965316772461, 13.53950309753418, 14.436041831970215, 15.33258056640625, 16.22911834716797, 17.125656127929688, 18.02219581604004, 18.918733596801758, 19.81527328491211, 20.711811065673828, 21.608348846435547, 22.5048885345459, 23.401426315307617, 24.29796600341797, 25.194503784179688]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 11.0, 4.0, 15.0, 17.0, 18.0, 27.0, 18.0, 25.0, 16.0, 31.0, 35.0, 40.0, 36.0, 53.0, 62.0, 31.0, 46.0, 54.0, 53.0, 39.0, 35.0, 45.0, 65.0, 34.0, 36.0, 31.0, 28.0, 16.0, 17.0, 15.0, 17.0, 8.0, 7.0, 3.0, 7.0, 1.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41015625, -6.2171630859375, -6.024169921875, -5.8311767578125, -5.63818359375, -5.4451904296875, -5.252197265625, -5.0592041015625, -4.8662109375, -4.6732177734375, -4.480224609375, -4.2872314453125, -4.09423828125, -3.9012451171875, -3.708251953125, -3.5152587890625, -3.322265625, -3.1292724609375, -2.936279296875, -2.7432861328125, -2.55029296875, -2.3572998046875, -2.164306640625, -1.9713134765625, -1.7783203125, -1.5853271484375, -1.392333984375, -1.1993408203125, -1.00634765625, -0.8133544921875, -0.620361328125, -0.4273681640625, -0.234375, -0.0413818359375, 0.151611328125, 0.3446044921875, 0.53759765625, 0.7305908203125, 0.923583984375, 1.1165771484375, 1.3095703125, 1.5025634765625, 1.695556640625, 1.8885498046875, 2.08154296875, 2.2745361328125, 2.467529296875, 2.6605224609375, 2.853515625, 3.0465087890625, 3.239501953125, 3.4324951171875, 3.62548828125, 3.8184814453125, 4.011474609375, 4.2044677734375, 4.3974609375, 4.5904541015625, 4.783447265625, 4.9764404296875, 5.16943359375, 5.3624267578125, 5.555419921875, 5.7484130859375, 5.94140625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 20.0, 16.0, 25.0, 21.0, 46.0, 59.0, 74.0, 105.0, 160.0, 243.0, 354.0, 564.0, 870.0, 1364.0, 2132.0, 3290.0, 5104.0, 7958.0, 12370.0, 19817.0, 32412.0, 56015.0, 103102.0, 222950.0, 279343.0, 130764.0, 67057.0, 38907.0, 23339.0, 14363.0, 9181.0, 5743.0, 3710.0, 2440.0, 1556.0, 1024.0, 679.0, 438.0, 298.0, 188.0, 150.0, 102.0, 59.0, 44.0, 29.0, 19.0, 17.0, 13.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.19580078125, -0.18951797485351562, -0.18323516845703125, -0.17695236206054688, -0.1706695556640625, -0.16438674926757812, -0.15810394287109375, -0.15182113647460938, -0.145538330078125, -0.13925552368164062, -0.13297271728515625, -0.12668991088867188, -0.1204071044921875, -0.11412429809570312, -0.10784149169921875, -0.10155868530273438, -0.09527587890625, -0.08899307250976562, -0.08271026611328125, -0.07642745971679688, -0.0701446533203125, -0.06386184692382812, -0.05757904052734375, -0.051296234130859375, -0.045013427734375, -0.038730621337890625, -0.03244781494140625, -0.026165008544921875, -0.0198822021484375, -0.013599395751953125, -0.00731658935546875, -0.001033782958984375, 0.0052490234375, 0.011531829833984375, 0.01781463623046875, 0.024097442626953125, 0.0303802490234375, 0.036663055419921875, 0.04294586181640625, 0.049228668212890625, 0.055511474609375, 0.061794281005859375, 0.06807708740234375, 0.07435989379882812, 0.0806427001953125, 0.08692550659179688, 0.09320831298828125, 0.09949111938476562, 0.10577392578125, 0.11205673217773438, 0.11833953857421875, 0.12462234497070312, 0.1309051513671875, 0.13718795776367188, 0.14347076416015625, 0.14975357055664062, 0.156036376953125, 0.16231918334960938, 0.16860198974609375, 0.17488479614257812, 0.1811676025390625, 0.18745040893554688, 0.19373321533203125, 0.20001602172851562, 0.206298828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 7.0, 10.0, 9.0, 14.0, 19.0, 18.0, 13.0, 30.0, 15.0, 19.0, 23.0, 22.0, 38.0, 38.0, 24.0, 38.0, 31.0, 32.0, 43.0, 1065.0, 39.0, 47.0, 36.0, 46.0, 36.0, 36.0, 30.0, 29.0, 34.0, 33.0, 29.0, 19.0, 17.0, 10.0, 13.0, 9.0, 5.0, 8.0, 5.0, 2.0, 8.0, 4.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.048828125, -2.94244384765625, -2.8360595703125, -2.72967529296875, -2.623291015625, -2.51690673828125, -2.4105224609375, -2.30413818359375, -2.19775390625, -2.09136962890625, -1.9849853515625, -1.87860107421875, -1.772216796875, -1.66583251953125, -1.5594482421875, -1.45306396484375, -1.3466796875, -1.24029541015625, -1.1339111328125, -1.02752685546875, -0.921142578125, -0.81475830078125, -0.7083740234375, -0.60198974609375, -0.49560546875, -0.38922119140625, -0.2828369140625, -0.17645263671875, -0.070068359375, 0.03631591796875, 0.1427001953125, 0.24908447265625, 0.35546875, 0.46185302734375, 0.5682373046875, 0.67462158203125, 0.781005859375, 0.88739013671875, 0.9937744140625, 1.10015869140625, 1.20654296875, 1.31292724609375, 1.4193115234375, 1.52569580078125, 1.632080078125, 1.73846435546875, 1.8448486328125, 1.95123291015625, 2.0576171875, 2.16400146484375, 2.2703857421875, 2.37677001953125, 2.483154296875, 2.58953857421875, 2.6959228515625, 2.80230712890625, 2.90869140625, 3.01507568359375, 3.1214599609375, 3.22784423828125, 3.334228515625, 3.44061279296875, 3.5469970703125, 3.65338134765625, 3.759765625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 16.0, 23.0, 34.0, 33.0, 55.0, 78.0, 122.0, 204.0, 275.0, 433.0, 619.0, 955.0, 1504.0, 2331.0, 3644.0, 5687.0, 9077.0, 14692.0, 24026.0, 40341.0, 69012.0, 136226.0, 1331862.0, 216871.0, 100309.0, 54878.0, 31869.0, 19474.0, 11848.0, 7359.0, 4601.0, 3052.0, 1896.0, 1295.0, 797.0, 540.0, 375.0, 215.0, 159.0, 115.0, 68.0, 43.0, 36.0, 31.0, 11.0, 11.0, 4.0, 8.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.10986328125, -0.10604667663574219, -0.10223007202148438, -0.09841346740722656, -0.09459686279296875, -0.09078025817871094, -0.08696365356445312, -0.08314704895019531, -0.0793304443359375, -0.07551383972167969, -0.07169723510742188, -0.06788063049316406, -0.06406402587890625, -0.06024742126464844, -0.056430816650390625, -0.05261421203613281, -0.048797607421875, -0.04498100280761719, -0.041164398193359375, -0.03734779357910156, -0.03353118896484375, -0.029714584350585938, -0.025897979736328125, -0.022081375122070312, -0.0182647705078125, -0.014448165893554688, -0.010631561279296875, -0.0068149566650390625, -0.00299835205078125, 0.0008182525634765625, 0.004634857177734375, 0.008451461791992188, 0.01226806640625, 0.016084671020507812, 0.019901275634765625, 0.023717880249023438, 0.02753448486328125, 0.03135108947753906, 0.035167694091796875, 0.03898429870605469, 0.0428009033203125, 0.04661750793457031, 0.050434112548828125, 0.05425071716308594, 0.05806732177734375, 0.06188392639160156, 0.06570053100585938, 0.06951713562011719, 0.073333740234375, 0.07715034484863281, 0.08096694946289062, 0.08478355407714844, 0.08860015869140625, 0.09241676330566406, 0.09623336791992188, 0.10004997253417969, 0.1038665771484375, 0.10768318176269531, 0.11149978637695312, 0.11531639099121094, 0.11913299560546875, 0.12294960021972656, 0.12676620483398438, 0.1305828094482422, 0.1343994140625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 5.0, 8.0, 17.0, 10.0, 20.0, 17.0, 26.0, 27.0, 35.0, 39.0, 42.0, 57.0, 64.0, 56.0, 60.0, 62.0, 54.0, 61.0, 52.0, 40.0, 37.0, 25.0, 30.0, 26.0, 14.0, 21.0, 18.0, 14.0, 8.0, 9.0, 6.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2809715270996094e-05, -5.112495273351669e-05, -4.944019019603729e-05, -4.775542765855789e-05, -4.607066512107849e-05, -4.438590258359909e-05, -4.270114004611969e-05, -4.101637750864029e-05, -3.933161497116089e-05, -3.764685243368149e-05, -3.596208989620209e-05, -3.427732735872269e-05, -3.2592564821243286e-05, -3.0907802283763885e-05, -2.9223039746284485e-05, -2.7538277208805084e-05, -2.5853514671325684e-05, -2.4168752133846283e-05, -2.2483989596366882e-05, -2.079922705888748e-05, -1.911446452140808e-05, -1.742970198392868e-05, -1.574493944644928e-05, -1.4060176908969879e-05, -1.2375414371490479e-05, -1.0690651834011078e-05, -9.005889296531677e-06, -7.321126759052277e-06, -5.636364221572876e-06, -3.951601684093475e-06, -2.2668391466140747e-06, -5.820766091346741e-07, 1.1026859283447266e-06, 2.787448465824127e-06, 4.472211003303528e-06, 6.1569735407829285e-06, 7.841736078262329e-06, 9.52649861574173e-06, 1.121126115322113e-05, 1.2896023690700531e-05, 1.4580786228179932e-05, 1.6265548765659332e-05, 1.7950311303138733e-05, 1.9635073840618134e-05, 2.1319836378097534e-05, 2.3004598915576935e-05, 2.4689361453056335e-05, 2.6374123990535736e-05, 2.8058886528015137e-05, 2.9743649065494537e-05, 3.142841160297394e-05, 3.311317414045334e-05, 3.479793667793274e-05, 3.648269921541214e-05, 3.816746175289154e-05, 3.985222429037094e-05, 4.153698682785034e-05, 4.322174936532974e-05, 4.490651190280914e-05, 4.6591274440288544e-05, 4.8276036977767944e-05, 4.9960799515247345e-05, 5.1645562052726746e-05, 5.3330324590206146e-05, 5.501508712768555e-05]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 10.0, 11.0, 10.0, 20.0, 14.0, 21.0, 24.0, 32.0, 52.0, 55.0, 83.0, 169.0, 447.0, 3642.0, 321325.0, 711237.0, 10046.0, 705.0, 230.0, 112.0, 66.0, 49.0, 36.0, 30.0, 30.0, 10.0, 17.0, 13.0, 8.0, 10.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.001094818115234375, -0.0010607391595840454, -0.0010266602039337158, -0.0009925812482833862, -0.0009585022926330566, -0.000924423336982727, -0.0008903443813323975, -0.0008562654256820679, -0.0008221864700317383, -0.0007881075143814087, -0.0007540285587310791, -0.0007199496030807495, -0.0006858706474304199, -0.0006517916917800903, -0.0006177127361297607, -0.0005836337804794312, -0.0005495548248291016, -0.000515475869178772, -0.0004813969135284424, -0.0004473179578781128, -0.0004132390022277832, -0.0003791600465774536, -0.000345081090927124, -0.00031100213527679443, -0.00027692317962646484, -0.00024284422397613525, -0.00020876526832580566, -0.00017468631267547607, -0.00014060735702514648, -0.0001065284013748169, -7.24494457244873e-05, -3.8370490074157715e-05, -4.291534423828125e-06, 2.9787421226501465e-05, 6.386637687683105e-05, 9.794533252716064e-05, 0.00013202428817749023, 0.00016610324382781982, 0.00020018219947814941, 0.000234261155128479, 0.0002683401107788086, 0.0003024190664291382, 0.0003364980220794678, 0.00037057697772979736, 0.00040465593338012695, 0.00043873488903045654, 0.00047281384468078613, 0.0005068928003311157, 0.0005409717559814453, 0.0005750507116317749, 0.0006091296672821045, 0.0006432086229324341, 0.0006772875785827637, 0.0007113665342330933, 0.0007454454898834229, 0.0007795244455337524, 0.000813603401184082, 0.0008476823568344116, 0.0008817613124847412, 0.0009158402681350708, 0.0009499192237854004, 0.00098399817943573, 0.0010180771350860596, 0.0010521560907363892, 0.0010862350463867188]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 59.0, 707.0, 237.0, 9.0], "bins": [-0.001038096728734672, -0.0010212758788838983, -0.0010044550290331244, -0.0009876341791823506, -0.0009708133875392377, -0.0009539925376884639, -0.000937171746045351, -0.0009203508961945772, -0.0009035300463438034, -0.0008867091964930296, -0.0008698883466422558, -0.0008530675549991429, -0.0008362467051483691, -0.0008194258552975953, -0.0008026050636544824, -0.0007857842138037086, -0.0007689633639529347, -0.0007521425141021609, -0.0007353216642513871, -0.0007185008726082742, -0.0007016800227575004, -0.0006848591729067266, -0.0006680383812636137, -0.0006512175314128399, -0.0006343966815620661, -0.0006175758317112923, -0.0006007549818605185, -0.0005839341902174056, -0.0005671133403666317, -0.0005502924905158579, -0.000533471698872745, -0.0005166508490219712, -0.0004998300573788583, -0.0004830092075280845, -0.00046618838678114116, -0.0004493675660341978, -0.000432546716183424, -0.0004157258663326502, -0.00039890504558570683, -0.0003820842248387635, -0.00036526337498798966, -0.00034844252513721585, -0.0003316217043902725, -0.00031480088364332914, -0.00029798003379255533, -0.0002811591839417815, -0.00026433836319483817, -0.0002475175424478948, -0.000230696692597121, -0.00021387585729826242, -0.00019705502199940383, -0.00018023418670054525, -0.00016341335140168667, -0.00014659251610282809, -0.0001297716808039695, -0.00011295084550511092, -9.613000293029472e-05, -7.930916763143614e-05, -6.248833233257756e-05, -4.5667497033718973e-05, -2.884666173486039e-05, -1.2025826436001807e-05, 4.7950088628567755e-06, 2.161584416171536e-05, 3.843667946057394e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 2.0, 7.0, 8.0, 10.0, 17.0, 19.0, 17.0, 25.0, 32.0, 36.0, 46.0, 48.0, 50.0, 45.0, 41.0, 55.0, 67.0, 45.0, 46.0, 50.0, 55.0, 43.0, 38.0, 39.0, 24.0, 30.0, 13.0, 19.0, 15.0, 13.0, 8.0, 12.0, 5.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248453140258789e-05, -3.120489418506622e-05, -2.9925256967544556e-05, -2.8645619750022888e-05, -2.736598253250122e-05, -2.6086345314979553e-05, -2.4806708097457886e-05, -2.3527070879936218e-05, -2.224743366241455e-05, -2.0967796444892883e-05, -1.9688159227371216e-05, -1.840852200984955e-05, -1.712888479232788e-05, -1.5849247574806213e-05, -1.4569610357284546e-05, -1.3289973139762878e-05, -1.2010335922241211e-05, -1.0730698704719543e-05, -9.451061487197876e-06, -8.171424269676208e-06, -6.891787052154541e-06, -5.6121498346328735e-06, -4.332512617111206e-06, -3.0528753995895386e-06, -1.773238182067871e-06, -4.936009645462036e-07, 7.860362529754639e-07, 2.0656734704971313e-06, 3.345310688018799e-06, 4.624947905540466e-06, 5.904585123062134e-06, 7.184222340583801e-06, 8.463859558105469e-06, 9.743496775627136e-06, 1.1023133993148804e-05, 1.2302771210670471e-05, 1.3582408428192139e-05, 1.4862045645713806e-05, 1.6141682863235474e-05, 1.742132008075714e-05, 1.870095729827881e-05, 1.9980594515800476e-05, 2.1260231733322144e-05, 2.253986895084381e-05, 2.381950616836548e-05, 2.5099143385887146e-05, 2.6378780603408813e-05, 2.765841782093048e-05, 2.893805503845215e-05, 3.0217692255973816e-05, 3.1497329473495483e-05, 3.277696669101715e-05, 3.405660390853882e-05, 3.5336241126060486e-05, 3.661587834358215e-05, 3.789551556110382e-05, 3.917515277862549e-05, 4.0454789996147156e-05, 4.173442721366882e-05, 4.301406443119049e-05, 4.429370164871216e-05, 4.5573338866233826e-05, 4.685297608375549e-05, 4.813261330127716e-05, 4.941225051879883e-05]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 11.0, 4.0, 15.0, 17.0, 18.0, 27.0, 18.0, 25.0, 16.0, 31.0, 35.0, 40.0, 36.0, 53.0, 62.0, 31.0, 46.0, 54.0, 53.0, 39.0, 35.0, 45.0, 65.0, 34.0, 36.0, 31.0, 28.0, 16.0, 17.0, 15.0, 17.0, 8.0, 7.0, 3.0, 7.0, 1.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41015625, -6.2171630859375, -6.024169921875, -5.8311767578125, -5.63818359375, -5.4451904296875, -5.252197265625, -5.0592041015625, -4.8662109375, -4.6732177734375, -4.480224609375, -4.2872314453125, -4.09423828125, -3.9012451171875, -3.708251953125, -3.5152587890625, -3.322265625, -3.1292724609375, -2.936279296875, -2.7432861328125, -2.55029296875, -2.3572998046875, -2.164306640625, -1.9713134765625, -1.7783203125, -1.5853271484375, -1.392333984375, -1.1993408203125, -1.00634765625, -0.8133544921875, -0.620361328125, -0.4273681640625, -0.234375, -0.0413818359375, 0.151611328125, 0.3446044921875, 0.53759765625, 0.7305908203125, 0.923583984375, 1.1165771484375, 1.3095703125, 1.5025634765625, 1.695556640625, 1.8885498046875, 2.08154296875, 2.2745361328125, 2.467529296875, 2.6605224609375, 2.853515625, 3.0465087890625, 3.239501953125, 3.4324951171875, 3.62548828125, 3.8184814453125, 4.011474609375, 4.2044677734375, 4.3974609375, 4.5904541015625, 4.783447265625, 4.9764404296875, 5.16943359375, 5.3624267578125, 5.555419921875, 5.7484130859375, 5.94140625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 16.0, 18.0, 19.0, 19.0, 32.0, 58.0, 90.0, 114.0, 183.0, 260.0, 415.0, 632.0, 1038.0, 1603.0, 2628.0, 4370.0, 7534.0, 13183.0, 24845.0, 52493.0, 147979.0, 474564.0, 189787.0, 62795.0, 28320.0, 14600.0, 8364.0, 4775.0, 2859.0, 1746.0, 1118.0, 720.0, 477.0, 288.0, 184.0, 149.0, 85.0, 49.0, 45.0, 30.0, 13.0, 20.0, 11.0, 9.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0], "bins": [-7.0546875, -6.8382568359375, -6.621826171875, -6.4053955078125, -6.18896484375, -5.9725341796875, -5.756103515625, -5.5396728515625, -5.3232421875, -5.1068115234375, -4.890380859375, -4.6739501953125, -4.45751953125, -4.2410888671875, -4.024658203125, -3.8082275390625, -3.591796875, -3.3753662109375, -3.158935546875, -2.9425048828125, -2.72607421875, -2.5096435546875, -2.293212890625, -2.0767822265625, -1.8603515625, -1.6439208984375, -1.427490234375, -1.2110595703125, -0.99462890625, -0.7781982421875, -0.561767578125, -0.3453369140625, -0.12890625, 0.0875244140625, 0.303955078125, 0.5203857421875, 0.73681640625, 0.9532470703125, 1.169677734375, 1.3861083984375, 1.6025390625, 1.8189697265625, 2.035400390625, 2.2518310546875, 2.46826171875, 2.6846923828125, 2.901123046875, 3.1175537109375, 3.333984375, 3.5504150390625, 3.766845703125, 3.9832763671875, 4.19970703125, 4.4161376953125, 4.632568359375, 4.8489990234375, 5.0654296875, 5.2818603515625, 5.498291015625, 5.7147216796875, 5.93115234375, 6.1475830078125, 6.364013671875, 6.5804443359375, 6.796875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 3.0, 3.0, 5.0, 12.0, 10.0, 14.0, 15.0, 25.0, 16.0, 33.0, 35.0, 36.0, 26.0, 41.0, 43.0, 48.0, 66.0, 91.0, 217.0, 1598.0, 194.0, 77.0, 53.0, 56.0, 58.0, 34.0, 39.0, 33.0, 34.0, 24.0, 18.0, 21.0, 18.0, 5.0, 6.0, 12.0, 8.0, 10.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9765625, -15.4342041015625, -14.891845703125, -14.3494873046875, -13.80712890625, -13.2647705078125, -12.722412109375, -12.1800537109375, -11.6376953125, -11.0953369140625, -10.552978515625, -10.0106201171875, -9.46826171875, -8.9259033203125, -8.383544921875, -7.8411865234375, -7.298828125, -6.7564697265625, -6.214111328125, -5.6717529296875, -5.12939453125, -4.5870361328125, -4.044677734375, -3.5023193359375, -2.9599609375, -2.4176025390625, -1.875244140625, -1.3328857421875, -0.79052734375, -0.2481689453125, 0.294189453125, 0.8365478515625, 1.37890625, 1.9212646484375, 2.463623046875, 3.0059814453125, 3.54833984375, 4.0906982421875, 4.633056640625, 5.1754150390625, 5.7177734375, 6.2601318359375, 6.802490234375, 7.3448486328125, 7.88720703125, 8.4295654296875, 8.971923828125, 9.5142822265625, 10.056640625, 10.5989990234375, 11.141357421875, 11.6837158203125, 12.22607421875, 12.7684326171875, 13.310791015625, 13.8531494140625, 14.3955078125, 14.9378662109375, 15.480224609375, 16.0225830078125, 16.56494140625, 17.1072998046875, 17.649658203125, 18.1920166015625, 18.734375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 5.0, 8.0, 9.0, 17.0, 19.0, 21.0, 27.0, 38.0, 46.0, 61.0, 103.0, 132.0, 179.0, 279.0, 731.0, 2669.0, 18577.0, 402439.0, 2669565.0, 43405.0, 5174.0, 1043.0, 390.0, 203.0, 146.0, 96.0, 83.0, 62.0, 47.0, 38.0, 13.0, 22.0, 19.0, 9.0, 5.0, 4.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.21875, -30.24853515625, -29.2783203125, -28.30810546875, -27.337890625, -26.36767578125, -25.3974609375, -24.42724609375, -23.45703125, -22.48681640625, -21.5166015625, -20.54638671875, -19.576171875, -18.60595703125, -17.6357421875, -16.66552734375, -15.6953125, -14.72509765625, -13.7548828125, -12.78466796875, -11.814453125, -10.84423828125, -9.8740234375, -8.90380859375, -7.93359375, -6.96337890625, -5.9931640625, -5.02294921875, -4.052734375, -3.08251953125, -2.1123046875, -1.14208984375, -0.171875, 0.79833984375, 1.7685546875, 2.73876953125, 3.708984375, 4.67919921875, 5.6494140625, 6.61962890625, 7.58984375, 8.56005859375, 9.5302734375, 10.50048828125, 11.470703125, 12.44091796875, 13.4111328125, 14.38134765625, 15.3515625, 16.32177734375, 17.2919921875, 18.26220703125, 19.232421875, 20.20263671875, 21.1728515625, 22.14306640625, 23.11328125, 24.08349609375, 25.0537109375, 26.02392578125, 26.994140625, 27.96435546875, 28.9345703125, 29.90478515625, 30.875]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [574.0, 442.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.160618782043457, -0.012415885925292969, 14.135787010192871, 28.283992767333984, 42.432193756103516, 56.58039474487305, 70.72859954833984, 84.87680053710938, 99.0250015258789, 113.17320251464844, 127.3214111328125, 141.4696044921875, 155.61781311035156, 169.76602172851562, 183.91421508789062, 198.0624237060547, 212.21063232421875, 226.3588409423828, 240.5070343017578, 254.65524291992188, 268.8034362792969, 282.95166015625, 297.099853515625, 311.248046875, 325.396240234375, 339.54443359375, 353.6926574707031, 367.8408508300781, 381.9890441894531, 396.13726806640625, 410.28546142578125, 424.43365478515625, 438.58184814453125, 452.73004150390625, 466.8782653808594, 481.0264587402344, 495.1746520996094, 509.3228759765625, 523.4710693359375, 537.6192626953125, 551.7674560546875, 565.9156494140625, 580.0638427734375, 594.2120361328125, 608.3602905273438, 622.5084838867188, 636.6566772460938, 650.8048706054688, 664.953125, 679.101318359375, 693.24951171875, 707.397705078125, 721.5459594726562, 735.6941528320312, 749.8423461914062, 763.9905395507812, 778.1387329101562, 792.2869262695312, 806.4351196289062, 820.5833740234375, 834.7315673828125, 848.8797607421875, 863.0279541015625, 877.1761474609375, 891.3243408203125]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 5.0, 5.0, 7.0, 8.0, 10.0, 10.0, 9.0, 11.0, 14.0, 19.0, 18.0, 22.0, 35.0, 29.0, 38.0, 36.0, 39.0, 33.0, 34.0, 41.0, 37.0, 38.0, 38.0, 46.0, 45.0, 39.0, 25.0, 39.0, 35.0, 31.0, 32.0, 29.0, 24.0, 21.0, 14.0, 13.0, 12.0, 6.0, 16.0, 11.0, 5.0, 8.0, 2.0, 2.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.54676818847656, -42.063377380371094, -40.579986572265625, -39.096595764160156, -37.61320495605469, -36.12981414794922, -34.64642333984375, -33.16303253173828, -31.679643630981445, -30.196252822875977, -28.712862014770508, -27.229473114013672, -25.746082305908203, -24.262691497802734, -22.779300689697266, -21.295909881591797, -19.812519073486328, -18.32912826538086, -16.84573745727539, -15.362347602844238, -13.87895679473877, -12.3955659866333, -10.912176132202148, -9.42878532409668, -7.945394515991211, -6.462003707885742, -4.978613376617432, -3.495223045349121, -2.0118322372436523, -0.5284414291381836, 0.9549484252929688, 2.4383392333984375, 3.921733856201172, 5.405124664306641, 6.888514995574951, 8.371905326843262, 9.85529613494873, 11.3386869430542, 12.822076797485352, 14.30546760559082, 15.788858413696289, 17.272249221801758, 18.755640029907227, 20.239028930664062, 21.72241973876953, 23.205810546875, 24.68920135498047, 26.172592163085938, 27.655982971191406, 29.139373779296875, 30.622764587402344, 32.10615539550781, 33.58954620361328, 35.07293701171875, 36.55632781982422, 38.03971862792969, 39.523109436035156, 41.006500244140625, 42.489891052246094, 43.97328186035156, 45.45667266845703, 46.9400634765625, 48.42345428466797, 49.90684509277344, 51.39023208618164]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 5.0, 4.0, 17.0, 12.0, 23.0, 28.0, 18.0, 17.0, 23.0, 29.0, 27.0, 36.0, 42.0, 45.0, 51.0, 40.0, 36.0, 45.0, 56.0, 47.0, 44.0, 34.0, 49.0, 41.0, 31.0, 39.0, 30.0, 21.0, 25.0, 17.0, 15.0, 15.0, 7.0, 7.0, 4.0, 1.0, 2.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.63446044921875, -5.4447021484375, -5.25494384765625, -5.065185546875, -4.87542724609375, -4.6856689453125, -4.49591064453125, -4.30615234375, -4.11639404296875, -3.9266357421875, -3.73687744140625, -3.547119140625, -3.35736083984375, -3.1676025390625, -2.97784423828125, -2.7880859375, -2.59832763671875, -2.4085693359375, -2.21881103515625, -2.029052734375, -1.83929443359375, -1.6495361328125, -1.45977783203125, -1.27001953125, -1.08026123046875, -0.8905029296875, -0.70074462890625, -0.510986328125, -0.32122802734375, -0.1314697265625, 0.05828857421875, 0.248046875, 0.43780517578125, 0.6275634765625, 0.81732177734375, 1.007080078125, 1.19683837890625, 1.3865966796875, 1.57635498046875, 1.76611328125, 1.95587158203125, 2.1456298828125, 2.33538818359375, 2.525146484375, 2.71490478515625, 2.9046630859375, 3.09442138671875, 3.2841796875, 3.47393798828125, 3.6636962890625, 3.85345458984375, 4.043212890625, 4.23297119140625, 4.4227294921875, 4.61248779296875, 4.80224609375, 4.99200439453125, 5.1817626953125, 5.37152099609375, 5.561279296875, 5.75103759765625, 5.9407958984375, 6.13055419921875, 6.3203125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 9.0, 8.0, 14.0, 19.0, 19.0, 32.0, 39.0, 41.0, 73.0, 127.0, 180.0, 391.0, 776.0, 1708.0, 3727.0, 9705.0, 28538.0, 118618.0, 1085742.0, 2609576.0, 260456.0, 49050.0, 15028.0, 5533.0, 2434.0, 1106.0, 516.0, 293.0, 184.0, 120.0, 63.0, 39.0, 24.0, 15.0, 13.0, 19.0, 7.0, 5.0, 7.0, 9.0, 4.0, 1.0, 2.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.859375, -12.4337158203125, -12.008056640625, -11.5823974609375, -11.15673828125, -10.7310791015625, -10.305419921875, -9.8797607421875, -9.4541015625, -9.0284423828125, -8.602783203125, -8.1771240234375, -7.75146484375, -7.3258056640625, -6.900146484375, -6.4744873046875, -6.048828125, -5.6231689453125, -5.197509765625, -4.7718505859375, -4.34619140625, -3.9205322265625, -3.494873046875, -3.0692138671875, -2.6435546875, -2.2178955078125, -1.792236328125, -1.3665771484375, -0.94091796875, -0.5152587890625, -0.089599609375, 0.3360595703125, 0.76171875, 1.1873779296875, 1.613037109375, 2.0386962890625, 2.46435546875, 2.8900146484375, 3.315673828125, 3.7413330078125, 4.1669921875, 4.5926513671875, 5.018310546875, 5.4439697265625, 5.86962890625, 6.2952880859375, 6.720947265625, 7.1466064453125, 7.572265625, 7.9979248046875, 8.423583984375, 8.8492431640625, 9.27490234375, 9.7005615234375, 10.126220703125, 10.5518798828125, 10.9775390625, 11.4031982421875, 11.828857421875, 12.2545166015625, 12.68017578125, 13.1058349609375, 13.531494140625, 13.9571533203125, 14.3828125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 1.0, 5.0, 6.0, 6.0, 8.0, 11.0, 21.0, 25.0, 46.0, 60.0, 74.0, 107.0, 162.0, 248.0, 419.0, 642.0, 701.0, 504.0, 328.0, 196.0, 128.0, 99.0, 85.0, 56.0, 39.0, 24.0, 18.0, 12.0, 12.0, 7.0, 7.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.3646240234375, -7.018310546875, -6.6719970703125, -6.32568359375, -5.9793701171875, -5.633056640625, -5.2867431640625, -4.9404296875, -4.5941162109375, -4.247802734375, -3.9014892578125, -3.55517578125, -3.2088623046875, -2.862548828125, -2.5162353515625, -2.169921875, -1.8236083984375, -1.477294921875, -1.1309814453125, -0.78466796875, -0.4383544921875, -0.092041015625, 0.2542724609375, 0.6005859375, 0.9468994140625, 1.293212890625, 1.6395263671875, 1.98583984375, 2.3321533203125, 2.678466796875, 3.0247802734375, 3.37109375, 3.7174072265625, 4.063720703125, 4.4100341796875, 4.75634765625, 5.1026611328125, 5.448974609375, 5.7952880859375, 6.1416015625, 6.4879150390625, 6.834228515625, 7.1805419921875, 7.52685546875, 7.8731689453125, 8.219482421875, 8.5657958984375, 8.912109375, 9.2584228515625, 9.604736328125, 9.9510498046875, 10.29736328125, 10.6436767578125, 10.989990234375, 11.3363037109375, 11.6826171875, 12.0289306640625, 12.375244140625, 12.7215576171875, 13.06787109375, 13.4141845703125, 13.760498046875, 14.1068115234375, 14.453125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 9.0, 14.0, 25.0, 22.0, 49.0, 50.0, 101.0, 108.0, 176.0, 378.0, 1234.0, 13285.0, 1184023.0, 2971085.0, 21091.0, 1606.0, 417.0, 203.0, 119.0, 73.0, 55.0, 46.0, 31.0, 16.0, 13.0, 7.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-66.5625, -64.9013671875, -63.240234375, -61.5791015625, -59.91796875, -58.2568359375, -56.595703125, -54.9345703125, -53.2734375, -51.6123046875, -49.951171875, -48.2900390625, -46.62890625, -44.9677734375, -43.306640625, -41.6455078125, -39.984375, -38.3232421875, -36.662109375, -35.0009765625, -33.33984375, -31.6787109375, -30.017578125, -28.3564453125, -26.6953125, -25.0341796875, -23.373046875, -21.7119140625, -20.05078125, -18.3896484375, -16.728515625, -15.0673828125, -13.40625, -11.7451171875, -10.083984375, -8.4228515625, -6.76171875, -5.1005859375, -3.439453125, -1.7783203125, -0.1171875, 1.5439453125, 3.205078125, 4.8662109375, 6.52734375, 8.1884765625, 9.849609375, 11.5107421875, 13.171875, 14.8330078125, 16.494140625, 18.1552734375, 19.81640625, 21.4775390625, 23.138671875, 24.7998046875, 26.4609375, 28.1220703125, 29.783203125, 31.4443359375, 33.10546875, 34.7666015625, 36.427734375, 38.0888671875, 39.75]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 8.0, 16.0, 17.0, 18.0, 33.0, 43.0, 64.0, 59.0, 80.0, 74.0, 83.0, 76.0, 77.0, 67.0, 65.0, 54.0, 54.0, 22.0, 24.0, 16.0, 14.0, 6.0, 6.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.069292068481445, -24.909761428833008, -23.750228881835938, -22.5906982421875, -21.431167602539062, -20.271636962890625, -19.112104415893555, -17.952573776245117, -16.793041229248047, -15.633509635925293, -14.473978996276855, -13.314447402954102, -12.154916763305664, -10.99538516998291, -9.835853576660156, -8.676322937011719, -7.516792297363281, -6.3572611808776855, -5.19773006439209, -4.038198471069336, -2.8786673545837402, -1.7191362380981445, -0.5596046447753906, 0.5999259948730469, 1.7594575881958008, 2.9189887046813965, 4.078519821166992, 5.238051414489746, 6.397582530975342, 7.5571136474609375, 8.716645240783691, 9.876175880432129, 11.035709381103516, 12.19524097442627, 13.354771614074707, 14.514303207397461, 15.673833847045898, 16.83336639404297, 17.992897033691406, 19.152427673339844, 20.31195831298828, 21.47148895263672, 22.63102149963379, 23.790552139282227, 24.950082778930664, 26.109615325927734, 27.269145965576172, 28.42867660522461, 29.58820915222168, 30.747739791870117, 31.907272338867188, 33.066802978515625, 34.22633361816406, 35.3858642578125, 36.54539489746094, 37.704925537109375, 38.86445999145508, 40.023990631103516, 41.18352127075195, 42.343055725097656, 43.502586364746094, 44.66211700439453, 45.82164764404297, 46.981178283691406, 48.140708923339844]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 6.0, 7.0, 12.0, 8.0, 12.0, 17.0, 15.0, 19.0, 20.0, 26.0, 40.0, 36.0, 31.0, 36.0, 38.0, 40.0, 53.0, 33.0, 41.0, 37.0, 32.0, 47.0, 38.0, 29.0, 33.0, 35.0, 28.0, 15.0, 22.0, 28.0, 16.0, 23.0, 15.0, 17.0, 19.0, 14.0, 9.0, 11.0, 8.0, 3.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.185523986816406, -32.191131591796875, -31.196735382080078, -30.202341079711914, -29.20794677734375, -28.213552474975586, -27.219158172607422, -26.22476577758789, -25.230369567871094, -24.23597526550293, -23.241580963134766, -22.2471866607666, -21.252792358398438, -20.258398056030273, -19.26400375366211, -18.269611358642578, -17.275217056274414, -16.28082275390625, -15.286428451538086, -14.292034149169922, -13.297639846801758, -12.303245544433594, -11.308852195739746, -10.314457893371582, -9.320063591003418, -8.325669288635254, -7.33127498626709, -6.336881160736084, -5.34248685836792, -4.348092555999756, -3.35369873046875, -2.359304428100586, -1.3649101257324219, -0.37051594257354736, 0.6238782405853271, 1.618272304534912, 2.612666606903076, 3.6070609092712402, 4.601454734802246, 5.59584903717041, 6.590243339538574, 7.584637641906738, 8.579031944274902, 9.57342529296875, 10.567819595336914, 11.562213897705078, 12.556608200073242, 13.551002502441406, 14.54539680480957, 15.539791107177734, 16.5341854095459, 17.528579711914062, 18.522974014282227, 19.51736831665039, 20.511760711669922, 21.50615692138672, 22.50054931640625, 23.494943618774414, 24.489337921142578, 25.483732223510742, 26.478126525878906, 27.47252082824707, 28.466915130615234, 29.461307525634766, 30.455703735351562]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 5.0, 8.0, 18.0, 19.0, 26.0, 25.0, 37.0, 24.0, 21.0, 35.0, 29.0, 54.0, 40.0, 46.0, 56.0, 52.0, 45.0, 58.0, 40.0, 53.0, 45.0, 43.0, 37.0, 26.0, 24.0, 26.0, 26.0, 16.0, 18.0, 7.0, 10.0, 12.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9609375, -5.75567626953125, -5.5504150390625, -5.34515380859375, -5.139892578125, -4.93463134765625, -4.7293701171875, -4.52410888671875, -4.31884765625, -4.11358642578125, -3.9083251953125, -3.70306396484375, -3.497802734375, -3.29254150390625, -3.0872802734375, -2.88201904296875, -2.6767578125, -2.47149658203125, -2.2662353515625, -2.06097412109375, -1.855712890625, -1.65045166015625, -1.4451904296875, -1.23992919921875, -1.03466796875, -0.82940673828125, -0.6241455078125, -0.41888427734375, -0.213623046875, -0.00836181640625, 0.1968994140625, 0.40216064453125, 0.607421875, 0.81268310546875, 1.0179443359375, 1.22320556640625, 1.428466796875, 1.63372802734375, 1.8389892578125, 2.04425048828125, 2.24951171875, 2.45477294921875, 2.6600341796875, 2.86529541015625, 3.070556640625, 3.27581787109375, 3.4810791015625, 3.68634033203125, 3.8916015625, 4.09686279296875, 4.3021240234375, 4.50738525390625, 4.712646484375, 4.91790771484375, 5.1231689453125, 5.32843017578125, 5.53369140625, 5.73895263671875, 5.9442138671875, 6.14947509765625, 6.354736328125, 6.55999755859375, 6.7652587890625, 6.97052001953125, 7.17578125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 4.0, 7.0, 10.0, 10.0, 15.0, 37.0, 38.0, 57.0, 84.0, 147.0, 215.0, 342.0, 526.0, 873.0, 1371.0, 2401.0, 4000.0, 6682.0, 11968.0, 20550.0, 36957.0, 69461.0, 147133.0, 344529.0, 206650.0, 88648.0, 45498.0, 25144.0, 14722.0, 8423.0, 4811.0, 2794.0, 1676.0, 1015.0, 623.0, 417.0, 240.0, 151.0, 109.0, 66.0, 56.0, 31.0, 18.0, 12.0, 14.0, 9.0, 4.0, 2.0, 8.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2254638671875, -0.2178668975830078, -0.21026992797851562, -0.20267295837402344, -0.19507598876953125, -0.18747901916503906, -0.17988204956054688, -0.1722850799560547, -0.1646881103515625, -0.1570911407470703, -0.14949417114257812, -0.14189720153808594, -0.13430023193359375, -0.12670326232910156, -0.11910629272460938, -0.11150932312011719, -0.103912353515625, -0.09631538391113281, -0.08871841430664062, -0.08112144470214844, -0.07352447509765625, -0.06592750549316406, -0.058330535888671875, -0.05073356628417969, -0.0431365966796875, -0.03553962707519531, -0.027942657470703125, -0.020345687866210938, -0.01274871826171875, -0.0051517486572265625, 0.002445220947265625, 0.010042190551757812, 0.01763916015625, 0.025236129760742188, 0.032833099365234375, 0.04043006896972656, 0.04802703857421875, 0.05562400817871094, 0.06322097778320312, 0.07081794738769531, 0.0784149169921875, 0.08601188659667969, 0.09360885620117188, 0.10120582580566406, 0.10880279541015625, 0.11639976501464844, 0.12399673461914062, 0.1315937042236328, 0.139190673828125, 0.1467876434326172, 0.15438461303710938, 0.16198158264160156, 0.16957855224609375, 0.17717552185058594, 0.18477249145507812, 0.1923694610595703, 0.1999664306640625, 0.2075634002685547, 0.21516036987304688, 0.22275733947753906, 0.23035430908203125, 0.23795127868652344, 0.24554824829101562, 0.2531452178955078, 0.2607421875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 6.0, 8.0, 14.0, 16.0, 21.0, 18.0, 24.0, 25.0, 25.0, 30.0, 17.0, 38.0, 28.0, 38.0, 39.0, 29.0, 41.0, 42.0, 1068.0, 39.0, 40.0, 44.0, 32.0, 33.0, 36.0, 31.0, 15.0, 35.0, 33.0, 21.0, 24.0, 14.0, 14.0, 12.0, 12.0, 10.0, 11.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.701171875, -3.5859375, -3.470703125, -3.35546875, -3.240234375, -3.125, -3.009765625, -2.89453125, -2.779296875, -2.6640625, -2.548828125, -2.43359375, -2.318359375, -2.203125, -2.087890625, -1.97265625, -1.857421875, -1.7421875, -1.626953125, -1.51171875, -1.396484375, -1.28125, -1.166015625, -1.05078125, -0.935546875, -0.8203125, -0.705078125, -0.58984375, -0.474609375, -0.359375, -0.244140625, -0.12890625, -0.013671875, 0.1015625, 0.216796875, 0.33203125, 0.447265625, 0.5625, 0.677734375, 0.79296875, 0.908203125, 1.0234375, 1.138671875, 1.25390625, 1.369140625, 1.484375, 1.599609375, 1.71484375, 1.830078125, 1.9453125, 2.060546875, 2.17578125, 2.291015625, 2.40625, 2.521484375, 2.63671875, 2.751953125, 2.8671875, 2.982421875, 3.09765625, 3.212890625, 3.328125, 3.443359375, 3.55859375, 3.673828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 8.0, 14.0, 25.0, 30.0, 52.0, 78.0, 133.0, 200.0, 301.0, 447.0, 757.0, 1103.0, 1737.0, 2756.0, 4438.0, 7434.0, 11731.0, 19602.0, 32392.0, 55331.0, 102932.0, 233014.0, 1333315.0, 127369.0, 65556.0, 37734.0, 22767.0, 13719.0, 8332.0, 5095.0, 3189.0, 2020.0, 1254.0, 813.0, 515.0, 318.0, 213.0, 134.0, 86.0, 62.0, 48.0, 29.0, 12.0, 12.0, 7.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13671875, -0.13246536254882812, -0.12821197509765625, -0.12395858764648438, -0.1197052001953125, -0.11545181274414062, -0.11119842529296875, -0.10694503784179688, -0.102691650390625, -0.09843826293945312, -0.09418487548828125, -0.08993148803710938, -0.0856781005859375, -0.08142471313476562, -0.07717132568359375, -0.07291793823242188, -0.06866455078125, -0.06441116333007812, -0.06015777587890625, -0.055904388427734375, -0.0516510009765625, -0.047397613525390625, -0.04314422607421875, -0.038890838623046875, -0.034637451171875, -0.030384063720703125, -0.02613067626953125, -0.021877288818359375, -0.0176239013671875, -0.013370513916015625, -0.00911712646484375, -0.004863739013671875, -0.0006103515625, 0.003643035888671875, 0.00789642333984375, 0.012149810791015625, 0.0164031982421875, 0.020656585693359375, 0.02490997314453125, 0.029163360595703125, 0.033416748046875, 0.037670135498046875, 0.04192352294921875, 0.046176910400390625, 0.0504302978515625, 0.054683685302734375, 0.05893707275390625, 0.06319046020507812, 0.06744384765625, 0.07169723510742188, 0.07595062255859375, 0.08020401000976562, 0.0844573974609375, 0.08871078491210938, 0.09296417236328125, 0.09721755981445312, 0.101470947265625, 0.10572433471679688, 0.10997772216796875, 0.11423110961914062, 0.1184844970703125, 0.12273788452148438, 0.12699127197265625, 0.13124465942382812, 0.135498046875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 4.0, 3.0, 8.0, 7.0, 11.0, 16.0, 28.0, 20.0, 23.0, 26.0, 19.0, 28.0, 39.0, 22.0, 36.0, 38.0, 41.0, 37.0, 46.0, 62.0, 51.0, 34.0, 39.0, 41.0, 33.0, 37.0, 34.0, 27.0, 36.0, 22.0, 15.0, 16.0, 12.0, 14.0, 15.0, 8.0, 13.0, 7.0, 3.0, 4.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-3.999471664428711e-05, -3.8691796362400055e-05, -3.7388876080513e-05, -3.6085955798625946e-05, -3.478303551673889e-05, -3.348011523485184e-05, -3.217719495296478e-05, -3.087427467107773e-05, -2.9571354389190674e-05, -2.826843410730362e-05, -2.6965513825416565e-05, -2.566259354352951e-05, -2.4359673261642456e-05, -2.30567529797554e-05, -2.1753832697868347e-05, -2.0450912415981293e-05, -1.9147992134094238e-05, -1.7845071852207184e-05, -1.654215157032013e-05, -1.5239231288433075e-05, -1.393631100654602e-05, -1.2633390724658966e-05, -1.1330470442771912e-05, -1.0027550160884857e-05, -8.724629878997803e-06, -7.421709597110748e-06, -6.118789315223694e-06, -4.815869033336639e-06, -3.512948751449585e-06, -2.2100284695625305e-06, -9.071081876754761e-07, 3.9581209421157837e-07, 1.6987323760986328e-06, 3.0016526579856873e-06, 4.304572939872742e-06, 5.607493221759796e-06, 6.910413503646851e-06, 8.213333785533905e-06, 9.51625406742096e-06, 1.0819174349308014e-05, 1.2122094631195068e-05, 1.3425014913082123e-05, 1.4727935194969177e-05, 1.603085547685623e-05, 1.7333775758743286e-05, 1.863669604063034e-05, 1.9939616322517395e-05, 2.124253660440445e-05, 2.2545456886291504e-05, 2.384837716817856e-05, 2.5151297450065613e-05, 2.6454217731952667e-05, 2.775713801383972e-05, 2.9060058295726776e-05, 3.036297857761383e-05, 3.1665898859500885e-05, 3.296881914138794e-05, 3.4271739423274994e-05, 3.557465970516205e-05, 3.68775799870491e-05, 3.818050026893616e-05, 3.948342055082321e-05, 4.0786340832710266e-05, 4.208926111459732e-05, 4.3392181396484375e-05]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 8.0, 10.0, 11.0, 16.0, 18.0, 17.0, 18.0, 39.0, 38.0, 41.0, 70.0, 86.0, 155.0, 328.0, 1371.0, 49279.0, 918038.0, 76309.0, 1727.0, 397.0, 155.0, 85.0, 61.0, 46.0, 26.0, 31.0, 26.0, 25.0, 15.0, 23.0, 15.0, 8.0, 6.0, 13.0, 6.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008473396301269531, -0.0008196011185646057, -0.0007918626070022583, -0.0007641240954399109, -0.0007363855838775635, -0.0007086470723152161, -0.0006809085607528687, -0.0006531700491905212, -0.0006254315376281738, -0.0005976930260658264, -0.000569954514503479, -0.0005422160029411316, -0.0005144774913787842, -0.00048673897981643677, -0.00045900046825408936, -0.00043126195669174194, -0.00040352344512939453, -0.0003757849335670471, -0.0003480464220046997, -0.0003203079104423523, -0.0002925693988800049, -0.00026483088731765747, -0.00023709237575531006, -0.00020935386419296265, -0.00018161535263061523, -0.00015387684106826782, -0.0001261383295059204, -9.8399817943573e-05, -7.066130638122559e-05, -4.2922794818878174e-05, -1.5184283256530762e-05, 1.255422830581665e-05, 4.029273986816406e-05, 6.803125143051147e-05, 9.576976299285889e-05, 0.0001235082745552063, 0.0001512467861175537, 0.00017898529767990112, 0.00020672380924224854, 0.00023446232080459595, 0.00026220083236694336, 0.00028993934392929077, 0.0003176778554916382, 0.0003454163670539856, 0.000373154878616333, 0.0004008933901786804, 0.00042863190174102783, 0.00045637041330337524, 0.00048410892486572266, 0.0005118474364280701, 0.0005395859479904175, 0.0005673244595527649, 0.0005950629711151123, 0.0006228014826774597, 0.0006505399942398071, 0.0006782785058021545, 0.000706017017364502, 0.0007337555289268494, 0.0007614940404891968, 0.0007892325520515442, 0.0008169710636138916, 0.000844709575176239, 0.0008724480867385864, 0.0009001865983009338, 0.0009279251098632812]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 44.0, 670.0, 294.0, 8.0, 2.0], "bins": [-0.0008232136606238782, -0.0008096713572740555, -0.0007961291121318936, -0.0007825868087820709, -0.000769044563639909, -0.0007555022602900863, -0.0007419599569402635, -0.0007284177117981017, -0.0007148754084482789, -0.0007013331050984561, -0.0006877908599562943, -0.0006742485566064715, -0.0006607063114643097, -0.0006471640081144869, -0.0006336217047646642, -0.0006200794596225023, -0.0006065371562726796, -0.0005929948529228568, -0.000579452607780695, -0.0005659103044308722, -0.0005523680592887104, -0.0005388257559388876, -0.0005252834525890648, -0.000511741207446903, -0.0004981989040970802, -0.00048465662985108793, -0.0004711143556050956, -0.00045757205225527287, -0.00044402977800928056, -0.00043048750376328826, -0.00041694522951729596, -0.00040340295527130365, -0.00038986068102531135, -0.00037631840677931905, -0.00036277613253332675, -0.000349233829183504, -0.0003356915549375117, -0.0003221492806915194, -0.0003086070064455271, -0.0002950647030957043, -0.000281522428849712, -0.0002679801546037197, -0.0002544378803577274, -0.00024089559155981988, -0.00022735330276191235, -0.00021381102851592004, -0.00020026875426992774, -0.0001867264654720202, -0.0001731841912260279, -0.0001596419169800356, -0.00014609962818212807, -0.00013255735393613577, -0.00011901506513822824, -0.00010547279089223593, -9.193050937028602e-05, -7.83882278483361e-05, -6.484594632638618e-05, -5.1303664804436266e-05, -3.776138328248635e-05, -2.421910539851524e-05, -1.0676823876565322e-05, 2.8654540074057877e-06, 1.6407735529355705e-05, 2.9950017051305622e-05, 4.349229857325554e-05]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 1.0, 8.0, 9.0, 12.0, 14.0, 16.0, 9.0, 18.0, 28.0, 22.0, 25.0, 33.0, 37.0, 32.0, 39.0, 48.0, 58.0, 42.0, 49.0, 49.0, 32.0, 42.0, 49.0, 42.0, 34.0, 37.0, 32.0, 31.0, 21.0, 16.0, 24.0, 20.0, 14.0, 15.0, 13.0, 6.0, 4.0, 11.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6404857635498047e-05, -2.5389716029167175e-05, -2.4374574422836304e-05, -2.3359432816505432e-05, -2.234429121017456e-05, -2.132914960384369e-05, -2.0314007997512817e-05, -1.9298866391181946e-05, -1.8283724784851074e-05, -1.7268583178520203e-05, -1.625344157218933e-05, -1.523829996585846e-05, -1.4223158359527588e-05, -1.3208016753196716e-05, -1.2192875146865845e-05, -1.1177733540534973e-05, -1.0162591934204102e-05, -9.14745032787323e-06, -8.132308721542358e-06, -7.117167115211487e-06, -6.102025508880615e-06, -5.086883902549744e-06, -4.071742296218872e-06, -3.0566006898880005e-06, -2.041459083557129e-06, -1.0263174772262573e-06, -1.1175870895385742e-08, 1.0039657354354858e-06, 2.0191073417663574e-06, 3.034248948097229e-06, 4.049390554428101e-06, 5.064532160758972e-06, 6.079673767089844e-06, 7.094815373420715e-06, 8.109956979751587e-06, 9.125098586082458e-06, 1.014024019241333e-05, 1.1155381798744202e-05, 1.2170523405075073e-05, 1.3185665011405945e-05, 1.4200806617736816e-05, 1.5215948224067688e-05, 1.623108983039856e-05, 1.724623143672943e-05, 1.8261373043060303e-05, 1.9276514649391174e-05, 2.0291656255722046e-05, 2.1306797862052917e-05, 2.232193946838379e-05, 2.333708107471466e-05, 2.4352222681045532e-05, 2.5367364287376404e-05, 2.6382505893707275e-05, 2.7397647500038147e-05, 2.841278910636902e-05, 2.942793071269989e-05, 3.0443072319030762e-05, 3.145821392536163e-05, 3.2473355531692505e-05, 3.3488497138023376e-05, 3.450363874435425e-05, 3.551878035068512e-05, 3.653392195701599e-05, 3.754906356334686e-05, 3.8564205169677734e-05]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 5.0, 8.0, 18.0, 19.0, 26.0, 25.0, 37.0, 24.0, 21.0, 35.0, 29.0, 54.0, 40.0, 46.0, 56.0, 52.0, 45.0, 58.0, 40.0, 53.0, 45.0, 43.0, 37.0, 26.0, 24.0, 26.0, 26.0, 16.0, 18.0, 7.0, 10.0, 12.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9609375, -5.75567626953125, -5.5504150390625, -5.34515380859375, -5.139892578125, -4.93463134765625, -4.7293701171875, -4.52410888671875, -4.31884765625, -4.11358642578125, -3.9083251953125, -3.70306396484375, -3.497802734375, -3.29254150390625, -3.0872802734375, -2.88201904296875, -2.6767578125, -2.47149658203125, -2.2662353515625, -2.06097412109375, -1.855712890625, -1.65045166015625, -1.4451904296875, -1.23992919921875, -1.03466796875, -0.82940673828125, -0.6241455078125, -0.41888427734375, -0.213623046875, -0.00836181640625, 0.1968994140625, 0.40216064453125, 0.607421875, 0.81268310546875, 1.0179443359375, 1.22320556640625, 1.428466796875, 1.63372802734375, 1.8389892578125, 2.04425048828125, 2.24951171875, 2.45477294921875, 2.6600341796875, 2.86529541015625, 3.070556640625, 3.27581787109375, 3.4810791015625, 3.68634033203125, 3.8916015625, 4.09686279296875, 4.3021240234375, 4.50738525390625, 4.712646484375, 4.91790771484375, 5.1231689453125, 5.32843017578125, 5.53369140625, 5.73895263671875, 5.9442138671875, 6.14947509765625, 6.354736328125, 6.55999755859375, 6.7652587890625, 6.97052001953125, 7.17578125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 10.0, 6.0, 7.0, 15.0, 16.0, 26.0, 29.0, 61.0, 94.0, 137.0, 206.0, 312.0, 572.0, 947.0, 1672.0, 3156.0, 6304.0, 12954.0, 27927.0, 70615.0, 294583.0, 467539.0, 94738.0, 35093.0, 15562.0, 7557.0, 3767.0, 2007.0, 1064.0, 551.0, 372.0, 228.0, 153.0, 82.0, 68.0, 48.0, 18.0, 20.0, 17.0, 6.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.87890625, -7.62579345703125, -7.3726806640625, -7.11956787109375, -6.866455078125, -6.61334228515625, -6.3602294921875, -6.10711669921875, -5.85400390625, -5.60089111328125, -5.3477783203125, -5.09466552734375, -4.841552734375, -4.58843994140625, -4.3353271484375, -4.08221435546875, -3.8291015625, -3.57598876953125, -3.3228759765625, -3.06976318359375, -2.816650390625, -2.56353759765625, -2.3104248046875, -2.05731201171875, -1.80419921875, -1.55108642578125, -1.2979736328125, -1.04486083984375, -0.791748046875, -0.53863525390625, -0.2855224609375, -0.03240966796875, 0.220703125, 0.47381591796875, 0.7269287109375, 0.98004150390625, 1.233154296875, 1.48626708984375, 1.7393798828125, 1.99249267578125, 2.24560546875, 2.49871826171875, 2.7518310546875, 3.00494384765625, 3.258056640625, 3.51116943359375, 3.7642822265625, 4.01739501953125, 4.2705078125, 4.52362060546875, 4.7767333984375, 5.02984619140625, 5.282958984375, 5.53607177734375, 5.7891845703125, 6.04229736328125, 6.29541015625, 6.54852294921875, 6.8016357421875, 7.05474853515625, 7.307861328125, 7.56097412109375, 7.8140869140625, 8.06719970703125, 8.3203125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 5.0, 6.0, 7.0, 14.0, 11.0, 7.0, 14.0, 18.0, 16.0, 23.0, 30.0, 31.0, 33.0, 34.0, 46.0, 50.0, 59.0, 62.0, 103.0, 168.0, 1547.0, 191.0, 90.0, 60.0, 50.0, 44.0, 40.0, 32.0, 42.0, 26.0, 28.0, 35.0, 21.0, 18.0, 14.0, 23.0, 9.0, 7.0, 8.0, 3.0, 9.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.75, -15.2509765625, -14.751953125, -14.2529296875, -13.75390625, -13.2548828125, -12.755859375, -12.2568359375, -11.7578125, -11.2587890625, -10.759765625, -10.2607421875, -9.76171875, -9.2626953125, -8.763671875, -8.2646484375, -7.765625, -7.2666015625, -6.767578125, -6.2685546875, -5.76953125, -5.2705078125, -4.771484375, -4.2724609375, -3.7734375, -3.2744140625, -2.775390625, -2.2763671875, -1.77734375, -1.2783203125, -0.779296875, -0.2802734375, 0.21875, 0.7177734375, 1.216796875, 1.7158203125, 2.21484375, 2.7138671875, 3.212890625, 3.7119140625, 4.2109375, 4.7099609375, 5.208984375, 5.7080078125, 6.20703125, 6.7060546875, 7.205078125, 7.7041015625, 8.203125, 8.7021484375, 9.201171875, 9.7001953125, 10.19921875, 10.6982421875, 11.197265625, 11.6962890625, 12.1953125, 12.6943359375, 13.193359375, 13.6923828125, 14.19140625, 14.6904296875, 15.189453125, 15.6884765625, 16.1875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 9.0, 3.0, 7.0, 4.0, 13.0, 17.0, 26.0, 32.0, 24.0, 37.0, 44.0, 61.0, 90.0, 160.0, 249.0, 467.0, 1195.0, 4681.0, 34134.0, 1949709.0, 1118518.0, 29754.0, 4143.0, 1115.0, 457.0, 248.0, 150.0, 91.0, 51.0, 46.0, 29.0, 31.0, 14.0, 19.0, 13.0, 7.0, 16.0, 13.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.53125, -32.51416015625, -31.4970703125, -30.47998046875, -29.462890625, -28.44580078125, -27.4287109375, -26.41162109375, -25.39453125, -24.37744140625, -23.3603515625, -22.34326171875, -21.326171875, -20.30908203125, -19.2919921875, -18.27490234375, -17.2578125, -16.24072265625, -15.2236328125, -14.20654296875, -13.189453125, -12.17236328125, -11.1552734375, -10.13818359375, -9.12109375, -8.10400390625, -7.0869140625, -6.06982421875, -5.052734375, -4.03564453125, -3.0185546875, -2.00146484375, -0.984375, 0.03271484375, 1.0498046875, 2.06689453125, 3.083984375, 4.10107421875, 5.1181640625, 6.13525390625, 7.15234375, 8.16943359375, 9.1865234375, 10.20361328125, 11.220703125, 12.23779296875, 13.2548828125, 14.27197265625, 15.2890625, 16.30615234375, 17.3232421875, 18.34033203125, 19.357421875, 20.37451171875, 21.3916015625, 22.40869140625, 23.42578125, 24.44287109375, 25.4599609375, 26.47705078125, 27.494140625, 28.51123046875, 29.5283203125, 30.54541015625, 31.5625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 45.0, 262.0, 470.0, 198.0, 31.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.696006774902344, -39.95793914794922, -35.21986770629883, -30.481800079345703, -25.743730545043945, -21.005661010742188, -16.267593383789062, -11.529521942138672, -6.791454315185547, -2.0533852577209473, 2.6846837997436523, 7.422752380371094, 12.160821914672852, 16.89889144897461, 21.636959075927734, 26.375030517578125, 31.11309814453125, 35.851165771484375, 40.589237213134766, 45.32730484008789, 50.06537628173828, 54.803443908691406, 59.54151153564453, 64.27958679199219, 69.01765441894531, 73.75572204589844, 78.49378967285156, 83.23185729980469, 87.96993255615234, 92.70800018310547, 97.4460678100586, 102.18414306640625, 106.92219543457031, 111.66026306152344, 116.39833068847656, 121.13639831542969, 125.87447357177734, 130.612548828125, 135.35061645507812, 140.08868408203125, 144.82675170898438, 149.5648193359375, 154.30288696289062, 159.04095458984375, 163.77902221679688, 168.51708984375, 173.25515747070312, 177.9932403564453, 182.73129272460938, 187.4693603515625, 192.20742797851562, 196.94549560546875, 201.68356323242188, 206.421630859375, 211.15969848632812, 215.8977813720703, 220.63584899902344, 225.37391662597656, 230.1119842529297, 234.8500518798828, 239.58811950683594, 244.32620239257812, 249.06427001953125, 253.80233764648438, 258.5404052734375]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 4.0, 3.0, 12.0, 4.0, 9.0, 19.0, 12.0, 17.0, 26.0, 16.0, 18.0, 34.0, 16.0, 22.0, 29.0, 40.0, 34.0, 40.0, 35.0, 39.0, 31.0, 31.0, 43.0, 44.0, 47.0, 31.0, 38.0, 37.0, 29.0, 36.0, 29.0, 24.0, 21.0, 22.0, 16.0, 14.0, 13.0, 5.0, 8.0, 9.0, 5.0, 11.0, 5.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-47.423702239990234, -46.028743743896484, -44.6337890625, -43.23883056640625, -41.8438720703125, -40.44891357421875, -39.053958892822266, -37.659000396728516, -36.26404571533203, -34.86908721923828, -33.4741325378418, -32.07917404174805, -30.684215545654297, -29.28925895690918, -27.894302368164062, -26.499343872070312, -25.104385375976562, -23.709428787231445, -22.314470291137695, -20.919513702392578, -19.524555206298828, -18.12959861755371, -16.734642028808594, -15.33968448638916, -13.944726943969727, -12.549769401550293, -11.15481185913086, -9.759855270385742, -8.364897727966309, -6.969940185546875, -5.574983596801758, -4.180026054382324, -2.7850723266601562, -1.3901150226593018, 0.004842281341552734, 1.3997993469238281, 2.7947568893432617, 4.189714431762695, 5.5846710205078125, 6.979628562927246, 8.37458610534668, 9.769543647766113, 11.164501190185547, 12.559457778930664, 13.954415321350098, 15.349372863769531, 16.74432945251465, 18.139286041259766, 19.534244537353516, 20.929201126098633, 22.324159622192383, 23.7191162109375, 25.11407470703125, 26.509031295776367, 27.903987884521484, 29.298946380615234, 30.69390296936035, 32.08885955810547, 33.48381805419922, 34.87877655029297, 36.27373123168945, 37.6686897277832, 39.06364440917969, 40.45860290527344, 41.85356140136719]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 13.0, 10.0, 11.0, 19.0, 21.0, 24.0, 28.0, 26.0, 20.0, 21.0, 33.0, 40.0, 32.0, 41.0, 41.0, 51.0, 58.0, 39.0, 43.0, 44.0, 34.0, 50.0, 48.0, 40.0, 31.0, 35.0, 14.0, 23.0, 21.0, 12.0, 16.0, 17.0, 13.0, 9.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.36328125, -5.1676025390625, -4.971923828125, -4.7762451171875, -4.58056640625, -4.3848876953125, -4.189208984375, -3.9935302734375, -3.7978515625, -3.6021728515625, -3.406494140625, -3.2108154296875, -3.01513671875, -2.8194580078125, -2.623779296875, -2.4281005859375, -2.232421875, -2.0367431640625, -1.841064453125, -1.6453857421875, -1.44970703125, -1.2540283203125, -1.058349609375, -0.8626708984375, -0.6669921875, -0.4713134765625, -0.275634765625, -0.0799560546875, 0.11572265625, 0.3114013671875, 0.507080078125, 0.7027587890625, 0.8984375, 1.0941162109375, 1.289794921875, 1.4854736328125, 1.68115234375, 1.8768310546875, 2.072509765625, 2.2681884765625, 2.4638671875, 2.6595458984375, 2.855224609375, 3.0509033203125, 3.24658203125, 3.4422607421875, 3.637939453125, 3.8336181640625, 4.029296875, 4.2249755859375, 4.420654296875, 4.6163330078125, 4.81201171875, 5.0076904296875, 5.203369140625, 5.3990478515625, 5.5947265625, 5.7904052734375, 5.986083984375, 6.1817626953125, 6.37744140625, 6.5731201171875, 6.768798828125, 6.9644775390625, 7.16015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 5.0, 4.0, 15.0, 22.0, 19.0, 31.0, 47.0, 66.0, 118.0, 185.0, 314.0, 659.0, 1438.0, 3670.0, 10012.0, 33119.0, 141522.0, 1105203.0, 2479573.0, 329356.0, 61210.0, 17317.0, 5825.0, 2278.0, 1012.0, 511.0, 289.0, 148.0, 96.0, 72.0, 42.0, 34.0, 21.0, 15.0, 11.0, 6.0, 11.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.96875, -13.521484375, -13.07421875, -12.626953125, -12.1796875, -11.732421875, -11.28515625, -10.837890625, -10.390625, -9.943359375, -9.49609375, -9.048828125, -8.6015625, -8.154296875, -7.70703125, -7.259765625, -6.8125, -6.365234375, -5.91796875, -5.470703125, -5.0234375, -4.576171875, -4.12890625, -3.681640625, -3.234375, -2.787109375, -2.33984375, -1.892578125, -1.4453125, -0.998046875, -0.55078125, -0.103515625, 0.34375, 0.791015625, 1.23828125, 1.685546875, 2.1328125, 2.580078125, 3.02734375, 3.474609375, 3.921875, 4.369140625, 4.81640625, 5.263671875, 5.7109375, 6.158203125, 6.60546875, 7.052734375, 7.5, 7.947265625, 8.39453125, 8.841796875, 9.2890625, 9.736328125, 10.18359375, 10.630859375, 11.078125, 11.525390625, 11.97265625, 12.419921875, 12.8671875, 13.314453125, 13.76171875, 14.208984375, 14.65625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 13.0, 19.0, 18.0, 16.0, 32.0, 49.0, 66.0, 91.0, 124.0, 134.0, 204.0, 280.0, 408.0, 540.0, 519.0, 411.0, 293.0, 228.0, 147.0, 115.0, 74.0, 70.0, 50.0, 52.0, 25.0, 19.0, 8.0, 17.0, 12.0, 4.0, 7.0, 9.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-10.828125, -10.518798828125, -10.20947265625, -9.900146484375, -9.5908203125, -9.281494140625, -8.97216796875, -8.662841796875, -8.353515625, -8.044189453125, -7.73486328125, -7.425537109375, -7.1162109375, -6.806884765625, -6.49755859375, -6.188232421875, -5.87890625, -5.569580078125, -5.26025390625, -4.950927734375, -4.6416015625, -4.332275390625, -4.02294921875, -3.713623046875, -3.404296875, -3.094970703125, -2.78564453125, -2.476318359375, -2.1669921875, -1.857666015625, -1.54833984375, -1.239013671875, -0.9296875, -0.620361328125, -0.31103515625, -0.001708984375, 0.3076171875, 0.616943359375, 0.92626953125, 1.235595703125, 1.544921875, 1.854248046875, 2.16357421875, 2.472900390625, 2.7822265625, 3.091552734375, 3.40087890625, 3.710205078125, 4.01953125, 4.328857421875, 4.63818359375, 4.947509765625, 5.2568359375, 5.566162109375, 5.87548828125, 6.184814453125, 6.494140625, 6.803466796875, 7.11279296875, 7.422119140625, 7.7314453125, 8.040771484375, 8.35009765625, 8.659423828125, 8.96875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 5.0, 9.0, 10.0, 7.0, 8.0, 31.0, 30.0, 44.0, 73.0, 98.0, 152.0, 226.0, 376.0, 945.0, 3978.0, 36400.0, 991730.0, 3065506.0, 85090.0, 6937.0, 1342.0, 517.0, 262.0, 180.0, 105.0, 66.0, 45.0, 28.0, 23.0, 20.0, 8.0, 13.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-39.0625, -37.951171875, -36.83984375, -35.728515625, -34.6171875, -33.505859375, -32.39453125, -31.283203125, -30.171875, -29.060546875, -27.94921875, -26.837890625, -25.7265625, -24.615234375, -23.50390625, -22.392578125, -21.28125, -20.169921875, -19.05859375, -17.947265625, -16.8359375, -15.724609375, -14.61328125, -13.501953125, -12.390625, -11.279296875, -10.16796875, -9.056640625, -7.9453125, -6.833984375, -5.72265625, -4.611328125, -3.5, -2.388671875, -1.27734375, -0.166015625, 0.9453125, 2.056640625, 3.16796875, 4.279296875, 5.390625, 6.501953125, 7.61328125, 8.724609375, 9.8359375, 10.947265625, 12.05859375, 13.169921875, 14.28125, 15.392578125, 16.50390625, 17.615234375, 18.7265625, 19.837890625, 20.94921875, 22.060546875, 23.171875, 24.283203125, 25.39453125, 26.505859375, 27.6171875, 28.728515625, 29.83984375, 30.951171875, 32.0625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 14.0, 40.0, 101.0, 152.0, 282.0, 197.0, 135.0, 53.0, 31.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.33702087402344, -94.77400207519531, -91.21097564697266, -87.64795684814453, -84.08493041992188, -80.52191162109375, -76.95889282226562, -73.3958740234375, -69.83284759521484, -66.26982879638672, -62.70680236816406, -59.14378356933594, -55.58076095581055, -52.017738342285156, -48.45471954345703, -44.89169692993164, -41.32867431640625, -37.76565170288086, -34.20262908935547, -30.639610290527344, -27.076587677001953, -23.513565063476562, -19.950544357299805, -16.387523651123047, -12.824501037597656, -9.261479377746582, -5.698457717895508, -2.1354360580444336, 1.4275856018066406, 4.990608215332031, 8.553628921508789, 12.116649627685547, 15.679672241210938, 19.242694854736328, 22.805715560913086, 26.368736267089844, 29.931758880615234, 33.494781494140625, 37.05780029296875, 40.62082290649414, 44.18384552001953, 47.74686813354492, 51.30989074707031, 54.87290954589844, 58.43593215942383, 61.99895477294922, 65.56197357177734, 69.125, 72.68801879882812, 76.25103759765625, 79.8140640258789, 83.37708282470703, 86.94010925292969, 90.50312805175781, 94.06614685058594, 97.62916564941406, 101.19219207763672, 104.75521087646484, 108.3182373046875, 111.88125610351562, 115.44427490234375, 119.0073013305664, 122.57032012939453, 126.13334655761719, 129.6963653564453]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 6.0, 10.0, 8.0, 11.0, 12.0, 18.0, 15.0, 24.0, 26.0, 23.0, 20.0, 32.0, 38.0, 37.0, 41.0, 20.0, 41.0, 46.0, 45.0, 49.0, 48.0, 38.0, 34.0, 36.0, 41.0, 28.0, 39.0, 26.0, 20.0, 25.0, 24.0, 22.0, 16.0, 19.0, 10.0, 7.0, 11.0, 7.0, 6.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0], "bins": [-35.319610595703125, -34.29916000366211, -33.278709411621094, -32.258262634277344, -31.237812042236328, -30.217361450195312, -29.19691276550293, -28.176464080810547, -27.15601348876953, -26.135562896728516, -25.115114212036133, -24.09466552734375, -23.074214935302734, -22.05376434326172, -21.033315658569336, -20.012866973876953, -18.992416381835938, -17.971965789794922, -16.95151710510254, -15.93106746673584, -14.91061782836914, -13.890168190002441, -12.869718551635742, -11.849268913269043, -10.828819274902344, -9.808369636535645, -8.787919998168945, -7.767470359802246, -6.747020721435547, -5.726571083068848, -4.706121444702148, -3.685671806335449, -2.6652259826660156, -1.6447763442993164, -0.6243267059326172, 0.39612293243408203, 1.4165725708007812, 2.4370222091674805, 3.4574718475341797, 4.477921485900879, 5.498371124267578, 6.518820762634277, 7.539270401000977, 8.559720039367676, 9.580169677734375, 10.600619316101074, 11.621068954467773, 12.641518592834473, 13.661968231201172, 14.682417869567871, 15.70286750793457, 16.723316192626953, 17.74376678466797, 18.764217376708984, 19.784666061401367, 20.80511474609375, 21.825565338134766, 22.84601593017578, 23.866464614868164, 24.886913299560547, 25.907363891601562, 26.927814483642578, 27.94826316833496, 28.968711853027344, 29.98916244506836]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 10.0, 7.0, 13.0, 14.0, 23.0, 19.0, 18.0, 22.0, 30.0, 23.0, 37.0, 31.0, 26.0, 32.0, 45.0, 52.0, 43.0, 52.0, 45.0, 41.0, 41.0, 42.0, 41.0, 42.0, 37.0, 25.0, 40.0, 19.0, 18.0, 23.0, 17.0, 15.0, 17.0, 8.0, 8.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.4296875, -5.23675537109375, -5.0438232421875, -4.85089111328125, -4.657958984375, -4.46502685546875, -4.2720947265625, -4.07916259765625, -3.88623046875, -3.69329833984375, -3.5003662109375, -3.30743408203125, -3.114501953125, -2.92156982421875, -2.7286376953125, -2.53570556640625, -2.3427734375, -2.14984130859375, -1.9569091796875, -1.76397705078125, -1.571044921875, -1.37811279296875, -1.1851806640625, -0.99224853515625, -0.79931640625, -0.60638427734375, -0.4134521484375, -0.22052001953125, -0.027587890625, 0.16534423828125, 0.3582763671875, 0.55120849609375, 0.744140625, 0.93707275390625, 1.1300048828125, 1.32293701171875, 1.515869140625, 1.70880126953125, 1.9017333984375, 2.09466552734375, 2.28759765625, 2.48052978515625, 2.6734619140625, 2.86639404296875, 3.059326171875, 3.25225830078125, 3.4451904296875, 3.63812255859375, 3.8310546875, 4.02398681640625, 4.2169189453125, 4.40985107421875, 4.602783203125, 4.79571533203125, 4.9886474609375, 5.18157958984375, 5.37451171875, 5.56744384765625, 5.7603759765625, 5.95330810546875, 6.146240234375, 6.33917236328125, 6.5321044921875, 6.72503662109375, 6.91796875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 3.0, 6.0, 5.0, 15.0, 27.0, 31.0, 51.0, 66.0, 96.0, 119.0, 187.0, 286.0, 439.0, 673.0, 1087.0, 1650.0, 2581.0, 3904.0, 5964.0, 9315.0, 14110.0, 22431.0, 35531.0, 58344.0, 105823.0, 239030.0, 263185.0, 116101.0, 62805.0, 37825.0, 23643.0, 15304.0, 9777.0, 6360.0, 4152.0, 2733.0, 1644.0, 1147.0, 678.0, 459.0, 300.0, 215.0, 143.0, 90.0, 56.0, 51.0, 28.0, 22.0, 25.0, 15.0, 7.0, 7.0, 2.0, 7.0, 2.0, 0.0, 2.0], "bins": [-0.2100830078125, -0.20372962951660156, -0.19737625122070312, -0.1910228729248047, -0.18466949462890625, -0.1783161163330078, -0.17196273803710938, -0.16560935974121094, -0.1592559814453125, -0.15290260314941406, -0.14654922485351562, -0.1401958465576172, -0.13384246826171875, -0.1274890899658203, -0.12113571166992188, -0.11478233337402344, -0.108428955078125, -0.10207557678222656, -0.09572219848632812, -0.08936882019042969, -0.08301544189453125, -0.07666206359863281, -0.07030868530273438, -0.06395530700683594, -0.0576019287109375, -0.05124855041503906, -0.044895172119140625, -0.03854179382324219, -0.03218841552734375, -0.025835037231445312, -0.019481658935546875, -0.013128280639648438, -0.00677490234375, -0.0004215240478515625, 0.005931854248046875, 0.012285232543945312, 0.01863861083984375, 0.024991989135742188, 0.031345367431640625, 0.03769874572753906, 0.0440521240234375, 0.05040550231933594, 0.056758880615234375, 0.06311225891113281, 0.06946563720703125, 0.07581901550292969, 0.08217239379882812, 0.08852577209472656, 0.094879150390625, 0.10123252868652344, 0.10758590698242188, 0.11393928527832031, 0.12029266357421875, 0.1266460418701172, 0.13299942016601562, 0.13935279846191406, 0.1457061767578125, 0.15205955505371094, 0.15841293334960938, 0.1647663116455078, 0.17111968994140625, 0.1774730682373047, 0.18382644653320312, 0.19017982482910156, 0.196533203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 10.0, 7.0, 11.0, 8.0, 13.0, 14.0, 23.0, 15.0, 26.0, 25.0, 23.0, 28.0, 21.0, 31.0, 28.0, 35.0, 36.0, 39.0, 35.0, 46.0, 1076.0, 41.0, 39.0, 33.0, 33.0, 39.0, 22.0, 33.0, 32.0, 29.0, 20.0, 18.0, 31.0, 16.0, 18.0, 15.0, 13.0, 13.0, 5.0, 6.0, 3.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.88671875, -3.766082763671875, -3.64544677734375, -3.524810791015625, -3.4041748046875, -3.283538818359375, -3.16290283203125, -3.042266845703125, -2.921630859375, -2.800994873046875, -2.68035888671875, -2.559722900390625, -2.4390869140625, -2.318450927734375, -2.19781494140625, -2.077178955078125, -1.95654296875, -1.835906982421875, -1.71527099609375, -1.594635009765625, -1.4739990234375, -1.353363037109375, -1.23272705078125, -1.112091064453125, -0.991455078125, -0.870819091796875, -0.75018310546875, -0.629547119140625, -0.5089111328125, -0.388275146484375, -0.26763916015625, -0.147003173828125, -0.0263671875, 0.094268798828125, 0.21490478515625, 0.335540771484375, 0.4561767578125, 0.576812744140625, 0.69744873046875, 0.818084716796875, 0.938720703125, 1.059356689453125, 1.17999267578125, 1.300628662109375, 1.4212646484375, 1.541900634765625, 1.66253662109375, 1.783172607421875, 1.90380859375, 2.024444580078125, 2.14508056640625, 2.265716552734375, 2.3863525390625, 2.506988525390625, 2.62762451171875, 2.748260498046875, 2.868896484375, 2.989532470703125, 3.11016845703125, 3.230804443359375, 3.3514404296875, 3.472076416015625, 3.59271240234375, 3.713348388671875, 3.833984375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 10.0, 15.0, 25.0, 36.0, 70.0, 63.0, 140.0, 218.0, 330.0, 489.0, 827.0, 1295.0, 2098.0, 3396.0, 5356.0, 8880.0, 14409.0, 23675.0, 38553.0, 65439.0, 124524.0, 1329420.0, 231153.0, 102731.0, 56466.0, 33784.0, 20606.0, 12660.0, 7706.0, 4803.0, 2962.0, 1840.0, 1132.0, 720.0, 469.0, 294.0, 206.0, 120.0, 67.0, 56.0, 31.0, 15.0, 13.0, 9.0, 5.0, 9.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1436767578125, -0.13930511474609375, -0.1349334716796875, -0.13056182861328125, -0.126190185546875, -0.12181854248046875, -0.1174468994140625, -0.11307525634765625, -0.10870361328125, -0.10433197021484375, -0.0999603271484375, -0.09558868408203125, -0.091217041015625, -0.08684539794921875, -0.0824737548828125, -0.07810211181640625, -0.07373046875, -0.06935882568359375, -0.0649871826171875, -0.06061553955078125, -0.056243896484375, -0.05187225341796875, -0.0475006103515625, -0.04312896728515625, -0.03875732421875, -0.03438568115234375, -0.0300140380859375, -0.02564239501953125, -0.021270751953125, -0.01689910888671875, -0.0125274658203125, -0.00815582275390625, -0.0037841796875, 0.00058746337890625, 0.0049591064453125, 0.00933074951171875, 0.013702392578125, 0.01807403564453125, 0.0224456787109375, 0.02681732177734375, 0.03118896484375, 0.03556060791015625, 0.0399322509765625, 0.04430389404296875, 0.048675537109375, 0.05304718017578125, 0.0574188232421875, 0.06179046630859375, 0.066162109375, 0.07053375244140625, 0.0749053955078125, 0.07927703857421875, 0.083648681640625, 0.08802032470703125, 0.0923919677734375, 0.09676361083984375, 0.10113525390625, 0.10550689697265625, 0.1098785400390625, 0.11425018310546875, 0.118621826171875, 0.12299346923828125, 0.1273651123046875, 0.13173675537109375, 0.1361083984375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 6.0, 5.0, 11.0, 4.0, 7.0, 14.0, 12.0, 14.0, 18.0, 22.0, 33.0, 31.0, 40.0, 35.0, 57.0, 51.0, 56.0, 50.0, 44.0, 49.0, 48.0, 47.0, 53.0, 35.0, 50.0, 37.0, 26.0, 27.0, 12.0, 17.0, 8.0, 13.0, 16.0, 6.0, 14.0, 6.0, 4.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.225969314575195e-05, -4.070345312356949e-05, -3.9147213101387024e-05, -3.759097307920456e-05, -3.6034733057022095e-05, -3.447849303483963e-05, -3.2922253012657166e-05, -3.13660129904747e-05, -2.9809772968292236e-05, -2.8253532946109772e-05, -2.6697292923927307e-05, -2.5141052901744843e-05, -2.3584812879562378e-05, -2.2028572857379913e-05, -2.047233283519745e-05, -1.8916092813014984e-05, -1.735985279083252e-05, -1.5803612768650055e-05, -1.424737274646759e-05, -1.2691132724285126e-05, -1.1134892702102661e-05, -9.578652679920197e-06, -8.022412657737732e-06, -6.466172635555267e-06, -4.909932613372803e-06, -3.353692591190338e-06, -1.7974525690078735e-06, -2.4121254682540894e-07, 1.3150274753570557e-06, 2.8712674975395203e-06, 4.427507519721985e-06, 5.9837475419044495e-06, 7.539987564086914e-06, 9.096227586269379e-06, 1.0652467608451843e-05, 1.2208707630634308e-05, 1.3764947652816772e-05, 1.5321187674999237e-05, 1.68774276971817e-05, 1.8433667719364166e-05, 1.998990774154663e-05, 2.1546147763729095e-05, 2.310238778591156e-05, 2.4658627808094025e-05, 2.621486783027649e-05, 2.7771107852458954e-05, 2.932734787464142e-05, 3.088358789682388e-05, 3.243982791900635e-05, 3.399606794118881e-05, 3.555230796337128e-05, 3.710854798555374e-05, 3.8664788007736206e-05, 4.022102802991867e-05, 4.1777268052101135e-05, 4.33335080742836e-05, 4.4889748096466064e-05, 4.644598811864853e-05, 4.8002228140830994e-05, 4.955846816301346e-05, 5.111470818519592e-05, 5.267094820737839e-05, 5.422718822956085e-05, 5.578342825174332e-05, 5.733966827392578e-05]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 5.0, 5.0, 7.0, 12.0, 12.0, 12.0, 7.0, 9.0, 19.0, 19.0, 24.0, 28.0, 49.0, 59.0, 92.0, 183.0, 360.0, 2174.0, 259703.0, 777016.0, 7486.0, 565.0, 260.0, 109.0, 88.0, 53.0, 43.0, 23.0, 25.0, 23.0, 21.0, 14.0, 3.0, 8.0, 13.0, 5.0, 9.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.001285552978515625, -0.0012527257204055786, -0.0012198984622955322, -0.0011870712041854858, -0.0011542439460754395, -0.001121416687965393, -0.0010885894298553467, -0.0010557621717453003, -0.001022934913635254, -0.0009901076555252075, -0.0009572803974151611, -0.0009244531393051147, -0.0008916258811950684, -0.000858798623085022, -0.0008259713649749756, -0.0007931441068649292, -0.0007603168487548828, -0.0007274895906448364, -0.00069466233253479, -0.0006618350744247437, -0.0006290078163146973, -0.0005961805582046509, -0.0005633533000946045, -0.0005305260419845581, -0.0004976987838745117, -0.00046487152576446533, -0.00043204426765441895, -0.00039921700954437256, -0.00036638975143432617, -0.0003335624933242798, -0.0003007352352142334, -0.000267907977104187, -0.00023508071899414062, -0.00020225346088409424, -0.00016942620277404785, -0.00013659894466400146, -0.00010377168655395508, -7.094442844390869e-05, -3.8117170333862305e-05, -5.289912223815918e-06, 2.753734588623047e-05, 6.0364603996276855e-05, 9.319186210632324e-05, 0.00012601912021636963, 0.00015884637832641602, 0.0001916736364364624, 0.0002245008945465088, 0.0002573281526565552, 0.00029015541076660156, 0.00032298266887664795, 0.00035580992698669434, 0.0003886371850967407, 0.0004214644432067871, 0.0004542917013168335, 0.0004871189594268799, 0.0005199462175369263, 0.0005527734756469727, 0.000585600733757019, 0.0006184279918670654, 0.0006512552499771118, 0.0006840825080871582, 0.0007169097661972046, 0.000749737024307251, 0.0007825642824172974, 0.0008153915405273438]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 11.0, 24.0, 82.0, 234.0, 344.0, 214.0, 76.0, 26.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002615794073790312, -0.0002567744813859463, -0.00025196955539286137, -0.000247164600295946, -0.0002423596743028611, -0.0002375547483097762, -0.00023274982231669128, -0.00022794489632360637, -0.00022313995577860624, -0.00021833502978552133, -0.0002135300892405212, -0.00020872516324743629, -0.00020392023725435138, -0.00019911529670935124, -0.00019431037071626633, -0.0001895054301712662, -0.0001847005041781813, -0.00017989557818509638, -0.00017509063764009625, -0.00017028571164701134, -0.0001654807711020112, -0.0001606758451089263, -0.0001558709191158414, -0.00015106599312275648, -0.00014626105257775635, -0.00014145612658467144, -0.0001366511860396713, -0.0001318462600465864, -0.0001270413340535015, -0.00012223639350850135, -0.00011743146751541644, -0.00011262653424637392, -0.0001078216009773314, -0.00010301666770828888, -9.821173443924636e-05, -9.340680844616145e-05, -8.860187517711893e-05, -8.37969419080764e-05, -7.89920159149915e-05, -7.418708264594898e-05, -6.938214937690645e-05, -6.457721610786393e-05, -5.977228647680022e-05, -5.4967356845736504e-05, -5.016242357669398e-05, -4.535749030765146e-05, -4.0552560676587746e-05, -3.574763104552403e-05, -3.0942701414460316e-05, -2.6137769964407198e-05, -2.133283851435408e-05, -1.6527907064300962e-05, -1.1722975614247844e-05, -6.9180441641947255e-06, -2.1131127141416073e-06, 2.6918169169221073e-06, 7.496750185964629e-06, 1.2301681636017747e-05, 1.7106613086070865e-05, 2.1911544536123984e-05, 2.6716475986177102e-05, 3.1521405617240816e-05, 3.632633888628334e-05, 4.113126851734705e-05, 4.5936201786389574e-05]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 2.0, 11.0, 12.0, 10.0, 9.0, 18.0, 14.0, 17.0, 21.0, 41.0, 29.0, 29.0, 39.0, 39.0, 38.0, 41.0, 37.0, 42.0, 46.0, 37.0, 45.0, 46.0, 42.0, 42.0, 36.0, 34.0, 32.0, 32.0, 23.0, 24.0, 24.0, 18.0, 16.0, 12.0, 5.0, 10.0, 7.0, 7.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.664327621459961e-05, -2.568308264017105e-05, -2.4722889065742493e-05, -2.3762695491313934e-05, -2.2802501916885376e-05, -2.1842308342456818e-05, -2.088211476802826e-05, -1.99219211935997e-05, -1.8961727619171143e-05, -1.8001534044742584e-05, -1.7041340470314026e-05, -1.6081146895885468e-05, -1.512095332145691e-05, -1.416075974702835e-05, -1.3200566172599792e-05, -1.2240372598171234e-05, -1.1280179023742676e-05, -1.0319985449314117e-05, -9.359791874885559e-06, -8.399598300457e-06, -7.439404726028442e-06, -6.479211151599884e-06, -5.519017577171326e-06, -4.558824002742767e-06, -3.598630428314209e-06, -2.6384368538856506e-06, -1.6782432794570923e-06, -7.180497050285339e-07, 2.421438694000244e-07, 1.2023374438285828e-06, 2.162531018257141e-06, 3.1227245926856995e-06, 4.082918167114258e-06, 5.043111741542816e-06, 6.0033053159713745e-06, 6.963498890399933e-06, 7.923692464828491e-06, 8.88388603925705e-06, 9.844079613685608e-06, 1.0804273188114166e-05, 1.1764466762542725e-05, 1.2724660336971283e-05, 1.3684853911399841e-05, 1.46450474858284e-05, 1.5605241060256958e-05, 1.6565434634685516e-05, 1.7525628209114075e-05, 1.8485821783542633e-05, 1.944601535797119e-05, 2.040620893239975e-05, 2.1366402506828308e-05, 2.2326596081256866e-05, 2.3286789655685425e-05, 2.4246983230113983e-05, 2.520717680454254e-05, 2.61673703789711e-05, 2.7127563953399658e-05, 2.8087757527828217e-05, 2.9047951102256775e-05, 3.0008144676685333e-05, 3.096833825111389e-05, 3.192853182554245e-05, 3.288872539997101e-05, 3.384891897439957e-05, 3.4809112548828125e-05]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 10.0, 7.0, 13.0, 14.0, 23.0, 19.0, 18.0, 22.0, 30.0, 23.0, 37.0, 31.0, 26.0, 32.0, 45.0, 52.0, 43.0, 52.0, 45.0, 41.0, 41.0, 42.0, 41.0, 42.0, 37.0, 25.0, 40.0, 19.0, 18.0, 23.0, 17.0, 15.0, 17.0, 8.0, 8.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.4296875, -5.23675537109375, -5.0438232421875, -4.85089111328125, -4.657958984375, -4.46502685546875, -4.2720947265625, -4.07916259765625, -3.88623046875, -3.69329833984375, -3.5003662109375, -3.30743408203125, -3.114501953125, -2.92156982421875, -2.7286376953125, -2.53570556640625, -2.3427734375, -2.14984130859375, -1.9569091796875, -1.76397705078125, -1.571044921875, -1.37811279296875, -1.1851806640625, -0.99224853515625, -0.79931640625, -0.60638427734375, -0.4134521484375, -0.22052001953125, -0.027587890625, 0.16534423828125, 0.3582763671875, 0.55120849609375, 0.744140625, 0.93707275390625, 1.1300048828125, 1.32293701171875, 1.515869140625, 1.70880126953125, 1.9017333984375, 2.09466552734375, 2.28759765625, 2.48052978515625, 2.6734619140625, 2.86639404296875, 3.059326171875, 3.25225830078125, 3.4451904296875, 3.63812255859375, 3.8310546875, 4.02398681640625, 4.2169189453125, 4.40985107421875, 4.602783203125, 4.79571533203125, 4.9886474609375, 5.18157958984375, 5.37451171875, 5.56744384765625, 5.7603759765625, 5.95330810546875, 6.146240234375, 6.33917236328125, 6.5321044921875, 6.72503662109375, 6.91796875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 11.0, 19.0, 17.0, 30.0, 52.0, 75.0, 141.0, 200.0, 345.0, 550.0, 1069.0, 1801.0, 3208.0, 5818.0, 10762.0, 21900.0, 47235.0, 114491.0, 337005.0, 310039.0, 105959.0, 44110.0, 20613.0, 10302.0, 5497.0, 3049.0, 1735.0, 1024.0, 600.0, 362.0, 172.0, 136.0, 80.0, 40.0, 41.0, 17.0, 13.0, 8.0, 8.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.427734375, -8.13671875, -7.845703125, -7.5546875, -7.263671875, -6.97265625, -6.681640625, -6.390625, -6.099609375, -5.80859375, -5.517578125, -5.2265625, -4.935546875, -4.64453125, -4.353515625, -4.0625, -3.771484375, -3.48046875, -3.189453125, -2.8984375, -2.607421875, -2.31640625, -2.025390625, -1.734375, -1.443359375, -1.15234375, -0.861328125, -0.5703125, -0.279296875, 0.01171875, 0.302734375, 0.59375, 0.884765625, 1.17578125, 1.466796875, 1.7578125, 2.048828125, 2.33984375, 2.630859375, 2.921875, 3.212890625, 3.50390625, 3.794921875, 4.0859375, 4.376953125, 4.66796875, 4.958984375, 5.25, 5.541015625, 5.83203125, 6.123046875, 6.4140625, 6.705078125, 6.99609375, 7.287109375, 7.578125, 7.869140625, 8.16015625, 8.451171875, 8.7421875, 9.033203125, 9.32421875, 9.615234375, 9.90625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 7.0, 1.0, 3.0, 10.0, 7.0, 13.0, 9.0, 12.0, 18.0, 22.0, 14.0, 22.0, 27.0, 35.0, 40.0, 33.0, 57.0, 76.0, 93.0, 135.0, 293.0, 1328.0, 195.0, 121.0, 81.0, 62.0, 53.0, 43.0, 33.0, 33.0, 34.0, 19.0, 25.0, 17.0, 14.0, 11.0, 9.0, 10.0, 6.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4140625, -14.8858642578125, -14.357666015625, -13.8294677734375, -13.30126953125, -12.7730712890625, -12.244873046875, -11.7166748046875, -11.1884765625, -10.6602783203125, -10.132080078125, -9.6038818359375, -9.07568359375, -8.5474853515625, -8.019287109375, -7.4910888671875, -6.962890625, -6.4346923828125, -5.906494140625, -5.3782958984375, -4.85009765625, -4.3218994140625, -3.793701171875, -3.2655029296875, -2.7373046875, -2.2091064453125, -1.680908203125, -1.1527099609375, -0.62451171875, -0.0963134765625, 0.431884765625, 0.9600830078125, 1.48828125, 2.0164794921875, 2.544677734375, 3.0728759765625, 3.60107421875, 4.1292724609375, 4.657470703125, 5.1856689453125, 5.7138671875, 6.2420654296875, 6.770263671875, 7.2984619140625, 7.82666015625, 8.3548583984375, 8.883056640625, 9.4112548828125, 9.939453125, 10.4676513671875, 10.995849609375, 11.5240478515625, 12.05224609375, 12.5804443359375, 13.108642578125, 13.6368408203125, 14.1650390625, 14.6932373046875, 15.221435546875, 15.7496337890625, 16.27783203125, 16.8060302734375, 17.334228515625, 17.8624267578125, 18.390625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 11.0, 7.0, 9.0, 8.0, 18.0, 19.0, 38.0, 32.0, 44.0, 101.0, 111.0, 189.0, 378.0, 602.0, 1264.0, 3251.0, 10519.0, 46742.0, 328392.0, 2394440.0, 300277.0, 43420.0, 10002.0, 3155.0, 1171.0, 577.0, 334.0, 192.0, 108.0, 81.0, 49.0, 44.0, 24.0, 17.0, 18.0, 12.0, 12.0, 11.0, 5.0, 5.0, 6.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 3.0], "bins": [-22.21875, -21.592529296875, -20.96630859375, -20.340087890625, -19.7138671875, -19.087646484375, -18.46142578125, -17.835205078125, -17.208984375, -16.582763671875, -15.95654296875, -15.330322265625, -14.7041015625, -14.077880859375, -13.45166015625, -12.825439453125, -12.19921875, -11.572998046875, -10.94677734375, -10.320556640625, -9.6943359375, -9.068115234375, -8.44189453125, -7.815673828125, -7.189453125, -6.563232421875, -5.93701171875, -5.310791015625, -4.6845703125, -4.058349609375, -3.43212890625, -2.805908203125, -2.1796875, -1.553466796875, -0.92724609375, -0.301025390625, 0.3251953125, 0.951416015625, 1.57763671875, 2.203857421875, 2.830078125, 3.456298828125, 4.08251953125, 4.708740234375, 5.3349609375, 5.961181640625, 6.58740234375, 7.213623046875, 7.83984375, 8.466064453125, 9.09228515625, 9.718505859375, 10.3447265625, 10.970947265625, 11.59716796875, 12.223388671875, 12.849609375, 13.475830078125, 14.10205078125, 14.728271484375, 15.3544921875, 15.980712890625, 16.60693359375, 17.233154296875, 17.859375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [8.0, 235.0, 659.0, 109.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.266681671142578, -12.285698890686035, -3.304716110229492, 5.676265716552734, 14.657249450683594, 23.638233184814453, 32.61921310424805, 41.600196838378906, 50.581180572509766, 59.562164306640625, 68.54314422607422, 77.52412414550781, 86.50511169433594, 95.48609924316406, 104.46707153320312, 113.44805908203125, 122.42904663085938, 131.4100341796875, 140.39100646972656, 149.3719940185547, 158.3529815673828, 167.33395385742188, 176.31494140625, 185.29592895507812, 194.2769012451172, 203.2578887939453, 212.23886108398438, 221.2198486328125, 230.20083618164062, 239.18182373046875, 248.1627960205078, 257.1437683105469, 266.1247863769531, 275.10577392578125, 284.0867614746094, 293.0677490234375, 302.0487060546875, 311.0296936035156, 320.01068115234375, 328.9916687011719, 337.97265625, 346.9536437988281, 355.93463134765625, 364.91558837890625, 373.8965759277344, 382.8775634765625, 391.8585510253906, 400.83953857421875, 409.82049560546875, 418.8014831542969, 427.782470703125, 436.763427734375, 445.7444152832031, 454.72540283203125, 463.7063903808594, 472.6873779296875, 481.6683654785156, 490.64935302734375, 499.6303405761719, 508.611328125, 517.59228515625, 526.5733032226562, 535.5542602539062, 544.5352172851562, 553.5162353515625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 2.0, 7.0, 4.0, 4.0, 5.0, 10.0, 14.0, 17.0, 25.0, 19.0, 33.0, 27.0, 39.0, 36.0, 36.0, 51.0, 44.0, 36.0, 56.0, 40.0, 42.0, 46.0, 45.0, 39.0, 45.0, 37.0, 42.0, 28.0, 26.0, 26.0, 21.0, 16.0, 15.0, 11.0, 15.0, 15.0, 5.0, 7.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.654327392578125, -45.12055206298828, -43.58677673339844, -42.053001403808594, -40.519229888916016, -38.98545455932617, -37.45167922973633, -35.917903900146484, -34.38412857055664, -32.8503532409668, -31.316579818725586, -29.782804489135742, -28.2490291595459, -26.715255737304688, -25.181480407714844, -23.647705078125, -22.11393165588379, -20.580156326293945, -19.046382904052734, -17.51260757446289, -15.978832244873047, -14.44505786895752, -12.911283493041992, -11.377508163452148, -9.843733787536621, -8.309959411621094, -6.77618408203125, -5.242409706115723, -3.708634853363037, -2.1748600006103516, -0.6410856246948242, 0.8926897048950195, 2.426464080810547, 3.9602389335632324, 5.494013786315918, 7.027788162231445, 8.561563491821289, 10.095337867736816, 11.629112243652344, 13.162887573242188, 14.696661949157715, 16.230436325073242, 17.764211654663086, 19.297985076904297, 20.83176040649414, 22.365535736083984, 23.899311065673828, 25.433086395263672, 26.966859817504883, 28.500635147094727, 30.034408569335938, 31.56818389892578, 33.101959228515625, 34.63573455810547, 36.16950988769531, 37.703285217285156, 39.237056732177734, 40.77083206176758, 42.30460739135742, 43.83837890625, 45.372154235839844, 46.90592956542969, 48.43970489501953, 49.973480224609375, 51.50725555419922]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 7.0, 4.0, 10.0, 13.0, 18.0, 18.0, 15.0, 23.0, 32.0, 18.0, 39.0, 28.0, 39.0, 31.0, 17.0, 49.0, 35.0, 51.0, 33.0, 38.0, 52.0, 46.0, 41.0, 42.0, 39.0, 36.0, 28.0, 25.0, 31.0, 21.0, 30.0, 17.0, 10.0, 14.0, 12.0, 9.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.43359375, -5.24163818359375, -5.0496826171875, -4.85772705078125, -4.665771484375, -4.47381591796875, -4.2818603515625, -4.08990478515625, -3.89794921875, -3.70599365234375, -3.5140380859375, -3.32208251953125, -3.130126953125, -2.93817138671875, -2.7462158203125, -2.55426025390625, -2.3623046875, -2.17034912109375, -1.9783935546875, -1.78643798828125, -1.594482421875, -1.40252685546875, -1.2105712890625, -1.01861572265625, -0.82666015625, -0.63470458984375, -0.4427490234375, -0.25079345703125, -0.058837890625, 0.13311767578125, 0.3250732421875, 0.51702880859375, 0.708984375, 0.90093994140625, 1.0928955078125, 1.28485107421875, 1.476806640625, 1.66876220703125, 1.8607177734375, 2.05267333984375, 2.24462890625, 2.43658447265625, 2.6285400390625, 2.82049560546875, 3.012451171875, 3.20440673828125, 3.3963623046875, 3.58831787109375, 3.7802734375, 3.97222900390625, 4.1641845703125, 4.35614013671875, 4.548095703125, 4.74005126953125, 4.9320068359375, 5.12396240234375, 5.31591796875, 5.50787353515625, 5.6998291015625, 5.89178466796875, 6.083740234375, 6.27569580078125, 6.4676513671875, 6.65960693359375, 6.8515625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 9.0, 12.0, 11.0, 21.0, 40.0, 53.0, 74.0, 128.0, 188.0, 331.0, 593.0, 1020.0, 1842.0, 3488.0, 7367.0, 17299.0, 47944.0, 166699.0, 1088243.0, 2378135.0, 351307.0, 80456.0, 27354.0, 10951.0, 4921.0, 2483.0, 1326.0, 753.0, 438.0, 251.0, 176.0, 120.0, 73.0, 43.0, 34.0, 29.0, 25.0, 12.0, 7.0, 7.0, 5.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.46875, -10.097900390625, -9.72705078125, -9.356201171875, -8.9853515625, -8.614501953125, -8.24365234375, -7.872802734375, -7.501953125, -7.131103515625, -6.76025390625, -6.389404296875, -6.0185546875, -5.647705078125, -5.27685546875, -4.906005859375, -4.53515625, -4.164306640625, -3.79345703125, -3.422607421875, -3.0517578125, -2.680908203125, -2.31005859375, -1.939208984375, -1.568359375, -1.197509765625, -0.82666015625, -0.455810546875, -0.0849609375, 0.285888671875, 0.65673828125, 1.027587890625, 1.3984375, 1.769287109375, 2.14013671875, 2.510986328125, 2.8818359375, 3.252685546875, 3.62353515625, 3.994384765625, 4.365234375, 4.736083984375, 5.10693359375, 5.477783203125, 5.8486328125, 6.219482421875, 6.59033203125, 6.961181640625, 7.33203125, 7.702880859375, 8.07373046875, 8.444580078125, 8.8154296875, 9.186279296875, 9.55712890625, 9.927978515625, 10.298828125, 10.669677734375, 11.04052734375, 11.411376953125, 11.7822265625, 12.153076171875, 12.52392578125, 12.894775390625, 13.265625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 13.0, 13.0, 13.0, 20.0, 36.0, 47.0, 60.0, 92.0, 119.0, 183.0, 247.0, 368.0, 568.0, 692.0, 486.0, 357.0, 207.0, 140.0, 106.0, 77.0, 57.0, 44.0, 20.0, 21.0, 20.0, 18.0, 12.0, 8.0, 4.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.5859375, -12.2296142578125, -11.873291015625, -11.5169677734375, -11.16064453125, -10.8043212890625, -10.447998046875, -10.0916748046875, -9.7353515625, -9.3790283203125, -9.022705078125, -8.6663818359375, -8.31005859375, -7.9537353515625, -7.597412109375, -7.2410888671875, -6.884765625, -6.5284423828125, -6.172119140625, -5.8157958984375, -5.45947265625, -5.1031494140625, -4.746826171875, -4.3905029296875, -4.0341796875, -3.6778564453125, -3.321533203125, -2.9652099609375, -2.60888671875, -2.2525634765625, -1.896240234375, -1.5399169921875, -1.18359375, -0.8272705078125, -0.470947265625, -0.1146240234375, 0.24169921875, 0.5980224609375, 0.954345703125, 1.3106689453125, 1.6669921875, 2.0233154296875, 2.379638671875, 2.7359619140625, 3.09228515625, 3.4486083984375, 3.804931640625, 4.1612548828125, 4.517578125, 4.8739013671875, 5.230224609375, 5.5865478515625, 5.94287109375, 6.2991943359375, 6.655517578125, 7.0118408203125, 7.3681640625, 7.7244873046875, 8.080810546875, 8.4371337890625, 8.79345703125, 9.1497802734375, 9.506103515625, 9.8624267578125, 10.21875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 6.0, 8.0, 9.0, 17.0, 21.0, 29.0, 21.0, 48.0, 68.0, 100.0, 184.0, 270.0, 471.0, 1021.0, 2808.0, 10903.0, 69510.0, 1245209.0, 2730438.0, 111842.0, 15060.0, 3601.0, 1211.0, 554.0, 310.0, 180.0, 135.0, 65.0, 47.0, 44.0, 28.0, 17.0, 14.0, 5.0, 6.0, 7.0, 6.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.875, -29.88232421875, -28.8896484375, -27.89697265625, -26.904296875, -25.91162109375, -24.9189453125, -23.92626953125, -22.93359375, -21.94091796875, -20.9482421875, -19.95556640625, -18.962890625, -17.97021484375, -16.9775390625, -15.98486328125, -14.9921875, -13.99951171875, -13.0068359375, -12.01416015625, -11.021484375, -10.02880859375, -9.0361328125, -8.04345703125, -7.05078125, -6.05810546875, -5.0654296875, -4.07275390625, -3.080078125, -2.08740234375, -1.0947265625, -0.10205078125, 0.890625, 1.88330078125, 2.8759765625, 3.86865234375, 4.861328125, 5.85400390625, 6.8466796875, 7.83935546875, 8.83203125, 9.82470703125, 10.8173828125, 11.81005859375, 12.802734375, 13.79541015625, 14.7880859375, 15.78076171875, 16.7734375, 17.76611328125, 18.7587890625, 19.75146484375, 20.744140625, 21.73681640625, 22.7294921875, 23.72216796875, 24.71484375, 25.70751953125, 26.7001953125, 27.69287109375, 28.685546875, 29.67822265625, 30.6708984375, 31.66357421875, 32.65625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 7.0, 8.0, 20.0, 26.0, 42.0, 57.0, 87.0, 100.0, 114.0, 111.0, 95.0, 94.0, 66.0, 56.0, 47.0, 34.0, 19.0, 14.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.049339294433594, -50.26707458496094, -48.484806060791016, -46.702537536621094, -44.92027282714844, -43.13800811767578, -41.35573959350586, -39.57347106933594, -37.79120635986328, -36.008941650390625, -34.2266731262207, -32.44440460205078, -30.662139892578125, -28.879873275756836, -27.097606658935547, -25.315340042114258, -23.53307342529297, -21.75080680847168, -19.96854019165039, -18.1862735748291, -16.404006958007812, -14.621740341186523, -12.839473724365234, -11.057207107543945, -9.274940490722656, -7.492673873901367, -5.710407257080078, -3.928140640258789, -2.1458740234375, -0.36360740661621094, 1.4186592102050781, 3.200925827026367, 4.983188629150391, 6.76545524597168, 8.547721862792969, 10.329988479614258, 12.112255096435547, 13.894521713256836, 15.676788330078125, 17.459054946899414, 19.241321563720703, 21.023588180541992, 22.80585479736328, 24.58812141418457, 26.37038803100586, 28.15265464782715, 29.934921264648438, 31.717187881469727, 33.499454498291016, 35.28172302246094, 37.063987731933594, 38.84625244140625, 40.62852096557617, 42.410789489746094, 44.19305419921875, 45.975318908691406, 47.75758743286133, 49.53985595703125, 51.322120666503906, 53.10438537597656, 54.886653900146484, 56.668922424316406, 58.45118713378906, 60.23345184326172, 62.01572036743164]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 6.0, 6.0, 5.0, 8.0, 7.0, 8.0, 7.0, 11.0, 15.0, 20.0, 23.0, 24.0, 21.0, 26.0, 31.0, 30.0, 34.0, 29.0, 30.0, 32.0, 35.0, 45.0, 40.0, 40.0, 52.0, 39.0, 38.0, 36.0, 34.0, 27.0, 32.0, 26.0, 30.0, 25.0, 30.0, 18.0, 18.0, 24.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.224472045898438, -28.254533767700195, -27.284595489501953, -26.31465721130371, -25.34471893310547, -24.374780654907227, -23.404842376708984, -22.434904098510742, -21.4649658203125, -20.495027542114258, -19.525089263916016, -18.555150985717773, -17.58521270751953, -16.61527442932129, -15.645336151123047, -14.675397872924805, -13.705459594726562, -12.73552131652832, -11.765583038330078, -10.795644760131836, -9.825706481933594, -8.855768203735352, -7.885829925537109, -6.915891647338867, -5.945953369140625, -4.976015090942383, -4.006076812744141, -3.0361385345458984, -2.0662002563476562, -1.096261978149414, -0.12632369995117188, 0.8436145782470703, 1.8135528564453125, 2.7834911346435547, 3.753429412841797, 4.723367691040039, 5.693305969238281, 6.663244247436523, 7.633182525634766, 8.603120803833008, 9.57305908203125, 10.542997360229492, 11.512935638427734, 12.482873916625977, 13.452812194824219, 14.422750473022461, 15.392688751220703, 16.362627029418945, 17.332565307617188, 18.30250358581543, 19.272441864013672, 20.242380142211914, 21.212318420410156, 22.1822566986084, 23.15219497680664, 24.122133255004883, 25.092071533203125, 26.062009811401367, 27.03194808959961, 28.00188636779785, 28.971824645996094, 29.941762924194336, 30.911701202392578, 31.88163948059082, 32.85157775878906]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 5.0, 4.0, 4.0, 3.0, 3.0, 6.0, 10.0, 19.0, 15.0, 23.0, 23.0, 24.0, 33.0, 20.0, 23.0, 25.0, 41.0, 36.0, 31.0, 37.0, 37.0, 37.0, 39.0, 39.0, 43.0, 46.0, 33.0, 39.0, 35.0, 35.0, 29.0, 33.0, 27.0, 22.0, 23.0, 17.0, 11.0, 18.0, 18.0, 8.0, 11.0, 5.0, 10.0, 2.0, 2.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2578125, -5.07037353515625, -4.8829345703125, -4.69549560546875, -4.508056640625, -4.32061767578125, -4.1331787109375, -3.94573974609375, -3.75830078125, -3.57086181640625, -3.3834228515625, -3.19598388671875, -3.008544921875, -2.82110595703125, -2.6336669921875, -2.44622802734375, -2.2587890625, -2.07135009765625, -1.8839111328125, -1.69647216796875, -1.509033203125, -1.32159423828125, -1.1341552734375, -0.94671630859375, -0.75927734375, -0.57183837890625, -0.3843994140625, -0.19696044921875, -0.009521484375, 0.17791748046875, 0.3653564453125, 0.55279541015625, 0.740234375, 0.92767333984375, 1.1151123046875, 1.30255126953125, 1.489990234375, 1.67742919921875, 1.8648681640625, 2.05230712890625, 2.23974609375, 2.42718505859375, 2.6146240234375, 2.80206298828125, 2.989501953125, 3.17694091796875, 3.3643798828125, 3.55181884765625, 3.7392578125, 3.92669677734375, 4.1141357421875, 4.30157470703125, 4.489013671875, 4.67645263671875, 4.8638916015625, 5.05133056640625, 5.23876953125, 5.42620849609375, 5.6136474609375, 5.80108642578125, 5.988525390625, 6.17596435546875, 6.3634033203125, 6.55084228515625, 6.73828125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 0.0, 6.0, 5.0, 8.0, 15.0, 16.0, 32.0, 44.0, 69.0, 70.0, 136.0, 210.0, 313.0, 457.0, 739.0, 1063.0, 1671.0, 2559.0, 4021.0, 6148.0, 9967.0, 15950.0, 26346.0, 42854.0, 74810.0, 145971.0, 304855.0, 189906.0, 89230.0, 50894.0, 30107.0, 18416.0, 11470.0, 7206.0, 4618.0, 2890.0, 1848.0, 1249.0, 817.0, 560.0, 306.0, 247.0, 157.0, 91.0, 71.0, 56.0, 27.0, 23.0, 17.0, 10.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.208740234375, -0.20170021057128906, -0.19466018676757812, -0.1876201629638672, -0.18058013916015625, -0.1735401153564453, -0.16650009155273438, -0.15946006774902344, -0.1524200439453125, -0.14538002014160156, -0.13833999633789062, -0.1312999725341797, -0.12425994873046875, -0.11721992492675781, -0.11017990112304688, -0.10313987731933594, -0.096099853515625, -0.08905982971191406, -0.08201980590820312, -0.07497978210449219, -0.06793975830078125, -0.06089973449707031, -0.053859710693359375, -0.04681968688964844, -0.0397796630859375, -0.03273963928222656, -0.025699615478515625, -0.018659591674804688, -0.01161956787109375, -0.0045795440673828125, 0.002460479736328125, 0.009500503540039062, 0.01654052734375, 0.023580551147460938, 0.030620574951171875, 0.03766059875488281, 0.04470062255859375, 0.05174064636230469, 0.058780670166015625, 0.06582069396972656, 0.0728607177734375, 0.07990074157714844, 0.08694076538085938, 0.09398078918457031, 0.10102081298828125, 0.10806083679199219, 0.11510086059570312, 0.12214088439941406, 0.129180908203125, 0.13622093200683594, 0.14326095581054688, 0.1503009796142578, 0.15734100341796875, 0.1643810272216797, 0.17142105102539062, 0.17846107482910156, 0.1855010986328125, 0.19254112243652344, 0.19958114624023438, 0.2066211700439453, 0.21366119384765625, 0.2207012176513672, 0.22774124145507812, 0.23478126525878906, 0.2418212890625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 3.0, 5.0, 4.0, 12.0, 17.0, 9.0, 10.0, 9.0, 20.0, 11.0, 19.0, 18.0, 28.0, 29.0, 34.0, 33.0, 23.0, 43.0, 47.0, 38.0, 39.0, 1070.0, 43.0, 50.0, 46.0, 30.0, 37.0, 42.0, 40.0, 31.0, 29.0, 32.0, 19.0, 17.0, 9.0, 16.0, 9.0, 11.0, 7.0, 12.0, 5.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.390625, -4.256591796875, -4.12255859375, -3.988525390625, -3.8544921875, -3.720458984375, -3.58642578125, -3.452392578125, -3.318359375, -3.184326171875, -3.05029296875, -2.916259765625, -2.7822265625, -2.648193359375, -2.51416015625, -2.380126953125, -2.24609375, -2.112060546875, -1.97802734375, -1.843994140625, -1.7099609375, -1.575927734375, -1.44189453125, -1.307861328125, -1.173828125, -1.039794921875, -0.90576171875, -0.771728515625, -0.6376953125, -0.503662109375, -0.36962890625, -0.235595703125, -0.1015625, 0.032470703125, 0.16650390625, 0.300537109375, 0.4345703125, 0.568603515625, 0.70263671875, 0.836669921875, 0.970703125, 1.104736328125, 1.23876953125, 1.372802734375, 1.5068359375, 1.640869140625, 1.77490234375, 1.908935546875, 2.04296875, 2.177001953125, 2.31103515625, 2.445068359375, 2.5791015625, 2.713134765625, 2.84716796875, 2.981201171875, 3.115234375, 3.249267578125, 3.38330078125, 3.517333984375, 3.6513671875, 3.785400390625, 3.91943359375, 4.053466796875, 4.1875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 8.0, 13.0, 23.0, 34.0, 44.0, 60.0, 110.0, 164.0, 226.0, 392.0, 582.0, 863.0, 1437.0, 2193.0, 3319.0, 5393.0, 8502.0, 13968.0, 23009.0, 39773.0, 72502.0, 151884.0, 1370721.0, 196925.0, 88658.0, 47159.0, 26432.0, 16147.0, 9860.0, 6045.0, 3837.0, 2399.0, 1607.0, 1013.0, 634.0, 412.0, 287.0, 164.0, 113.0, 74.0, 59.0, 28.0, 17.0, 11.0, 15.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.168701171875, -0.1638317108154297, -0.15896224975585938, -0.15409278869628906, -0.14922332763671875, -0.14435386657714844, -0.13948440551757812, -0.1346149444580078, -0.1297454833984375, -0.12487602233886719, -0.12000656127929688, -0.11513710021972656, -0.11026763916015625, -0.10539817810058594, -0.10052871704101562, -0.09565925598144531, -0.090789794921875, -0.08592033386230469, -0.08105087280273438, -0.07618141174316406, -0.07131195068359375, -0.06644248962402344, -0.061573028564453125, -0.05670356750488281, -0.0518341064453125, -0.04696464538574219, -0.042095184326171875, -0.03722572326660156, -0.03235626220703125, -0.027486801147460938, -0.022617340087890625, -0.017747879028320312, -0.01287841796875, -0.008008956909179688, -0.003139495849609375, 0.0017299652099609375, 0.00659942626953125, 0.011468887329101562, 0.016338348388671875, 0.021207809448242188, 0.0260772705078125, 0.030946731567382812, 0.035816192626953125, 0.04068565368652344, 0.04555511474609375, 0.05042457580566406, 0.055294036865234375, 0.06016349792480469, 0.065032958984375, 0.06990242004394531, 0.07477188110351562, 0.07964134216308594, 0.08451080322265625, 0.08938026428222656, 0.09424972534179688, 0.09911918640136719, 0.1039886474609375, 0.10885810852050781, 0.11372756958007812, 0.11859703063964844, 0.12346649169921875, 0.12833595275878906, 0.13320541381835938, 0.1380748748779297, 0.1429443359375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 5.0, 6.0, 7.0, 18.0, 16.0, 13.0, 26.0, 24.0, 32.0, 29.0, 29.0, 53.0, 39.0, 40.0, 43.0, 55.0, 46.0, 54.0, 47.0, 56.0, 47.0, 38.0, 32.0, 34.0, 31.0, 24.0, 30.0, 23.0, 15.0, 13.0, 12.0, 8.0, 8.0, 6.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.2869319915771484e-05, -5.1233917474746704e-05, -4.9598515033721924e-05, -4.7963112592697144e-05, -4.632771015167236e-05, -4.469230771064758e-05, -4.30569052696228e-05, -4.142150282859802e-05, -3.978610038757324e-05, -3.815069794654846e-05, -3.651529550552368e-05, -3.48798930644989e-05, -3.324449062347412e-05, -3.160908818244934e-05, -2.997368574142456e-05, -2.833828330039978e-05, -2.6702880859375e-05, -2.506747841835022e-05, -2.343207597732544e-05, -2.179667353630066e-05, -2.016127109527588e-05, -1.85258686542511e-05, -1.689046621322632e-05, -1.5255063772201538e-05, -1.3619661331176758e-05, -1.1984258890151978e-05, -1.0348856449127197e-05, -8.713454008102417e-06, -7.078051567077637e-06, -5.4426491260528564e-06, -3.807246685028076e-06, -2.171844244003296e-06, -5.364418029785156e-07, 1.0989606380462646e-06, 2.734363079071045e-06, 4.369765520095825e-06, 6.0051679611206055e-06, 7.640570402145386e-06, 9.275972843170166e-06, 1.0911375284194946e-05, 1.2546777725219727e-05, 1.4182180166244507e-05, 1.5817582607269287e-05, 1.7452985048294067e-05, 1.9088387489318848e-05, 2.0723789930343628e-05, 2.2359192371368408e-05, 2.399459481239319e-05, 2.562999725341797e-05, 2.726539969444275e-05, 2.890080213546753e-05, 3.053620457649231e-05, 3.217160701751709e-05, 3.380700945854187e-05, 3.544241189956665e-05, 3.707781434059143e-05, 3.871321678161621e-05, 4.034861922264099e-05, 4.198402166366577e-05, 4.361942410469055e-05, 4.525482654571533e-05, 4.689022898674011e-05, 4.852563142776489e-05, 5.016103386878967e-05, 5.179643630981445e-05]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 4.0, 5.0, 3.0, 9.0, 8.0, 15.0, 8.0, 21.0, 36.0, 24.0, 34.0, 58.0, 54.0, 85.0, 154.0, 337.0, 1856.0, 299612.0, 740652.0, 4455.0, 447.0, 213.0, 105.0, 75.0, 59.0, 43.0, 33.0, 30.0, 27.0, 15.0, 14.0, 14.0, 9.0, 4.0, 9.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00118255615234375, -0.0011457353830337524, -0.0011089146137237549, -0.0010720938444137573, -0.0010352730751037598, -0.0009984523057937622, -0.0009616315364837646, -0.0009248107671737671, -0.0008879899978637695, -0.000851169228553772, -0.0008143484592437744, -0.0007775276899337769, -0.0007407069206237793, -0.0007038861513137817, -0.0006670653820037842, -0.0006302446126937866, -0.0005934238433837891, -0.0005566030740737915, -0.0005197823047637939, -0.0004829615354537964, -0.00044614076614379883, -0.00040931999683380127, -0.0003724992275238037, -0.00033567845821380615, -0.0002988576889038086, -0.00026203691959381104, -0.00022521615028381348, -0.00018839538097381592, -0.00015157461166381836, -0.0001147538423538208, -7.793307304382324e-05, -4.1112303733825684e-05, -4.291534423828125e-06, 3.2529234886169434e-05, 6.935000419616699e-05, 0.00010617077350616455, 0.0001429915428161621, 0.00017981231212615967, 0.00021663308143615723, 0.0002534538507461548, 0.00029027462005615234, 0.0003270953893661499, 0.00036391615867614746, 0.000400736927986145, 0.0004375576972961426, 0.00047437846660614014, 0.0005111992359161377, 0.0005480200052261353, 0.0005848407745361328, 0.0006216615438461304, 0.0006584823131561279, 0.0006953030824661255, 0.000732123851776123, 0.0007689446210861206, 0.0008057653903961182, 0.0008425861597061157, 0.0008794069290161133, 0.0009162276983261108, 0.0009530484676361084, 0.000989869236946106, 0.0010266900062561035, 0.001063510775566101, 0.0011003315448760986, 0.0011371523141860962, 0.0011739730834960938]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 19.0, 334.0, 607.0, 55.0, 2.0], "bins": [-0.0007627009763382375, -0.0007502383668906987, -0.0007377757574431598, -0.000725313147995621, -0.0007128505385480821, -0.0007003879291005433, -0.0006879253196530044, -0.0006754627102054656, -0.0006630001007579267, -0.0006505374913103878, -0.000638074881862849, -0.0006256122724153101, -0.0006131496629677713, -0.0006006870535202324, -0.0005882244440726936, -0.0005757618346251547, -0.0005632992251776159, -0.000550836615730077, -0.0005383740062825382, -0.0005259113968349993, -0.0005134487873874605, -0.0005009861779399216, -0.0004885235684923828, -0.0004760609590448439, -0.0004635983204934746, -0.00045113571104593575, -0.0004386731015983969, -0.00042621049215085804, -0.0004137478827033192, -0.00040128527325578034, -0.0003888226638082415, -0.00037636005436070263, -0.00036389747401699424, -0.0003514348645694554, -0.00033897225512191653, -0.0003265096456743777, -0.00031404703622683883, -0.0003015844267793, -0.0002891218173317611, -0.00027665920788422227, -0.00026419656933285296, -0.0002517339598853141, -0.00023927135043777525, -0.0002268087409902364, -0.00021434613154269755, -0.0002018835220951587, -0.00018942091264761984, -0.000176958303200081, -0.00016449569375254214, -0.00015203308430500329, -0.00013957047485746443, -0.00012710786540992558, -0.00011464525596238673, -0.00010218263923889026, -8.972002979135141e-05, -7.725742034381256e-05, -6.479481817223132e-05, -5.2332208724692464e-05, -3.986959927715361e-05, -2.740698619163595e-05, -1.4944376744097099e-05, -2.481763658579439e-06, 9.980845788959414e-06, 2.2443455236498266e-05, 3.4906068322015926e-05]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 7.0, 5.0, 12.0, 10.0, 12.0, 18.0, 17.0, 22.0, 8.0, 25.0, 35.0, 33.0, 40.0, 45.0, 45.0, 44.0, 44.0, 41.0, 56.0, 51.0, 45.0, 50.0, 35.0, 34.0, 35.0, 32.0, 33.0, 27.0, 22.0, 19.0, 22.0, 16.0, 9.0, 12.0, 15.0, 7.0, 7.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.24249267578125e-05, -3.1334348022937775e-05, -3.024376928806305e-05, -2.9153190553188324e-05, -2.80626118183136e-05, -2.6972033083438873e-05, -2.5881454348564148e-05, -2.4790875613689423e-05, -2.3700296878814697e-05, -2.2609718143939972e-05, -2.1519139409065247e-05, -2.042856067419052e-05, -1.9337981939315796e-05, -1.824740320444107e-05, -1.7156824469566345e-05, -1.606624573469162e-05, -1.4975666999816895e-05, -1.388508826494217e-05, -1.2794509530067444e-05, -1.1703930795192719e-05, -1.0613352060317993e-05, -9.522773325443268e-06, -8.432194590568542e-06, -7.341615855693817e-06, -6.251037120819092e-06, -5.1604583859443665e-06, -4.069879651069641e-06, -2.9793009161949158e-06, -1.8887221813201904e-06, -7.981434464454651e-07, 2.9243528842926025e-07, 1.3830140233039856e-06, 2.473592758178711e-06, 3.5641714930534363e-06, 4.654750227928162e-06, 5.745328962802887e-06, 6.835907697677612e-06, 7.926486432552338e-06, 9.017065167427063e-06, 1.0107643902301788e-05, 1.1198222637176514e-05, 1.2288801372051239e-05, 1.3379380106925964e-05, 1.446995884180069e-05, 1.5560537576675415e-05, 1.665111631155014e-05, 1.7741695046424866e-05, 1.883227378129959e-05, 1.9922852516174316e-05, 2.1013431251049042e-05, 2.2104009985923767e-05, 2.3194588720798492e-05, 2.4285167455673218e-05, 2.5375746190547943e-05, 2.646632492542267e-05, 2.7556903660297394e-05, 2.864748239517212e-05, 2.9738061130046844e-05, 3.082863986492157e-05, 3.1919218599796295e-05, 3.300979733467102e-05, 3.4100376069545746e-05, 3.519095480442047e-05, 3.6281533539295197e-05, 3.737211227416992e-05]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 5.0, 4.0, 4.0, 3.0, 3.0, 6.0, 10.0, 19.0, 15.0, 23.0, 23.0, 24.0, 33.0, 20.0, 23.0, 25.0, 41.0, 36.0, 31.0, 37.0, 37.0, 37.0, 39.0, 39.0, 43.0, 46.0, 33.0, 39.0, 35.0, 35.0, 29.0, 33.0, 27.0, 22.0, 23.0, 17.0, 11.0, 18.0, 18.0, 8.0, 11.0, 5.0, 10.0, 2.0, 2.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2578125, -5.07037353515625, -4.8829345703125, -4.69549560546875, -4.508056640625, -4.32061767578125, -4.1331787109375, -3.94573974609375, -3.75830078125, -3.57086181640625, -3.3834228515625, -3.19598388671875, -3.008544921875, -2.82110595703125, -2.6336669921875, -2.44622802734375, -2.2587890625, -2.07135009765625, -1.8839111328125, -1.69647216796875, -1.509033203125, -1.32159423828125, -1.1341552734375, -0.94671630859375, -0.75927734375, -0.57183837890625, -0.3843994140625, -0.19696044921875, -0.009521484375, 0.17791748046875, 0.3653564453125, 0.55279541015625, 0.740234375, 0.92767333984375, 1.1151123046875, 1.30255126953125, 1.489990234375, 1.67742919921875, 1.8648681640625, 2.05230712890625, 2.23974609375, 2.42718505859375, 2.6146240234375, 2.80206298828125, 2.989501953125, 3.17694091796875, 3.3643798828125, 3.55181884765625, 3.7392578125, 3.92669677734375, 4.1141357421875, 4.30157470703125, 4.489013671875, 4.67645263671875, 4.8638916015625, 5.05133056640625, 5.23876953125, 5.42620849609375, 5.6136474609375, 5.80108642578125, 5.988525390625, 6.17596435546875, 6.3634033203125, 6.55084228515625, 6.73828125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 8.0, 8.0, 9.0, 13.0, 18.0, 17.0, 33.0, 39.0, 54.0, 76.0, 110.0, 166.0, 261.0, 368.0, 555.0, 772.0, 1172.0, 1785.0, 2892.0, 4721.0, 7981.0, 13964.0, 25811.0, 50440.0, 108201.0, 327890.0, 295337.0, 100258.0, 47561.0, 24384.0, 13505.0, 7536.0, 4455.0, 2893.0, 1754.0, 1169.0, 740.0, 492.0, 344.0, 233.0, 164.0, 109.0, 91.0, 56.0, 24.0, 31.0, 19.0, 12.0, 9.0, 15.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-8.140625, -7.8594970703125, -7.578369140625, -7.2972412109375, -7.01611328125, -6.7349853515625, -6.453857421875, -6.1727294921875, -5.8916015625, -5.6104736328125, -5.329345703125, -5.0482177734375, -4.76708984375, -4.4859619140625, -4.204833984375, -3.9237060546875, -3.642578125, -3.3614501953125, -3.080322265625, -2.7991943359375, -2.51806640625, -2.2369384765625, -1.955810546875, -1.6746826171875, -1.3935546875, -1.1124267578125, -0.831298828125, -0.5501708984375, -0.26904296875, 0.0120849609375, 0.293212890625, 0.5743408203125, 0.85546875, 1.1365966796875, 1.417724609375, 1.6988525390625, 1.97998046875, 2.2611083984375, 2.542236328125, 2.8233642578125, 3.1044921875, 3.3856201171875, 3.666748046875, 3.9478759765625, 4.22900390625, 4.5101318359375, 4.791259765625, 5.0723876953125, 5.353515625, 5.6346435546875, 5.915771484375, 6.1968994140625, 6.47802734375, 6.7591552734375, 7.040283203125, 7.3214111328125, 7.6025390625, 7.8836669921875, 8.164794921875, 8.4459228515625, 8.72705078125, 9.0081787109375, 9.289306640625, 9.5704345703125, 9.8515625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 6.0, 5.0, 1.0, 7.0, 10.0, 12.0, 14.0, 25.0, 21.0, 23.0, 35.0, 41.0, 34.0, 58.0, 70.0, 75.0, 104.0, 352.0, 1528.0, 190.0, 82.0, 70.0, 40.0, 55.0, 39.0, 42.0, 25.0, 24.0, 21.0, 15.0, 14.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.40625, -19.656494140625, -18.90673828125, -18.156982421875, -17.4072265625, -16.657470703125, -15.90771484375, -15.157958984375, -14.408203125, -13.658447265625, -12.90869140625, -12.158935546875, -11.4091796875, -10.659423828125, -9.90966796875, -9.159912109375, -8.41015625, -7.660400390625, -6.91064453125, -6.160888671875, -5.4111328125, -4.661376953125, -3.91162109375, -3.161865234375, -2.412109375, -1.662353515625, -0.91259765625, -0.162841796875, 0.5869140625, 1.336669921875, 2.08642578125, 2.836181640625, 3.5859375, 4.335693359375, 5.08544921875, 5.835205078125, 6.5849609375, 7.334716796875, 8.08447265625, 8.834228515625, 9.583984375, 10.333740234375, 11.08349609375, 11.833251953125, 12.5830078125, 13.332763671875, 14.08251953125, 14.832275390625, 15.58203125, 16.331787109375, 17.08154296875, 17.831298828125, 18.5810546875, 19.330810546875, 20.08056640625, 20.830322265625, 21.580078125, 22.329833984375, 23.07958984375, 23.829345703125, 24.5791015625, 25.328857421875, 26.07861328125, 26.828369140625, 27.578125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 9.0, 3.0, 7.0, 11.0, 26.0, 19.0, 29.0, 43.0, 57.0, 86.0, 156.0, 315.0, 885.0, 3637.0, 22046.0, 271274.0, 2696200.0, 133002.0, 13977.0, 2526.0, 715.0, 239.0, 111.0, 106.0, 65.0, 41.0, 35.0, 22.0, 16.0, 14.0, 11.0, 6.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.75, -33.7392578125, -32.728515625, -31.7177734375, -30.70703125, -29.6962890625, -28.685546875, -27.6748046875, -26.6640625, -25.6533203125, -24.642578125, -23.6318359375, -22.62109375, -21.6103515625, -20.599609375, -19.5888671875, -18.578125, -17.5673828125, -16.556640625, -15.5458984375, -14.53515625, -13.5244140625, -12.513671875, -11.5029296875, -10.4921875, -9.4814453125, -8.470703125, -7.4599609375, -6.44921875, -5.4384765625, -4.427734375, -3.4169921875, -2.40625, -1.3955078125, -0.384765625, 0.6259765625, 1.63671875, 2.6474609375, 3.658203125, 4.6689453125, 5.6796875, 6.6904296875, 7.701171875, 8.7119140625, 9.72265625, 10.7333984375, 11.744140625, 12.7548828125, 13.765625, 14.7763671875, 15.787109375, 16.7978515625, 17.80859375, 18.8193359375, 19.830078125, 20.8408203125, 21.8515625, 22.8623046875, 23.873046875, 24.8837890625, 25.89453125, 26.9052734375, 27.916015625, 28.9267578125, 29.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 22.0, 31.0, 44.0, 83.0, 117.0, 171.0, 145.0, 130.0, 100.0, 68.0, 40.0, 26.0, 10.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.14958190917969, -41.562477111816406, -39.975372314453125, -38.388267517089844, -36.80116271972656, -35.21405792236328, -33.626953125, -32.03984832763672, -30.45274543762207, -28.86564064025879, -27.278535842895508, -25.69143295288086, -24.104328155517578, -22.517223358154297, -20.930118560791016, -19.343013763427734, -17.755908966064453, -16.168804168701172, -14.58169937133789, -12.994595527648926, -11.407490730285645, -9.820385932922363, -8.233282089233398, -6.646177291870117, -5.059072494506836, -3.471967935562134, -1.8848633766174316, -0.2977590560913086, 1.2893457412719727, 2.876450538635254, 4.463554382324219, 6.0506591796875, 7.637767791748047, 9.224872589111328, 10.81197738647461, 12.399081230163574, 13.986186027526855, 15.573290824890137, 17.1603946685791, 18.747499465942383, 20.334604263305664, 21.921709060668945, 23.508813858032227, 25.095916748046875, 26.683021545410156, 28.270126342773438, 29.85723114013672, 31.4443359375, 33.03144073486328, 34.61854553222656, 36.205650329589844, 37.792755126953125, 39.379859924316406, 40.96696472167969, 42.55406951904297, 44.14117431640625, 45.72827911376953, 47.31538391113281, 48.902488708496094, 50.489593505859375, 52.076698303222656, 53.66380310058594, 55.25090789794922, 56.8380126953125, 58.425113677978516]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 0.0, 7.0, 5.0, 3.0, 3.0, 9.0, 5.0, 10.0, 7.0, 4.0, 11.0, 16.0, 21.0, 21.0, 28.0, 23.0, 27.0, 26.0, 40.0, 42.0, 47.0, 51.0, 44.0, 41.0, 57.0, 45.0, 32.0, 37.0, 32.0, 27.0, 39.0, 34.0, 32.0, 21.0, 24.0, 12.0, 31.0, 18.0, 13.0, 17.0, 13.0, 4.0, 5.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.379905700683594, -43.79947280883789, -42.21903991699219, -40.638607025146484, -39.05817413330078, -37.47774124145508, -35.897308349609375, -34.316871643066406, -32.73644256591797, -31.156009674072266, -29.575576782226562, -27.99514389038086, -26.414710998535156, -24.834278106689453, -23.253843307495117, -21.673410415649414, -20.092975616455078, -18.512542724609375, -16.932109832763672, -15.351675987243652, -13.77124309539795, -12.190810203552246, -10.610376358032227, -9.029943466186523, -7.44951057434082, -5.869077682495117, -4.288644313812256, -2.7082109451293945, -1.1277780532836914, 0.4526548385620117, 2.0330886840820312, 3.6135215759277344, 5.193950653076172, 6.774383544921875, 8.354816436767578, 9.935250282287598, 11.5156831741333, 13.096116065979004, 14.676549911499023, 16.256982803344727, 17.83741569519043, 19.417848587036133, 20.998281478881836, 22.578716278076172, 24.159149169921875, 25.739582061767578, 27.32001495361328, 28.900447845458984, 30.480880737304688, 32.06131362915039, 33.641746520996094, 35.2221794128418, 36.8026123046875, 38.3830451965332, 39.963478088378906, 41.543914794921875, 43.12434387207031, 44.704776763916016, 46.28520965576172, 47.86564254760742, 49.446075439453125, 51.02650833129883, 52.60694122314453, 54.1873779296875, 55.7678108215332]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 2.0, 7.0, 6.0, 10.0, 13.0, 9.0, 23.0, 19.0, 24.0, 31.0, 17.0, 22.0, 29.0, 36.0, 30.0, 28.0, 36.0, 47.0, 36.0, 36.0, 41.0, 38.0, 44.0, 43.0, 40.0, 40.0, 27.0, 27.0, 34.0, 26.0, 32.0, 22.0, 27.0, 15.0, 7.0, 9.0, 16.0, 14.0, 10.0, 7.0, 3.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.44921875, -5.260009765625, -5.07080078125, -4.881591796875, -4.6923828125, -4.503173828125, -4.31396484375, -4.124755859375, -3.935546875, -3.746337890625, -3.55712890625, -3.367919921875, -3.1787109375, -2.989501953125, -2.80029296875, -2.611083984375, -2.421875, -2.232666015625, -2.04345703125, -1.854248046875, -1.6650390625, -1.475830078125, -1.28662109375, -1.097412109375, -0.908203125, -0.718994140625, -0.52978515625, -0.340576171875, -0.1513671875, 0.037841796875, 0.22705078125, 0.416259765625, 0.60546875, 0.794677734375, 0.98388671875, 1.173095703125, 1.3623046875, 1.551513671875, 1.74072265625, 1.929931640625, 2.119140625, 2.308349609375, 2.49755859375, 2.686767578125, 2.8759765625, 3.065185546875, 3.25439453125, 3.443603515625, 3.6328125, 3.822021484375, 4.01123046875, 4.200439453125, 4.3896484375, 4.578857421875, 4.76806640625, 4.957275390625, 5.146484375, 5.335693359375, 5.52490234375, 5.714111328125, 5.9033203125, 6.092529296875, 6.28173828125, 6.470947265625, 6.66015625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 11.0, 16.0, 15.0, 25.0, 38.0, 63.0, 85.0, 163.0, 234.0, 439.0, 815.0, 1418.0, 3012.0, 6802.0, 16768.0, 47568.0, 173548.0, 1195427.0, 2320913.0, 310676.0, 73974.0, 24724.0, 9354.0, 3984.0, 1946.0, 927.0, 477.0, 337.0, 166.0, 120.0, 88.0, 48.0, 19.0, 26.0, 15.0, 11.0, 10.0, 8.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4453125, -13.9820556640625, -13.518798828125, -13.0555419921875, -12.59228515625, -12.1290283203125, -11.665771484375, -11.2025146484375, -10.7392578125, -10.2760009765625, -9.812744140625, -9.3494873046875, -8.88623046875, -8.4229736328125, -7.959716796875, -7.4964599609375, -7.033203125, -6.5699462890625, -6.106689453125, -5.6434326171875, -5.18017578125, -4.7169189453125, -4.253662109375, -3.7904052734375, -3.3271484375, -2.8638916015625, -2.400634765625, -1.9373779296875, -1.47412109375, -1.0108642578125, -0.547607421875, -0.0843505859375, 0.37890625, 0.8421630859375, 1.305419921875, 1.7686767578125, 2.23193359375, 2.6951904296875, 3.158447265625, 3.6217041015625, 4.0849609375, 4.5482177734375, 5.011474609375, 5.4747314453125, 5.93798828125, 6.4012451171875, 6.864501953125, 7.3277587890625, 7.791015625, 8.2542724609375, 8.717529296875, 9.1807861328125, 9.64404296875, 10.1072998046875, 10.570556640625, 11.0338134765625, 11.4970703125, 11.9603271484375, 12.423583984375, 12.8868408203125, 13.35009765625, 13.8133544921875, 14.276611328125, 14.7398681640625, 15.203125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 10.0, 18.0, 17.0, 24.0, 41.0, 49.0, 77.0, 89.0, 171.0, 255.0, 350.0, 526.0, 685.0, 558.0, 360.0, 258.0, 180.0, 121.0, 69.0, 55.0, 46.0, 33.0, 28.0, 13.0, 17.0, 5.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.9765625, -13.572265625, -13.16796875, -12.763671875, -12.359375, -11.955078125, -11.55078125, -11.146484375, -10.7421875, -10.337890625, -9.93359375, -9.529296875, -9.125, -8.720703125, -8.31640625, -7.912109375, -7.5078125, -7.103515625, -6.69921875, -6.294921875, -5.890625, -5.486328125, -5.08203125, -4.677734375, -4.2734375, -3.869140625, -3.46484375, -3.060546875, -2.65625, -2.251953125, -1.84765625, -1.443359375, -1.0390625, -0.634765625, -0.23046875, 0.173828125, 0.578125, 0.982421875, 1.38671875, 1.791015625, 2.1953125, 2.599609375, 3.00390625, 3.408203125, 3.8125, 4.216796875, 4.62109375, 5.025390625, 5.4296875, 5.833984375, 6.23828125, 6.642578125, 7.046875, 7.451171875, 7.85546875, 8.259765625, 8.6640625, 9.068359375, 9.47265625, 9.876953125, 10.28125, 10.685546875, 11.08984375, 11.494140625, 11.8984375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 7.0, 9.0, 14.0, 23.0, 25.0, 40.0, 100.0, 132.0, 258.0, 520.0, 1384.0, 4404.0, 22311.0, 193966.0, 3230392.0, 675253.0, 53498.0, 8270.0, 2113.0, 761.0, 367.0, 180.0, 96.0, 70.0, 34.0, 21.0, 15.0, 10.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.6875, -28.65380859375, -27.6201171875, -26.58642578125, -25.552734375, -24.51904296875, -23.4853515625, -22.45166015625, -21.41796875, -20.38427734375, -19.3505859375, -18.31689453125, -17.283203125, -16.24951171875, -15.2158203125, -14.18212890625, -13.1484375, -12.11474609375, -11.0810546875, -10.04736328125, -9.013671875, -7.97998046875, -6.9462890625, -5.91259765625, -4.87890625, -3.84521484375, -2.8115234375, -1.77783203125, -0.744140625, 0.28955078125, 1.3232421875, 2.35693359375, 3.390625, 4.42431640625, 5.4580078125, 6.49169921875, 7.525390625, 8.55908203125, 9.5927734375, 10.62646484375, 11.66015625, 12.69384765625, 13.7275390625, 14.76123046875, 15.794921875, 16.82861328125, 17.8623046875, 18.89599609375, 19.9296875, 20.96337890625, 21.9970703125, 23.03076171875, 24.064453125, 25.09814453125, 26.1318359375, 27.16552734375, 28.19921875, 29.23291015625, 30.2666015625, 31.30029296875, 32.333984375, 33.36767578125, 34.4013671875, 35.43505859375, 36.46875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 20.0, 58.0, 101.0, 162.0, 222.0, 217.0, 138.0, 63.0, 19.0, 12.0], "bins": [-218.2934112548828, -214.56678771972656, -210.8401641845703, -207.11354064941406, -203.3869171142578, -199.66029357910156, -195.9336700439453, -192.20704650878906, -188.4804229736328, -184.75379943847656, -181.0271759033203, -177.30055236816406, -173.5739288330078, -169.84730529785156, -166.1206817626953, -162.39405822753906, -158.6674346923828, -154.94081115722656, -151.2141876220703, -147.48756408691406, -143.7609405517578, -140.03431701660156, -136.3076934814453, -132.58106994628906, -128.8544464111328, -125.12782287597656, -121.40119934082031, -117.67457580566406, -113.94795227050781, -110.22132873535156, -106.49470520019531, -102.76808166503906, -99.04144287109375, -95.3148193359375, -91.58819580078125, -87.861572265625, -84.13494873046875, -80.4083251953125, -76.68170166015625, -72.955078125, -69.22845458984375, -65.5018310546875, -61.77520751953125, -58.048583984375, -54.32196044921875, -50.5953369140625, -46.86871337890625, -43.14208984375, -39.41546630859375, -35.6888427734375, -31.96221923828125, -28.235595703125, -24.50897216796875, -20.782346725463867, -17.055723190307617, -13.329099655151367, -9.602474212646484, -5.875850677490234, -2.149226665496826, 1.577397346496582, 5.304020881652832, 9.030645370483398, 12.757268905639648, 16.4838924407959, 20.21051597595215]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 0.0, 6.0, 4.0, 2.0, 3.0, 6.0, 8.0, 8.0, 18.0, 13.0, 14.0, 24.0, 17.0, 21.0, 19.0, 23.0, 35.0, 25.0, 31.0, 42.0, 37.0, 44.0, 53.0, 45.0, 45.0, 41.0, 52.0, 43.0, 39.0, 36.0, 36.0, 25.0, 32.0, 23.0, 21.0, 13.0, 15.0, 14.0, 10.0, 14.0, 6.0, 13.0, 8.0, 3.0, 7.0, 2.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.807167053222656, -34.7009391784668, -33.59470748901367, -32.48847961425781, -31.382247924804688, -30.276018142700195, -29.169788360595703, -28.063560485839844, -26.95732879638672, -25.851099014282227, -24.744869232177734, -23.638639450073242, -22.53240966796875, -21.426179885864258, -20.319950103759766, -19.213722229003906, -18.107492446899414, -17.001262664794922, -15.89503288269043, -14.788803100585938, -13.682573318481445, -12.576343536376953, -11.470114707946777, -10.363884925842285, -9.257655143737793, -8.1514253616333, -7.045195579528809, -5.938966274261475, -4.832736492156982, -3.7265067100524902, -2.6202774047851562, -1.514047622680664, -0.4078178405761719, 0.6984118223190308, 1.8046414852142334, 2.9108710289001465, 4.017100811004639, 5.123330593109131, 6.229559898376465, 7.335789680480957, 8.44201946258545, 9.548249244689941, 10.654479026794434, 11.76070785522461, 12.866937637329102, 13.973167419433594, 15.079397201538086, 16.185626983642578, 17.29185676574707, 18.398086547851562, 19.504316329956055, 20.610546112060547, 21.71677589416504, 22.82300567626953, 23.92923355102539, 25.035465240478516, 26.141693115234375, 27.247922897338867, 28.35415267944336, 29.46038246154785, 30.566612243652344, 31.672842025756836, 32.77907180786133, 33.88529968261719, 34.99153137207031]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 9.0, 7.0, 15.0, 15.0, 14.0, 11.0, 16.0, 19.0, 23.0, 25.0, 27.0, 23.0, 34.0, 35.0, 26.0, 34.0, 38.0, 36.0, 40.0, 46.0, 42.0, 32.0, 45.0, 28.0, 36.0, 44.0, 29.0, 27.0, 35.0, 19.0, 22.0, 23.0, 25.0, 11.0, 13.0, 16.0, 9.0, 9.0, 10.0, 5.0, 4.0, 8.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.31640625, -5.1279296875, -4.939453125, -4.7509765625, -4.5625, -4.3740234375, -4.185546875, -3.9970703125, -3.80859375, -3.6201171875, -3.431640625, -3.2431640625, -3.0546875, -2.8662109375, -2.677734375, -2.4892578125, -2.30078125, -2.1123046875, -1.923828125, -1.7353515625, -1.546875, -1.3583984375, -1.169921875, -0.9814453125, -0.79296875, -0.6044921875, -0.416015625, -0.2275390625, -0.0390625, 0.1494140625, 0.337890625, 0.5263671875, 0.71484375, 0.9033203125, 1.091796875, 1.2802734375, 1.46875, 1.6572265625, 1.845703125, 2.0341796875, 2.22265625, 2.4111328125, 2.599609375, 2.7880859375, 2.9765625, 3.1650390625, 3.353515625, 3.5419921875, 3.73046875, 3.9189453125, 4.107421875, 4.2958984375, 4.484375, 4.6728515625, 4.861328125, 5.0498046875, 5.23828125, 5.4267578125, 5.615234375, 5.8037109375, 5.9921875, 6.1806640625, 6.369140625, 6.5576171875, 6.74609375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 8.0, 15.0, 26.0, 32.0, 45.0, 60.0, 76.0, 154.0, 183.0, 315.0, 442.0, 619.0, 933.0, 1347.0, 2019.0, 2893.0, 4281.0, 6506.0, 9490.0, 14367.0, 21497.0, 33335.0, 53327.0, 94287.0, 200397.0, 276131.0, 133993.0, 69998.0, 41471.0, 26887.0, 17498.0, 11701.0, 7843.0, 5225.0, 3578.0, 2404.0, 1625.0, 1121.0, 798.0, 486.0, 361.0, 251.0, 169.0, 108.0, 94.0, 58.0, 30.0, 27.0, 13.0, 11.0, 12.0, 3.0, 5.0, 3.0, 4.0], "bins": [-0.214599609375, -0.20833396911621094, -0.20206832885742188, -0.1958026885986328, -0.18953704833984375, -0.1832714080810547, -0.17700576782226562, -0.17074012756347656, -0.1644744873046875, -0.15820884704589844, -0.15194320678710938, -0.1456775665283203, -0.13941192626953125, -0.1331462860107422, -0.12688064575195312, -0.12061500549316406, -0.114349365234375, -0.10808372497558594, -0.10181808471679688, -0.09555244445800781, -0.08928680419921875, -0.08302116394042969, -0.07675552368164062, -0.07048988342285156, -0.0642242431640625, -0.05795860290527344, -0.051692962646484375, -0.04542732238769531, -0.03916168212890625, -0.03289604187011719, -0.026630401611328125, -0.020364761352539062, -0.01409912109375, -0.007833480834960938, -0.001567840576171875, 0.0046977996826171875, 0.01096343994140625, 0.017229080200195312, 0.023494720458984375, 0.029760360717773438, 0.0360260009765625, 0.04229164123535156, 0.048557281494140625, 0.05482292175292969, 0.06108856201171875, 0.06735420227050781, 0.07361984252929688, 0.07988548278808594, 0.086151123046875, 0.09241676330566406, 0.09868240356445312, 0.10494804382324219, 0.11121368408203125, 0.11747932434082031, 0.12374496459960938, 0.13001060485839844, 0.1362762451171875, 0.14254188537597656, 0.14880752563476562, 0.1550731658935547, 0.16133880615234375, 0.1676044464111328, 0.17387008666992188, 0.18013572692871094, 0.1864013671875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 8.0, 12.0, 6.0, 13.0, 17.0, 16.0, 20.0, 20.0, 30.0, 34.0, 36.0, 24.0, 34.0, 32.0, 30.0, 36.0, 41.0, 32.0, 1057.0, 39.0, 41.0, 38.0, 41.0, 36.0, 47.0, 24.0, 29.0, 24.0, 28.0, 22.0, 22.0, 17.0, 20.0, 18.0, 14.0, 7.0, 2.0, 8.0, 4.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.09765625, -3.970703125, -3.84375, -3.716796875, -3.58984375, -3.462890625, -3.3359375, -3.208984375, -3.08203125, -2.955078125, -2.828125, -2.701171875, -2.57421875, -2.447265625, -2.3203125, -2.193359375, -2.06640625, -1.939453125, -1.8125, -1.685546875, -1.55859375, -1.431640625, -1.3046875, -1.177734375, -1.05078125, -0.923828125, -0.796875, -0.669921875, -0.54296875, -0.416015625, -0.2890625, -0.162109375, -0.03515625, 0.091796875, 0.21875, 0.345703125, 0.47265625, 0.599609375, 0.7265625, 0.853515625, 0.98046875, 1.107421875, 1.234375, 1.361328125, 1.48828125, 1.615234375, 1.7421875, 1.869140625, 1.99609375, 2.123046875, 2.25, 2.376953125, 2.50390625, 2.630859375, 2.7578125, 2.884765625, 3.01171875, 3.138671875, 3.265625, 3.392578125, 3.51953125, 3.646484375, 3.7734375, 3.900390625, 4.02734375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 13.0, 19.0, 21.0, 32.0, 54.0, 75.0, 106.0, 180.0, 273.0, 380.0, 577.0, 868.0, 1267.0, 2083.0, 2963.0, 4737.0, 7473.0, 11573.0, 18551.0, 30282.0, 51008.0, 90144.0, 182335.0, 1330315.0, 159265.0, 80853.0, 46468.0, 27882.0, 17106.0, 10708.0, 6880.0, 4310.0, 2865.0, 1813.0, 1213.0, 829.0, 521.0, 355.0, 249.0, 160.0, 108.0, 64.0, 48.0, 40.0, 23.0, 13.0, 14.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1451416015625, -0.14066314697265625, -0.1361846923828125, -0.13170623779296875, -0.127227783203125, -0.12274932861328125, -0.1182708740234375, -0.11379241943359375, -0.10931396484375, -0.10483551025390625, -0.1003570556640625, -0.09587860107421875, -0.091400146484375, -0.08692169189453125, -0.0824432373046875, -0.07796478271484375, -0.073486328125, -0.06900787353515625, -0.0645294189453125, -0.06005096435546875, -0.055572509765625, -0.05109405517578125, -0.0466156005859375, -0.04213714599609375, -0.03765869140625, -0.03318023681640625, -0.0287017822265625, -0.02422332763671875, -0.019744873046875, -0.01526641845703125, -0.0107879638671875, -0.00630950927734375, -0.0018310546875, 0.00264739990234375, 0.0071258544921875, 0.01160430908203125, 0.016082763671875, 0.02056121826171875, 0.0250396728515625, 0.02951812744140625, 0.03399658203125, 0.03847503662109375, 0.0429534912109375, 0.04743194580078125, 0.051910400390625, 0.05638885498046875, 0.0608673095703125, 0.06534576416015625, 0.06982421875, 0.07430267333984375, 0.0787811279296875, 0.08325958251953125, 0.087738037109375, 0.09221649169921875, 0.0966949462890625, 0.10117340087890625, 0.10565185546875, 0.11013031005859375, 0.1146087646484375, 0.11908721923828125, 0.123565673828125, 0.12804412841796875, 0.1325225830078125, 0.13700103759765625, 0.1414794921875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 8.0, 10.0, 14.0, 13.0, 24.0, 12.0, 30.0, 19.0, 46.0, 36.0, 24.0, 53.0, 42.0, 56.0, 59.0, 49.0, 50.0, 47.0, 44.0, 50.0, 39.0, 35.0, 34.0, 31.0, 26.0, 27.0, 25.0, 9.0, 19.0, 14.0, 8.0, 5.0, 8.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.488229751586914e-05, -4.3081119656562805e-05, -4.127994179725647e-05, -3.9478763937950134e-05, -3.76775860786438e-05, -3.587640821933746e-05, -3.407523036003113e-05, -3.227405250072479e-05, -3.0472874641418457e-05, -2.867169678211212e-05, -2.6870518922805786e-05, -2.506934106349945e-05, -2.3268163204193115e-05, -2.146698534488678e-05, -1.9665807485580444e-05, -1.786462962627411e-05, -1.6063451766967773e-05, -1.4262273907661438e-05, -1.2461096048355103e-05, -1.0659918189048767e-05, -8.858740329742432e-06, -7.057562470436096e-06, -5.256384611129761e-06, -3.4552067518234253e-06, -1.6540288925170898e-06, 1.471489667892456e-07, 1.948326826095581e-06, 3.7495046854019165e-06, 5.550682544708252e-06, 7.351860404014587e-06, 9.153038263320923e-06, 1.0954216122627258e-05, 1.2755393981933594e-05, 1.455657184123993e-05, 1.6357749700546265e-05, 1.81589275598526e-05, 1.9960105419158936e-05, 2.176128327846527e-05, 2.3562461137771606e-05, 2.5363638997077942e-05, 2.7164816856384277e-05, 2.8965994715690613e-05, 3.076717257499695e-05, 3.2568350434303284e-05, 3.436952829360962e-05, 3.6170706152915955e-05, 3.797188401222229e-05, 3.9773061871528625e-05, 4.157423973083496e-05, 4.3375417590141296e-05, 4.517659544944763e-05, 4.697777330875397e-05, 4.87789511680603e-05, 5.058012902736664e-05, 5.2381306886672974e-05, 5.418248474597931e-05, 5.5983662605285645e-05, 5.778484046459198e-05, 5.9586018323898315e-05, 6.138719618320465e-05, 6.318837404251099e-05, 6.498955190181732e-05, 6.679072976112366e-05, 6.859190762042999e-05, 7.039308547973633e-05]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 8.0, 12.0, 8.0, 15.0, 19.0, 23.0, 26.0, 33.0, 52.0, 47.0, 83.0, 123.0, 224.0, 535.0, 5574.0, 596546.0, 439872.0, 4214.0, 519.0, 186.0, 113.0, 73.0, 62.0, 51.0, 35.0, 19.0, 20.0, 18.0, 14.0, 8.0, 3.0, 7.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0], "bins": [-0.001674652099609375, -0.001634739339351654, -0.001594826579093933, -0.0015549138188362122, -0.0015150010585784912, -0.0014750882983207703, -0.0014351755380630493, -0.0013952627778053284, -0.0013553500175476074, -0.0013154372572898865, -0.0012755244970321655, -0.0012356117367744446, -0.0011956989765167236, -0.0011557862162590027, -0.0011158734560012817, -0.0010759606957435608, -0.0010360479354858398, -0.000996135175228119, -0.000956222414970398, -0.000916309654712677, -0.0008763968944549561, -0.0008364841341972351, -0.0007965713739395142, -0.0007566586136817932, -0.0007167458534240723, -0.0006768330931663513, -0.0006369203329086304, -0.0005970075726509094, -0.0005570948123931885, -0.0005171820521354675, -0.0004772692918777466, -0.00043735653162002563, -0.0003974437713623047, -0.00035753101110458374, -0.0003176182508468628, -0.00027770549058914185, -0.0002377927303314209, -0.00019787997007369995, -0.000157967209815979, -0.00011805444955825806, -7.814168930053711e-05, -3.822892904281616e-05, 1.6838312149047852e-06, 4.159659147262573e-05, 8.150935173034668e-05, 0.00012142211198806763, 0.00016133487224578857, 0.00020124763250350952, 0.00024116039276123047, 0.0002810731530189514, 0.00032098591327667236, 0.0003608986735343933, 0.00040081143379211426, 0.0004407241940498352, 0.00048063695430755615, 0.0005205497145652771, 0.000560462474822998, 0.000600375235080719, 0.0006402879953384399, 0.0006802007555961609, 0.0007201135158538818, 0.0007600262761116028, 0.0007999390363693237, 0.0008398517966270447, 0.0008797645568847656]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 31.0, 116.0, 266.0, 330.0, 169.0, 59.0, 27.0, 9.0, 0.0, 2.0], "bins": [-0.0003462833119556308, -0.00034024176420643926, -0.0003342002455610782, -0.00032815869781188667, -0.00032211715006269515, -0.0003160756314173341, -0.00031003408366814256, -0.00030399253591895103, -0.00029795101727358997, -0.00029190946952439845, -0.0002858679508790374, -0.00027982640312984586, -0.00027378485538065434, -0.00026774333673529327, -0.00026170178898610175, -0.0002556602412369102, -0.00024961872259154916, -0.00024357718939427286, -0.00023753564164508134, -0.00023149410844780505, -0.00022545257525052875, -0.00021941104205325246, -0.00021336949430406094, -0.00020732796110678464, -0.0002012863988056779, -0.0001952448656084016, -0.00018920331785921007, -0.00018316178466193378, -0.00017712025146465749, -0.0001710787182673812, -0.00016503717051818967, -0.00015899563732091337, -0.00015295410412363708, -0.00014691257092636079, -0.00014087102317716926, -0.00013482948997989297, -0.00012878795678261667, -0.00012274642358534038, -0.00011670487583614886, -0.00011066334263887256, -0.00010462180216563866, -9.858026169240475e-05, -9.253872849512845e-05, -8.649718802189454e-05, -8.045564754866064e-05, -7.441411435138434e-05, -6.837257387815043e-05, -6.233103340491652e-05, -5.628950020764023e-05, -5.024796337238513e-05, -4.420642653713003e-05, -3.816488606389612e-05, -3.212334922864102e-05, -2.6081812393385917e-05, -2.004027192015201e-05, -1.3998735084896907e-05, -7.957198249641806e-06, -1.915660504892003e-06, 4.1258772398578e-06, 1.0167415894102305e-05, 1.6208952729357406e-05, 2.2250489564612508e-05, 2.8292030037846416e-05, 3.433356687310152e-05, 4.037510370835662e-05]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 3.0, 3.0, 2.0, 5.0, 14.0, 2.0, 15.0, 9.0, 12.0, 10.0, 17.0, 23.0, 15.0, 19.0, 30.0, 39.0, 35.0, 29.0, 32.0, 32.0, 34.0, 48.0, 34.0, 32.0, 33.0, 39.0, 47.0, 42.0, 38.0, 23.0, 27.0, 36.0, 30.0, 24.0, 21.0, 27.0, 30.0, 15.0, 12.0, 13.0, 7.0, 15.0, 12.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.123283386230469e-05, -3.0227936804294586e-05, -2.9223039746284485e-05, -2.8218142688274384e-05, -2.7213245630264282e-05, -2.620834857225418e-05, -2.520345151424408e-05, -2.4198554456233978e-05, -2.3193657398223877e-05, -2.2188760340213776e-05, -2.1183863282203674e-05, -2.0178966224193573e-05, -1.917406916618347e-05, -1.816917210817337e-05, -1.716427505016327e-05, -1.6159377992153168e-05, -1.5154480934143066e-05, -1.4149583876132965e-05, -1.3144686818122864e-05, -1.2139789760112762e-05, -1.1134892702102661e-05, -1.012999564409256e-05, -9.125098586082458e-06, -8.120201528072357e-06, -7.115304470062256e-06, -6.1104074120521545e-06, -5.105510354042053e-06, -4.100613296031952e-06, -3.0957162380218506e-06, -2.0908191800117493e-06, -1.085922122001648e-06, -8.102506399154663e-08, 9.238719940185547e-07, 1.928769052028656e-06, 2.9336661100387573e-06, 3.938563168048859e-06, 4.94346022605896e-06, 5.948357284069061e-06, 6.953254342079163e-06, 7.958151400089264e-06, 8.963048458099365e-06, 9.967945516109467e-06, 1.0972842574119568e-05, 1.197773963212967e-05, 1.298263669013977e-05, 1.3987533748149872e-05, 1.4992430806159973e-05, 1.5997327864170074e-05, 1.7002224922180176e-05, 1.8007121980190277e-05, 1.901201903820038e-05, 2.001691609621048e-05, 2.102181315422058e-05, 2.2026710212230682e-05, 2.3031607270240784e-05, 2.4036504328250885e-05, 2.5041401386260986e-05, 2.6046298444271088e-05, 2.705119550228119e-05, 2.805609256029129e-05, 2.906098961830139e-05, 3.0065886676311493e-05, 3.1070783734321594e-05, 3.2075680792331696e-05, 3.30805778503418e-05]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 9.0, 7.0, 15.0, 15.0, 14.0, 11.0, 16.0, 19.0, 23.0, 25.0, 27.0, 23.0, 34.0, 35.0, 26.0, 34.0, 38.0, 36.0, 40.0, 46.0, 42.0, 32.0, 45.0, 28.0, 36.0, 44.0, 29.0, 27.0, 35.0, 19.0, 22.0, 23.0, 25.0, 11.0, 13.0, 16.0, 9.0, 9.0, 10.0, 5.0, 4.0, 8.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.31640625, -5.1279296875, -4.939453125, -4.7509765625, -4.5625, -4.3740234375, -4.185546875, -3.9970703125, -3.80859375, -3.6201171875, -3.431640625, -3.2431640625, -3.0546875, -2.8662109375, -2.677734375, -2.4892578125, -2.30078125, -2.1123046875, -1.923828125, -1.7353515625, -1.546875, -1.3583984375, -1.169921875, -0.9814453125, -0.79296875, -0.6044921875, -0.416015625, -0.2275390625, -0.0390625, 0.1494140625, 0.337890625, 0.5263671875, 0.71484375, 0.9033203125, 1.091796875, 1.2802734375, 1.46875, 1.6572265625, 1.845703125, 2.0341796875, 2.22265625, 2.4111328125, 2.599609375, 2.7880859375, 2.9765625, 3.1650390625, 3.353515625, 3.5419921875, 3.73046875, 3.9189453125, 4.107421875, 4.2958984375, 4.484375, 4.6728515625, 4.861328125, 5.0498046875, 5.23828125, 5.4267578125, 5.615234375, 5.8037109375, 5.9921875, 6.1806640625, 6.369140625, 6.5576171875, 6.74609375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 11.0, 10.0, 24.0, 31.0, 47.0, 59.0, 82.0, 146.0, 192.0, 348.0, 511.0, 812.0, 1390.0, 2547.0, 4562.0, 8250.0, 15384.0, 29496.0, 60762.0, 166926.0, 490329.0, 149346.0, 56381.0, 28167.0, 14545.0, 7897.0, 4276.0, 2478.0, 1369.0, 806.0, 486.0, 273.0, 190.0, 135.0, 87.0, 69.0, 44.0, 21.0, 23.0, 14.0, 6.0, 7.0, 4.0, 7.0, 2.0, 0.0, 1.0], "bins": [-13.4609375, -13.1015625, -12.7421875, -12.3828125, -12.0234375, -11.6640625, -11.3046875, -10.9453125, -10.5859375, -10.2265625, -9.8671875, -9.5078125, -9.1484375, -8.7890625, -8.4296875, -8.0703125, -7.7109375, -7.3515625, -6.9921875, -6.6328125, -6.2734375, -5.9140625, -5.5546875, -5.1953125, -4.8359375, -4.4765625, -4.1171875, -3.7578125, -3.3984375, -3.0390625, -2.6796875, -2.3203125, -1.9609375, -1.6015625, -1.2421875, -0.8828125, -0.5234375, -0.1640625, 0.1953125, 0.5546875, 0.9140625, 1.2734375, 1.6328125, 1.9921875, 2.3515625, 2.7109375, 3.0703125, 3.4296875, 3.7890625, 4.1484375, 4.5078125, 4.8671875, 5.2265625, 5.5859375, 5.9453125, 6.3046875, 6.6640625, 7.0234375, 7.3828125, 7.7421875, 8.1015625, 8.4609375, 8.8203125, 9.1796875, 9.5390625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 5.0, 4.0, 1.0, 4.0, 2.0, 5.0, 8.0, 12.0, 8.0, 15.0, 11.0, 13.0, 14.0, 19.0, 25.0, 30.0, 26.0, 29.0, 40.0, 39.0, 49.0, 58.0, 87.0, 119.0, 220.0, 1452.0, 175.0, 118.0, 70.0, 61.0, 43.0, 39.0, 43.0, 27.0, 26.0, 23.0, 23.0, 22.0, 17.0, 13.0, 8.0, 9.0, 16.0, 10.0, 6.0, 4.0, 6.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.9765625, -14.4493408203125, -13.922119140625, -13.3948974609375, -12.86767578125, -12.3404541015625, -11.813232421875, -11.2860107421875, -10.7587890625, -10.2315673828125, -9.704345703125, -9.1771240234375, -8.64990234375, -8.1226806640625, -7.595458984375, -7.0682373046875, -6.541015625, -6.0137939453125, -5.486572265625, -4.9593505859375, -4.43212890625, -3.9049072265625, -3.377685546875, -2.8504638671875, -2.3232421875, -1.7960205078125, -1.268798828125, -0.7415771484375, -0.21435546875, 0.3128662109375, 0.840087890625, 1.3673095703125, 1.89453125, 2.4217529296875, 2.948974609375, 3.4761962890625, 4.00341796875, 4.5306396484375, 5.057861328125, 5.5850830078125, 6.1123046875, 6.6395263671875, 7.166748046875, 7.6939697265625, 8.22119140625, 8.7484130859375, 9.275634765625, 9.8028564453125, 10.330078125, 10.8572998046875, 11.384521484375, 11.9117431640625, 12.43896484375, 12.9661865234375, 13.493408203125, 14.0206298828125, 14.5478515625, 15.0750732421875, 15.602294921875, 16.1295166015625, 16.65673828125, 17.1839599609375, 17.711181640625, 18.2384033203125, 18.765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 12.0, 2.0, 13.0, 6.0, 14.0, 14.0, 26.0, 30.0, 35.0, 50.0, 75.0, 100.0, 189.0, 321.0, 718.0, 1665.0, 4831.0, 16433.0, 69603.0, 628206.0, 2244087.0, 139200.0, 28051.0, 7522.0, 2428.0, 985.0, 424.0, 225.0, 130.0, 80.0, 49.0, 41.0, 27.0, 34.0, 18.0, 19.0, 12.0, 9.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-24.25, -23.47265625, -22.6953125, -21.91796875, -21.140625, -20.36328125, -19.5859375, -18.80859375, -18.03125, -17.25390625, -16.4765625, -15.69921875, -14.921875, -14.14453125, -13.3671875, -12.58984375, -11.8125, -11.03515625, -10.2578125, -9.48046875, -8.703125, -7.92578125, -7.1484375, -6.37109375, -5.59375, -4.81640625, -4.0390625, -3.26171875, -2.484375, -1.70703125, -0.9296875, -0.15234375, 0.625, 1.40234375, 2.1796875, 2.95703125, 3.734375, 4.51171875, 5.2890625, 6.06640625, 6.84375, 7.62109375, 8.3984375, 9.17578125, 9.953125, 10.73046875, 11.5078125, 12.28515625, 13.0625, 13.83984375, 14.6171875, 15.39453125, 16.171875, 16.94921875, 17.7265625, 18.50390625, 19.28125, 20.05859375, 20.8359375, 21.61328125, 22.390625, 23.16796875, 23.9453125, 24.72265625, 25.5]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 7.0, 7.0, 21.0, 15.0, 25.0, 42.0, 59.0, 75.0, 94.0, 92.0, 98.0, 102.0, 96.0, 69.0, 61.0, 41.0, 28.0, 26.0, 15.0, 15.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.96511459350586, -46.81098556518555, -45.656856536865234, -44.50272750854492, -43.34859848022461, -42.1944694519043, -41.040340423583984, -39.886207580566406, -38.732078552246094, -37.57794952392578, -36.42382049560547, -35.269691467285156, -34.115562438964844, -32.96143341064453, -31.807302474975586, -30.653173446655273, -29.499046325683594, -28.34491729736328, -27.19078826904297, -26.036659240722656, -24.882530212402344, -23.72840118408203, -22.574270248413086, -21.420141220092773, -20.26601219177246, -19.11188316345215, -17.957754135131836, -16.803625106811523, -15.649495124816895, -14.495366096496582, -13.341236114501953, -12.18710708618164, -11.032976150512695, -9.878847122192383, -8.72471809387207, -7.570588111877441, -6.416459083557129, -5.262330055236816, -4.108200550079346, -2.954071044921875, -1.7999420166015625, -0.6458127498626709, 0.5083165168762207, 1.6624457836151123, 2.816575050354004, 3.9707040786743164, 5.124833583831787, 6.278963088989258, 7.43309211730957, 8.587221145629883, 9.741350173950195, 10.895480155944824, 12.049609184265137, 13.20373821258545, 14.357868194580078, 15.51199722290039, 16.666126251220703, 17.820255279541016, 18.974384307861328, 20.12851333618164, 21.282642364501953, 22.436771392822266, 23.59090232849121, 24.745031356811523, 25.899160385131836]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 2.0, 9.0, 6.0, 14.0, 9.0, 9.0, 13.0, 16.0, 23.0, 19.0, 21.0, 32.0, 38.0, 38.0, 38.0, 46.0, 28.0, 48.0, 45.0, 28.0, 41.0, 31.0, 36.0, 45.0, 46.0, 37.0, 43.0, 28.0, 30.0, 21.0, 21.0, 29.0, 18.0, 18.0, 20.0, 11.0, 9.0, 12.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-57.57184600830078, -55.94717025756836, -54.32249069213867, -52.69781494140625, -51.07313919067383, -49.448463439941406, -47.82378387451172, -46.1991081237793, -44.574432373046875, -42.94975662231445, -41.325077056884766, -39.700401306152344, -38.07572555541992, -36.4510498046875, -34.82637023925781, -33.20169448852539, -31.577014923095703, -29.95233726501465, -28.327661514282227, -26.702983856201172, -25.07830810546875, -23.453630447387695, -21.82895278930664, -20.20427703857422, -18.579599380493164, -16.95492172241211, -15.330245971679688, -13.705568313598633, -12.080891609191895, -10.456214904785156, -8.831537246704102, -7.206860542297363, -5.582180023193359, -3.957503080368042, -2.3328261375427246, -0.7081489562988281, 0.9165277481079102, 2.5412044525146484, 4.165882110595703, 5.790558815002441, 7.41523551940918, 9.039912223815918, 10.664588928222656, 12.289266586303711, 13.91394329071045, 15.538619995117188, 17.163297653198242, 18.787975311279297, 20.41265106201172, 22.037328720092773, 23.662004470825195, 25.28668212890625, 26.911357879638672, 28.536035537719727, 30.16071319580078, 31.785388946533203, 33.410064697265625, 35.03474044799805, 36.659420013427734, 38.284095764160156, 39.90877151489258, 41.533447265625, 43.15812683105469, 44.78280258178711, 46.4074821472168]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 5.0, 1.0, 2.0, 6.0, 7.0, 13.0, 8.0, 10.0, 15.0, 21.0, 23.0, 19.0, 21.0, 26.0, 20.0, 29.0, 33.0, 28.0, 38.0, 31.0, 36.0, 35.0, 26.0, 42.0, 38.0, 33.0, 48.0, 32.0, 38.0, 26.0, 37.0, 28.0, 37.0, 23.0, 21.0, 19.0, 12.0, 18.0, 20.0, 8.0, 13.0, 17.0, 9.0, 6.0, 4.0, 10.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.5831298828125, -5.396728515625, -5.2103271484375, -5.02392578125, -4.8375244140625, -4.651123046875, -4.4647216796875, -4.2783203125, -4.0919189453125, -3.905517578125, -3.7191162109375, -3.53271484375, -3.3463134765625, -3.159912109375, -2.9735107421875, -2.787109375, -2.6007080078125, -2.414306640625, -2.2279052734375, -2.04150390625, -1.8551025390625, -1.668701171875, -1.4822998046875, -1.2958984375, -1.1094970703125, -0.923095703125, -0.7366943359375, -0.55029296875, -0.3638916015625, -0.177490234375, 0.0089111328125, 0.1953125, 0.3817138671875, 0.568115234375, 0.7545166015625, 0.94091796875, 1.1273193359375, 1.313720703125, 1.5001220703125, 1.6865234375, 1.8729248046875, 2.059326171875, 2.2457275390625, 2.43212890625, 2.6185302734375, 2.804931640625, 2.9913330078125, 3.177734375, 3.3641357421875, 3.550537109375, 3.7369384765625, 3.92333984375, 4.1097412109375, 4.296142578125, 4.4825439453125, 4.6689453125, 4.8553466796875, 5.041748046875, 5.2281494140625, 5.41455078125, 5.6009521484375, 5.787353515625, 5.9737548828125, 6.16015625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 5.0, 3.0, 0.0, 6.0, 11.0, 24.0, 29.0, 41.0, 60.0, 79.0, 113.0, 176.0, 266.0, 380.0, 579.0, 889.0, 1327.0, 2187.0, 3607.0, 6066.0, 10934.0, 20320.0, 41541.0, 98172.0, 303813.0, 1300935.0, 1745760.0, 426051.0, 124050.0, 50946.0, 24526.0, 12871.0, 7165.0, 4210.0, 2501.0, 1611.0, 1062.0, 645.0, 446.0, 277.0, 181.0, 141.0, 90.0, 60.0, 34.0, 27.0, 27.0, 13.0, 7.0, 4.0, 12.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-9.4296875, -9.14501953125, -8.8603515625, -8.57568359375, -8.291015625, -8.00634765625, -7.7216796875, -7.43701171875, -7.15234375, -6.86767578125, -6.5830078125, -6.29833984375, -6.013671875, -5.72900390625, -5.4443359375, -5.15966796875, -4.875, -4.59033203125, -4.3056640625, -4.02099609375, -3.736328125, -3.45166015625, -3.1669921875, -2.88232421875, -2.59765625, -2.31298828125, -2.0283203125, -1.74365234375, -1.458984375, -1.17431640625, -0.8896484375, -0.60498046875, -0.3203125, -0.03564453125, 0.2490234375, 0.53369140625, 0.818359375, 1.10302734375, 1.3876953125, 1.67236328125, 1.95703125, 2.24169921875, 2.5263671875, 2.81103515625, 3.095703125, 3.38037109375, 3.6650390625, 3.94970703125, 4.234375, 4.51904296875, 4.8037109375, 5.08837890625, 5.373046875, 5.65771484375, 5.9423828125, 6.22705078125, 6.51171875, 6.79638671875, 7.0810546875, 7.36572265625, 7.650390625, 7.93505859375, 8.2197265625, 8.50439453125, 8.7890625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 8.0, 8.0, 11.0, 16.0, 23.0, 31.0, 48.0, 71.0, 75.0, 92.0, 145.0, 177.0, 258.0, 432.0, 650.0, 600.0, 448.0, 286.0, 179.0, 150.0, 99.0, 66.0, 53.0, 32.0, 27.0, 19.0, 8.0, 16.0, 7.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.359375, -11.9847412109375, -11.610107421875, -11.2354736328125, -10.86083984375, -10.4862060546875, -10.111572265625, -9.7369384765625, -9.3623046875, -8.9876708984375, -8.613037109375, -8.2384033203125, -7.86376953125, -7.4891357421875, -7.114501953125, -6.7398681640625, -6.365234375, -5.9906005859375, -5.615966796875, -5.2413330078125, -4.86669921875, -4.4920654296875, -4.117431640625, -3.7427978515625, -3.3681640625, -2.9935302734375, -2.618896484375, -2.2442626953125, -1.86962890625, -1.4949951171875, -1.120361328125, -0.7457275390625, -0.37109375, 0.0035400390625, 0.378173828125, 0.7528076171875, 1.12744140625, 1.5020751953125, 1.876708984375, 2.2513427734375, 2.6259765625, 3.0006103515625, 3.375244140625, 3.7498779296875, 4.12451171875, 4.4991455078125, 4.873779296875, 5.2484130859375, 5.623046875, 5.9976806640625, 6.372314453125, 6.7469482421875, 7.12158203125, 7.4962158203125, 7.870849609375, 8.2454833984375, 8.6201171875, 8.9947509765625, 9.369384765625, 9.7440185546875, 10.11865234375, 10.4932861328125, 10.867919921875, 11.2425537109375, 11.6171875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 6.0, 11.0, 21.0, 24.0, 31.0, 85.0, 113.0, 197.0, 394.0, 1018.0, 3080.0, 13432.0, 88986.0, 1531169.0, 2419669.0, 114139.0, 16066.0, 3646.0, 1160.0, 432.0, 212.0, 125.0, 77.0, 43.0, 46.0, 23.0, 15.0, 14.0, 15.0, 6.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.234375, -28.228271484375, -27.22216796875, -26.216064453125, -25.2099609375, -24.203857421875, -23.19775390625, -22.191650390625, -21.185546875, -20.179443359375, -19.17333984375, -18.167236328125, -17.1611328125, -16.155029296875, -15.14892578125, -14.142822265625, -13.13671875, -12.130615234375, -11.12451171875, -10.118408203125, -9.1123046875, -8.106201171875, -7.10009765625, -6.093994140625, -5.087890625, -4.081787109375, -3.07568359375, -2.069580078125, -1.0634765625, -0.057373046875, 0.94873046875, 1.954833984375, 2.9609375, 3.967041015625, 4.97314453125, 5.979248046875, 6.9853515625, 7.991455078125, 8.99755859375, 10.003662109375, 11.009765625, 12.015869140625, 13.02197265625, 14.028076171875, 15.0341796875, 16.040283203125, 17.04638671875, 18.052490234375, 19.05859375, 20.064697265625, 21.07080078125, 22.076904296875, 23.0830078125, 24.089111328125, 25.09521484375, 26.101318359375, 27.107421875, 28.113525390625, 29.11962890625, 30.125732421875, 31.1318359375, 32.137939453125, 33.14404296875, 34.150146484375, 35.15625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 10.0, 27.0, 35.0, 68.0, 121.0, 151.0, 163.0, 139.0, 92.0, 85.0, 54.0, 32.0, 16.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.89708709716797, -92.38953399658203, -89.88197326660156, -87.37442016601562, -84.86686706542969, -82.35930633544922, -79.85175323486328, -77.34419250488281, -74.83663940429688, -72.32908630371094, -69.82152557373047, -67.31397247314453, -64.80641174316406, -62.298858642578125, -59.79130554199219, -57.283748626708984, -54.77619171142578, -52.26863479614258, -49.761077880859375, -47.25352478027344, -44.745967864990234, -42.23841094970703, -39.730857849121094, -37.22330093383789, -34.71574401855469, -32.208187103271484, -29.700632095336914, -27.193077087402344, -24.68552017211914, -22.177963256835938, -19.670408248901367, -17.162853240966797, -14.655303955078125, -12.147747993469238, -9.640192031860352, -7.132636070251465, -4.625080108642578, -2.1175241470336914, 0.3900318145751953, 2.8975868225097656, 5.405143737792969, 7.9126996994018555, 10.420255661010742, 12.927811622619629, 15.435367584228516, 17.94292449951172, 20.45047950744629, 22.95803451538086, 25.465591430664062, 27.973148345947266, 30.480703353881836, 32.988258361816406, 35.49581527709961, 38.00337219238281, 40.51092529296875, 43.01848220825195, 45.526039123535156, 48.03359603881836, 50.54115295410156, 53.0487060546875, 55.5562629699707, 58.063819885253906, 60.571372985839844, 63.07892990112305, 65.58648681640625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 2.0, 6.0, 1.0, 12.0, 16.0, 10.0, 11.0, 16.0, 8.0, 19.0, 21.0, 21.0, 31.0, 26.0, 32.0, 37.0, 29.0, 33.0, 38.0, 33.0, 44.0, 40.0, 35.0, 56.0, 33.0, 22.0, 34.0, 39.0, 28.0, 30.0, 38.0, 21.0, 24.0, 18.0, 18.0, 19.0, 18.0, 21.0, 6.0, 13.0, 9.0, 8.0, 6.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-35.9652099609375, -34.81837844848633, -33.671546936035156, -32.52471160888672, -31.377880096435547, -30.231048583984375, -29.08421516418457, -27.937381744384766, -26.790550231933594, -25.643718719482422, -24.496885299682617, -23.350051879882812, -22.20322036743164, -21.05638885498047, -19.909555435180664, -18.76272201538086, -17.615890502929688, -16.469058990478516, -15.322225570678711, -14.175393104553223, -13.028560638427734, -11.881728172302246, -10.734895706176758, -9.58806324005127, -8.441230773925781, -7.294398307800293, -6.147565841674805, -5.000733375549316, -3.853900909423828, -2.70706844329834, -1.5602359771728516, -0.4134035110473633, 0.733428955078125, 1.8802614212036133, 3.0270938873291016, 4.17392635345459, 5.320758819580078, 6.467591285705566, 7.614423751831055, 8.761256217956543, 9.908088684082031, 11.05492115020752, 12.201753616333008, 13.348586082458496, 14.495418548583984, 15.642251014709473, 16.78908348083496, 17.935916900634766, 19.082748413085938, 20.22957992553711, 21.376413345336914, 22.52324676513672, 23.67007827758789, 24.816909790039062, 25.963743209838867, 27.110576629638672, 28.257408142089844, 29.404239654541016, 30.55107307434082, 31.697906494140625, 32.8447380065918, 33.99156951904297, 35.138404846191406, 36.28523635864258, 37.43206787109375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 4.0, 8.0, 9.0, 10.0, 15.0, 19.0, 23.0, 27.0, 26.0, 21.0, 43.0, 38.0, 31.0, 34.0, 42.0, 39.0, 40.0, 45.0, 40.0, 45.0, 49.0, 42.0, 45.0, 35.0, 24.0, 30.0, 34.0, 34.0, 23.0, 26.0, 17.0, 10.0, 17.0, 9.0, 9.0, 8.0, 3.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.63671875, -7.4132080078125, -7.189697265625, -6.9661865234375, -6.74267578125, -6.5191650390625, -6.295654296875, -6.0721435546875, -5.8486328125, -5.6251220703125, -5.401611328125, -5.1781005859375, -4.95458984375, -4.7310791015625, -4.507568359375, -4.2840576171875, -4.060546875, -3.8370361328125, -3.613525390625, -3.3900146484375, -3.16650390625, -2.9429931640625, -2.719482421875, -2.4959716796875, -2.2724609375, -2.0489501953125, -1.825439453125, -1.6019287109375, -1.37841796875, -1.1549072265625, -0.931396484375, -0.7078857421875, -0.484375, -0.2608642578125, -0.037353515625, 0.1861572265625, 0.40966796875, 0.6331787109375, 0.856689453125, 1.0802001953125, 1.3037109375, 1.5272216796875, 1.750732421875, 1.9742431640625, 2.19775390625, 2.4212646484375, 2.644775390625, 2.8682861328125, 3.091796875, 3.3153076171875, 3.538818359375, 3.7623291015625, 3.98583984375, 4.2093505859375, 4.432861328125, 4.6563720703125, 4.8798828125, 5.1033935546875, 5.326904296875, 5.5504150390625, 5.77392578125, 5.9974365234375, 6.220947265625, 6.4444580078125, 6.66796875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 15.0, 10.0, 7.0, 18.0, 26.0, 45.0, 77.0, 110.0, 120.0, 204.0, 292.0, 471.0, 655.0, 950.0, 1454.0, 2295.0, 3546.0, 5384.0, 8525.0, 13944.0, 22662.0, 38719.0, 70989.0, 148424.0, 322628.0, 200610.0, 88161.0, 47003.0, 26759.0, 16444.0, 10006.0, 6281.0, 3920.0, 2644.0, 1722.0, 1122.0, 721.0, 492.0, 313.0, 275.0, 173.0, 118.0, 78.0, 45.0, 23.0, 22.0, 24.0, 9.0, 12.0, 8.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.262939453125, -0.2551288604736328, -0.24731826782226562, -0.23950767517089844, -0.23169708251953125, -0.22388648986816406, -0.21607589721679688, -0.2082653045654297, -0.2004547119140625, -0.1926441192626953, -0.18483352661132812, -0.17702293395996094, -0.16921234130859375, -0.16140174865722656, -0.15359115600585938, -0.1457805633544922, -0.137969970703125, -0.1301593780517578, -0.12234878540039062, -0.11453819274902344, -0.10672760009765625, -0.09891700744628906, -0.09110641479492188, -0.08329582214355469, -0.0754852294921875, -0.06767463684082031, -0.059864044189453125, -0.05205345153808594, -0.04424285888671875, -0.03643226623535156, -0.028621673583984375, -0.020811080932617188, -0.01300048828125, -0.0051898956298828125, 0.002620697021484375, 0.010431289672851562, 0.01824188232421875, 0.026052474975585938, 0.033863067626953125, 0.04167366027832031, 0.0494842529296875, 0.05729484558105469, 0.06510543823242188, 0.07291603088378906, 0.08072662353515625, 0.08853721618652344, 0.09634780883789062, 0.10415840148925781, 0.111968994140625, 0.11977958679199219, 0.12759017944335938, 0.13540077209472656, 0.14321136474609375, 0.15102195739746094, 0.15883255004882812, 0.1666431427001953, 0.1744537353515625, 0.1822643280029297, 0.19007492065429688, 0.19788551330566406, 0.20569610595703125, 0.21350669860839844, 0.22131729125976562, 0.2291278839111328, 0.2369384765625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 9.0, 6.0, 10.0, 5.0, 10.0, 5.0, 13.0, 12.0, 16.0, 18.0, 21.0, 9.0, 14.0, 17.0, 31.0, 26.0, 34.0, 38.0, 39.0, 35.0, 37.0, 44.0, 49.0, 1056.0, 34.0, 33.0, 28.0, 33.0, 25.0, 30.0, 39.0, 36.0, 19.0, 21.0, 20.0, 18.0, 18.0, 9.0, 15.0, 16.0, 11.0, 14.0, 9.0, 6.0, 10.0, 5.0, 6.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.23046875, -4.09588623046875, -3.9613037109375, -3.82672119140625, -3.692138671875, -3.55755615234375, -3.4229736328125, -3.28839111328125, -3.15380859375, -3.01922607421875, -2.8846435546875, -2.75006103515625, -2.615478515625, -2.48089599609375, -2.3463134765625, -2.21173095703125, -2.0771484375, -1.94256591796875, -1.8079833984375, -1.67340087890625, -1.538818359375, -1.40423583984375, -1.2696533203125, -1.13507080078125, -1.00048828125, -0.86590576171875, -0.7313232421875, -0.59674072265625, -0.462158203125, -0.32757568359375, -0.1929931640625, -0.05841064453125, 0.076171875, 0.21075439453125, 0.3453369140625, 0.47991943359375, 0.614501953125, 0.74908447265625, 0.8836669921875, 1.01824951171875, 1.15283203125, 1.28741455078125, 1.4219970703125, 1.55657958984375, 1.691162109375, 1.82574462890625, 1.9603271484375, 2.09490966796875, 2.2294921875, 2.36407470703125, 2.4986572265625, 2.63323974609375, 2.767822265625, 2.90240478515625, 3.0369873046875, 3.17156982421875, 3.30615234375, 3.44073486328125, 3.5753173828125, 3.70989990234375, 3.844482421875, 3.97906494140625, 4.1136474609375, 4.24822998046875, 4.3828125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 5.0, 1.0, 4.0, 3.0, 6.0, 16.0, 25.0, 22.0, 33.0, 45.0, 95.0, 150.0, 210.0, 307.0, 457.0, 668.0, 1004.0, 1515.0, 2150.0, 3197.0, 4749.0, 7188.0, 10604.0, 15794.0, 24037.0, 38520.0, 65894.0, 122053.0, 1297617.0, 227464.0, 109466.0, 59878.0, 35577.0, 23099.0, 14835.0, 9859.0, 6729.0, 4551.0, 3020.0, 2060.0, 1358.0, 935.0, 652.0, 452.0, 275.0, 170.0, 135.0, 96.0, 62.0, 36.0, 22.0, 15.0, 11.0, 3.0, 9.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1514892578125, -0.1467437744140625, -0.141998291015625, -0.1372528076171875, -0.13250732421875, -0.1277618408203125, -0.123016357421875, -0.1182708740234375, -0.113525390625, -0.1087799072265625, -0.104034423828125, -0.0992889404296875, -0.09454345703125, -0.0897979736328125, -0.085052490234375, -0.0803070068359375, -0.0755615234375, -0.0708160400390625, -0.066070556640625, -0.0613250732421875, -0.05657958984375, -0.0518341064453125, -0.047088623046875, -0.0423431396484375, -0.03759765625, -0.0328521728515625, -0.028106689453125, -0.0233612060546875, -0.01861572265625, -0.0138702392578125, -0.009124755859375, -0.0043792724609375, 0.0003662109375, 0.0051116943359375, 0.009857177734375, 0.0146026611328125, 0.01934814453125, 0.0240936279296875, 0.028839111328125, 0.0335845947265625, 0.038330078125, 0.0430755615234375, 0.047821044921875, 0.0525665283203125, 0.05731201171875, 0.0620574951171875, 0.066802978515625, 0.0715484619140625, 0.0762939453125, 0.0810394287109375, 0.085784912109375, 0.0905303955078125, 0.09527587890625, 0.1000213623046875, 0.104766845703125, 0.1095123291015625, 0.1142578125, 0.1190032958984375, 0.123748779296875, 0.1284942626953125, 0.13323974609375, 0.1379852294921875, 0.142730712890625, 0.1474761962890625, 0.1522216796875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 10.0, 11.0, 7.0, 6.0, 13.0, 17.0, 22.0, 25.0, 28.0, 26.0, 42.0, 43.0, 44.0, 49.0, 59.0, 50.0, 64.0, 56.0, 50.0, 61.0, 53.0, 43.0, 36.0, 34.0, 33.0, 21.0, 22.0, 13.0, 14.0, 8.0, 7.0, 5.0, 4.0, 4.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.003545761108398e-05, -6.7858025431633e-05, -6.568059325218201e-05, -6.350316107273102e-05, -6.132572889328003e-05, -5.914829671382904e-05, -5.697086453437805e-05, -5.479343235492706e-05, -5.2616000175476074e-05, -5.0438567996025085e-05, -4.82611358165741e-05, -4.608370363712311e-05, -4.390627145767212e-05, -4.172883927822113e-05, -3.955140709877014e-05, -3.737397491931915e-05, -3.5196542739868164e-05, -3.3019110560417175e-05, -3.0841678380966187e-05, -2.8664246201515198e-05, -2.648681402206421e-05, -2.430938184261322e-05, -2.213194966316223e-05, -1.9954517483711243e-05, -1.7777085304260254e-05, -1.5599653124809265e-05, -1.3422220945358276e-05, -1.1244788765907288e-05, -9.067356586456299e-06, -6.88992440700531e-06, -4.712492227554321e-06, -2.5350600481033325e-06, -3.5762786865234375e-07, 1.819804310798645e-06, 3.997236490249634e-06, 6.1746686697006226e-06, 8.352100849151611e-06, 1.05295330286026e-05, 1.2706965208053589e-05, 1.4884397387504578e-05, 1.7061829566955566e-05, 1.9239261746406555e-05, 2.1416693925857544e-05, 2.3594126105308533e-05, 2.577155828475952e-05, 2.794899046421051e-05, 3.01264226436615e-05, 3.230385482311249e-05, 3.4481287002563477e-05, 3.6658719182014465e-05, 3.8836151361465454e-05, 4.101358354091644e-05, 4.319101572036743e-05, 4.536844789981842e-05, 4.754588007926941e-05, 4.97233122587204e-05, 5.190074443817139e-05, 5.4078176617622375e-05, 5.6255608797073364e-05, 5.843304097652435e-05, 6.061047315597534e-05, 6.278790533542633e-05, 6.496533751487732e-05, 6.714276969432831e-05, 6.93202018737793e-05]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 8.0, 3.0, 7.0, 10.0, 12.0, 14.0, 27.0, 24.0, 40.0, 47.0, 55.0, 57.0, 131.0, 209.0, 428.0, 2539.0, 712881.0, 329694.0, 1444.0, 356.0, 198.0, 81.0, 60.0, 42.0, 29.0, 26.0, 28.0, 20.0, 21.0, 9.0, 8.0, 9.0, 10.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0016145706176757812, -0.001566961407661438, -0.0015193521976470947, -0.0014717429876327515, -0.0014241337776184082, -0.001376524567604065, -0.0013289153575897217, -0.0012813061475753784, -0.0012336969375610352, -0.001186087727546692, -0.0011384785175323486, -0.0010908693075180054, -0.0010432600975036621, -0.0009956508874893188, -0.0009480416774749756, -0.0009004324674606323, -0.0008528232574462891, -0.0008052140474319458, -0.0007576048374176025, -0.0007099956274032593, -0.000662386417388916, -0.0006147772073745728, -0.0005671679973602295, -0.0005195587873458862, -0.00047194957733154297, -0.0004243403673171997, -0.00037673115730285645, -0.0003291219472885132, -0.0002815127372741699, -0.00023390352725982666, -0.0001862943172454834, -0.00013868510723114014, -9.107589721679688e-05, -4.346668720245361e-05, 4.1425228118896484e-06, 5.175173282623291e-05, 9.936094284057617e-05, 0.00014697015285491943, 0.0001945793628692627, 0.00024218857288360596, 0.0002897977828979492, 0.0003374069929122925, 0.00038501620292663574, 0.000432625412940979, 0.00048023462295532227, 0.0005278438329696655, 0.0005754530429840088, 0.000623062252998352, 0.0006706714630126953, 0.0007182806730270386, 0.0007658898830413818, 0.0008134990930557251, 0.0008611083030700684, 0.0009087175130844116, 0.0009563267230987549, 0.0010039359331130981, 0.0010515451431274414, 0.0010991543531417847, 0.001146763563156128, 0.0011943727731704712, 0.0012419819831848145, 0.0012895911931991577, 0.001337200403213501, 0.0013848096132278442, 0.0014324188232421875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 46.0, 300.0, 522.0, 135.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005373908788897097, -0.0005276696756482124, -0.0005179484724067152, -0.0005082272691652179, -0.0004985061241313815, -0.0004887849208898842, -0.00047906371764838696, -0.0004693425144068897, -0.0004596213111653924, -0.0004499001079238951, -0.00044017890468239784, -0.000430457730544731, -0.00042073652730323374, -0.00041101532406173646, -0.00040129414992406964, -0.00039157294668257236, -0.0003818517434410751, -0.0003721305401995778, -0.00036240933695808053, -0.0003526881628204137, -0.00034296695957891643, -0.00033324575633741915, -0.00032352458219975233, -0.00031380337895825505, -0.0003040821757167578, -0.0002943609724752605, -0.0002846397692337632, -0.0002749185950960964, -0.0002651973918545991, -0.00025547618861310184, -0.000245755014475435, -0.00023603381123393774, -0.00022631263709627092, -0.00021659143385477364, -0.0002068702451651916, -0.00019714905647560954, -0.00018742785323411226, -0.00017770664999261498, -0.00016798546130303293, -0.00015826427261345088, -0.0001485430693719536, -0.00013882186613045633, -0.00012910067744087428, -0.00011937948147533461, -0.00010965828550979495, -9.993708954425529e-05, -9.021589357871562e-05, -8.049469761317596e-05, -7.077349437167868e-05, -6.105229840613902e-05, -5.133110244059935e-05, -4.160990647505969e-05, -3.1888710509520024e-05, -2.216751454398036e-05, -1.2446318578440696e-05, -2.725122612901032e-06, 6.996073352638632e-06, 1.6717269318178296e-05, 2.643846528371796e-05, 3.6159661249257624e-05, 4.588085721479729e-05, 5.560205318033695e-05, 6.532324914587662e-05, 7.504444511141628e-05, 8.476564107695594e-05]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 9.0, 3.0, 7.0, 6.0, 10.0, 7.0, 11.0, 10.0, 10.0, 11.0, 17.0, 14.0, 26.0, 25.0, 36.0, 30.0, 32.0, 41.0, 51.0, 42.0, 36.0, 34.0, 44.0, 37.0, 40.0, 43.0, 41.0, 49.0, 38.0, 31.0, 28.0, 18.0, 32.0, 26.0, 21.0, 20.0, 17.0, 13.0, 5.0, 7.0, 3.0, 7.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6835670471191406e-05, -3.565941005945206e-05, -3.448314964771271e-05, -3.330688923597336e-05, -3.213062882423401e-05, -3.095436841249466e-05, -2.977810800075531e-05, -2.860184758901596e-05, -2.742558717727661e-05, -2.6249326765537262e-05, -2.5073066353797913e-05, -2.3896805942058563e-05, -2.2720545530319214e-05, -2.1544285118579865e-05, -2.0368024706840515e-05, -1.9191764295101166e-05, -1.8015503883361816e-05, -1.6839243471622467e-05, -1.5662983059883118e-05, -1.4486722648143768e-05, -1.3310462236404419e-05, -1.213420182466507e-05, -1.095794141292572e-05, -9.781681001186371e-06, -8.605420589447021e-06, -7.429160177707672e-06, -6.252899765968323e-06, -5.076639354228973e-06, -3.900378942489624e-06, -2.7241185307502747e-06, -1.5478581190109253e-06, -3.7159770727157593e-07, 8.046627044677734e-07, 1.980923116207123e-06, 3.157183527946472e-06, 4.3334439396858215e-06, 5.509704351425171e-06, 6.68596476316452e-06, 7.86222517490387e-06, 9.038485586643219e-06, 1.0214745998382568e-05, 1.1391006410121918e-05, 1.2567266821861267e-05, 1.3743527233600616e-05, 1.4919787645339966e-05, 1.6096048057079315e-05, 1.7272308468818665e-05, 1.8448568880558014e-05, 1.9624829292297363e-05, 2.0801089704036713e-05, 2.1977350115776062e-05, 2.315361052751541e-05, 2.432987093925476e-05, 2.550613135099411e-05, 2.668239176273346e-05, 2.785865217447281e-05, 2.9034912586212158e-05, 3.0211172997951508e-05, 3.138743340969086e-05, 3.2563693821430206e-05, 3.3739954233169556e-05, 3.4916214644908905e-05, 3.6092475056648254e-05, 3.7268735468387604e-05, 3.844499588012695e-05]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 4.0, 8.0, 9.0, 10.0, 15.0, 19.0, 23.0, 27.0, 26.0, 21.0, 43.0, 38.0, 31.0, 34.0, 42.0, 39.0, 40.0, 45.0, 40.0, 45.0, 49.0, 42.0, 45.0, 35.0, 24.0, 30.0, 34.0, 34.0, 23.0, 26.0, 17.0, 10.0, 17.0, 9.0, 9.0, 8.0, 3.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.63671875, -7.4132080078125, -7.189697265625, -6.9661865234375, -6.74267578125, -6.5191650390625, -6.295654296875, -6.0721435546875, -5.8486328125, -5.6251220703125, -5.401611328125, -5.1781005859375, -4.95458984375, -4.7310791015625, -4.507568359375, -4.2840576171875, -4.060546875, -3.8370361328125, -3.613525390625, -3.3900146484375, -3.16650390625, -2.9429931640625, -2.719482421875, -2.4959716796875, -2.2724609375, -2.0489501953125, -1.825439453125, -1.6019287109375, -1.37841796875, -1.1549072265625, -0.931396484375, -0.7078857421875, -0.484375, -0.2608642578125, -0.037353515625, 0.1861572265625, 0.40966796875, 0.6331787109375, 0.856689453125, 1.0802001953125, 1.3037109375, 1.5272216796875, 1.750732421875, 1.9742431640625, 2.19775390625, 2.4212646484375, 2.644775390625, 2.8682861328125, 3.091796875, 3.3153076171875, 3.538818359375, 3.7623291015625, 3.98583984375, 4.2093505859375, 4.432861328125, 4.6563720703125, 4.8798828125, 5.1033935546875, 5.326904296875, 5.5504150390625, 5.77392578125, 5.9974365234375, 6.220947265625, 6.4444580078125, 6.66796875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 5.0, 8.0, 19.0, 22.0, 28.0, 41.0, 48.0, 68.0, 113.0, 151.0, 262.0, 402.0, 585.0, 962.0, 1475.0, 2414.0, 3771.0, 6272.0, 10268.0, 17498.0, 30147.0, 54146.0, 102209.0, 195024.0, 259322.0, 165801.0, 86185.0, 46280.0, 26268.0, 15129.0, 9021.0, 5453.0, 3287.0, 2024.0, 1326.0, 859.0, 594.0, 364.0, 216.0, 174.0, 93.0, 71.0, 53.0, 39.0, 25.0, 12.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.046875, -8.7757568359375, -8.504638671875, -8.2335205078125, -7.96240234375, -7.6912841796875, -7.420166015625, -7.1490478515625, -6.8779296875, -6.6068115234375, -6.335693359375, -6.0645751953125, -5.79345703125, -5.5223388671875, -5.251220703125, -4.9801025390625, -4.708984375, -4.4378662109375, -4.166748046875, -3.8956298828125, -3.62451171875, -3.3533935546875, -3.082275390625, -2.8111572265625, -2.5400390625, -2.2689208984375, -1.997802734375, -1.7266845703125, -1.45556640625, -1.1844482421875, -0.913330078125, -0.6422119140625, -0.37109375, -0.0999755859375, 0.171142578125, 0.4422607421875, 0.71337890625, 0.9844970703125, 1.255615234375, 1.5267333984375, 1.7978515625, 2.0689697265625, 2.340087890625, 2.6112060546875, 2.88232421875, 3.1534423828125, 3.424560546875, 3.6956787109375, 3.966796875, 4.2379150390625, 4.509033203125, 4.7801513671875, 5.05126953125, 5.3223876953125, 5.593505859375, 5.8646240234375, 6.1357421875, 6.4068603515625, 6.677978515625, 6.9490966796875, 7.22021484375, 7.4913330078125, 7.762451171875, 8.0335693359375, 8.3046875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 9.0, 6.0, 7.0, 10.0, 11.0, 11.0, 23.0, 13.0, 18.0, 30.0, 40.0, 39.0, 40.0, 55.0, 61.0, 82.0, 149.0, 219.0, 1329.0, 230.0, 151.0, 85.0, 68.0, 45.0, 50.0, 46.0, 35.0, 29.0, 28.0, 18.0, 20.0, 15.0, 17.0, 8.0, 5.0, 10.0, 8.0, 11.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0, -17.43017578125, -16.8603515625, -16.29052734375, -15.720703125, -15.15087890625, -14.5810546875, -14.01123046875, -13.44140625, -12.87158203125, -12.3017578125, -11.73193359375, -11.162109375, -10.59228515625, -10.0224609375, -9.45263671875, -8.8828125, -8.31298828125, -7.7431640625, -7.17333984375, -6.603515625, -6.03369140625, -5.4638671875, -4.89404296875, -4.32421875, -3.75439453125, -3.1845703125, -2.61474609375, -2.044921875, -1.47509765625, -0.9052734375, -0.33544921875, 0.234375, 0.80419921875, 1.3740234375, 1.94384765625, 2.513671875, 3.08349609375, 3.6533203125, 4.22314453125, 4.79296875, 5.36279296875, 5.9326171875, 6.50244140625, 7.072265625, 7.64208984375, 8.2119140625, 8.78173828125, 9.3515625, 9.92138671875, 10.4912109375, 11.06103515625, 11.630859375, 12.20068359375, 12.7705078125, 13.34033203125, 13.91015625, 14.47998046875, 15.0498046875, 15.61962890625, 16.189453125, 16.75927734375, 17.3291015625, 17.89892578125, 18.46875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 15.0, 12.0, 15.0, 31.0, 32.0, 36.0, 60.0, 82.0, 174.0, 332.0, 704.0, 1517.0, 3610.0, 9476.0, 27499.0, 93658.0, 554221.0, 2009286.0, 341705.0, 68983.0, 21281.0, 7517.0, 2842.0, 1290.0, 584.0, 288.0, 144.0, 78.0, 54.0, 38.0, 31.0, 31.0, 18.0, 9.0, 9.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 4.0, 5.0, 2.0], "bins": [-21.125, -20.5599365234375, -19.994873046875, -19.4298095703125, -18.86474609375, -18.2996826171875, -17.734619140625, -17.1695556640625, -16.6044921875, -16.0394287109375, -15.474365234375, -14.9093017578125, -14.34423828125, -13.7791748046875, -13.214111328125, -12.6490478515625, -12.083984375, -11.5189208984375, -10.953857421875, -10.3887939453125, -9.82373046875, -9.2586669921875, -8.693603515625, -8.1285400390625, -7.5634765625, -6.9984130859375, -6.433349609375, -5.8682861328125, -5.30322265625, -4.7381591796875, -4.173095703125, -3.6080322265625, -3.04296875, -2.4779052734375, -1.912841796875, -1.3477783203125, -0.78271484375, -0.2176513671875, 0.347412109375, 0.9124755859375, 1.4775390625, 2.0426025390625, 2.607666015625, 3.1727294921875, 3.73779296875, 4.3028564453125, 4.867919921875, 5.4329833984375, 5.998046875, 6.5631103515625, 7.128173828125, 7.6932373046875, 8.25830078125, 8.8233642578125, 9.388427734375, 9.9534912109375, 10.5185546875, 11.0836181640625, 11.648681640625, 12.2137451171875, 12.77880859375, 13.3438720703125, 13.908935546875, 14.4739990234375, 15.0390625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 23.0, 36.0, 83.0, 140.0, 211.0, 195.0, 140.0, 85.0, 48.0, 22.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.17153549194336, -41.76957702636719, -38.36761474609375, -34.96565246582031, -31.56369400024414, -28.161733627319336, -24.75977325439453, -21.357812881469727, -17.955852508544922, -14.553892135620117, -11.151931762695312, -7.749971389770508, -4.348011016845703, -0.9460506439208984, 2.4559097290039062, 5.857870101928711, 9.259830474853516, 12.66179084777832, 16.063751220703125, 19.46571159362793, 22.867671966552734, 26.26963233947754, 29.671592712402344, 33.07355499267578, 36.47551345825195, 39.877471923828125, 43.27943420410156, 46.681396484375, 50.08335494995117, 53.485313415527344, 56.88727569580078, 60.28923797607422, 63.691192626953125, 67.09315490722656, 70.4951171875, 73.8970718383789, 77.29903411865234, 80.70099639892578, 84.10295104980469, 87.50491333007812, 90.90687561035156, 94.308837890625, 97.71080017089844, 101.11275482177734, 104.51471710205078, 107.91667938232422, 111.31863403320312, 114.72059631347656, 118.12255859375, 121.52452087402344, 124.92648315429688, 128.3284454345703, 131.73040771484375, 135.13235473632812, 138.53431701660156, 141.936279296875, 145.33824157714844, 148.74020385742188, 152.1421661376953, 155.54412841796875, 158.94607543945312, 162.34803771972656, 165.75, 169.15196228027344, 172.55392456054688]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 5.0, 7.0, 4.0, 4.0, 7.0, 11.0, 8.0, 10.0, 12.0, 8.0, 17.0, 16.0, 24.0, 18.0, 26.0, 27.0, 34.0, 26.0, 39.0, 30.0, 41.0, 34.0, 39.0, 36.0, 47.0, 42.0, 42.0, 33.0, 32.0, 33.0, 43.0, 40.0, 23.0, 28.0, 23.0, 25.0, 25.0, 16.0, 14.0, 9.0, 12.0, 9.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-54.364418029785156, -52.8651123046875, -51.36580276489258, -49.86649703979492, -48.367191314697266, -46.86788558959961, -45.36857604980469, -43.86927032470703, -42.369964599609375, -40.87065887451172, -39.3713493347168, -37.87204360961914, -36.372737884521484, -34.87343215942383, -33.374122619628906, -31.87481689453125, -30.37550926208496, -28.876201629638672, -27.376895904541016, -25.877588272094727, -24.37828254699707, -22.87897491455078, -21.379669189453125, -19.880361557006836, -18.381053924560547, -16.881746292114258, -15.382440567016602, -13.883132934570312, -12.383827209472656, -10.884519577026367, -9.385212898254395, -7.885906219482422, -6.386600494384766, -4.887293815612793, -3.387986898422241, -1.8886799812316895, -0.3893733024597168, 1.1099333763122559, 2.6092405319213867, 4.108547210693359, 5.607853889465332, 7.107160568237305, 8.606467247009277, 10.10577392578125, 11.605081558227539, 13.104387283325195, 14.603694915771484, 16.10300064086914, 17.60230827331543, 19.10161590576172, 20.600921630859375, 22.100229263305664, 23.59953498840332, 25.09884262084961, 26.598148345947266, 28.097455978393555, 29.596763610839844, 31.096071243286133, 32.59537887573242, 34.09468460083008, 35.593990325927734, 37.09329605102539, 38.59260559082031, 40.09191131591797, 41.591217041015625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 7.0, 8.0, 6.0, 6.0, 12.0, 18.0, 15.0, 18.0, 22.0, 23.0, 26.0, 33.0, 38.0, 45.0, 44.0, 43.0, 42.0, 55.0, 42.0, 44.0, 35.0, 44.0, 35.0, 50.0, 46.0, 32.0, 39.0, 25.0, 25.0, 25.0, 23.0, 13.0, 15.0, 13.0, 4.0, 8.0, 8.0, 8.0, 6.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.8046875, -8.552978515625, -8.30126953125, -8.049560546875, -7.7978515625, -7.546142578125, -7.29443359375, -7.042724609375, -6.791015625, -6.539306640625, -6.28759765625, -6.035888671875, -5.7841796875, -5.532470703125, -5.28076171875, -5.029052734375, -4.77734375, -4.525634765625, -4.27392578125, -4.022216796875, -3.7705078125, -3.518798828125, -3.26708984375, -3.015380859375, -2.763671875, -2.511962890625, -2.26025390625, -2.008544921875, -1.7568359375, -1.505126953125, -1.25341796875, -1.001708984375, -0.75, -0.498291015625, -0.24658203125, 0.005126953125, 0.2568359375, 0.508544921875, 0.76025390625, 1.011962890625, 1.263671875, 1.515380859375, 1.76708984375, 2.018798828125, 2.2705078125, 2.522216796875, 2.77392578125, 3.025634765625, 3.27734375, 3.529052734375, 3.78076171875, 4.032470703125, 4.2841796875, 4.535888671875, 4.78759765625, 5.039306640625, 5.291015625, 5.542724609375, 5.79443359375, 6.046142578125, 6.2978515625, 6.549560546875, 6.80126953125, 7.052978515625, 7.3046875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 13.0, 18.0, 19.0, 26.0, 46.0, 70.0, 88.0, 148.0, 248.0, 465.0, 829.0, 1570.0, 3143.0, 6497.0, 14203.0, 33535.0, 91593.0, 348818.0, 2202948.0, 1181129.0, 201690.0, 62137.0, 24357.0, 10648.0, 4862.0, 2408.0, 1150.0, 648.0, 352.0, 226.0, 132.0, 69.0, 55.0, 39.0, 32.0, 31.0, 9.0, 4.0, 10.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.9140625, -14.4595947265625, -14.005126953125, -13.5506591796875, -13.09619140625, -12.6417236328125, -12.187255859375, -11.7327880859375, -11.2783203125, -10.8238525390625, -10.369384765625, -9.9149169921875, -9.46044921875, -9.0059814453125, -8.551513671875, -8.0970458984375, -7.642578125, -7.1881103515625, -6.733642578125, -6.2791748046875, -5.82470703125, -5.3702392578125, -4.915771484375, -4.4613037109375, -4.0068359375, -3.5523681640625, -3.097900390625, -2.6434326171875, -2.18896484375, -1.7344970703125, -1.280029296875, -0.8255615234375, -0.37109375, 0.0833740234375, 0.537841796875, 0.9923095703125, 1.44677734375, 1.9012451171875, 2.355712890625, 2.8101806640625, 3.2646484375, 3.7191162109375, 4.173583984375, 4.6280517578125, 5.08251953125, 5.5369873046875, 5.991455078125, 6.4459228515625, 6.900390625, 7.3548583984375, 7.809326171875, 8.2637939453125, 8.71826171875, 9.1727294921875, 9.627197265625, 10.0816650390625, 10.5361328125, 10.9906005859375, 11.445068359375, 11.8995361328125, 12.35400390625, 12.8084716796875, 13.262939453125, 13.7174072265625, 14.171875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 7.0, 9.0, 9.0, 17.0, 15.0, 28.0, 37.0, 54.0, 45.0, 91.0, 111.0, 154.0, 240.0, 350.0, 529.0, 616.0, 550.0, 328.0, 207.0, 150.0, 119.0, 78.0, 78.0, 47.0, 43.0, 31.0, 30.0, 16.0, 18.0, 12.0, 6.0, 9.0, 5.0, 3.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-14.3515625, -13.9688720703125, -13.586181640625, -13.2034912109375, -12.82080078125, -12.4381103515625, -12.055419921875, -11.6727294921875, -11.2900390625, -10.9073486328125, -10.524658203125, -10.1419677734375, -9.75927734375, -9.3765869140625, -8.993896484375, -8.6112060546875, -8.228515625, -7.8458251953125, -7.463134765625, -7.0804443359375, -6.69775390625, -6.3150634765625, -5.932373046875, -5.5496826171875, -5.1669921875, -4.7843017578125, -4.401611328125, -4.0189208984375, -3.63623046875, -3.2535400390625, -2.870849609375, -2.4881591796875, -2.10546875, -1.7227783203125, -1.340087890625, -0.9573974609375, -0.57470703125, -0.1920166015625, 0.190673828125, 0.5733642578125, 0.9560546875, 1.3387451171875, 1.721435546875, 2.1041259765625, 2.48681640625, 2.8695068359375, 3.252197265625, 3.6348876953125, 4.017578125, 4.4002685546875, 4.782958984375, 5.1656494140625, 5.54833984375, 5.9310302734375, 6.313720703125, 6.6964111328125, 7.0791015625, 7.4617919921875, 7.844482421875, 8.2271728515625, 8.60986328125, 8.9925537109375, 9.375244140625, 9.7579345703125, 10.140625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 8.0, 11.0, 15.0, 15.0, 32.0, 44.0, 87.0, 149.0, 253.0, 474.0, 1010.0, 2222.0, 5108.0, 13772.0, 43993.0, 183175.0, 1470719.0, 2162596.0, 230208.0, 53366.0, 16401.0, 5902.0, 2404.0, 1101.0, 555.0, 301.0, 142.0, 83.0, 45.0, 30.0, 22.0, 14.0, 7.0, 3.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.265625, -16.54833984375, -15.8310546875, -15.11376953125, -14.396484375, -13.67919921875, -12.9619140625, -12.24462890625, -11.52734375, -10.81005859375, -10.0927734375, -9.37548828125, -8.658203125, -7.94091796875, -7.2236328125, -6.50634765625, -5.7890625, -5.07177734375, -4.3544921875, -3.63720703125, -2.919921875, -2.20263671875, -1.4853515625, -0.76806640625, -0.05078125, 0.66650390625, 1.3837890625, 2.10107421875, 2.818359375, 3.53564453125, 4.2529296875, 4.97021484375, 5.6875, 6.40478515625, 7.1220703125, 7.83935546875, 8.556640625, 9.27392578125, 9.9912109375, 10.70849609375, 11.42578125, 12.14306640625, 12.8603515625, 13.57763671875, 14.294921875, 15.01220703125, 15.7294921875, 16.44677734375, 17.1640625, 17.88134765625, 18.5986328125, 19.31591796875, 20.033203125, 20.75048828125, 21.4677734375, 22.18505859375, 22.90234375, 23.61962890625, 24.3369140625, 25.05419921875, 25.771484375, 26.48876953125, 27.2060546875, 27.92333984375, 28.640625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 9.0, 12.0, 23.0, 22.0, 36.0, 58.0, 59.0, 50.0, 75.0, 112.0, 99.0, 74.0, 82.0, 87.0, 51.0, 41.0, 37.0, 29.0, 16.0, 15.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.692049026489258, -27.03499984741211, -25.377948760986328, -23.720897674560547, -22.0638484954834, -20.40679931640625, -18.74974822998047, -17.092697143554688, -15.435647964477539, -13.778597831726074, -12.12154769897461, -10.464497566223145, -8.80744743347168, -7.150397300720215, -5.49334716796875, -3.836297035217285, -2.1792469024658203, -0.5221967697143555, 1.1348533630371094, 2.791903495788574, 4.448953628540039, 6.106003761291504, 7.763053894042969, 9.420104026794434, 11.077154159545898, 12.734204292297363, 14.391254425048828, 16.04830551147461, 17.705354690551758, 19.362403869628906, 21.019454956054688, 22.67650604248047, 24.33355712890625, 25.99060821533203, 27.64765739440918, 29.304706573486328, 30.96175765991211, 32.61880874633789, 34.275856018066406, 35.93290710449219, 37.58995819091797, 39.24700927734375, 40.90406036376953, 42.56110763549805, 44.21815872192383, 45.87520980834961, 47.532257080078125, 49.189308166503906, 50.84635925292969, 52.50341033935547, 54.16046142578125, 55.817508697509766, 57.47455978393555, 59.13161087036133, 60.788658142089844, 62.445709228515625, 64.1027603149414, 65.75981140136719, 67.41686248779297, 69.07391357421875, 70.73095703125, 72.38800811767578, 74.04505920410156, 75.70211029052734, 77.35916137695312]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 2.0, 7.0, 9.0, 5.0, 5.0, 9.0, 11.0, 13.0, 13.0, 23.0, 26.0, 20.0, 21.0, 23.0, 31.0, 37.0, 32.0, 35.0, 36.0, 42.0, 40.0, 38.0, 54.0, 34.0, 50.0, 30.0, 37.0, 37.0, 31.0, 24.0, 28.0, 24.0, 35.0, 13.0, 21.0, 19.0, 18.0, 13.0, 8.0, 19.0, 5.0, 8.0, 8.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-43.9974365234375, -42.66325759887695, -41.329078674316406, -39.994895935058594, -38.66071701049805, -37.3265380859375, -35.99235916137695, -34.658180236816406, -33.323997497558594, -31.989818572998047, -30.655637741088867, -29.32145881652832, -27.98727798461914, -26.653099060058594, -25.318920135498047, -23.9847412109375, -22.650562286376953, -21.316383361816406, -19.982202529907227, -18.64802360534668, -17.3138427734375, -15.979663848876953, -14.645484924316406, -13.311305046081543, -11.97712516784668, -10.642945289611816, -9.308765411376953, -7.974586486816406, -6.640406608581543, -5.30622673034668, -3.972047805786133, -2.6378679275512695, -1.3036880493164062, 0.03049159049987793, 1.364671230316162, 2.698850631713867, 4.0330305099487305, 5.367210388183594, 6.701389312744141, 8.035569190979004, 9.369749069213867, 10.70392894744873, 12.038108825683594, 13.37228775024414, 14.706467628479004, 16.040647506713867, 17.374826431274414, 18.709007263183594, 20.04318618774414, 21.377365112304688, 22.711545944213867, 24.045724868774414, 25.379905700683594, 26.71408462524414, 28.048263549804688, 29.382442474365234, 30.716623306274414, 32.050804138183594, 33.38498306274414, 34.71916198730469, 36.053340911865234, 37.38751983642578, 38.721702575683594, 40.05588150024414, 41.39006042480469]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 4.0, 9.0, 4.0, 12.0, 18.0, 17.0, 18.0, 16.0, 26.0, 23.0, 22.0, 27.0, 21.0, 29.0, 45.0, 46.0, 37.0, 31.0, 49.0, 40.0, 32.0, 39.0, 31.0, 48.0, 37.0, 33.0, 39.0, 34.0, 29.0, 20.0, 15.0, 25.0, 14.0, 18.0, 14.0, 11.0, 5.0, 15.0, 12.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0], "bins": [-7.87109375, -7.6510009765625, -7.430908203125, -7.2108154296875, -6.99072265625, -6.7706298828125, -6.550537109375, -6.3304443359375, -6.1103515625, -5.8902587890625, -5.670166015625, -5.4500732421875, -5.22998046875, -5.0098876953125, -4.789794921875, -4.5697021484375, -4.349609375, -4.1295166015625, -3.909423828125, -3.6893310546875, -3.46923828125, -3.2491455078125, -3.029052734375, -2.8089599609375, -2.5888671875, -2.3687744140625, -2.148681640625, -1.9285888671875, -1.70849609375, -1.4884033203125, -1.268310546875, -1.0482177734375, -0.828125, -0.6080322265625, -0.387939453125, -0.1678466796875, 0.05224609375, 0.2723388671875, 0.492431640625, 0.7125244140625, 0.9326171875, 1.1527099609375, 1.372802734375, 1.5928955078125, 1.81298828125, 2.0330810546875, 2.253173828125, 2.4732666015625, 2.693359375, 2.9134521484375, 3.133544921875, 3.3536376953125, 3.57373046875, 3.7938232421875, 4.013916015625, 4.2340087890625, 4.4541015625, 4.6741943359375, 4.894287109375, 5.1143798828125, 5.33447265625, 5.5545654296875, 5.774658203125, 5.9947509765625, 6.21484375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 2.0, 4.0, 5.0, 11.0, 14.0, 18.0, 28.0, 47.0, 70.0, 103.0, 178.0, 237.0, 377.0, 583.0, 920.0, 1464.0, 2268.0, 3516.0, 5710.0, 9024.0, 14905.0, 25265.0, 44085.0, 85910.0, 195849.0, 322873.0, 163084.0, 74325.0, 39176.0, 22462.0, 13675.0, 8219.0, 5235.0, 3196.0, 2037.0, 1250.0, 866.0, 523.0, 346.0, 224.0, 152.0, 114.0, 64.0, 48.0, 26.0, 25.0, 18.0, 10.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.251220703125, -0.24237442016601562, -0.23352813720703125, -0.22468185424804688, -0.2158355712890625, -0.20698928833007812, -0.19814300537109375, -0.18929672241210938, -0.180450439453125, -0.17160415649414062, -0.16275787353515625, -0.15391159057617188, -0.1450653076171875, -0.13621902465820312, -0.12737274169921875, -0.11852645874023438, -0.10968017578125, -0.10083389282226562, -0.09198760986328125, -0.08314132690429688, -0.0742950439453125, -0.06544876098632812, -0.05660247802734375, -0.047756195068359375, -0.038909912109375, -0.030063629150390625, -0.02121734619140625, -0.012371063232421875, -0.0035247802734375, 0.005321502685546875, 0.01416778564453125, 0.023014068603515625, 0.0318603515625, 0.040706634521484375, 0.04955291748046875, 0.058399200439453125, 0.0672454833984375, 0.07609176635742188, 0.08493804931640625, 0.09378433227539062, 0.102630615234375, 0.11147689819335938, 0.12032318115234375, 0.12916946411132812, 0.1380157470703125, 0.14686203002929688, 0.15570831298828125, 0.16455459594726562, 0.17340087890625, 0.18224716186523438, 0.19109344482421875, 0.19993972778320312, 0.2087860107421875, 0.21763229370117188, 0.22647857666015625, 0.23532485961914062, 0.244171142578125, 0.2530174255371094, 0.26186370849609375, 0.2707099914550781, 0.2795562744140625, 0.2884025573730469, 0.29724884033203125, 0.3060951232910156, 0.31494140625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 8.0, 11.0, 13.0, 12.0, 14.0, 15.0, 22.0, 25.0, 30.0, 28.0, 32.0, 34.0, 36.0, 30.0, 36.0, 33.0, 34.0, 45.0, 1065.0, 41.0, 36.0, 33.0, 35.0, 39.0, 40.0, 27.0, 28.0, 34.0, 28.0, 23.0, 17.0, 18.0, 20.0, 10.0, 16.0, 6.0, 6.0, 6.0, 8.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9296875, -4.7691650390625, -4.608642578125, -4.4481201171875, -4.28759765625, -4.1270751953125, -3.966552734375, -3.8060302734375, -3.6455078125, -3.4849853515625, -3.324462890625, -3.1639404296875, -3.00341796875, -2.8428955078125, -2.682373046875, -2.5218505859375, -2.361328125, -2.2008056640625, -2.040283203125, -1.8797607421875, -1.71923828125, -1.5587158203125, -1.398193359375, -1.2376708984375, -1.0771484375, -0.9166259765625, -0.756103515625, -0.5955810546875, -0.43505859375, -0.2745361328125, -0.114013671875, 0.0465087890625, 0.20703125, 0.3675537109375, 0.528076171875, 0.6885986328125, 0.84912109375, 1.0096435546875, 1.170166015625, 1.3306884765625, 1.4912109375, 1.6517333984375, 1.812255859375, 1.9727783203125, 2.13330078125, 2.2938232421875, 2.454345703125, 2.6148681640625, 2.775390625, 2.9359130859375, 3.096435546875, 3.2569580078125, 3.41748046875, 3.5780029296875, 3.738525390625, 3.8990478515625, 4.0595703125, 4.2200927734375, 4.380615234375, 4.5411376953125, 4.70166015625, 4.8621826171875, 5.022705078125, 5.1832275390625, 5.34375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 11.0, 13.0, 18.0, 34.0, 58.0, 79.0, 131.0, 212.0, 300.0, 443.0, 707.0, 1067.0, 1638.0, 2648.0, 4129.0, 6581.0, 10825.0, 17460.0, 28806.0, 48697.0, 86936.0, 178170.0, 1339075.0, 167540.0, 82809.0, 46827.0, 27644.0, 16779.0, 10061.0, 6320.0, 4050.0, 2481.0, 1617.0, 1029.0, 687.0, 427.0, 271.0, 200.0, 118.0, 71.0, 55.0, 41.0, 23.0, 15.0, 6.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1739501953125, -0.16823959350585938, -0.16252899169921875, -0.15681838989257812, -0.1511077880859375, -0.14539718627929688, -0.13968658447265625, -0.13397598266601562, -0.128265380859375, -0.12255477905273438, -0.11684417724609375, -0.11113357543945312, -0.1054229736328125, -0.09971237182617188, -0.09400177001953125, -0.08829116821289062, -0.08258056640625, -0.07686996459960938, -0.07115936279296875, -0.06544876098632812, -0.0597381591796875, -0.054027557373046875, -0.04831695556640625, -0.042606353759765625, -0.036895751953125, -0.031185150146484375, -0.02547454833984375, -0.019763946533203125, -0.0140533447265625, -0.008342742919921875, -0.00263214111328125, 0.003078460693359375, 0.0087890625, 0.014499664306640625, 0.02021026611328125, 0.025920867919921875, 0.0316314697265625, 0.037342071533203125, 0.04305267333984375, 0.048763275146484375, 0.054473876953125, 0.060184478759765625, 0.06589508056640625, 0.07160568237304688, 0.0773162841796875, 0.08302688598632812, 0.08873748779296875, 0.09444808959960938, 0.10015869140625, 0.10586929321289062, 0.11157989501953125, 0.11729049682617188, 0.1230010986328125, 0.12871170043945312, 0.13442230224609375, 0.14013290405273438, 0.145843505859375, 0.15155410766601562, 0.15726470947265625, 0.16297531127929688, 0.1686859130859375, 0.17439651489257812, 0.18010711669921875, 0.18581771850585938, 0.1915283203125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 8.0, 11.0, 9.0, 12.0, 19.0, 10.0, 21.0, 12.0, 32.0, 31.0, 31.0, 25.0, 39.0, 44.0, 39.0, 47.0, 56.0, 49.0, 57.0, 40.0, 40.0, 39.0, 44.0, 34.0, 28.0, 33.0, 19.0, 25.0, 28.0, 19.0, 17.0, 17.0, 11.0, 11.0, 11.0, 11.0, 3.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-7.027387619018555e-05, -6.82976096868515e-05, -6.632134318351746e-05, -6.434507668018341e-05, -6.236881017684937e-05, -6.039254367351532e-05, -5.8416277170181274e-05, -5.644001066684723e-05, -5.4463744163513184e-05, -5.248747766017914e-05, -5.051121115684509e-05, -4.853494465351105e-05, -4.6558678150177e-05, -4.4582411646842957e-05, -4.260614514350891e-05, -4.0629878640174866e-05, -3.865361213684082e-05, -3.6677345633506775e-05, -3.470107913017273e-05, -3.2724812626838684e-05, -3.074854612350464e-05, -2.8772279620170593e-05, -2.6796013116836548e-05, -2.4819746613502502e-05, -2.2843480110168457e-05, -2.086721360683441e-05, -1.8890947103500366e-05, -1.691468060016632e-05, -1.4938414096832275e-05, -1.296214759349823e-05, -1.0985881090164185e-05, -9.00961458683014e-06, -7.033348083496094e-06, -5.057081580162048e-06, -3.080815076828003e-06, -1.1045485734939575e-06, 8.717179298400879e-07, 2.8479844331741333e-06, 4.824250936508179e-06, 6.800517439842224e-06, 8.77678394317627e-06, 1.0753050446510315e-05, 1.272931694984436e-05, 1.4705583453178406e-05, 1.668184995651245e-05, 1.8658116459846497e-05, 2.0634382963180542e-05, 2.2610649466514587e-05, 2.4586915969848633e-05, 2.6563182473182678e-05, 2.8539448976516724e-05, 3.051571547985077e-05, 3.2491981983184814e-05, 3.446824848651886e-05, 3.6444514989852905e-05, 3.842078149318695e-05, 4.0397047996520996e-05, 4.237331449985504e-05, 4.434958100318909e-05, 4.632584750652313e-05, 4.830211400985718e-05, 5.027838051319122e-05, 5.225464701652527e-05, 5.4230913519859314e-05, 5.620718002319336e-05]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 6.0, 9.0, 10.0, 12.0, 18.0, 19.0, 17.0, 31.0, 28.0, 36.0, 44.0, 71.0, 108.0, 180.0, 361.0, 1071.0, 46895.0, 974337.0, 23466.0, 877.0, 293.0, 192.0, 117.0, 72.0, 48.0, 40.0, 40.0, 26.0, 27.0, 12.0, 12.0, 18.0, 7.0, 8.0, 16.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013151168823242188, -0.0012704432010650635, -0.0012257695198059082, -0.001181095838546753, -0.0011364221572875977, -0.0010917484760284424, -0.0010470747947692871, -0.0010024011135101318, -0.0009577274322509766, -0.0009130537509918213, -0.000868380069732666, -0.0008237063884735107, -0.0007790327072143555, -0.0007343590259552002, -0.0006896853446960449, -0.0006450116634368896, -0.0006003379821777344, -0.0005556643009185791, -0.0005109906196594238, -0.00046631693840026855, -0.0004216432571411133, -0.000376969575881958, -0.00033229589462280273, -0.00028762221336364746, -0.0002429485321044922, -0.00019827485084533691, -0.00015360116958618164, -0.00010892748832702637, -6.42538070678711e-05, -1.958012580871582e-05, 2.5093555450439453e-05, 6.976723670959473e-05, 0.00011444091796875, 0.00015911459922790527, 0.00020378828048706055, 0.0002484619617462158, 0.0002931356430053711, 0.00033780932426452637, 0.00038248300552368164, 0.0004271566867828369, 0.0004718303680419922, 0.0005165040493011475, 0.0005611777305603027, 0.000605851411819458, 0.0006505250930786133, 0.0006951987743377686, 0.0007398724555969238, 0.0007845461368560791, 0.0008292198181152344, 0.0008738934993743896, 0.0009185671806335449, 0.0009632408618927002, 0.0010079145431518555, 0.0010525882244110107, 0.001097261905670166, 0.0011419355869293213, 0.0011866092681884766, 0.0012312829494476318, 0.0012759566307067871, 0.0013206303119659424, 0.0013653039932250977, 0.001409977674484253, 0.0014546513557434082, 0.0014993250370025635, 0.0015439987182617188]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 10.0, 38.0, 120.0, 298.0, 321.0, 156.0, 47.0, 11.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.975300569436513e-05, -3.3293083106400445e-05, -2.683316051843576e-05, -2.0373237930471078e-05, -1.3913315342506394e-05, -7.45339275454171e-06, -9.934701665770262e-07, 5.4664524213876575e-06, 1.1926375009352341e-05, 1.8386297597317025e-05, 2.484622018528171e-05, 3.130614277324639e-05, 3.7766065361211076e-05, 4.422598794917576e-05, 5.0685910537140444e-05, 5.714583312510513e-05, 6.3605752075091e-05, 7.006567466305569e-05, 7.652559725102037e-05, 8.298551983898506e-05, 8.944544242694974e-05, 9.590536501491442e-05, 0.00010236528760287911, 0.00010882521019084379, 0.00011528513277880847, 0.00012174505536677316, 0.00012820497795473784, 0.00013466490781866014, 0.0001411248231306672, 0.00014758473844267428, 0.00015404466830659658, 0.00016050459817051888, 0.00016696451348252594, 0.00017342442879453301, 0.0001798843586584553, 0.0001863442885223776, 0.00019280420383438468, 0.00019926411914639175, 0.00020572404901031405, 0.00021218397887423635, 0.00021864389418624341, 0.00022510380949825048, 0.00023156373936217278, 0.00023802366922609508, 0.00024448358453810215, 0.0002509434998501092, 0.0002574034151621163, 0.0002638633595779538, 0.0002703232748899609, 0.00027678319020196795, 0.0002832431346178055, 0.00028970304992981255, 0.0002961629652418196, 0.0003026228805538267, 0.00030908279586583376, 0.0003155427402816713, 0.00032200265559367836, 0.0003284625709056854, 0.00033492251532152295, 0.00034138243063353, 0.0003478423459455371, 0.00035430226125754416, 0.00036076217656955123, 0.00036722212098538876, 0.0003736820362973958]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 7.0, 7.0, 3.0, 7.0, 4.0, 6.0, 7.0, 11.0, 6.0, 14.0, 19.0, 22.0, 14.0, 21.0, 24.0, 26.0, 32.0, 27.0, 24.0, 32.0, 36.0, 38.0, 37.0, 24.0, 39.0, 41.0, 35.0, 34.0, 32.0, 21.0, 29.0, 32.0, 27.0, 26.0, 19.0, 24.0, 34.0, 27.0, 20.0, 11.0, 13.0, 13.0, 15.0, 11.0, 12.0, 10.0, 10.0, 3.0, 6.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1948089599609375e-05, -3.0836090445518494e-05, -2.9724091291427612e-05, -2.861209213733673e-05, -2.750009298324585e-05, -2.6388093829154968e-05, -2.5276094675064087e-05, -2.4164095520973206e-05, -2.3052096366882324e-05, -2.1940097212791443e-05, -2.082809805870056e-05, -1.971609890460968e-05, -1.86040997505188e-05, -1.7492100596427917e-05, -1.6380101442337036e-05, -1.5268102288246155e-05, -1.4156103134155273e-05, -1.3044103980064392e-05, -1.193210482597351e-05, -1.082010567188263e-05, -9.708106517791748e-06, -8.596107363700867e-06, -7.484108209609985e-06, -6.372109055519104e-06, -5.260109901428223e-06, -4.148110747337341e-06, -3.03611159324646e-06, -1.9241124391555786e-06, -8.121132850646973e-07, 2.998858690261841e-07, 1.4118850231170654e-06, 2.5238841772079468e-06, 3.635883331298828e-06, 4.7478824853897095e-06, 5.859881639480591e-06, 6.971880793571472e-06, 8.083879947662354e-06, 9.195879101753235e-06, 1.0307878255844116e-05, 1.1419877409934998e-05, 1.2531876564025879e-05, 1.364387571811676e-05, 1.4755874872207642e-05, 1.5867874026298523e-05, 1.6979873180389404e-05, 1.8091872334480286e-05, 1.9203871488571167e-05, 2.031587064266205e-05, 2.142786979675293e-05, 2.253986895084381e-05, 2.3651868104934692e-05, 2.4763867259025574e-05, 2.5875866413116455e-05, 2.6987865567207336e-05, 2.8099864721298218e-05, 2.92118638753891e-05, 3.032386302947998e-05, 3.143586218357086e-05, 3.254786133766174e-05, 3.3659860491752625e-05, 3.4771859645843506e-05, 3.588385879993439e-05, 3.699585795402527e-05, 3.810785710811615e-05, 3.921985626220703e-05]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 4.0, 9.0, 4.0, 12.0, 18.0, 17.0, 18.0, 16.0, 26.0, 23.0, 22.0, 27.0, 21.0, 29.0, 45.0, 46.0, 37.0, 31.0, 49.0, 40.0, 32.0, 39.0, 31.0, 48.0, 37.0, 33.0, 39.0, 34.0, 29.0, 20.0, 15.0, 25.0, 14.0, 18.0, 14.0, 11.0, 5.0, 15.0, 12.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0], "bins": [-7.87109375, -7.6510009765625, -7.430908203125, -7.2108154296875, -6.99072265625, -6.7706298828125, -6.550537109375, -6.3304443359375, -6.1103515625, -5.8902587890625, -5.670166015625, -5.4500732421875, -5.22998046875, -5.0098876953125, -4.789794921875, -4.5697021484375, -4.349609375, -4.1295166015625, -3.909423828125, -3.6893310546875, -3.46923828125, -3.2491455078125, -3.029052734375, -2.8089599609375, -2.5888671875, -2.3687744140625, -2.148681640625, -1.9285888671875, -1.70849609375, -1.4884033203125, -1.268310546875, -1.0482177734375, -0.828125, -0.6080322265625, -0.387939453125, -0.1678466796875, 0.05224609375, 0.2723388671875, 0.492431640625, 0.7125244140625, 0.9326171875, 1.1527099609375, 1.372802734375, 1.5928955078125, 1.81298828125, 2.0330810546875, 2.253173828125, 2.4732666015625, 2.693359375, 2.9134521484375, 3.133544921875, 3.3536376953125, 3.57373046875, 3.7938232421875, 4.013916015625, 4.2340087890625, 4.4541015625, 4.6741943359375, 4.894287109375, 5.1143798828125, 5.33447265625, 5.5545654296875, 5.774658203125, 5.9947509765625, 6.21484375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 10.0, 22.0, 16.0, 37.0, 48.0, 72.0, 109.0, 154.0, 218.0, 374.0, 550.0, 827.0, 1227.0, 2037.0, 3353.0, 5429.0, 9182.0, 14835.0, 24523.0, 40723.0, 71037.0, 136257.0, 279249.0, 215459.0, 102574.0, 56007.0, 32868.0, 19626.0, 12125.0, 7376.0, 4507.0, 2882.0, 1733.0, 1081.0, 671.0, 394.0, 306.0, 186.0, 124.0, 102.0, 67.0, 37.0, 38.0, 21.0, 25.0, 14.0, 9.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0], "bins": [-9.671875, -9.376953125, -9.08203125, -8.787109375, -8.4921875, -8.197265625, -7.90234375, -7.607421875, -7.3125, -7.017578125, -6.72265625, -6.427734375, -6.1328125, -5.837890625, -5.54296875, -5.248046875, -4.953125, -4.658203125, -4.36328125, -4.068359375, -3.7734375, -3.478515625, -3.18359375, -2.888671875, -2.59375, -2.298828125, -2.00390625, -1.708984375, -1.4140625, -1.119140625, -0.82421875, -0.529296875, -0.234375, 0.060546875, 0.35546875, 0.650390625, 0.9453125, 1.240234375, 1.53515625, 1.830078125, 2.125, 2.419921875, 2.71484375, 3.009765625, 3.3046875, 3.599609375, 3.89453125, 4.189453125, 4.484375, 4.779296875, 5.07421875, 5.369140625, 5.6640625, 5.958984375, 6.25390625, 6.548828125, 6.84375, 7.138671875, 7.43359375, 7.728515625, 8.0234375, 8.318359375, 8.61328125, 8.908203125, 9.203125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 5.0, 6.0, 7.0, 8.0, 11.0, 15.0, 9.0, 14.0, 21.0, 26.0, 30.0, 20.0, 34.0, 37.0, 45.0, 61.0, 50.0, 62.0, 81.0, 153.0, 190.0, 1278.0, 200.0, 133.0, 98.0, 71.0, 64.0, 48.0, 38.0, 35.0, 29.0, 18.0, 28.0, 20.0, 20.0, 11.0, 12.0, 13.0, 13.0, 4.0, 8.0, 7.0, 7.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-18.453125, -17.903564453125, -17.35400390625, -16.804443359375, -16.2548828125, -15.705322265625, -15.15576171875, -14.606201171875, -14.056640625, -13.507080078125, -12.95751953125, -12.407958984375, -11.8583984375, -11.308837890625, -10.75927734375, -10.209716796875, -9.66015625, -9.110595703125, -8.56103515625, -8.011474609375, -7.4619140625, -6.912353515625, -6.36279296875, -5.813232421875, -5.263671875, -4.714111328125, -4.16455078125, -3.614990234375, -3.0654296875, -2.515869140625, -1.96630859375, -1.416748046875, -0.8671875, -0.317626953125, 0.23193359375, 0.781494140625, 1.3310546875, 1.880615234375, 2.43017578125, 2.979736328125, 3.529296875, 4.078857421875, 4.62841796875, 5.177978515625, 5.7275390625, 6.277099609375, 6.82666015625, 7.376220703125, 7.92578125, 8.475341796875, 9.02490234375, 9.574462890625, 10.1240234375, 10.673583984375, 11.22314453125, 11.772705078125, 12.322265625, 12.871826171875, 13.42138671875, 13.970947265625, 14.5205078125, 15.070068359375, 15.61962890625, 16.169189453125, 16.71875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 6.0, 5.0, 18.0, 15.0, 13.0, 25.0, 15.0, 36.0, 37.0, 68.0, 85.0, 167.0, 283.0, 585.0, 1369.0, 3808.0, 11319.0, 37795.0, 165770.0, 1550133.0, 1182805.0, 141472.0, 33537.0, 10238.0, 3469.0, 1270.0, 547.0, 282.0, 168.0, 109.0, 60.0, 45.0, 26.0, 32.0, 14.0, 15.0, 9.0, 10.0, 9.0, 5.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.671875, -19.01513671875, -18.3583984375, -17.70166015625, -17.044921875, -16.38818359375, -15.7314453125, -15.07470703125, -14.41796875, -13.76123046875, -13.1044921875, -12.44775390625, -11.791015625, -11.13427734375, -10.4775390625, -9.82080078125, -9.1640625, -8.50732421875, -7.8505859375, -7.19384765625, -6.537109375, -5.88037109375, -5.2236328125, -4.56689453125, -3.91015625, -3.25341796875, -2.5966796875, -1.93994140625, -1.283203125, -0.62646484375, 0.0302734375, 0.68701171875, 1.34375, 2.00048828125, 2.6572265625, 3.31396484375, 3.970703125, 4.62744140625, 5.2841796875, 5.94091796875, 6.59765625, 7.25439453125, 7.9111328125, 8.56787109375, 9.224609375, 9.88134765625, 10.5380859375, 11.19482421875, 11.8515625, 12.50830078125, 13.1650390625, 13.82177734375, 14.478515625, 15.13525390625, 15.7919921875, 16.44873046875, 17.10546875, 17.76220703125, 18.4189453125, 19.07568359375, 19.732421875, 20.38916015625, 21.0458984375, 21.70263671875, 22.359375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [2.0, 14.0, 57.0, 151.0, 270.0, 319.0, 129.0, 51.0, 13.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.686716079711914, -22.20356559753418, -16.720415115356445, -11.237264633178711, -5.754114151000977, -0.2709636688232422, 5.212186813354492, 10.695337295532227, 16.17848777770996, 21.661638259887695, 27.14478874206543, 32.62793731689453, 38.11109161376953, 43.59423828125, 49.077392578125, 54.56053924560547, 60.04369354248047, 65.52684020996094, 71.00999450683594, 76.49314880371094, 81.9762954711914, 87.45944213867188, 92.94259643554688, 98.42575073242188, 103.90889739990234, 109.39204406738281, 114.87519836425781, 120.35835266113281, 125.84149932861328, 131.32464599609375, 136.80780029296875, 142.29095458984375, 147.77410888671875, 153.25726318359375, 158.74041748046875, 164.2235565185547, 169.7067108154297, 175.1898651123047, 180.67300415039062, 186.15615844726562, 191.63931274414062, 197.12246704101562, 202.60562133789062, 208.08876037597656, 213.57191467285156, 219.05506896972656, 224.5382080078125, 230.0213623046875, 235.5045166015625, 240.9876708984375, 246.4708251953125, 251.95396423339844, 257.4371337890625, 262.9202575683594, 268.4034118652344, 273.8865661621094, 279.3697204589844, 284.8528747558594, 290.3360290527344, 295.8191833496094, 301.30230712890625, 306.78546142578125, 312.26861572265625, 317.75177001953125, 323.23492431640625]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 4.0, 3.0, 2.0, 6.0, 13.0, 11.0, 14.0, 22.0, 18.0, 17.0, 25.0, 21.0, 37.0, 36.0, 40.0, 39.0, 22.0, 44.0, 48.0, 33.0, 41.0, 33.0, 37.0, 37.0, 44.0, 39.0, 32.0, 34.0, 32.0, 35.0, 29.0, 22.0, 21.0, 19.0, 17.0, 12.0, 12.0, 10.0, 4.0, 9.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.54527282714844, -43.94932556152344, -42.35337829589844, -40.75743103027344, -39.16148376464844, -37.56553268432617, -35.96958541870117, -34.37363815307617, -32.77769088745117, -31.181743621826172, -29.585796356201172, -27.98984718322754, -26.39389991760254, -24.79795265197754, -23.202003479003906, -21.606056213378906, -20.010108947753906, -18.414161682128906, -16.818214416503906, -15.222265243530273, -13.626317977905273, -12.030370712280273, -10.434422492980957, -8.83847427368164, -7.242527008056641, -5.646579265594482, -4.050631523132324, -2.454683780670166, -0.8587360382080078, 0.7372117042541504, 2.3331594467163086, 3.929107666015625, 5.525054931640625, 7.121002674102783, 8.716950416564941, 10.312898635864258, 11.908845901489258, 13.504793167114258, 15.100741386413574, 16.69668960571289, 18.29263687133789, 19.88858413696289, 21.48453140258789, 23.080480575561523, 24.676427841186523, 26.272375106811523, 27.868324279785156, 29.464271545410156, 31.060218811035156, 32.656166076660156, 34.252113342285156, 35.848060607910156, 37.444007873535156, 39.03995895385742, 40.63590621948242, 42.23185348510742, 43.82780075073242, 45.42374801635742, 47.01969528198242, 48.61564254760742, 50.21159362792969, 51.80754089355469, 53.40348815917969, 54.99943542480469, 56.59538269042969]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 7.0, 8.0, 6.0, 6.0, 11.0, 17.0, 19.0, 17.0, 20.0, 23.0, 29.0, 32.0, 36.0, 34.0, 35.0, 46.0, 48.0, 42.0, 38.0, 52.0, 46.0, 43.0, 49.0, 30.0, 32.0, 40.0, 37.0, 30.0, 20.0, 23.0, 18.0, 14.0, 14.0, 12.0, 16.0, 12.0, 6.0, 11.0, 9.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.453125, -8.1912841796875, -7.929443359375, -7.6676025390625, -7.40576171875, -7.1439208984375, -6.882080078125, -6.6202392578125, -6.3583984375, -6.0965576171875, -5.834716796875, -5.5728759765625, -5.31103515625, -5.0491943359375, -4.787353515625, -4.5255126953125, -4.263671875, -4.0018310546875, -3.739990234375, -3.4781494140625, -3.21630859375, -2.9544677734375, -2.692626953125, -2.4307861328125, -2.1689453125, -1.9071044921875, -1.645263671875, -1.3834228515625, -1.12158203125, -0.8597412109375, -0.597900390625, -0.3360595703125, -0.07421875, 0.1876220703125, 0.449462890625, 0.7113037109375, 0.97314453125, 1.2349853515625, 1.496826171875, 1.7586669921875, 2.0205078125, 2.2823486328125, 2.544189453125, 2.8060302734375, 3.06787109375, 3.3297119140625, 3.591552734375, 3.8533935546875, 4.115234375, 4.3770751953125, 4.638916015625, 4.9007568359375, 5.16259765625, 5.4244384765625, 5.686279296875, 5.9481201171875, 6.2099609375, 6.4718017578125, 6.733642578125, 6.9954833984375, 7.25732421875, 7.5191650390625, 7.781005859375, 8.0428466796875, 8.3046875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 8.0, 3.0, 13.0, 6.0, 13.0, 22.0, 26.0, 25.0, 28.0, 31.0, 37.0, 67.0, 75.0, 89.0, 137.0, 207.0, 276.0, 474.0, 2628.0, 217296.0, 3959431.0, 11344.0, 784.0, 329.0, 242.0, 174.0, 98.0, 75.0, 79.0, 45.0, 40.0, 24.0, 26.0, 27.0, 25.0, 10.0, 18.0, 10.0, 3.0, 6.0, 7.0, 8.0, 2.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.5625, -83.4951171875, -80.427734375, -77.3603515625, -74.29296875, -71.2255859375, -68.158203125, -65.0908203125, -62.0234375, -58.9560546875, -55.888671875, -52.8212890625, -49.75390625, -46.6865234375, -43.619140625, -40.5517578125, -37.484375, -34.4169921875, -31.349609375, -28.2822265625, -25.21484375, -22.1474609375, -19.080078125, -16.0126953125, -12.9453125, -9.8779296875, -6.810546875, -3.7431640625, -0.67578125, 2.3916015625, 5.458984375, 8.5263671875, 11.59375, 14.6611328125, 17.728515625, 20.7958984375, 23.86328125, 26.9306640625, 29.998046875, 33.0654296875, 36.1328125, 39.2001953125, 42.267578125, 45.3349609375, 48.40234375, 51.4697265625, 54.537109375, 57.6044921875, 60.671875, 63.7392578125, 66.806640625, 69.8740234375, 72.94140625, 76.0087890625, 79.076171875, 82.1435546875, 85.2109375, 88.2783203125, 91.345703125, 94.4130859375, 97.48046875, 100.5478515625, 103.615234375, 106.6826171875, 109.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 9.0, 6.0, 13.0, 23.0, 34.0, 43.0, 82.0, 107.0, 161.0, 277.0, 631.0, 1131.0, 626.0, 340.0, 187.0, 122.0, 69.0, 61.0, 45.0, 22.0, 33.0, 24.0, 13.0, 3.0, 2.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9375, -13.34423828125, -12.7509765625, -12.15771484375, -11.564453125, -10.97119140625, -10.3779296875, -9.78466796875, -9.19140625, -8.59814453125, -8.0048828125, -7.41162109375, -6.818359375, -6.22509765625, -5.6318359375, -5.03857421875, -4.4453125, -3.85205078125, -3.2587890625, -2.66552734375, -2.072265625, -1.47900390625, -0.8857421875, -0.29248046875, 0.30078125, 0.89404296875, 1.4873046875, 2.08056640625, 2.673828125, 3.26708984375, 3.8603515625, 4.45361328125, 5.046875, 5.64013671875, 6.2333984375, 6.82666015625, 7.419921875, 8.01318359375, 8.6064453125, 9.19970703125, 9.79296875, 10.38623046875, 10.9794921875, 11.57275390625, 12.166015625, 12.75927734375, 13.3525390625, 13.94580078125, 14.5390625, 15.13232421875, 15.7255859375, 16.31884765625, 16.912109375, 17.50537109375, 18.0986328125, 18.69189453125, 19.28515625, 19.87841796875, 20.4716796875, 21.06494140625, 21.658203125, 22.25146484375, 22.8447265625, 23.43798828125, 24.03125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 12.0, 18.0, 20.0, 26.0, 44.0, 81.0, 120.0, 230.0, 491.0, 1931.0, 15550.0, 304799.0, 3738065.0, 122020.0, 8756.0, 1311.0, 401.0, 157.0, 74.0, 44.0, 35.0, 25.0, 20.0, 13.0, 11.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-63.96875, -62.34375, -60.71875, -59.09375, -57.46875, -55.84375, -54.21875, -52.59375, -50.96875, -49.34375, -47.71875, -46.09375, -44.46875, -42.84375, -41.21875, -39.59375, -37.96875, -36.34375, -34.71875, -33.09375, -31.46875, -29.84375, -28.21875, -26.59375, -24.96875, -23.34375, -21.71875, -20.09375, -18.46875, -16.84375, -15.21875, -13.59375, -11.96875, -10.34375, -8.71875, -7.09375, -5.46875, -3.84375, -2.21875, -0.59375, 1.03125, 2.65625, 4.28125, 5.90625, 7.53125, 9.15625, 10.78125, 12.40625, 14.03125, 15.65625, 17.28125, 18.90625, 20.53125, 22.15625, 23.78125, 25.40625, 27.03125, 28.65625, 30.28125, 31.90625, 33.53125, 35.15625, 36.78125, 38.40625, 40.03125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 63.0, 391.0, 428.0, 115.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.8079376220703, -224.05015563964844, -212.2923583984375, -200.53457641601562, -188.77679443359375, -177.01901245117188, -165.26123046875, -153.50343322753906, -141.7456512451172, -129.9878692626953, -118.2300796508789, -106.4722900390625, -94.71450805664062, -82.95672607421875, -71.19893646240234, -59.44114685058594, -47.68336486816406, -35.92557907104492, -24.16779327392578, -12.41000747680664, -0.6522216796875, 11.10556411743164, 22.86334991455078, 34.62113952636719, 46.37892150878906, 58.1367073059082, 69.89449310302734, 81.65228271484375, 93.41006469726562, 105.1678466796875, 116.9256362915039, 128.6834259033203, 140.44122314453125, 152.19900512695312, 163.956787109375, 175.71458435058594, 187.4723663330078, 199.2301483154297, 210.98794555664062, 222.7457275390625, 234.50350952148438, 246.26129150390625, 258.0190734863281, 269.77685546875, 281.53466796875, 293.2924499511719, 305.05023193359375, 316.8080139160156, 328.5657958984375, 340.3235778808594, 352.08135986328125, 363.8391418457031, 375.596923828125, 387.354736328125, 399.1125183105469, 410.87030029296875, 422.6280822753906, 434.3858642578125, 446.1436462402344, 457.90142822265625, 469.65924072265625, 481.4170227050781, 493.1748046875, 504.9325866699219, 516.6903686523438]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 4.0, 5.0, 8.0, 17.0, 16.0, 23.0, 15.0, 21.0, 20.0, 26.0, 23.0, 31.0, 34.0, 46.0, 40.0, 52.0, 45.0, 44.0, 50.0, 51.0, 52.0, 34.0, 42.0, 40.0, 28.0, 44.0, 29.0, 20.0, 24.0, 22.0, 16.0, 12.0, 23.0, 11.0, 10.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.05975341796875, -58.14244842529297, -56.22514343261719, -54.307838439941406, -52.390533447265625, -50.473228454589844, -48.5559196472168, -46.638614654541016, -44.721309661865234, -42.80400466918945, -40.88669967651367, -38.96939468383789, -37.052085876464844, -35.13478088378906, -33.21747589111328, -31.3001708984375, -29.38286590576172, -27.465560913085938, -25.548255920410156, -23.630949020385742, -21.71364402770996, -19.79633903503418, -17.879032135009766, -15.961727142333984, -14.044422149658203, -12.127117156982422, -10.209811210632324, -8.292505264282227, -6.375200271606445, -4.457895278930664, -2.5405893325805664, -0.6232833862304688, 1.2940254211425781, 3.2113308906555176, 5.128636360168457, 7.0459418296813965, 8.963247299194336, 10.880552291870117, 12.797858238220215, 14.715164184570312, 16.632469177246094, 18.549774169921875, 20.467079162597656, 22.38438606262207, 24.30169105529785, 26.218996047973633, 28.136302947998047, 30.053607940673828, 31.97091293334961, 33.88821792602539, 35.80552291870117, 37.72282791137695, 39.64013671875, 41.55744171142578, 43.47474670410156, 45.392051696777344, 47.309356689453125, 49.226661682128906, 51.14396667480469, 53.06127166748047, 54.97857666015625, 56.89588165283203, 58.81319046020508, 60.73049545288086, 62.64780044555664]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 10.0, 7.0, 4.0, 11.0, 23.0, 13.0, 16.0, 26.0, 18.0, 27.0, 35.0, 26.0, 36.0, 33.0, 28.0, 37.0, 45.0, 46.0, 40.0, 41.0, 44.0, 39.0, 38.0, 44.0, 34.0, 40.0, 37.0, 29.0, 19.0, 22.0, 15.0, 14.0, 19.0, 11.0, 12.0, 10.0, 9.0, 2.0, 6.0, 10.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-8.7265625, -8.47564697265625, -8.2247314453125, -7.97381591796875, -7.722900390625, -7.47198486328125, -7.2210693359375, -6.97015380859375, -6.71923828125, -6.46832275390625, -6.2174072265625, -5.96649169921875, -5.715576171875, -5.46466064453125, -5.2137451171875, -4.96282958984375, -4.7119140625, -4.46099853515625, -4.2100830078125, -3.95916748046875, -3.708251953125, -3.45733642578125, -3.2064208984375, -2.95550537109375, -2.70458984375, -2.45367431640625, -2.2027587890625, -1.95184326171875, -1.700927734375, -1.45001220703125, -1.1990966796875, -0.94818115234375, -0.697265625, -0.44635009765625, -0.1954345703125, 0.05548095703125, 0.306396484375, 0.55731201171875, 0.8082275390625, 1.05914306640625, 1.31005859375, 1.56097412109375, 1.8118896484375, 2.06280517578125, 2.313720703125, 2.56463623046875, 2.8155517578125, 3.06646728515625, 3.3173828125, 3.56829833984375, 3.8192138671875, 4.07012939453125, 4.321044921875, 4.57196044921875, 4.8228759765625, 5.07379150390625, 5.32470703125, 5.57562255859375, 5.8265380859375, 6.07745361328125, 6.328369140625, 6.57928466796875, 6.8302001953125, 7.08111572265625, 7.33203125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 8.0, 4.0, 18.0, 24.0, 43.0, 33.0, 60.0, 110.0, 117.0, 180.0, 244.0, 371.0, 487.0, 704.0, 953.0, 1406.0, 1966.0, 2841.0, 4048.0, 6003.0, 8869.0, 13263.0, 20760.0, 32380.0, 52109.0, 89495.0, 175147.0, 273393.0, 150118.0, 79626.0, 47219.0, 29158.0, 18684.0, 12243.0, 8169.0, 5659.0, 3836.0, 2648.0, 1783.0, 1263.0, 919.0, 643.0, 413.0, 327.0, 234.0, 172.0, 118.0, 78.0, 67.0, 37.0, 40.0, 23.0, 22.0, 9.0, 7.0, 3.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.2418212890625, -0.2335948944091797, -0.22536849975585938, -0.21714210510253906, -0.20891571044921875, -0.20068931579589844, -0.19246292114257812, -0.1842365264892578, -0.1760101318359375, -0.1677837371826172, -0.15955734252929688, -0.15133094787597656, -0.14310455322265625, -0.13487815856933594, -0.12665176391601562, -0.11842536926269531, -0.110198974609375, -0.10197257995605469, -0.09374618530273438, -0.08551979064941406, -0.07729339599609375, -0.06906700134277344, -0.060840606689453125, -0.05261421203613281, -0.0443878173828125, -0.03616142272949219, -0.027935028076171875, -0.019708633422851562, -0.01148223876953125, -0.0032558441162109375, 0.004970550537109375, 0.013196945190429688, 0.02142333984375, 0.029649734497070312, 0.037876129150390625, 0.04610252380371094, 0.05432891845703125, 0.06255531311035156, 0.07078170776367188, 0.07900810241699219, 0.0872344970703125, 0.09546089172363281, 0.10368728637695312, 0.11191368103027344, 0.12014007568359375, 0.12836647033691406, 0.13659286499023438, 0.1448192596435547, 0.153045654296875, 0.1612720489501953, 0.16949844360351562, 0.17772483825683594, 0.18595123291015625, 0.19417762756347656, 0.20240402221679688, 0.2106304168701172, 0.2188568115234375, 0.2270832061767578, 0.23530960083007812, 0.24353599548339844, 0.25176239013671875, 0.25998878479003906, 0.2682151794433594, 0.2764415740966797, 0.28466796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 5.0, 12.0, 11.0, 8.0, 10.0, 25.0, 19.0, 19.0, 24.0, 40.0, 37.0, 33.0, 39.0, 37.0, 34.0, 41.0, 38.0, 36.0, 1078.0, 26.0, 39.0, 42.0, 43.0, 33.0, 32.0, 31.0, 35.0, 25.0, 26.0, 19.0, 21.0, 17.0, 18.0, 12.0, 14.0, 8.0, 5.0, 6.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.34375, -6.14056396484375, -5.9373779296875, -5.73419189453125, -5.531005859375, -5.32781982421875, -5.1246337890625, -4.92144775390625, -4.71826171875, -4.51507568359375, -4.3118896484375, -4.10870361328125, -3.905517578125, -3.70233154296875, -3.4991455078125, -3.29595947265625, -3.0927734375, -2.88958740234375, -2.6864013671875, -2.48321533203125, -2.280029296875, -2.07684326171875, -1.8736572265625, -1.67047119140625, -1.46728515625, -1.26409912109375, -1.0609130859375, -0.85772705078125, -0.654541015625, -0.45135498046875, -0.2481689453125, -0.04498291015625, 0.158203125, 0.36138916015625, 0.5645751953125, 0.76776123046875, 0.970947265625, 1.17413330078125, 1.3773193359375, 1.58050537109375, 1.78369140625, 1.98687744140625, 2.1900634765625, 2.39324951171875, 2.596435546875, 2.79962158203125, 3.0028076171875, 3.20599365234375, 3.4091796875, 3.61236572265625, 3.8155517578125, 4.01873779296875, 4.221923828125, 4.42510986328125, 4.6282958984375, 4.83148193359375, 5.03466796875, 5.23785400390625, 5.4410400390625, 5.64422607421875, 5.847412109375, 6.05059814453125, 6.2537841796875, 6.45697021484375, 6.66015625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 11.0, 15.0, 32.0, 45.0, 50.0, 109.0, 142.0, 216.0, 337.0, 518.0, 819.0, 1241.0, 2074.0, 3126.0, 5058.0, 8264.0, 13488.0, 22867.0, 38750.0, 68336.0, 132265.0, 1332262.0, 225989.0, 103613.0, 55838.0, 32200.0, 19000.0, 11486.0, 7061.0, 4393.0, 2691.0, 1719.0, 1065.0, 701.0, 477.0, 293.0, 203.0, 130.0, 80.0, 67.0, 32.0, 23.0, 15.0, 9.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.234375, -0.2272357940673828, -0.22009658813476562, -0.21295738220214844, -0.20581817626953125, -0.19867897033691406, -0.19153976440429688, -0.1844005584716797, -0.1772613525390625, -0.1701221466064453, -0.16298294067382812, -0.15584373474121094, -0.14870452880859375, -0.14156532287597656, -0.13442611694335938, -0.1272869110107422, -0.120147705078125, -0.11300849914550781, -0.10586929321289062, -0.09873008728027344, -0.09159088134765625, -0.08445167541503906, -0.07731246948242188, -0.07017326354980469, -0.0630340576171875, -0.05589485168457031, -0.048755645751953125, -0.04161643981933594, -0.03447723388671875, -0.027338027954101562, -0.020198822021484375, -0.013059616088867188, -0.00592041015625, 0.0012187957763671875, 0.008358001708984375, 0.015497207641601562, 0.02263641357421875, 0.029775619506835938, 0.036914825439453125, 0.04405403137207031, 0.0511932373046875, 0.05833244323730469, 0.06547164916992188, 0.07261085510253906, 0.07975006103515625, 0.08688926696777344, 0.09402847290039062, 0.10116767883300781, 0.108306884765625, 0.11544609069824219, 0.12258529663085938, 0.12972450256347656, 0.13686370849609375, 0.14400291442871094, 0.15114212036132812, 0.1582813262939453, 0.1654205322265625, 0.1725597381591797, 0.17969894409179688, 0.18683815002441406, 0.19397735595703125, 0.20111656188964844, 0.20825576782226562, 0.2153949737548828, 0.2225341796875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 11.0, 11.0, 12.0, 28.0, 25.0, 25.0, 47.0, 40.0, 46.0, 65.0, 74.0, 52.0, 63.0, 75.0, 64.0, 54.0, 60.0, 39.0, 49.0, 27.0, 28.0, 12.0, 20.0, 19.0, 14.0, 8.0, 5.0, 3.0, 2.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011748075485229492, -0.00011343415826559067, -0.00010938756167888641, -0.00010534096509218216, -0.0001012943685054779, -9.724777191877365e-05, -9.32011753320694e-05, -8.915457874536514e-05, -8.510798215866089e-05, -8.106138557195663e-05, -7.701478898525238e-05, -7.296819239854813e-05, -6.892159581184387e-05, -6.487499922513962e-05, -6.0828402638435364e-05, -5.678180605173111e-05, -5.2735209465026855e-05, -4.86886128783226e-05, -4.464201629161835e-05, -4.059541970491409e-05, -3.654882311820984e-05, -3.2502226531505585e-05, -2.845562994480133e-05, -2.4409033358097076e-05, -2.0362436771392822e-05, -1.6315840184688568e-05, -1.2269243597984314e-05, -8.22264701128006e-06, -4.176050424575806e-06, -1.2945383787155151e-07, 3.917142748832703e-06, 7.963739335536957e-06, 1.2010335922241211e-05, 1.6056932508945465e-05, 2.010352909564972e-05, 2.4150125682353973e-05, 2.8196722269058228e-05, 3.224331885576248e-05, 3.6289915442466736e-05, 4.033651202917099e-05, 4.4383108615875244e-05, 4.84297052025795e-05, 5.247630178928375e-05, 5.6522898375988007e-05, 6.056949496269226e-05, 6.461609154939651e-05, 6.866268813610077e-05, 7.270928472280502e-05, 7.675588130950928e-05, 8.080247789621353e-05, 8.484907448291779e-05, 8.889567106962204e-05, 9.29422676563263e-05, 9.698886424303055e-05, 0.0001010354608297348, 0.00010508205741643906, 0.00010912865400314331, 0.00011317525058984756, 0.00011722184717655182, 0.00012126844376325607, 0.00012531504034996033, 0.00012936163693666458, 0.00013340823352336884, 0.0001374548301100731, 0.00014150142669677734]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 6.0, 5.0, 11.0, 20.0, 24.0, 25.0, 32.0, 42.0, 78.0, 130.0, 228.0, 843.0, 104607.0, 937995.0, 3553.0, 432.0, 191.0, 87.0, 63.0, 51.0, 37.0, 31.0, 16.0, 9.0, 12.0, 4.0, 5.0, 5.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00336456298828125, -0.003266274929046631, -0.0031679868698120117, -0.0030696988105773926, -0.0029714107513427734, -0.0028731226921081543, -0.002774834632873535, -0.002676546573638916, -0.002578258514404297, -0.0024799704551696777, -0.0023816823959350586, -0.0022833943367004395, -0.0021851062774658203, -0.002086818218231201, -0.001988530158996582, -0.0018902420997619629, -0.0017919540405273438, -0.0016936659812927246, -0.0015953779220581055, -0.0014970898628234863, -0.0013988018035888672, -0.001300513744354248, -0.001202225685119629, -0.0011039376258850098, -0.0010056495666503906, -0.0009073615074157715, -0.0008090734481811523, -0.0007107853889465332, -0.0006124973297119141, -0.0005142092704772949, -0.0004159212112426758, -0.00031763315200805664, -0.0002193450927734375, -0.00012105703353881836, -2.276897430419922e-05, 7.551908493041992e-05, 0.00017380714416503906, 0.0002720952033996582, 0.00037038326263427734, 0.0004686713218688965, 0.0005669593811035156, 0.0006652474403381348, 0.0007635354995727539, 0.000861823558807373, 0.0009601116180419922, 0.0010583996772766113, 0.0011566877365112305, 0.0012549757957458496, 0.0013532638549804688, 0.0014515519142150879, 0.001549839973449707, 0.0016481280326843262, 0.0017464160919189453, 0.0018447041511535645, 0.0019429922103881836, 0.0020412802696228027, 0.002139568328857422, 0.002237856388092041, 0.00233614444732666, 0.0024344325065612793, 0.0025327205657958984, 0.0026310086250305176, 0.0027292966842651367, 0.002827584743499756, 0.002925872802734375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 22.0, 442.0, 527.0, 25.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014449161244556308, -0.0001088781573344022, -7.326470222324133e-05, -3.7651247112080455e-05, -2.0377920009195805e-06, 3.3575663110241294e-05, 6.918911822140217e-05, 0.00010480257333256304, 0.00014041602844372392, 0.0001760294835548848, 0.00021164293866604567, 0.00024725639377720654, 0.0002828698488883674, 0.0003184833039995283, 0.00035409675911068916, 0.00038971021422185004, 0.0004253236693330109, 0.0004609371244441718, 0.0004965505795553327, 0.0005321640055626631, 0.0005677774897776544, 0.0006033909739926457, 0.0006390043999999762, 0.0006746178260073066, 0.0007102313102222979, 0.0007458447944372892, 0.0007814582204446197, 0.0008170716464519501, 0.0008526851306669414, 0.0008882986148819327, 0.0009239120408892632, 0.0009595254668965936, 0.000995138892903924, 0.0010307523189112544, 0.0010663657449185848, 0.001101979287341237, 0.0011375927133485675, 0.001173206139355898, 0.0012088196817785501, 0.0012444331077858806, 0.001280046533793211, 0.0013156599598005414, 0.0013512733858078718, 0.001386886928230524, 0.0014225003542378545, 0.001458113780245185, 0.0014937273226678371, 0.0015293407486751676, 0.001564954174682498, 0.0016005676006898284, 0.0016361810266971588, 0.001671794569119811, 0.0017074079951271415, 0.001743021421134472, 0.0017786349635571241, 0.0018142483895644546, 0.001849861815571785, 0.0018854752415791154, 0.0019210886675864458, 0.001956702210009098, 0.0019923155196011066, 0.002027929062023759, 0.002063542604446411, 0.0020991559140384197, 0.002134769456461072]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 3.0, 6.0, 1.0, 20.0, 10.0, 22.0, 21.0, 16.0, 20.0, 23.0, 35.0, 32.0, 32.0, 38.0, 46.0, 53.0, 46.0, 53.0, 64.0, 45.0, 45.0, 44.0, 53.0, 31.0, 30.0, 27.0, 29.0, 24.0, 24.0, 27.0, 17.0, 10.0, 15.0, 13.0, 6.0, 12.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.518861770629883e-05, -9.264517575502396e-05, -9.010173380374908e-05, -8.755829185247421e-05, -8.501484990119934e-05, -8.247140794992447e-05, -7.99279659986496e-05, -7.738452404737473e-05, -7.484108209609985e-05, -7.229764014482498e-05, -6.975419819355011e-05, -6.721075624227524e-05, -6.466731429100037e-05, -6.21238723397255e-05, -5.958043038845062e-05, -5.703698843717575e-05, -5.449354648590088e-05, -5.195010453462601e-05, -4.9406662583351135e-05, -4.6863220632076263e-05, -4.431977868080139e-05, -4.177633672952652e-05, -3.923289477825165e-05, -3.6689452826976776e-05, -3.4146010875701904e-05, -3.160256892442703e-05, -2.905912697315216e-05, -2.651568502187729e-05, -2.3972243070602417e-05, -2.1428801119327545e-05, -1.8885359168052673e-05, -1.63419172167778e-05, -1.379847526550293e-05, -1.1255033314228058e-05, -8.711591362953186e-06, -6.168149411678314e-06, -3.6247074604034424e-06, -1.0812655091285706e-06, 1.4621764421463013e-06, 4.005618393421173e-06, 6.549060344696045e-06, 9.092502295970917e-06, 1.1635944247245789e-05, 1.417938619852066e-05, 1.6722828149795532e-05, 1.9266270101070404e-05, 2.1809712052345276e-05, 2.4353154003620148e-05, 2.689659595489502e-05, 2.944003790616989e-05, 3.198347985744476e-05, 3.4526921808719635e-05, 3.707036375999451e-05, 3.961380571126938e-05, 4.215724766254425e-05, 4.470068961381912e-05, 4.7244131565093994e-05, 4.9787573516368866e-05, 5.233101546764374e-05, 5.487445741891861e-05, 5.741789937019348e-05, 5.996134132146835e-05, 6.250478327274323e-05, 6.50482252240181e-05, 6.759166717529297e-05]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 10.0, 7.0, 4.0, 11.0, 23.0, 13.0, 16.0, 26.0, 18.0, 27.0, 35.0, 26.0, 36.0, 33.0, 28.0, 37.0, 45.0, 46.0, 40.0, 41.0, 44.0, 39.0, 38.0, 44.0, 34.0, 40.0, 37.0, 29.0, 19.0, 22.0, 15.0, 14.0, 19.0, 11.0, 12.0, 10.0, 9.0, 2.0, 6.0, 10.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-8.7265625, -8.47564697265625, -8.2247314453125, -7.97381591796875, -7.722900390625, -7.47198486328125, -7.2210693359375, -6.97015380859375, -6.71923828125, -6.46832275390625, -6.2174072265625, -5.96649169921875, -5.715576171875, -5.46466064453125, -5.2137451171875, -4.96282958984375, -4.7119140625, -4.46099853515625, -4.2100830078125, -3.95916748046875, -3.708251953125, -3.45733642578125, -3.2064208984375, -2.95550537109375, -2.70458984375, -2.45367431640625, -2.2027587890625, -1.95184326171875, -1.700927734375, -1.45001220703125, -1.1990966796875, -0.94818115234375, -0.697265625, -0.44635009765625, -0.1954345703125, 0.05548095703125, 0.306396484375, 0.55731201171875, 0.8082275390625, 1.05914306640625, 1.31005859375, 1.56097412109375, 1.8118896484375, 2.06280517578125, 2.313720703125, 2.56463623046875, 2.8155517578125, 3.06646728515625, 3.3173828125, 3.56829833984375, 3.8192138671875, 4.07012939453125, 4.321044921875, 4.57196044921875, 4.8228759765625, 5.07379150390625, 5.32470703125, 5.57562255859375, 5.8265380859375, 6.07745361328125, 6.328369140625, 6.57928466796875, 6.8302001953125, 7.08111572265625, 7.33203125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 7.0, 8.0, 24.0, 28.0, 45.0, 65.0, 121.0, 224.0, 345.0, 617.0, 1046.0, 2066.0, 3737.0, 6968.0, 13882.0, 28570.0, 61396.0, 131333.0, 249701.0, 265547.0, 148388.0, 69733.0, 32518.0, 15415.0, 7650.0, 4067.0, 2235.0, 1179.0, 665.0, 403.0, 220.0, 142.0, 84.0, 49.0, 23.0, 17.0, 15.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.96875, -13.5333251953125, -13.097900390625, -12.6624755859375, -12.22705078125, -11.7916259765625, -11.356201171875, -10.9207763671875, -10.4853515625, -10.0499267578125, -9.614501953125, -9.1790771484375, -8.74365234375, -8.3082275390625, -7.872802734375, -7.4373779296875, -7.001953125, -6.5665283203125, -6.131103515625, -5.6956787109375, -5.26025390625, -4.8248291015625, -4.389404296875, -3.9539794921875, -3.5185546875, -3.0831298828125, -2.647705078125, -2.2122802734375, -1.77685546875, -1.3414306640625, -0.906005859375, -0.4705810546875, -0.03515625, 0.4002685546875, 0.835693359375, 1.2711181640625, 1.70654296875, 2.1419677734375, 2.577392578125, 3.0128173828125, 3.4482421875, 3.8836669921875, 4.319091796875, 4.7545166015625, 5.18994140625, 5.6253662109375, 6.060791015625, 6.4962158203125, 6.931640625, 7.3670654296875, 7.802490234375, 8.2379150390625, 8.67333984375, 9.1087646484375, 9.544189453125, 9.9796142578125, 10.4150390625, 10.8504638671875, 11.285888671875, 11.7213134765625, 12.15673828125, 12.5921630859375, 13.027587890625, 13.4630126953125, 13.8984375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 13.0, 10.0, 7.0, 22.0, 27.0, 48.0, 47.0, 50.0, 65.0, 86.0, 143.0, 245.0, 1414.0, 288.0, 189.0, 101.0, 66.0, 65.0, 46.0, 24.0, 16.0, 19.0, 15.0, 16.0, 4.0, 6.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.375, -36.29638671875, -35.2177734375, -34.13916015625, -33.060546875, -31.98193359375, -30.9033203125, -29.82470703125, -28.74609375, -27.66748046875, -26.5888671875, -25.51025390625, -24.431640625, -23.35302734375, -22.2744140625, -21.19580078125, -20.1171875, -19.03857421875, -17.9599609375, -16.88134765625, -15.802734375, -14.72412109375, -13.6455078125, -12.56689453125, -11.48828125, -10.40966796875, -9.3310546875, -8.25244140625, -7.173828125, -6.09521484375, -5.0166015625, -3.93798828125, -2.859375, -1.78076171875, -0.7021484375, 0.37646484375, 1.455078125, 2.53369140625, 3.6123046875, 4.69091796875, 5.76953125, 6.84814453125, 7.9267578125, 9.00537109375, 10.083984375, 11.16259765625, 12.2412109375, 13.31982421875, 14.3984375, 15.47705078125, 16.5556640625, 17.63427734375, 18.712890625, 19.79150390625, 20.8701171875, 21.94873046875, 23.02734375, 24.10595703125, 25.1845703125, 26.26318359375, 27.341796875, 28.42041015625, 29.4990234375, 30.57763671875, 31.65625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 12.0, 10.0, 6.0, 15.0, 23.0, 39.0, 50.0, 103.0, 159.0, 233.0, 530.0, 1565.0, 10420.0, 504101.0, 2594181.0, 30091.0, 2580.0, 694.0, 361.0, 174.0, 105.0, 72.0, 42.0, 40.0, 21.0, 19.0, 15.0, 10.0, 5.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-62.34375, -60.5712890625, -58.798828125, -57.0263671875, -55.25390625, -53.4814453125, -51.708984375, -49.9365234375, -48.1640625, -46.3916015625, -44.619140625, -42.8466796875, -41.07421875, -39.3017578125, -37.529296875, -35.7568359375, -33.984375, -32.2119140625, -30.439453125, -28.6669921875, -26.89453125, -25.1220703125, -23.349609375, -21.5771484375, -19.8046875, -18.0322265625, -16.259765625, -14.4873046875, -12.71484375, -10.9423828125, -9.169921875, -7.3974609375, -5.625, -3.8525390625, -2.080078125, -0.3076171875, 1.46484375, 3.2373046875, 5.009765625, 6.7822265625, 8.5546875, 10.3271484375, 12.099609375, 13.8720703125, 15.64453125, 17.4169921875, 19.189453125, 20.9619140625, 22.734375, 24.5068359375, 26.279296875, 28.0517578125, 29.82421875, 31.5966796875, 33.369140625, 35.1416015625, 36.9140625, 38.6865234375, 40.458984375, 42.2314453125, 44.00390625, 45.7763671875, 47.548828125, 49.3212890625, 51.09375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 12.0, 52.0, 212.0, 363.0, 274.0, 80.0, 13.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-466.3736267089844, -456.9913635253906, -447.6091003417969, -438.2268371582031, -428.8445739746094, -419.4623107910156, -410.0800476074219, -400.6977844238281, -391.3155212402344, -381.9332580566406, -372.5509948730469, -363.1687316894531, -353.7864685058594, -344.4042053222656, -335.0219421386719, -325.6396789550781, -316.25738525390625, -306.8751220703125, -297.49285888671875, -288.110595703125, -278.72833251953125, -269.3460693359375, -259.96380615234375, -250.58154296875, -241.19927978515625, -231.8170166015625, -222.43475341796875, -213.052490234375, -203.67022705078125, -194.2879638671875, -184.90570068359375, -175.5234375, -166.1411895751953, -156.75892639160156, -147.3766632080078, -137.99440002441406, -128.6121368408203, -119.22987365722656, -109.84760284423828, -100.46533966064453, -91.08307647705078, -81.70081329345703, -72.31855010986328, -62.936283111572266, -53.554019927978516, -44.171756744384766, -34.78948974609375, -25.4072265625, -16.02496337890625, -6.642699241638184, 2.739564895629883, 12.121829986572266, 21.504093170166016, 30.886356353759766, 40.26862335205078, 49.65088653564453, 59.03314971923828, 68.41541290283203, 77.79767608642578, 87.17994689941406, 96.56221008300781, 105.94447326660156, 115.32673645019531, 124.70899963378906, 134.0912628173828]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 6.0, 9.0, 11.0, 15.0, 18.0, 23.0, 25.0, 20.0, 36.0, 42.0, 35.0, 42.0, 52.0, 55.0, 65.0, 73.0, 60.0, 55.0, 51.0, 56.0, 56.0, 31.0, 35.0, 24.0, 24.0, 20.0, 15.0, 12.0, 8.0, 7.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.6611785888672, -129.1174774169922, -125.57376861572266, -122.03006744384766, -118.48636627197266, -114.94265747070312, -111.39895629882812, -107.85525512695312, -104.31155395507812, -100.76785278320312, -97.2241439819336, -93.6804428100586, -90.1367416381836, -86.59303283691406, -83.04933166503906, -79.50563049316406, -75.96192169189453, -72.41822052001953, -68.87451171875, -65.330810546875, -61.787109375, -58.243404388427734, -54.69969940185547, -51.15599822998047, -47.6122932434082, -44.06858825683594, -40.52488708496094, -36.98118209838867, -33.437477111816406, -29.893775939941406, -26.35007095336914, -22.806367874145508, -19.262657165527344, -15.718954086303711, -12.175250053405762, -8.631546020507812, -5.08784294128418, -1.5441398620605469, 1.9995651245117188, 5.543268203735352, 9.086971282958984, 12.630674362182617, 16.17437744140625, 19.718082427978516, 23.26178550720215, 26.80548858642578, 30.349193572998047, 33.89289855957031, 37.43659973144531, 40.98030471801758, 44.52400588989258, 48.067710876464844, 51.611412048339844, 55.15511703491211, 58.698822021484375, 62.242523193359375, 65.78622436523438, 69.32992553710938, 72.8736343383789, 76.4173355102539, 79.9610366821289, 83.50474548339844, 87.04844665527344, 90.59214782714844, 94.13585662841797]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 1.0, 5.0, 1.0, 3.0, 6.0, 5.0, 8.0, 9.0, 17.0, 9.0, 21.0, 17.0, 23.0, 29.0, 26.0, 37.0, 34.0, 32.0, 42.0, 44.0, 39.0, 44.0, 66.0, 53.0, 52.0, 50.0, 36.0, 41.0, 41.0, 35.0, 29.0, 25.0, 30.0, 14.0, 18.0, 15.0, 11.0, 5.0, 7.0, 3.0, 9.0, 3.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.2904052734375, -8.994873046875, -8.6993408203125, -8.40380859375, -8.1082763671875, -7.812744140625, -7.5172119140625, -7.2216796875, -6.9261474609375, -6.630615234375, -6.3350830078125, -6.03955078125, -5.7440185546875, -5.448486328125, -5.1529541015625, -4.857421875, -4.5618896484375, -4.266357421875, -3.9708251953125, -3.67529296875, -3.3797607421875, -3.084228515625, -2.7886962890625, -2.4931640625, -2.1976318359375, -1.902099609375, -1.6065673828125, -1.31103515625, -1.0155029296875, -0.719970703125, -0.4244384765625, -0.12890625, 0.1666259765625, 0.462158203125, 0.7576904296875, 1.05322265625, 1.3487548828125, 1.644287109375, 1.9398193359375, 2.2353515625, 2.5308837890625, 2.826416015625, 3.1219482421875, 3.41748046875, 3.7130126953125, 4.008544921875, 4.3040771484375, 4.599609375, 4.8951416015625, 5.190673828125, 5.4862060546875, 5.78173828125, 6.0772705078125, 6.372802734375, 6.6683349609375, 6.9638671875, 7.2593994140625, 7.554931640625, 7.8504638671875, 8.14599609375, 8.4415283203125, 8.737060546875, 9.0325927734375, 9.328125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 16.0, 33.0, 38.0, 77.0, 124.0, 250.0, 434.0, 920.0, 1910.0, 4420.0, 12461.0, 49181.0, 382984.0, 3144909.0, 515244.0, 58612.0, 14025.0, 4803.0, 2007.0, 898.0, 410.0, 219.0, 126.0, 60.0, 34.0, 28.0, 15.0, 6.0, 2.0, 8.0, 7.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-33.0, -32.044921875, -31.08984375, -30.134765625, -29.1796875, -28.224609375, -27.26953125, -26.314453125, -25.359375, -24.404296875, -23.44921875, -22.494140625, -21.5390625, -20.583984375, -19.62890625, -18.673828125, -17.71875, -16.763671875, -15.80859375, -14.853515625, -13.8984375, -12.943359375, -11.98828125, -11.033203125, -10.078125, -9.123046875, -8.16796875, -7.212890625, -6.2578125, -5.302734375, -4.34765625, -3.392578125, -2.4375, -1.482421875, -0.52734375, 0.427734375, 1.3828125, 2.337890625, 3.29296875, 4.248046875, 5.203125, 6.158203125, 7.11328125, 8.068359375, 9.0234375, 9.978515625, 10.93359375, 11.888671875, 12.84375, 13.798828125, 14.75390625, 15.708984375, 16.6640625, 17.619140625, 18.57421875, 19.529296875, 20.484375, 21.439453125, 22.39453125, 23.349609375, 24.3046875, 25.259765625, 26.21484375, 27.169921875, 28.125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 0.0, 13.0, 9.0, 26.0, 53.0, 88.0, 235.0, 464.0, 1065.0, 1085.0, 507.0, 244.0, 134.0, 75.0, 36.0, 21.0, 14.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.9375, -51.811279296875, -50.68505859375, -49.558837890625, -48.4326171875, -47.306396484375, -46.18017578125, -45.053955078125, -43.927734375, -42.801513671875, -41.67529296875, -40.549072265625, -39.4228515625, -38.296630859375, -37.17041015625, -36.044189453125, -34.91796875, -33.791748046875, -32.66552734375, -31.539306640625, -30.4130859375, -29.286865234375, -28.16064453125, -27.034423828125, -25.908203125, -24.781982421875, -23.65576171875, -22.529541015625, -21.4033203125, -20.277099609375, -19.15087890625, -18.024658203125, -16.8984375, -15.772216796875, -14.64599609375, -13.519775390625, -12.3935546875, -11.267333984375, -10.14111328125, -9.014892578125, -7.888671875, -6.762451171875, -5.63623046875, -4.510009765625, -3.3837890625, -2.257568359375, -1.13134765625, -0.005126953125, 1.12109375, 2.247314453125, 3.37353515625, 4.499755859375, 5.6259765625, 6.752197265625, 7.87841796875, 9.004638671875, 10.130859375, 11.257080078125, 12.38330078125, 13.509521484375, 14.6357421875, 15.761962890625, 16.88818359375, 18.014404296875, 19.140625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 12.0, 16.0, 15.0, 34.0, 68.0, 121.0, 256.0, 703.0, 2487.0, 18548.0, 527641.0, 3548602.0, 87777.0, 6023.0, 1148.0, 402.0, 203.0, 99.0, 50.0, 28.0, 22.0, 11.0, 12.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.46875, -57.62548828125, -55.7822265625, -53.93896484375, -52.095703125, -50.25244140625, -48.4091796875, -46.56591796875, -44.72265625, -42.87939453125, -41.0361328125, -39.19287109375, -37.349609375, -35.50634765625, -33.6630859375, -31.81982421875, -29.9765625, -28.13330078125, -26.2900390625, -24.44677734375, -22.603515625, -20.76025390625, -18.9169921875, -17.07373046875, -15.23046875, -13.38720703125, -11.5439453125, -9.70068359375, -7.857421875, -6.01416015625, -4.1708984375, -2.32763671875, -0.484375, 1.35888671875, 3.2021484375, 5.04541015625, 6.888671875, 8.73193359375, 10.5751953125, 12.41845703125, 14.26171875, 16.10498046875, 17.9482421875, 19.79150390625, 21.634765625, 23.47802734375, 25.3212890625, 27.16455078125, 29.0078125, 30.85107421875, 32.6943359375, 34.53759765625, 36.380859375, 38.22412109375, 40.0673828125, 41.91064453125, 43.75390625, 45.59716796875, 47.4404296875, 49.28369140625, 51.126953125, 52.97021484375, 54.8134765625, 56.65673828125, 58.5]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 133.0, 649.0, 212.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-435.26348876953125, -417.5155334472656, -399.7675476074219, -382.01959228515625, -364.2716064453125, -346.5236511230469, -328.77569580078125, -311.0277099609375, -293.27972412109375, -275.5317687988281, -257.7837829589844, -240.03582763671875, -222.287841796875, -204.53988647460938, -186.7919158935547, -169.0439453125, -151.29598999023438, -133.5480194091797, -115.800048828125, -98.05208587646484, -80.30411529541016, -62.55614471435547, -44.80818176269531, -27.060211181640625, -9.312240600585938, 8.435728073120117, 26.183696746826172, 43.931663513183594, 61.67963409423828, 79.42760467529297, 97.17556762695312, 114.92353820800781, 132.6715087890625, 150.4194793701172, 168.16744995117188, 185.9154052734375, 203.66339111328125, 221.41134643554688, 239.15931701660156, 256.90728759765625, 274.6552734375, 292.4032287597656, 310.1512145996094, 327.899169921875, 345.64715576171875, 363.3951110839844, 381.14306640625, 398.89105224609375, 416.6390075683594, 434.386962890625, 452.13494873046875, 469.8829040527344, 487.6308898925781, 505.37884521484375, 523.1268310546875, 540.874755859375, 558.6227416992188, 576.3707275390625, 594.11865234375, 611.8666381835938, 629.6146240234375, 647.3626098632812, 665.1105346679688, 682.8585205078125, 700.6065063476562]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 11.0, 13.0, 14.0, 23.0, 18.0, 31.0, 29.0, 30.0, 41.0, 46.0, 53.0, 57.0, 48.0, 58.0, 71.0, 56.0, 49.0, 45.0, 59.0, 48.0, 41.0, 29.0, 26.0, 22.0, 11.0, 22.0, 13.0, 9.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-107.16656494140625, -104.37073516845703, -101.57489776611328, -98.77906799316406, -95.98323059082031, -93.1874008178711, -90.39157104492188, -87.59573364257812, -84.7999038696289, -82.00407409667969, -79.20823669433594, -76.41240692138672, -73.6165771484375, -70.82073974609375, -68.02490997314453, -65.22908020019531, -62.43324279785156, -59.63740921020508, -56.841575622558594, -54.045745849609375, -51.24991226196289, -48.454078674316406, -45.65824890136719, -42.8624153137207, -40.06658172607422, -37.270748138427734, -34.47491455078125, -31.67908477783203, -28.883251190185547, -26.087417602539062, -23.29158592224121, -20.49575424194336, -17.699920654296875, -14.904088020324707, -12.108255386352539, -9.312422752380371, -6.516590118408203, -3.720757484436035, -0.9249248504638672, 1.8709068298339844, 4.666740417480469, 7.462573051452637, 10.258405685424805, 13.054238319396973, 15.85007095336914, 18.645904541015625, 21.441736221313477, 24.237567901611328, 27.033401489257812, 29.829235076904297, 32.62506866455078, 35.4208984375, 38.216732025146484, 41.01256561279297, 43.80839538574219, 46.60422897338867, 49.400062561035156, 52.19589614868164, 54.991729736328125, 57.787559509277344, 60.58339309692383, 63.37922668457031, 66.17505645751953, 68.97088623046875, 71.7667236328125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 10.0, 14.0, 15.0, 28.0, 15.0, 17.0, 35.0, 30.0, 44.0, 49.0, 48.0, 53.0, 50.0, 57.0, 69.0, 48.0, 55.0, 54.0, 49.0, 52.0, 43.0, 26.0, 24.0, 18.0, 22.0, 12.0, 10.0, 14.0, 9.0, 6.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.9281005859375, -8.598388671875, -8.2686767578125, -7.93896484375, -7.6092529296875, -7.279541015625, -6.9498291015625, -6.6201171875, -6.2904052734375, -5.960693359375, -5.6309814453125, -5.30126953125, -4.9715576171875, -4.641845703125, -4.3121337890625, -3.982421875, -3.6527099609375, -3.322998046875, -2.9932861328125, -2.66357421875, -2.3338623046875, -2.004150390625, -1.6744384765625, -1.3447265625, -1.0150146484375, -0.685302734375, -0.3555908203125, -0.02587890625, 0.3038330078125, 0.633544921875, 0.9632568359375, 1.29296875, 1.6226806640625, 1.952392578125, 2.2821044921875, 2.61181640625, 2.9415283203125, 3.271240234375, 3.6009521484375, 3.9306640625, 4.2603759765625, 4.590087890625, 4.9197998046875, 5.24951171875, 5.5792236328125, 5.908935546875, 6.2386474609375, 6.568359375, 6.8980712890625, 7.227783203125, 7.5574951171875, 7.88720703125, 8.2169189453125, 8.546630859375, 8.8763427734375, 9.2060546875, 9.5357666015625, 9.865478515625, 10.1951904296875, 10.52490234375, 10.8546142578125, 11.184326171875, 11.5140380859375, 11.84375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 10.0, 8.0, 12.0, 21.0, 42.0, 52.0, 74.0, 128.0, 199.0, 312.0, 577.0, 932.0, 1767.0, 3142.0, 5882.0, 10862.0, 20660.0, 42201.0, 96741.0, 301245.0, 357247.0, 110139.0, 47332.0, 22794.0, 11933.0, 6331.0, 3444.0, 1914.0, 1022.0, 608.0, 351.0, 210.0, 141.0, 60.0, 55.0, 38.0, 23.0, 17.0, 8.0, 6.0, 8.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.463623046875, -0.4496040344238281, -0.43558502197265625, -0.4215660095214844, -0.4075469970703125, -0.3935279846191406, -0.37950897216796875, -0.3654899597167969, -0.351470947265625, -0.3374519348144531, -0.32343292236328125, -0.3094139099121094, -0.2953948974609375, -0.2813758850097656, -0.26735687255859375, -0.2533378601074219, -0.23931884765625, -0.22529983520507812, -0.21128082275390625, -0.19726181030273438, -0.1832427978515625, -0.16922378540039062, -0.15520477294921875, -0.14118576049804688, -0.127166748046875, -0.11314773559570312, -0.09912872314453125, -0.08510971069335938, -0.0710906982421875, -0.057071685791015625, -0.04305267333984375, -0.029033660888671875, -0.0150146484375, -0.000995635986328125, 0.01302337646484375, 0.027042388916015625, 0.0410614013671875, 0.055080413818359375, 0.06909942626953125, 0.08311843872070312, 0.097137451171875, 0.11115646362304688, 0.12517547607421875, 0.13919448852539062, 0.1532135009765625, 0.16723251342773438, 0.18125152587890625, 0.19527053833007812, 0.20928955078125, 0.22330856323242188, 0.23732757568359375, 0.2513465881347656, 0.2653656005859375, 0.2793846130371094, 0.29340362548828125, 0.3074226379394531, 0.321441650390625, 0.3354606628417969, 0.34947967529296875, 0.3634986877441406, 0.3775177001953125, 0.3915367126464844, 0.40555572509765625, 0.4195747375488281, 0.43359375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 3.0, 8.0, 6.0, 10.0, 13.0, 11.0, 27.0, 14.0, 13.0, 17.0, 26.0, 16.0, 27.0, 29.0, 22.0, 29.0, 37.0, 39.0, 32.0, 38.0, 37.0, 25.0, 1052.0, 35.0, 28.0, 33.0, 32.0, 39.0, 35.0, 28.0, 36.0, 24.0, 22.0, 22.0, 22.0, 16.0, 11.0, 18.0, 13.0, 11.0, 19.0, 12.0, 13.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3203125, -5.137939453125, -4.95556640625, -4.773193359375, -4.5908203125, -4.408447265625, -4.22607421875, -4.043701171875, -3.861328125, -3.678955078125, -3.49658203125, -3.314208984375, -3.1318359375, -2.949462890625, -2.76708984375, -2.584716796875, -2.40234375, -2.219970703125, -2.03759765625, -1.855224609375, -1.6728515625, -1.490478515625, -1.30810546875, -1.125732421875, -0.943359375, -0.760986328125, -0.57861328125, -0.396240234375, -0.2138671875, -0.031494140625, 0.15087890625, 0.333251953125, 0.515625, 0.697998046875, 0.88037109375, 1.062744140625, 1.2451171875, 1.427490234375, 1.60986328125, 1.792236328125, 1.974609375, 2.156982421875, 2.33935546875, 2.521728515625, 2.7041015625, 2.886474609375, 3.06884765625, 3.251220703125, 3.43359375, 3.615966796875, 3.79833984375, 3.980712890625, 4.1630859375, 4.345458984375, 4.52783203125, 4.710205078125, 4.892578125, 5.074951171875, 5.25732421875, 5.439697265625, 5.6220703125, 5.804443359375, 5.98681640625, 6.169189453125, 6.3515625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 7.0, 10.0, 18.0, 23.0, 33.0, 48.0, 64.0, 119.0, 168.0, 231.0, 414.0, 652.0, 984.0, 1446.0, 2222.0, 3463.0, 5202.0, 7954.0, 12408.0, 19276.0, 29108.0, 46736.0, 79327.0, 150575.0, 1319005.0, 179441.0, 91903.0, 52767.0, 32761.0, 21268.0, 13705.0, 8932.0, 5820.0, 3817.0, 2475.0, 1723.0, 1055.0, 667.0, 472.0, 241.0, 211.0, 138.0, 89.0, 53.0, 37.0, 25.0, 16.0, 11.0, 8.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1893310546875, -0.1829395294189453, -0.17654800415039062, -0.17015647888183594, -0.16376495361328125, -0.15737342834472656, -0.15098190307617188, -0.1445903778076172, -0.1381988525390625, -0.1318073272705078, -0.12541580200195312, -0.11902427673339844, -0.11263275146484375, -0.10624122619628906, -0.09984970092773438, -0.09345817565917969, -0.087066650390625, -0.08067512512207031, -0.07428359985351562, -0.06789207458496094, -0.06150054931640625, -0.05510902404785156, -0.048717498779296875, -0.04232597351074219, -0.0359344482421875, -0.029542922973632812, -0.023151397705078125, -0.016759872436523438, -0.01036834716796875, -0.0039768218994140625, 0.002414703369140625, 0.008806228637695312, 0.01519775390625, 0.021589279174804688, 0.027980804443359375, 0.03437232971191406, 0.04076385498046875, 0.04715538024902344, 0.053546905517578125, 0.05993843078613281, 0.0663299560546875, 0.07272148132324219, 0.07911300659179688, 0.08550453186035156, 0.09189605712890625, 0.09828758239746094, 0.10467910766601562, 0.11107063293457031, 0.117462158203125, 0.12385368347167969, 0.13024520874023438, 0.13663673400878906, 0.14302825927734375, 0.14941978454589844, 0.15581130981445312, 0.1622028350830078, 0.1685943603515625, 0.1749858856201172, 0.18137741088867188, 0.18776893615722656, 0.19416046142578125, 0.20055198669433594, 0.20694351196289062, 0.2133350372314453, 0.2197265625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 9.0, 0.0, 3.0, 5.0, 8.0, 4.0, 7.0, 7.0, 10.0, 21.0, 16.0, 16.0, 15.0, 16.0, 31.0, 34.0, 33.0, 31.0, 32.0, 51.0, 38.0, 49.0, 53.0, 41.0, 47.0, 42.0, 41.0, 36.0, 48.0, 21.0, 33.0, 30.0, 32.0, 32.0, 20.0, 22.0, 14.0, 12.0, 10.0, 6.0, 6.0, 5.0, 9.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011259317398071289, -0.00010904483497142792, -0.00010549649596214294, -0.00010194815695285797, -9.8399817943573e-05, -9.485147893428802e-05, -9.130313992500305e-05, -8.775480091571808e-05, -8.42064619064331e-05, -8.065812289714813e-05, -7.710978388786316e-05, -7.356144487857819e-05, -7.001310586929321e-05, -6.646476686000824e-05, -6.291642785072327e-05, -5.9368088841438293e-05, -5.581974983215332e-05, -5.227141082286835e-05, -4.8723071813583374e-05, -4.51747328042984e-05, -4.162639379501343e-05, -3.8078054785728455e-05, -3.452971577644348e-05, -3.098137676715851e-05, -2.7433037757873535e-05, -2.3884698748588562e-05, -2.033635973930359e-05, -1.6788020730018616e-05, -1.3239681720733643e-05, -9.69134271144867e-06, -6.143003702163696e-06, -2.594664692878723e-06, 9.5367431640625e-07, 4.502013325691223e-06, 8.050352334976196e-06, 1.159869134426117e-05, 1.5147030353546143e-05, 1.8695369362831116e-05, 2.224370837211609e-05, 2.5792047381401062e-05, 2.9340386390686035e-05, 3.288872539997101e-05, 3.643706440925598e-05, 3.9985403418540955e-05, 4.353374242782593e-05, 4.70820814371109e-05, 5.0630420446395874e-05, 5.417875945568085e-05, 5.772709846496582e-05, 6.12754374742508e-05, 6.482377648353577e-05, 6.837211549282074e-05, 7.192045450210571e-05, 7.546879351139069e-05, 7.901713252067566e-05, 8.256547152996063e-05, 8.61138105392456e-05, 8.966214954853058e-05, 9.321048855781555e-05, 9.675882756710052e-05, 0.0001003071665763855, 0.00010385550558567047, 0.00010740384459495544, 0.00011095218360424042, 0.00011450052261352539]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 7.0, 5.0, 12.0, 3.0, 4.0, 9.0, 11.0, 14.0, 14.0, 26.0, 35.0, 41.0, 35.0, 46.0, 70.0, 87.0, 144.0, 194.0, 358.0, 1323.0, 28639.0, 860643.0, 152061.0, 3392.0, 524.0, 244.0, 143.0, 105.0, 71.0, 55.0, 49.0, 33.0, 22.0, 33.0, 17.0, 22.0, 15.0, 11.0, 10.0, 7.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020847320556640625, -0.002016812562942505, -0.0019488930702209473, -0.0018809735774993896, -0.001813054084777832, -0.0017451345920562744, -0.0016772150993347168, -0.0016092956066131592, -0.0015413761138916016, -0.001473456621170044, -0.0014055371284484863, -0.0013376176357269287, -0.001269698143005371, -0.0012017786502838135, -0.0011338591575622559, -0.0010659396648406982, -0.0009980201721191406, -0.000930100679397583, -0.0008621811866760254, -0.0007942616939544678, -0.0007263422012329102, -0.0006584227085113525, -0.0005905032157897949, -0.0005225837230682373, -0.0004546642303466797, -0.00038674473762512207, -0.00031882524490356445, -0.00025090575218200684, -0.00018298625946044922, -0.0001150667667388916, -4.7147274017333984e-05, 2.0772218704223633e-05, 8.869171142578125e-05, 0.00015661120414733887, 0.00022453069686889648, 0.0002924501895904541, 0.0003603696823120117, 0.00042828917503356934, 0.000496208667755127, 0.0005641281604766846, 0.0006320476531982422, 0.0006999671459197998, 0.0007678866386413574, 0.000835806131362915, 0.0009037256240844727, 0.0009716451168060303, 0.0010395646095275879, 0.0011074841022491455, 0.0011754035949707031, 0.0012433230876922607, 0.0013112425804138184, 0.001379162073135376, 0.0014470815658569336, 0.0015150010585784912, 0.0015829205513000488, 0.0016508400440216064, 0.001718759536743164, 0.0017866790294647217, 0.0018545985221862793, 0.001922518014907837, 0.0019904375076293945, 0.002058357000350952, 0.0021262764930725098, 0.0021941959857940674, 0.002262115478515625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 10.0, 14.0, 51.0, 137.0, 276.0, 284.0, 153.0, 66.0, 16.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010223874414805323, -8.94940021680668e-05, -7.674926018808037e-05, -6.400451093213633e-05, -5.12597689521499e-05, -3.851502697216347e-05, -2.5770277716219425e-05, -1.3025535736232996e-05, -2.8079375624656677e-07, 1.2463950042729266e-05, 2.52086938417051e-05, 3.7953439459670335e-05, 5.0698181439656764e-05, 6.34429234196432e-05, 7.618767267558724e-05, 8.893241465557367e-05, 0.0001016771566355601, 0.00011442189861554652, 0.00012716664059553295, 0.0001399113971274346, 0.00015265613910742104, 0.00016540088108740747, 0.0001781456230673939, 0.00019089036504738033, 0.00020363510702736676, 0.0002163798490073532, 0.00022912459098733962, 0.00024186933296732605, 0.0002546140749473125, 0.0002673588169272989, 0.0002801035880111158, 0.0002928483299911022, 0.00030559307197108865, 0.0003183378139510751, 0.0003310825559310615, 0.00034382729791104794, 0.00035657203989103436, 0.0003693167818710208, 0.0003820615238510072, 0.00039480626583099365, 0.0004075510078109801, 0.0004202957497909665, 0.00043304049177095294, 0.00044578523375093937, 0.0004585299757309258, 0.00047127471771091223, 0.00048401945969089866, 0.0004967642016708851, 0.0005095090018585324, 0.0005222537438385189, 0.0005349984858185053, 0.0005477432277984917, 0.0005604879697784781, 0.0005732327117584646, 0.000585977453738451, 0.0005987221957184374, 0.0006114669376984239, 0.0006242116796784103, 0.0006369564216583967, 0.0006497011636383832, 0.0006624459056183696, 0.000675190647598356, 0.0006879353895783424, 0.0007006801315583289, 0.0007134248735383153]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 5.0, 5.0, 5.0, 9.0, 11.0, 12.0, 13.0, 14.0, 12.0, 17.0, 14.0, 25.0, 26.0, 35.0, 27.0, 34.0, 47.0, 32.0, 44.0, 39.0, 41.0, 46.0, 44.0, 29.0, 37.0, 31.0, 36.0, 33.0, 28.0, 28.0, 33.0, 25.0, 31.0, 20.0, 19.0, 18.0, 12.0, 10.0, 11.0, 13.0, 8.0, 5.0, 5.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.434057235717773e-05, -8.173007518053055e-05, -7.911957800388336e-05, -7.650908082723618e-05, -7.389858365058899e-05, -7.12880864739418e-05, -6.867758929729462e-05, -6.606709212064743e-05, -6.345659494400024e-05, -6.084609776735306e-05, -5.823560059070587e-05, -5.5625103414058685e-05, -5.30146062374115e-05, -5.040410906076431e-05, -4.7793611884117126e-05, -4.518311470746994e-05, -4.2572617530822754e-05, -3.996212035417557e-05, -3.735162317752838e-05, -3.4741126000881195e-05, -3.213062882423401e-05, -2.9520131647586823e-05, -2.6909634470939636e-05, -2.429913729429245e-05, -2.1688640117645264e-05, -1.9078142940998077e-05, -1.646764576435089e-05, -1.3857148587703705e-05, -1.1246651411056519e-05, -8.636154234409332e-06, -6.025657057762146e-06, -3.4151598811149597e-06, -8.046627044677734e-07, 1.8058344721794128e-06, 4.416331648826599e-06, 7.026828825473785e-06, 9.637326002120972e-06, 1.2247823178768158e-05, 1.4858320355415344e-05, 1.746881753206253e-05, 2.0079314708709717e-05, 2.2689811885356903e-05, 2.530030906200409e-05, 2.7910806238651276e-05, 3.052130341529846e-05, 3.313180059194565e-05, 3.5742297768592834e-05, 3.835279494524002e-05, 4.096329212188721e-05, 4.357378929853439e-05, 4.618428647518158e-05, 4.8794783651828766e-05, 5.140528082847595e-05, 5.401577800512314e-05, 5.6626275181770325e-05, 5.923677235841751e-05, 6.18472695350647e-05, 6.445776671171188e-05, 6.706826388835907e-05, 6.967876106500626e-05, 7.228925824165344e-05, 7.489975541830063e-05, 7.751025259494781e-05, 8.0120749771595e-05, 8.273124694824219e-05]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 10.0, 14.0, 15.0, 28.0, 15.0, 17.0, 35.0, 30.0, 44.0, 49.0, 48.0, 53.0, 50.0, 57.0, 69.0, 48.0, 55.0, 54.0, 49.0, 52.0, 43.0, 26.0, 24.0, 18.0, 22.0, 12.0, 10.0, 14.0, 9.0, 6.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.9281005859375, -8.598388671875, -8.2686767578125, -7.93896484375, -7.6092529296875, -7.279541015625, -6.9498291015625, -6.6201171875, -6.2904052734375, -5.960693359375, -5.6309814453125, -5.30126953125, -4.9715576171875, -4.641845703125, -4.3121337890625, -3.982421875, -3.6527099609375, -3.322998046875, -2.9932861328125, -2.66357421875, -2.3338623046875, -2.004150390625, -1.6744384765625, -1.3447265625, -1.0150146484375, -0.685302734375, -0.3555908203125, -0.02587890625, 0.3038330078125, 0.633544921875, 0.9632568359375, 1.29296875, 1.6226806640625, 1.952392578125, 2.2821044921875, 2.61181640625, 2.9415283203125, 3.271240234375, 3.6009521484375, 3.9306640625, 4.2603759765625, 4.590087890625, 4.9197998046875, 5.24951171875, 5.5792236328125, 5.908935546875, 6.2386474609375, 6.568359375, 6.8980712890625, 7.227783203125, 7.5574951171875, 7.88720703125, 8.2169189453125, 8.546630859375, 8.8763427734375, 9.2060546875, 9.5357666015625, 9.865478515625, 10.1951904296875, 10.52490234375, 10.8546142578125, 11.184326171875, 11.5140380859375, 11.84375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 3.0, 8.0, 14.0, 16.0, 24.0, 26.0, 49.0, 55.0, 87.0, 137.0, 224.0, 381.0, 704.0, 1312.0, 2578.0, 5296.0, 12659.0, 33760.0, 102700.0, 337400.0, 371573.0, 116290.0, 37618.0, 13814.0, 5699.0, 2848.0, 1439.0, 735.0, 364.0, 258.0, 168.0, 104.0, 60.0, 45.0, 30.0, 21.0, 10.0, 9.0, 13.0, 5.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.28125, -17.744384765625, -17.20751953125, -16.670654296875, -16.1337890625, -15.596923828125, -15.06005859375, -14.523193359375, -13.986328125, -13.449462890625, -12.91259765625, -12.375732421875, -11.8388671875, -11.302001953125, -10.76513671875, -10.228271484375, -9.69140625, -9.154541015625, -8.61767578125, -8.080810546875, -7.5439453125, -7.007080078125, -6.47021484375, -5.933349609375, -5.396484375, -4.859619140625, -4.32275390625, -3.785888671875, -3.2490234375, -2.712158203125, -2.17529296875, -1.638427734375, -1.1015625, -0.564697265625, -0.02783203125, 0.509033203125, 1.0458984375, 1.582763671875, 2.11962890625, 2.656494140625, 3.193359375, 3.730224609375, 4.26708984375, 4.803955078125, 5.3408203125, 5.877685546875, 6.41455078125, 6.951416015625, 7.48828125, 8.025146484375, 8.56201171875, 9.098876953125, 9.6357421875, 10.172607421875, 10.70947265625, 11.246337890625, 11.783203125, 12.320068359375, 12.85693359375, 13.393798828125, 13.9306640625, 14.467529296875, 15.00439453125, 15.541259765625, 16.078125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 6.0, 7.0, 6.0, 5.0, 10.0, 14.0, 21.0, 15.0, 21.0, 42.0, 37.0, 48.0, 64.0, 90.0, 135.0, 177.0, 1356.0, 268.0, 193.0, 138.0, 80.0, 67.0, 58.0, 36.0, 42.0, 29.0, 22.0, 19.0, 8.0, 9.0, 10.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.4375, -23.58984375, -22.7421875, -21.89453125, -21.046875, -20.19921875, -19.3515625, -18.50390625, -17.65625, -16.80859375, -15.9609375, -15.11328125, -14.265625, -13.41796875, -12.5703125, -11.72265625, -10.875, -10.02734375, -9.1796875, -8.33203125, -7.484375, -6.63671875, -5.7890625, -4.94140625, -4.09375, -3.24609375, -2.3984375, -1.55078125, -0.703125, 0.14453125, 0.9921875, 1.83984375, 2.6875, 3.53515625, 4.3828125, 5.23046875, 6.078125, 6.92578125, 7.7734375, 8.62109375, 9.46875, 10.31640625, 11.1640625, 12.01171875, 12.859375, 13.70703125, 14.5546875, 15.40234375, 16.25, 17.09765625, 17.9453125, 18.79296875, 19.640625, 20.48828125, 21.3359375, 22.18359375, 23.03125, 23.87890625, 24.7265625, 25.57421875, 26.421875, 27.26953125, 28.1171875, 28.96484375, 29.8125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 5.0, 10.0, 16.0, 26.0, 69.0, 119.0, 291.0, 961.0, 11646.0, 3122732.0, 8496.0, 847.0, 260.0, 108.0, 49.0, 20.0, 14.0, 15.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.1875, -122.4169921875, -118.646484375, -114.8759765625, -111.10546875, -107.3349609375, -103.564453125, -99.7939453125, -96.0234375, -92.2529296875, -88.482421875, -84.7119140625, -80.94140625, -77.1708984375, -73.400390625, -69.6298828125, -65.859375, -62.0888671875, -58.318359375, -54.5478515625, -50.77734375, -47.0068359375, -43.236328125, -39.4658203125, -35.6953125, -31.9248046875, -28.154296875, -24.3837890625, -20.61328125, -16.8427734375, -13.072265625, -9.3017578125, -5.53125, -1.7607421875, 2.009765625, 5.7802734375, 9.55078125, 13.3212890625, 17.091796875, 20.8623046875, 24.6328125, 28.4033203125, 32.173828125, 35.9443359375, 39.71484375, 43.4853515625, 47.255859375, 51.0263671875, 54.796875, 58.5673828125, 62.337890625, 66.1083984375, 69.87890625, 73.6494140625, 77.419921875, 81.1904296875, 84.9609375, 88.7314453125, 92.501953125, 96.2724609375, 100.04296875, 103.8134765625, 107.583984375, 111.3544921875, 115.125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 13.0, 18.0, 29.0, 68.0, 133.0, 195.0, 215.0, 169.0, 89.0, 49.0, 19.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-191.60662841796875, -187.16661071777344, -182.72659301757812, -178.28659057617188, -173.84657287597656, -169.40655517578125, -164.96653747558594, -160.52651977539062, -156.08651733398438, -151.64649963378906, -147.20648193359375, -142.7664794921875, -138.3264617919922, -133.88644409179688, -129.44642639160156, -125.00640869140625, -120.56639099121094, -116.12637329101562, -111.68636322021484, -107.24634552001953, -102.80633544921875, -98.36631774902344, -93.92630004882812, -89.48628234863281, -85.04627227783203, -80.60625457763672, -76.16624450683594, -71.72622680664062, -67.28620910644531, -62.84619903564453, -58.40618133544922, -53.96616744995117, -49.52616882324219, -45.08615493774414, -40.646141052246094, -36.20612335205078, -31.766109466552734, -27.326095581054688, -22.886079788208008, -18.446063995361328, -14.006050109863281, -9.566035270690918, -5.126020431518555, -0.6860055923461914, 3.754009246826172, 8.194023132324219, 12.634038925170898, 17.074054718017578, 21.514068603515625, 25.954082489013672, 30.39409828186035, 34.83411407470703, 39.27412796020508, 43.714141845703125, 48.15415954589844, 52.594173431396484, 57.03418731689453, 61.47420120239258, 65.91421508789062, 70.35423278808594, 74.79425048828125, 79.23426055908203, 83.67427825927734, 88.11428833007812, 92.55430603027344]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 9.0, 10.0, 7.0, 6.0, 13.0, 10.0, 19.0, 12.0, 18.0, 16.0, 27.0, 23.0, 36.0, 24.0, 36.0, 35.0, 31.0, 38.0, 33.0, 44.0, 53.0, 39.0, 41.0, 30.0, 36.0, 36.0, 37.0, 29.0, 34.0, 30.0, 23.0, 16.0, 26.0, 17.0, 13.0, 14.0, 11.0, 14.0, 7.0, 10.0, 9.0, 3.0, 5.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.862159729003906, -51.848602294921875, -49.83504867553711, -47.82149124145508, -45.80793380737305, -43.79438018798828, -41.78082275390625, -39.76726531982422, -37.75370788574219, -35.740150451660156, -33.72659683227539, -31.71303939819336, -29.699481964111328, -27.68592643737793, -25.67237091064453, -23.6588134765625, -21.645259857177734, -19.631704330444336, -17.618146896362305, -15.604591369628906, -13.591034889221191, -11.577478408813477, -9.563922882080078, -7.550366401672363, -5.536809921264648, -3.5232536792755127, -1.509697437286377, 0.5038585662841797, 2.5174150466918945, 4.530971527099609, 6.544527053833008, 8.558083534240723, 10.571640014648438, 12.585196495056152, 14.598752975463867, 16.612308502197266, 18.625865936279297, 20.639421463012695, 22.652976989746094, 24.666534423828125, 26.680089950561523, 28.693645477294922, 30.707202911376953, 32.72075653076172, 34.73431396484375, 36.74787139892578, 38.76142883300781, 40.77498245239258, 42.78853988647461, 44.80209732055664, 46.815650939941406, 48.82920837402344, 50.84276580810547, 52.8563232421875, 54.869876861572266, 56.8834342956543, 58.89698791503906, 60.910545349121094, 62.92409896850586, 64.93765258789062, 66.95121002197266, 68.96476745605469, 70.97832489013672, 72.99188232421875, 75.00543975830078]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 10.0, 10.0, 16.0, 12.0, 24.0, 19.0, 26.0, 39.0, 39.0, 35.0, 37.0, 53.0, 46.0, 63.0, 50.0, 49.0, 59.0, 48.0, 59.0, 54.0, 39.0, 33.0, 36.0, 29.0, 25.0, 22.0, 19.0, 9.0, 11.0, 6.0, 5.0, 4.0, 5.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.7874755859375, -9.449951171875, -9.1124267578125, -8.77490234375, -8.4373779296875, -8.099853515625, -7.7623291015625, -7.4248046875, -7.0872802734375, -6.749755859375, -6.4122314453125, -6.07470703125, -5.7371826171875, -5.399658203125, -5.0621337890625, -4.724609375, -4.3870849609375, -4.049560546875, -3.7120361328125, -3.37451171875, -3.0369873046875, -2.699462890625, -2.3619384765625, -2.0244140625, -1.6868896484375, -1.349365234375, -1.0118408203125, -0.67431640625, -0.3367919921875, 0.000732421875, 0.3382568359375, 0.67578125, 1.0133056640625, 1.350830078125, 1.6883544921875, 2.02587890625, 2.3634033203125, 2.700927734375, 3.0384521484375, 3.3759765625, 3.7135009765625, 4.051025390625, 4.3885498046875, 4.72607421875, 5.0635986328125, 5.401123046875, 5.7386474609375, 6.076171875, 6.4136962890625, 6.751220703125, 7.0887451171875, 7.42626953125, 7.7637939453125, 8.101318359375, 8.4388427734375, 8.7763671875, 9.1138916015625, 9.451416015625, 9.7889404296875, 10.12646484375, 10.4639892578125, 10.801513671875, 11.1390380859375, 11.4765625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 6.0, 11.0, 16.0, 32.0, 50.0, 115.0, 191.0, 356.0, 651.0, 1194.0, 2366.0, 4758.0, 10994.0, 30702.0, 154525.0, 2722802.0, 1149008.0, 79987.0, 20971.0, 8094.0, 3585.0, 1864.0, 973.0, 459.0, 268.0, 127.0, 84.0, 36.0, 22.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.3125, -35.27001953125, -34.2275390625, -33.18505859375, -32.142578125, -31.10009765625, -30.0576171875, -29.01513671875, -27.97265625, -26.93017578125, -25.8876953125, -24.84521484375, -23.802734375, -22.76025390625, -21.7177734375, -20.67529296875, -19.6328125, -18.59033203125, -17.5478515625, -16.50537109375, -15.462890625, -14.42041015625, -13.3779296875, -12.33544921875, -11.29296875, -10.25048828125, -9.2080078125, -8.16552734375, -7.123046875, -6.08056640625, -5.0380859375, -3.99560546875, -2.953125, -1.91064453125, -0.8681640625, 0.17431640625, 1.216796875, 2.25927734375, 3.3017578125, 4.34423828125, 5.38671875, 6.42919921875, 7.4716796875, 8.51416015625, 9.556640625, 10.59912109375, 11.6416015625, 12.68408203125, 13.7265625, 14.76904296875, 15.8115234375, 16.85400390625, 17.896484375, 18.93896484375, 19.9814453125, 21.02392578125, 22.06640625, 23.10888671875, 24.1513671875, 25.19384765625, 26.236328125, 27.27880859375, 28.3212890625, 29.36376953125, 30.40625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 5.0, 12.0, 9.0, 18.0, 41.0, 73.0, 116.0, 243.0, 440.0, 864.0, 1032.0, 575.0, 278.0, 140.0, 103.0, 43.0, 24.0, 19.0, 10.0, 4.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0], "bins": [-48.21875, -47.197509765625, -46.17626953125, -45.155029296875, -44.1337890625, -43.112548828125, -42.09130859375, -41.070068359375, -40.048828125, -39.027587890625, -38.00634765625, -36.985107421875, -35.9638671875, -34.942626953125, -33.92138671875, -32.900146484375, -31.87890625, -30.857666015625, -29.83642578125, -28.815185546875, -27.7939453125, -26.772705078125, -25.75146484375, -24.730224609375, -23.708984375, -22.687744140625, -21.66650390625, -20.645263671875, -19.6240234375, -18.602783203125, -17.58154296875, -16.560302734375, -15.5390625, -14.517822265625, -13.49658203125, -12.475341796875, -11.4541015625, -10.432861328125, -9.41162109375, -8.390380859375, -7.369140625, -6.347900390625, -5.32666015625, -4.305419921875, -3.2841796875, -2.262939453125, -1.24169921875, -0.220458984375, 0.80078125, 1.822021484375, 2.84326171875, 3.864501953125, 4.8857421875, 5.906982421875, 6.92822265625, 7.949462890625, 8.970703125, 9.991943359375, 11.01318359375, 12.034423828125, 13.0556640625, 14.076904296875, 15.09814453125, 16.119384765625, 17.140625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 8.0, 4.0, 10.0, 17.0, 23.0, 29.0, 52.0, 78.0, 145.0, 259.0, 593.0, 1542.0, 5972.0, 43770.0, 1539352.0, 2535884.0, 56284.0, 7240.0, 1725.0, 610.0, 289.0, 149.0, 91.0, 50.0, 31.0, 10.0, 20.0, 11.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.625, -31.0751953125, -29.525390625, -27.9755859375, -26.42578125, -24.8759765625, -23.326171875, -21.7763671875, -20.2265625, -18.6767578125, -17.126953125, -15.5771484375, -14.02734375, -12.4775390625, -10.927734375, -9.3779296875, -7.828125, -6.2783203125, -4.728515625, -3.1787109375, -1.62890625, -0.0791015625, 1.470703125, 3.0205078125, 4.5703125, 6.1201171875, 7.669921875, 9.2197265625, 10.76953125, 12.3193359375, 13.869140625, 15.4189453125, 16.96875, 18.5185546875, 20.068359375, 21.6181640625, 23.16796875, 24.7177734375, 26.267578125, 27.8173828125, 29.3671875, 30.9169921875, 32.466796875, 34.0166015625, 35.56640625, 37.1162109375, 38.666015625, 40.2158203125, 41.765625, 43.3154296875, 44.865234375, 46.4150390625, 47.96484375, 49.5146484375, 51.064453125, 52.6142578125, 54.1640625, 55.7138671875, 57.263671875, 58.8134765625, 60.36328125, 61.9130859375, 63.462890625, 65.0126953125, 66.5625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 14.0, 90.0, 335.0, 405.0, 144.0, 24.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-406.2010498046875, -393.9336242675781, -381.66619873046875, -369.39874267578125, -357.1313171386719, -344.8638916015625, -332.5964660644531, -320.32904052734375, -308.06158447265625, -295.7941589355469, -283.5267333984375, -271.25927734375, -258.9918518066406, -246.72442626953125, -234.45700073242188, -222.1895751953125, -209.92214965820312, -197.65472412109375, -185.3872833251953, -173.11985778808594, -160.8524169921875, -148.58499145507812, -136.31756591796875, -124.05013275146484, -111.78269958496094, -99.51526641845703, -87.24783325195312, -74.98040771484375, -62.712974548339844, -50.44554138183594, -38.17811584472656, -25.910682678222656, -13.643280029296875, -1.3758487701416016, 10.891582489013672, 23.159011840820312, 35.42644500732422, 47.693878173828125, 59.9613037109375, 72.2287368774414, 84.49617004394531, 96.76360321044922, 109.03103637695312, 121.2984619140625, 133.56588745117188, 145.8333282470703, 158.1007537841797, 170.36819458007812, 182.6356201171875, 194.90304565429688, 207.1704864501953, 219.4379119873047, 231.70535278320312, 243.9727783203125, 256.2402038574219, 268.50762939453125, 280.77508544921875, 293.0425109863281, 305.3099365234375, 317.577392578125, 329.8448181152344, 342.11224365234375, 354.3796691894531, 366.6470947265625, 378.9145202636719]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 11.0, 18.0, 29.0, 46.0, 58.0, 46.0, 61.0, 89.0, 88.0, 94.0, 89.0, 78.0, 58.0, 63.0, 38.0, 42.0, 33.0, 16.0, 16.0, 14.0, 4.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.41453552246094, -121.85604858398438, -117.29756164550781, -112.73908233642578, -108.18059539794922, -103.62210845947266, -99.06362915039062, -94.50514221191406, -89.9466552734375, -85.38816833496094, -80.82968139648438, -76.27120208740234, -71.71271514892578, -67.15422821044922, -62.59574508666992, -58.037261962890625, -53.47877502441406, -48.9202880859375, -44.3618049621582, -39.803321838378906, -35.244834899902344, -30.686349868774414, -26.127864837646484, -21.569379806518555, -17.010894775390625, -12.452409744262695, -7.893924713134766, -3.335439682006836, 1.2230453491210938, 5.781530380249023, 10.340015411376953, 14.898500442504883, 19.457000732421875, 24.015485763549805, 28.573970794677734, 33.13245391845703, 37.690940856933594, 42.249427795410156, 46.80791091918945, 51.36639404296875, 55.92488098144531, 60.483367919921875, 65.04185485839844, 69.60033416748047, 74.15882110595703, 78.7173080444336, 83.27578735351562, 87.83427429199219, 92.39276123046875, 96.95124816894531, 101.50973510742188, 106.0682144165039, 110.62670135498047, 115.18518829345703, 119.74366760253906, 124.30215454101562, 128.8606414794922, 133.41912841796875, 137.9776153564453, 142.53610229492188, 147.09457397460938, 151.65306091308594, 156.2115478515625, 160.77003479003906, 165.32852172851562]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 5.0, 10.0, 12.0, 9.0, 22.0, 19.0, 19.0, 14.0, 25.0, 35.0, 34.0, 31.0, 27.0, 39.0, 33.0, 38.0, 45.0, 35.0, 39.0, 43.0, 43.0, 43.0, 43.0, 49.0, 42.0, 23.0, 28.0, 36.0, 24.0, 25.0, 22.0, 21.0, 8.0, 16.0, 3.0, 11.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1796875, -7.893798828125, -7.60791015625, -7.322021484375, -7.0361328125, -6.750244140625, -6.46435546875, -6.178466796875, -5.892578125, -5.606689453125, -5.32080078125, -5.034912109375, -4.7490234375, -4.463134765625, -4.17724609375, -3.891357421875, -3.60546875, -3.319580078125, -3.03369140625, -2.747802734375, -2.4619140625, -2.176025390625, -1.89013671875, -1.604248046875, -1.318359375, -1.032470703125, -0.74658203125, -0.460693359375, -0.1748046875, 0.111083984375, 0.39697265625, 0.682861328125, 0.96875, 1.254638671875, 1.54052734375, 1.826416015625, 2.1123046875, 2.398193359375, 2.68408203125, 2.969970703125, 3.255859375, 3.541748046875, 3.82763671875, 4.113525390625, 4.3994140625, 4.685302734375, 4.97119140625, 5.257080078125, 5.54296875, 5.828857421875, 6.11474609375, 6.400634765625, 6.6865234375, 6.972412109375, 7.25830078125, 7.544189453125, 7.830078125, 8.115966796875, 8.40185546875, 8.687744140625, 8.9736328125, 9.259521484375, 9.54541015625, 9.831298828125, 10.1171875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 0.0, 10.0, 10.0, 7.0, 25.0, 12.0, 35.0, 60.0, 73.0, 126.0, 183.0, 261.0, 377.0, 589.0, 885.0, 1371.0, 2053.0, 3209.0, 4982.0, 7579.0, 11537.0, 18047.0, 28867.0, 45953.0, 75391.0, 139586.0, 281258.0, 184898.0, 92349.0, 54632.0, 33760.0, 21442.0, 13662.0, 8709.0, 5684.0, 3783.0, 2424.0, 1590.0, 1040.0, 693.0, 475.0, 298.0, 212.0, 122.0, 111.0, 62.0, 38.0, 30.0, 17.0, 14.0, 12.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.376953125, -0.36576080322265625, -0.3545684814453125, -0.34337615966796875, -0.332183837890625, -0.32099151611328125, -0.3097991943359375, -0.29860687255859375, -0.28741455078125, -0.27622222900390625, -0.2650299072265625, -0.25383758544921875, -0.242645263671875, -0.23145294189453125, -0.2202606201171875, -0.20906829833984375, -0.1978759765625, -0.18668365478515625, -0.1754913330078125, -0.16429901123046875, -0.153106689453125, -0.14191436767578125, -0.1307220458984375, -0.11952972412109375, -0.10833740234375, -0.09714508056640625, -0.0859527587890625, -0.07476043701171875, -0.063568115234375, -0.05237579345703125, -0.0411834716796875, -0.02999114990234375, -0.018798828125, -0.00760650634765625, 0.0035858154296875, 0.01477813720703125, 0.025970458984375, 0.03716278076171875, 0.0483551025390625, 0.05954742431640625, 0.07073974609375, 0.08193206787109375, 0.0931243896484375, 0.10431671142578125, 0.115509033203125, 0.12670135498046875, 0.1378936767578125, 0.14908599853515625, 0.1602783203125, 0.17147064208984375, 0.1826629638671875, 0.19385528564453125, 0.205047607421875, 0.21623992919921875, 0.2274322509765625, 0.23862457275390625, 0.24981689453125, 0.26100921630859375, 0.2722015380859375, 0.28339385986328125, 0.294586181640625, 0.30577850341796875, 0.3169708251953125, 0.32816314697265625, 0.33935546875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 1.0, 8.0, 5.0, 6.0, 7.0, 13.0, 12.0, 8.0, 13.0, 21.0, 9.0, 22.0, 28.0, 31.0, 25.0, 27.0, 24.0, 32.0, 29.0, 43.0, 30.0, 43.0, 32.0, 1049.0, 39.0, 37.0, 44.0, 36.0, 30.0, 33.0, 30.0, 34.0, 30.0, 27.0, 15.0, 22.0, 20.0, 14.0, 14.0, 17.0, 11.0, 13.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-6.43359375, -6.24078369140625, -6.0479736328125, -5.85516357421875, -5.662353515625, -5.46954345703125, -5.2767333984375, -5.08392333984375, -4.89111328125, -4.69830322265625, -4.5054931640625, -4.31268310546875, -4.119873046875, -3.92706298828125, -3.7342529296875, -3.54144287109375, -3.3486328125, -3.15582275390625, -2.9630126953125, -2.77020263671875, -2.577392578125, -2.38458251953125, -2.1917724609375, -1.99896240234375, -1.80615234375, -1.61334228515625, -1.4205322265625, -1.22772216796875, -1.034912109375, -0.84210205078125, -0.6492919921875, -0.45648193359375, -0.263671875, -0.07086181640625, 0.1219482421875, 0.31475830078125, 0.507568359375, 0.70037841796875, 0.8931884765625, 1.08599853515625, 1.27880859375, 1.47161865234375, 1.6644287109375, 1.85723876953125, 2.050048828125, 2.24285888671875, 2.4356689453125, 2.62847900390625, 2.8212890625, 3.01409912109375, 3.2069091796875, 3.39971923828125, 3.592529296875, 3.78533935546875, 3.9781494140625, 4.17095947265625, 4.36376953125, 4.55657958984375, 4.7493896484375, 4.94219970703125, 5.135009765625, 5.32781982421875, 5.5206298828125, 5.71343994140625, 5.90625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 12.0, 9.0, 14.0, 33.0, 45.0, 69.0, 115.0, 185.0, 298.0, 404.0, 651.0, 1028.0, 1575.0, 2378.0, 3702.0, 5887.0, 9381.0, 15122.0, 24297.0, 40727.0, 71490.0, 140912.0, 1331946.0, 211261.0, 98835.0, 53627.0, 31712.0, 18952.0, 11906.0, 7448.0, 4704.0, 2962.0, 1919.0, 1258.0, 776.0, 520.0, 330.0, 257.0, 137.0, 91.0, 63.0, 30.0, 26.0, 10.0, 7.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.23486328125, -0.22746658325195312, -0.22006988525390625, -0.21267318725585938, -0.2052764892578125, -0.19787979125976562, -0.19048309326171875, -0.18308639526367188, -0.175689697265625, -0.16829299926757812, -0.16089630126953125, -0.15349960327148438, -0.1461029052734375, -0.13870620727539062, -0.13130950927734375, -0.12391281127929688, -0.11651611328125, -0.10911941528320312, -0.10172271728515625, -0.09432601928710938, -0.0869293212890625, -0.07953262329101562, -0.07213592529296875, -0.06473922729492188, -0.057342529296875, -0.049945831298828125, -0.04254913330078125, -0.035152435302734375, -0.0277557373046875, -0.020359039306640625, -0.01296234130859375, -0.005565643310546875, 0.0018310546875, 0.009227752685546875, 0.01662445068359375, 0.024021148681640625, 0.0314178466796875, 0.038814544677734375, 0.04621124267578125, 0.053607940673828125, 0.061004638671875, 0.06840133666992188, 0.07579803466796875, 0.08319473266601562, 0.0905914306640625, 0.09798812866210938, 0.10538482666015625, 0.11278152465820312, 0.12017822265625, 0.12757492065429688, 0.13497161865234375, 0.14236831665039062, 0.1497650146484375, 0.15716171264648438, 0.16455841064453125, 0.17195510864257812, 0.179351806640625, 0.18674850463867188, 0.19414520263671875, 0.20154190063476562, 0.2089385986328125, 0.21633529663085938, 0.22373199462890625, 0.23112869262695312, 0.238525390625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 10.0, 4.0, 6.0, 11.0, 12.0, 11.0, 14.0, 19.0, 22.0, 21.0, 30.0, 32.0, 46.0, 49.0, 45.0, 32.0, 49.0, 48.0, 51.0, 47.0, 44.0, 35.0, 44.0, 41.0, 38.0, 41.0, 30.0, 28.0, 23.0, 24.0, 18.0, 15.0, 12.0, 7.0, 7.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00017964839935302734, -0.00017410330474376678, -0.00016855821013450623, -0.00016301311552524567, -0.0001574680209159851, -0.00015192292630672455, -0.000146377831697464, -0.00014083273708820343, -0.00013528764247894287, -0.0001297425478696823, -0.00012419745326042175, -0.0001186523586511612, -0.00011310726404190063, -0.00010756216943264008, -0.00010201707482337952, -9.647198021411896e-05, -9.09268856048584e-05, -8.538179099559784e-05, -7.983669638633728e-05, -7.429160177707672e-05, -6.874650716781616e-05, -6.32014125585556e-05, -5.7656317949295044e-05, -5.2111223340034485e-05, -4.6566128730773926e-05, -4.102103412151337e-05, -3.547593951225281e-05, -2.993084490299225e-05, -2.438575029373169e-05, -1.884065568447113e-05, -1.3295561075210571e-05, -7.750466465950012e-06, -2.205371856689453e-06, 3.339722752571106e-06, 8.884817361831665e-06, 1.4429911971092224e-05, 1.9975006580352783e-05, 2.5520101189613342e-05, 3.10651957988739e-05, 3.661029040813446e-05, 4.215538501739502e-05, 4.770047962665558e-05, 5.324557423591614e-05, 5.87906688451767e-05, 6.433576345443726e-05, 6.988085806369781e-05, 7.542595267295837e-05, 8.097104728221893e-05, 8.651614189147949e-05, 9.206123650074005e-05, 9.760633111000061e-05, 0.00010315142571926117, 0.00010869652032852173, 0.00011424161493778229, 0.00011978670954704285, 0.0001253318041563034, 0.00013087689876556396, 0.00013642199337482452, 0.00014196708798408508, 0.00014751218259334564, 0.0001530572772026062, 0.00015860237181186676, 0.00016414746642112732, 0.00016969256103038788, 0.00017523765563964844]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 5.0, 3.0, 6.0, 9.0, 7.0, 5.0, 16.0, 15.0, 15.0, 25.0, 43.0, 44.0, 66.0, 63.0, 87.0, 120.0, 178.0, 204.0, 407.0, 779.0, 4518.0, 409969.0, 623287.0, 6450.0, 908.0, 383.0, 242.0, 183.0, 129.0, 87.0, 51.0, 50.0, 40.0, 33.0, 36.0, 17.0, 23.0, 12.0, 8.0, 4.0, 7.0, 3.0, 9.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0027618408203125, -0.0026668012142181396, -0.0025717616081237793, -0.002476722002029419, -0.0023816823959350586, -0.0022866427898406982, -0.002191603183746338, -0.0020965635776519775, -0.002001523971557617, -0.0019064843654632568, -0.0018114447593688965, -0.0017164051532745361, -0.0016213655471801758, -0.0015263259410858154, -0.001431286334991455, -0.0013362467288970947, -0.0012412071228027344, -0.001146167516708374, -0.0010511279106140137, -0.0009560883045196533, -0.000861048698425293, -0.0007660090923309326, -0.0006709694862365723, -0.0005759298801422119, -0.00048089027404785156, -0.0003858506679534912, -0.00029081106185913086, -0.0001957714557647705, -0.00010073184967041016, -5.692243576049805e-06, 8.934736251831055e-05, 0.0001843869686126709, 0.00027942657470703125, 0.0003744661808013916, 0.00046950578689575195, 0.0005645453929901123, 0.0006595849990844727, 0.000754624605178833, 0.0008496642112731934, 0.0009447038173675537, 0.001039743423461914, 0.0011347830295562744, 0.0012298226356506348, 0.0013248622417449951, 0.0014199018478393555, 0.0015149414539337158, 0.0016099810600280762, 0.0017050206661224365, 0.0018000602722167969, 0.0018950998783111572, 0.0019901394844055176, 0.002085179090499878, 0.0021802186965942383, 0.0022752583026885986, 0.002370297908782959, 0.0024653375148773193, 0.0025603771209716797, 0.00265541672706604, 0.0027504563331604004, 0.0028454959392547607, 0.002940535545349121, 0.0030355751514434814, 0.003130614757537842, 0.003225654363632202, 0.0033206939697265625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 33.0, 291.0, 538.0, 134.0, 13.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004836737643927336, -0.00044425265514291823, -0.0004048315458931029, -0.000365410465747118, -0.00032598935649730265, -0.0002865682472474873, -0.0002471471671015024, -0.00020772605785168707, -0.00016830494860187173, -0.00012888383935205638, -8.946274465415627e-05, -5.004164268029854e-05, -1.0620540706440806e-05, 2.880056854337454e-05, 6.822166324127465e-05, 0.00010764275793917477, 0.00014706386718899012, 0.00018648497643880546, 0.00022590607113670558, 0.0002653271658346057, 0.00030474827508442104, 0.0003441693843342364, 0.00038359046448022127, 0.0004230115737300366, 0.00046243268297985196, 0.0005018537631258368, 0.0005412749014794827, 0.0005806959816254675, 0.0006201170617714524, 0.0006595382001250982, 0.0006989592802710831, 0.000738380360417068, 0.0007778014987707138, 0.0008172225789166987, 0.0008566437172703445, 0.0008960647974163294, 0.0009354859357699752, 0.0009749070159159601, 0.001014328096061945, 0.0010537492344155908, 0.0010931703727692366, 0.0011325915111228824, 0.0011720125330612063, 0.0012114336714148521, 0.001250854809768498, 0.0012902759481221437, 0.0013296969700604677, 0.0013691181084141135, 0.0014085391303524375, 0.0014479602687060833, 0.0014873812906444073, 0.001526802428998053, 0.0015662235673516989, 0.0016056445892900229, 0.0016450657276436687, 0.0016844868659973145, 0.0017239078879356384, 0.0017633290262892842, 0.0018027500482276082, 0.001842171186581254, 0.0018815923249348998, 0.0019210134632885456, 0.0019604344852268696, 0.0019998555071651936, 0.002039276761934161]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 5.0, 3.0, 4.0, 9.0, 8.0, 10.0, 10.0, 18.0, 16.0, 13.0, 32.0, 38.0, 29.0, 45.0, 47.0, 56.0, 32.0, 52.0, 53.0, 50.0, 36.0, 47.0, 53.0, 52.0, 49.0, 45.0, 28.0, 40.0, 24.0, 16.0, 16.0, 20.0, 13.0, 13.0, 6.0, 5.0, 7.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013780593872070312, -0.0001315521076321602, -0.00012529827654361725, -0.00011904444545507431, -0.00011279061436653137, -0.00010653678327798843, -0.0001002829521894455, -9.402912110090256e-05, -8.777529001235962e-05, -8.152145892381668e-05, -7.526762783527374e-05, -6.90137967467308e-05, -6.275996565818787e-05, -5.650613456964493e-05, -5.025230348110199e-05, -4.399847239255905e-05, -3.774464130401611e-05, -3.1490810215473175e-05, -2.5236979126930237e-05, -1.89831480383873e-05, -1.272931694984436e-05, -6.475485861301422e-06, -2.2165477275848389e-07, 6.032176315784454e-06, 1.2286007404327393e-05, 1.853983849287033e-05, 2.479366958141327e-05, 3.104750066995621e-05, 3.7301331758499146e-05, 4.3555162847042084e-05, 4.980899393558502e-05, 5.606282502412796e-05, 6.23166561126709e-05, 6.857048720121384e-05, 7.482431828975677e-05, 8.107814937829971e-05, 8.733198046684265e-05, 9.358581155538559e-05, 9.983964264392853e-05, 0.00010609347373247147, 0.0001123473048210144, 0.00011860113590955734, 0.00012485496699810028, 0.00013110879808664322, 0.00013736262917518616, 0.0001436164602637291, 0.00014987029135227203, 0.00015612412244081497, 0.0001623779535293579, 0.00016863178461790085, 0.0001748856157064438, 0.00018113944679498672, 0.00018739327788352966, 0.0001936471089720726, 0.00019990094006061554, 0.00020615477114915848, 0.00021240860223770142, 0.00021866243332624435, 0.0002249162644147873, 0.00023117009550333023, 0.00023742392659187317, 0.0002436777576804161, 0.00024993158876895905, 0.000256185419857502, 0.0002624392509460449]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 5.0, 10.0, 12.0, 9.0, 22.0, 19.0, 19.0, 14.0, 25.0, 35.0, 34.0, 31.0, 27.0, 39.0, 33.0, 38.0, 45.0, 35.0, 39.0, 43.0, 43.0, 43.0, 43.0, 49.0, 42.0, 23.0, 28.0, 36.0, 24.0, 25.0, 22.0, 21.0, 8.0, 16.0, 3.0, 11.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1796875, -7.893798828125, -7.60791015625, -7.322021484375, -7.0361328125, -6.750244140625, -6.46435546875, -6.178466796875, -5.892578125, -5.606689453125, -5.32080078125, -5.034912109375, -4.7490234375, -4.463134765625, -4.17724609375, -3.891357421875, -3.60546875, -3.319580078125, -3.03369140625, -2.747802734375, -2.4619140625, -2.176025390625, -1.89013671875, -1.604248046875, -1.318359375, -1.032470703125, -0.74658203125, -0.460693359375, -0.1748046875, 0.111083984375, 0.39697265625, 0.682861328125, 0.96875, 1.254638671875, 1.54052734375, 1.826416015625, 2.1123046875, 2.398193359375, 2.68408203125, 2.969970703125, 3.255859375, 3.541748046875, 3.82763671875, 4.113525390625, 4.3994140625, 4.685302734375, 4.97119140625, 5.257080078125, 5.54296875, 5.828857421875, 6.11474609375, 6.400634765625, 6.6865234375, 6.972412109375, 7.25830078125, 7.544189453125, 7.830078125, 8.115966796875, 8.40185546875, 8.687744140625, 8.9736328125, 9.259521484375, 9.54541015625, 9.831298828125, 10.1171875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 12.0, 14.0, 32.0, 34.0, 61.0, 75.0, 133.0, 184.0, 291.0, 382.0, 609.0, 902.0, 1459.0, 2154.0, 3440.0, 5791.0, 9540.0, 17295.0, 34955.0, 75477.0, 169334.0, 312366.0, 218262.0, 99314.0, 44848.0, 21780.0, 11795.0, 6748.0, 4025.0, 2467.0, 1622.0, 1031.0, 698.0, 446.0, 324.0, 212.0, 162.0, 95.0, 57.0, 40.0, 28.0, 17.0, 12.0, 9.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1328125, -7.8388671875, -7.544921875, -7.2509765625, -6.95703125, -6.6630859375, -6.369140625, -6.0751953125, -5.78125, -5.4873046875, -5.193359375, -4.8994140625, -4.60546875, -4.3115234375, -4.017578125, -3.7236328125, -3.4296875, -3.1357421875, -2.841796875, -2.5478515625, -2.25390625, -1.9599609375, -1.666015625, -1.3720703125, -1.078125, -0.7841796875, -0.490234375, -0.1962890625, 0.09765625, 0.3916015625, 0.685546875, 0.9794921875, 1.2734375, 1.5673828125, 1.861328125, 2.1552734375, 2.44921875, 2.7431640625, 3.037109375, 3.3310546875, 3.625, 3.9189453125, 4.212890625, 4.5068359375, 4.80078125, 5.0947265625, 5.388671875, 5.6826171875, 5.9765625, 6.2705078125, 6.564453125, 6.8583984375, 7.15234375, 7.4462890625, 7.740234375, 8.0341796875, 8.328125, 8.6220703125, 8.916015625, 9.2099609375, 9.50390625, 9.7978515625, 10.091796875, 10.3857421875, 10.6796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 7.0, 5.0, 7.0, 10.0, 7.0, 9.0, 14.0, 18.0, 18.0, 24.0, 20.0, 30.0, 31.0, 39.0, 49.0, 63.0, 85.0, 113.0, 241.0, 1474.0, 225.0, 116.0, 78.0, 64.0, 51.0, 36.0, 32.0, 31.0, 35.0, 25.0, 13.0, 15.0, 4.0, 8.0, 6.0, 3.0, 11.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.453125, -25.556884765625, -24.66064453125, -23.764404296875, -22.8681640625, -21.971923828125, -21.07568359375, -20.179443359375, -19.283203125, -18.386962890625, -17.49072265625, -16.594482421875, -15.6982421875, -14.802001953125, -13.90576171875, -13.009521484375, -12.11328125, -11.217041015625, -10.32080078125, -9.424560546875, -8.5283203125, -7.632080078125, -6.73583984375, -5.839599609375, -4.943359375, -4.047119140625, -3.15087890625, -2.254638671875, -1.3583984375, -0.462158203125, 0.43408203125, 1.330322265625, 2.2265625, 3.122802734375, 4.01904296875, 4.915283203125, 5.8115234375, 6.707763671875, 7.60400390625, 8.500244140625, 9.396484375, 10.292724609375, 11.18896484375, 12.085205078125, 12.9814453125, 13.877685546875, 14.77392578125, 15.670166015625, 16.56640625, 17.462646484375, 18.35888671875, 19.255126953125, 20.1513671875, 21.047607421875, 21.94384765625, 22.840087890625, 23.736328125, 24.632568359375, 25.52880859375, 26.425048828125, 27.3212890625, 28.217529296875, 29.11376953125, 30.010009765625, 30.90625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 0.0, 4.0, 8.0, 6.0, 10.0, 6.0, 12.0, 17.0, 28.0, 37.0, 46.0, 61.0, 95.0, 136.0, 243.0, 396.0, 1001.0, 7591.0, 2800823.0, 329780.0, 3591.0, 747.0, 340.0, 222.0, 141.0, 84.0, 72.0, 41.0, 31.0, 24.0, 26.0, 14.0, 16.0, 10.0, 9.0, 11.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-64.8125, -62.84033203125, -60.8681640625, -58.89599609375, -56.923828125, -54.95166015625, -52.9794921875, -51.00732421875, -49.03515625, -47.06298828125, -45.0908203125, -43.11865234375, -41.146484375, -39.17431640625, -37.2021484375, -35.22998046875, -33.2578125, -31.28564453125, -29.3134765625, -27.34130859375, -25.369140625, -23.39697265625, -21.4248046875, -19.45263671875, -17.48046875, -15.50830078125, -13.5361328125, -11.56396484375, -9.591796875, -7.61962890625, -5.6474609375, -3.67529296875, -1.703125, 0.26904296875, 2.2412109375, 4.21337890625, 6.185546875, 8.15771484375, 10.1298828125, 12.10205078125, 14.07421875, 16.04638671875, 18.0185546875, 19.99072265625, 21.962890625, 23.93505859375, 25.9072265625, 27.87939453125, 29.8515625, 31.82373046875, 33.7958984375, 35.76806640625, 37.740234375, 39.71240234375, 41.6845703125, 43.65673828125, 45.62890625, 47.60107421875, 49.5732421875, 51.54541015625, 53.517578125, 55.48974609375, 57.4619140625, 59.43408203125, 61.40625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 22.0, 215.0, 513.0, 222.0, 33.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.35731506347656, -183.7769317626953, -175.19656372070312, -166.61618041992188, -158.03579711914062, -149.45541381835938, -140.8750457763672, -132.29466247558594, -123.71428680419922, -115.1339111328125, -106.55352783203125, -97.97315216064453, -89.39277648925781, -80.81239318847656, -72.23201751708984, -63.65163803100586, -55.071258544921875, -46.49087905883789, -37.910499572753906, -29.330123901367188, -20.749744415283203, -12.169364929199219, -3.5889892578125, 4.991390228271484, 13.571769714355469, 22.152149200439453, 30.732526779174805, 39.312904357910156, 47.89328384399414, 56.473663330078125, 65.05403900146484, 73.63441467285156, 82.21481323242188, 90.7951889038086, 99.37557220458984, 107.95594787597656, 116.53633117675781, 125.11670684814453, 133.69708251953125, 142.2774658203125, 150.85784912109375, 159.438232421875, 168.0186004638672, 176.59898376464844, 185.1793670654297, 193.75973510742188, 202.34011840820312, 210.92050170898438, 219.50086975097656, 228.0812530517578, 236.66162109375, 245.24200439453125, 253.8223876953125, 262.40277099609375, 270.983154296875, 279.5635070800781, 288.1438903808594, 296.7242736816406, 305.3046569824219, 313.885009765625, 322.46539306640625, 331.0457763671875, 339.62615966796875, 348.20654296875, 356.78692626953125]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 8.0, 12.0, 21.0, 23.0, 24.0, 29.0, 28.0, 34.0, 34.0, 30.0, 38.0, 42.0, 47.0, 42.0, 42.0, 44.0, 31.0, 46.0, 45.0, 45.0, 43.0, 50.0, 34.0, 33.0, 26.0, 24.0, 24.0, 13.0, 15.0, 11.0, 13.0, 9.0, 9.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.67426300048828, -97.41069030761719, -94.14712524414062, -90.88355255126953, -87.61997985839844, -84.35641479492188, -81.09284210205078, -77.82926940917969, -74.56570434570312, -71.30213165283203, -68.03856658935547, -64.77499389648438, -61.51142501831055, -58.24785614013672, -54.984283447265625, -51.7207145690918, -48.45714569091797, -45.19357681274414, -41.93000793457031, -38.66643524169922, -35.40286636352539, -32.13929748535156, -28.8757266998291, -25.61215591430664, -22.348587036132812, -19.085018157958984, -15.821447372436523, -12.557877540588379, -9.294307708740234, -6.030738830566406, -2.7671680450439453, 0.4964027404785156, 3.7599639892578125, 7.023533821105957, 10.287103652954102, 13.550673484802246, 16.81424331665039, 20.07781219482422, 23.34138298034668, 26.60495376586914, 29.86852264404297, 33.1320915222168, 36.395660400390625, 39.65923309326172, 42.92280197143555, 46.186370849609375, 49.44994354248047, 52.7135124206543, 55.977081298828125, 59.24065017700195, 62.50421905517578, 65.76779174804688, 69.03135681152344, 72.29492950439453, 75.55850219726562, 78.82206726074219, 82.08563995361328, 85.34921264648438, 88.61277770996094, 91.87635040283203, 95.13992309570312, 98.40348815917969, 101.66706085205078, 104.93063354492188, 108.19419860839844]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 8.0, 7.0, 11.0, 19.0, 16.0, 21.0, 21.0, 22.0, 24.0, 23.0, 22.0, 31.0, 29.0, 36.0, 40.0, 39.0, 46.0, 38.0, 37.0, 39.0, 51.0, 52.0, 28.0, 36.0, 36.0, 43.0, 32.0, 29.0, 29.0, 26.0, 16.0, 15.0, 17.0, 10.0, 10.0, 13.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.0859375, -8.7813720703125, -8.476806640625, -8.1722412109375, -7.86767578125, -7.5631103515625, -7.258544921875, -6.9539794921875, -6.6494140625, -6.3448486328125, -6.040283203125, -5.7357177734375, -5.43115234375, -5.1265869140625, -4.822021484375, -4.5174560546875, -4.212890625, -3.9083251953125, -3.603759765625, -3.2991943359375, -2.99462890625, -2.6900634765625, -2.385498046875, -2.0809326171875, -1.7763671875, -1.4718017578125, -1.167236328125, -0.8626708984375, -0.55810546875, -0.2535400390625, 0.051025390625, 0.3555908203125, 0.66015625, 0.9647216796875, 1.269287109375, 1.5738525390625, 1.87841796875, 2.1829833984375, 2.487548828125, 2.7921142578125, 3.0966796875, 3.4012451171875, 3.705810546875, 4.0103759765625, 4.31494140625, 4.6195068359375, 4.924072265625, 5.2286376953125, 5.533203125, 5.8377685546875, 6.142333984375, 6.4468994140625, 6.75146484375, 7.0560302734375, 7.360595703125, 7.6651611328125, 7.9697265625, 8.2742919921875, 8.578857421875, 8.8834228515625, 9.18798828125, 9.4925537109375, 9.797119140625, 10.1016845703125, 10.40625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 11.0, 9.0, 12.0, 12.0, 15.0, 22.0, 43.0, 42.0, 63.0, 90.0, 125.0, 171.0, 224.0, 285.0, 400.0, 617.0, 1011.0, 2037.0, 6059.0, 30640.0, 272736.0, 3397397.0, 429825.0, 39615.0, 7240.0, 2253.0, 1086.0, 627.0, 464.0, 324.0, 224.0, 159.0, 112.0, 90.0, 62.0, 53.0, 43.0, 22.0, 18.0, 10.0, 8.0, 5.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-53.375, -51.62939453125, -49.8837890625, -48.13818359375, -46.392578125, -44.64697265625, -42.9013671875, -41.15576171875, -39.41015625, -37.66455078125, -35.9189453125, -34.17333984375, -32.427734375, -30.68212890625, -28.9365234375, -27.19091796875, -25.4453125, -23.69970703125, -21.9541015625, -20.20849609375, -18.462890625, -16.71728515625, -14.9716796875, -13.22607421875, -11.48046875, -9.73486328125, -7.9892578125, -6.24365234375, -4.498046875, -2.75244140625, -1.0068359375, 0.73876953125, 2.484375, 4.22998046875, 5.9755859375, 7.72119140625, 9.466796875, 11.21240234375, 12.9580078125, 14.70361328125, 16.44921875, 18.19482421875, 19.9404296875, 21.68603515625, 23.431640625, 25.17724609375, 26.9228515625, 28.66845703125, 30.4140625, 32.15966796875, 33.9052734375, 35.65087890625, 37.396484375, 39.14208984375, 40.8876953125, 42.63330078125, 44.37890625, 46.12451171875, 47.8701171875, 49.61572265625, 51.361328125, 53.10693359375, 54.8525390625, 56.59814453125, 58.34375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 4.0, 7.0, 8.0, 10.0, 18.0, 25.0, 39.0, 44.0, 56.0, 74.0, 105.0, 171.0, 211.0, 276.0, 387.0, 518.0, 562.0, 456.0, 293.0, 225.0, 158.0, 103.0, 76.0, 70.0, 45.0, 29.0, 24.0, 16.0, 12.0, 9.0, 3.0, 4.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-28.078125, -27.36181640625, -26.6455078125, -25.92919921875, -25.212890625, -24.49658203125, -23.7802734375, -23.06396484375, -22.34765625, -21.63134765625, -20.9150390625, -20.19873046875, -19.482421875, -18.76611328125, -18.0498046875, -17.33349609375, -16.6171875, -15.90087890625, -15.1845703125, -14.46826171875, -13.751953125, -13.03564453125, -12.3193359375, -11.60302734375, -10.88671875, -10.17041015625, -9.4541015625, -8.73779296875, -8.021484375, -7.30517578125, -6.5888671875, -5.87255859375, -5.15625, -4.43994140625, -3.7236328125, -3.00732421875, -2.291015625, -1.57470703125, -0.8583984375, -0.14208984375, 0.57421875, 1.29052734375, 2.0068359375, 2.72314453125, 3.439453125, 4.15576171875, 4.8720703125, 5.58837890625, 6.3046875, 7.02099609375, 7.7373046875, 8.45361328125, 9.169921875, 9.88623046875, 10.6025390625, 11.31884765625, 12.03515625, 12.75146484375, 13.4677734375, 14.18408203125, 14.900390625, 15.61669921875, 16.3330078125, 17.04931640625, 17.765625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 12.0, 7.0, 10.0, 17.0, 17.0, 24.0, 41.0, 59.0, 83.0, 125.0, 194.0, 277.0, 476.0, 831.0, 1662.0, 3739.0, 10385.0, 35417.0, 155216.0, 965970.0, 2550630.0, 365915.0, 72655.0, 18931.0, 6195.0, 2539.0, 1155.0, 609.0, 367.0, 212.0, 183.0, 109.0, 56.0, 49.0, 32.0, 24.0, 14.0, 9.0, 12.0, 13.0, 6.0, 3.0, 3.0, 3.0, 2.0], "bins": [-37.03125, -36.087890625, -35.14453125, -34.201171875, -33.2578125, -32.314453125, -31.37109375, -30.427734375, -29.484375, -28.541015625, -27.59765625, -26.654296875, -25.7109375, -24.767578125, -23.82421875, -22.880859375, -21.9375, -20.994140625, -20.05078125, -19.107421875, -18.1640625, -17.220703125, -16.27734375, -15.333984375, -14.390625, -13.447265625, -12.50390625, -11.560546875, -10.6171875, -9.673828125, -8.73046875, -7.787109375, -6.84375, -5.900390625, -4.95703125, -4.013671875, -3.0703125, -2.126953125, -1.18359375, -0.240234375, 0.703125, 1.646484375, 2.58984375, 3.533203125, 4.4765625, 5.419921875, 6.36328125, 7.306640625, 8.25, 9.193359375, 10.13671875, 11.080078125, 12.0234375, 12.966796875, 13.91015625, 14.853515625, 15.796875, 16.740234375, 17.68359375, 18.626953125, 19.5703125, 20.513671875, 21.45703125, 22.400390625, 23.34375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 11.0, 10.0, 17.0, 19.0, 30.0, 33.0, 46.0, 53.0, 70.0, 60.0, 72.0, 97.0, 89.0, 80.0, 54.0, 55.0, 46.0, 33.0, 27.0, 23.0, 18.0, 12.0, 14.0, 6.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.49395751953125, -116.76133728027344, -111.0287094116211, -105.29608154296875, -99.56346130371094, -93.83084106445312, -88.09821319580078, -82.36558532714844, -76.63296508789062, -70.90034484863281, -65.16771697998047, -59.43509292602539, -53.70246887207031, -47.969844818115234, -42.237220764160156, -36.50459671020508, -30.77197265625, -25.039348602294922, -19.306724548339844, -13.574100494384766, -7.8414764404296875, -2.1088523864746094, 3.6237716674804688, 9.356395721435547, 15.089019775390625, 20.821643829345703, 26.55426788330078, 32.28689193725586, 38.01951599121094, 43.752140045166016, 49.484764099121094, 55.21738815307617, 60.95002746582031, 66.68264770507812, 72.41527557373047, 78.14790344238281, 83.88052368164062, 89.61314392089844, 95.34577178955078, 101.07839965820312, 106.81101989746094, 112.54364013671875, 118.2762680053711, 124.00889587402344, 129.74151611328125, 135.47413635253906, 141.20675659179688, 146.93939208984375, 152.67201232910156, 158.40463256835938, 164.13726806640625, 169.86988830566406, 175.60250854492188, 181.3351287841797, 187.0677490234375, 192.80038452148438, 198.5330047607422, 204.265625, 209.99826049804688, 215.7308807373047, 221.4635009765625, 227.1961212158203, 232.92874145507812, 238.661376953125, 244.3939971923828]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 5.0, 12.0, 9.0, 8.0, 22.0, 10.0, 27.0, 16.0, 18.0, 36.0, 27.0, 25.0, 46.0, 41.0, 41.0, 55.0, 51.0, 38.0, 45.0, 54.0, 42.0, 37.0, 47.0, 34.0, 29.0, 35.0, 17.0, 29.0, 26.0, 19.0, 28.0, 13.0, 15.0, 8.0, 5.0, 3.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.17784118652344, -100.6960220336914, -97.21420288085938, -93.73239135742188, -90.25057220458984, -86.76875305175781, -83.28693389892578, -79.80511474609375, -76.32330322265625, -72.84148406982422, -69.35966491699219, -65.87785339355469, -62.396034240722656, -58.914215087890625, -55.432395935058594, -51.95057678222656, -48.46875762939453, -44.9869384765625, -41.505123138427734, -38.0233039855957, -34.54148864746094, -31.059669494628906, -27.577850341796875, -24.096033096313477, -20.614215850830078, -17.13239860534668, -13.650580406188965, -10.16876220703125, -6.686944961547852, -3.205127716064453, 0.2766914367675781, 3.7585086822509766, 7.240325927734375, 10.722143173217773, 14.203961372375488, 17.685779571533203, 21.1675968170166, 24.6494140625, 28.13123321533203, 31.61305046081543, 35.09486770629883, 38.57668685913086, 42.058502197265625, 45.540321350097656, 49.02214050292969, 52.50395584106445, 55.985774993896484, 59.46759033203125, 62.94940948486328, 66.43122863769531, 69.91304779052734, 73.39486694335938, 76.87667846679688, 80.3584976196289, 83.84031677246094, 87.32213592529297, 90.803955078125, 94.28577423095703, 97.76759338378906, 101.24940490722656, 104.7312240600586, 108.21304321289062, 111.69486236572266, 115.17668151855469, 118.65849304199219]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 2.0, 9.0, 3.0, 17.0, 13.0, 18.0, 21.0, 17.0, 26.0, 32.0, 32.0, 37.0, 41.0, 57.0, 53.0, 61.0, 47.0, 59.0, 49.0, 42.0, 43.0, 47.0, 35.0, 30.0, 32.0, 32.0, 24.0, 27.0, 19.0, 12.0, 17.0, 10.0, 8.0, 6.0, 7.0, 8.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.75, -204.296875, -196.84375, -189.390625, -181.9375, -174.484375, -167.03125, -159.578125, -152.125, -144.671875, -137.21875, -129.765625, -122.3125, -114.859375, -107.40625, -99.953125, -92.5, -85.046875, -77.59375, -70.140625, -62.6875, -55.234375, -47.78125, -40.328125, -32.875, -25.421875, -17.96875, -10.515625, -3.0625, 4.390625, 11.84375, 19.296875, 26.75, 34.203125, 41.65625, 49.109375, 56.5625, 64.015625, 71.46875, 78.921875, 86.375, 93.828125, 101.28125, 108.734375, 116.1875, 123.640625, 131.09375, 138.546875, 146.0, 153.453125, 160.90625, 168.359375, 175.8125, 183.265625, 190.71875, 198.171875, 205.625, 213.078125, 220.53125, 227.984375, 235.4375, 242.890625, 250.34375, 257.796875, 265.25]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 8.0, 15.0, 26.0, 32.0, 45.0, 71.0, 119.0, 151.0, 266.0, 454.0, 779.0, 1299.0, 2286.0, 4155.0, 7429.0, 13640.0, 26047.0, 51268.0, 112586.0, 329305.0, 294046.0, 103305.0, 47945.0, 24339.0, 12815.0, 7012.0, 3914.0, 2162.0, 1199.0, 708.0, 400.0, 284.0, 147.0, 107.0, 68.0, 39.0, 28.0, 18.0, 13.0, 5.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.1640625, -13.7587890625, -13.353515625, -12.9482421875, -12.54296875, -12.1376953125, -11.732421875, -11.3271484375, -10.921875, -10.5166015625, -10.111328125, -9.7060546875, -9.30078125, -8.8955078125, -8.490234375, -8.0849609375, -7.6796875, -7.2744140625, -6.869140625, -6.4638671875, -6.05859375, -5.6533203125, -5.248046875, -4.8427734375, -4.4375, -4.0322265625, -3.626953125, -3.2216796875, -2.81640625, -2.4111328125, -2.005859375, -1.6005859375, -1.1953125, -0.7900390625, -0.384765625, 0.0205078125, 0.42578125, 0.8310546875, 1.236328125, 1.6416015625, 2.046875, 2.4521484375, 2.857421875, 3.2626953125, 3.66796875, 4.0732421875, 4.478515625, 4.8837890625, 5.2890625, 5.6943359375, 6.099609375, 6.5048828125, 6.91015625, 7.3154296875, 7.720703125, 8.1259765625, 8.53125, 8.9365234375, 9.341796875, 9.7470703125, 10.15234375, 10.5576171875, 10.962890625, 11.3681640625, 11.7734375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 10.0, 7.0, 13.0, 7.0, 15.0, 19.0, 27.0, 22.0, 27.0, 26.0, 29.0, 37.0, 27.0, 33.0, 32.0, 41.0, 30.0, 40.0, 1059.0, 42.0, 38.0, 42.0, 43.0, 38.0, 36.0, 33.0, 39.0, 28.0, 23.0, 30.0, 13.0, 12.0, 15.0, 10.0, 13.0, 16.0, 10.0, 6.0, 7.0, 4.0, 7.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-164.25, -159.10546875, -153.9609375, -148.81640625, -143.671875, -138.52734375, -133.3828125, -128.23828125, -123.09375, -117.94921875, -112.8046875, -107.66015625, -102.515625, -97.37109375, -92.2265625, -87.08203125, -81.9375, -76.79296875, -71.6484375, -66.50390625, -61.359375, -56.21484375, -51.0703125, -45.92578125, -40.78125, -35.63671875, -30.4921875, -25.34765625, -20.203125, -15.05859375, -9.9140625, -4.76953125, 0.375, 5.51953125, 10.6640625, 15.80859375, 20.953125, 26.09765625, 31.2421875, 36.38671875, 41.53125, 46.67578125, 51.8203125, 56.96484375, 62.109375, 67.25390625, 72.3984375, 77.54296875, 82.6875, 87.83203125, 92.9765625, 98.12109375, 103.265625, 108.41015625, 113.5546875, 118.69921875, 123.84375, 128.98828125, 134.1328125, 139.27734375, 144.421875, 149.56640625, 154.7109375, 159.85546875, 165.0]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 6.0, 12.0, 19.0, 30.0, 49.0, 62.0, 93.0, 156.0, 228.0, 349.0, 529.0, 870.0, 1288.0, 1995.0, 3080.0, 4808.0, 7543.0, 12568.0, 20088.0, 32865.0, 56048.0, 103534.0, 224629.0, 1326988.0, 130616.0, 67601.0, 38658.0, 23343.0, 14408.0, 8887.0, 5682.0, 3643.0, 2303.0, 1435.0, 950.0, 621.0, 406.0, 240.0, 159.0, 115.0, 81.0, 48.0, 43.0, 23.0, 7.0, 13.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.79296875, -5.61285400390625, -5.4327392578125, -5.25262451171875, -5.072509765625, -4.89239501953125, -4.7122802734375, -4.53216552734375, -4.35205078125, -4.17193603515625, -3.9918212890625, -3.81170654296875, -3.631591796875, -3.45147705078125, -3.2713623046875, -3.09124755859375, -2.9111328125, -2.73101806640625, -2.5509033203125, -2.37078857421875, -2.190673828125, -2.01055908203125, -1.8304443359375, -1.65032958984375, -1.47021484375, -1.29010009765625, -1.1099853515625, -0.92987060546875, -0.749755859375, -0.56964111328125, -0.3895263671875, -0.20941162109375, -0.029296875, 0.15081787109375, 0.3309326171875, 0.51104736328125, 0.691162109375, 0.87127685546875, 1.0513916015625, 1.23150634765625, 1.41162109375, 1.59173583984375, 1.7718505859375, 1.95196533203125, 2.132080078125, 2.31219482421875, 2.4923095703125, 2.67242431640625, 2.8525390625, 3.03265380859375, 3.2127685546875, 3.39288330078125, 3.572998046875, 3.75311279296875, 3.9332275390625, 4.11334228515625, 4.29345703125, 4.47357177734375, 4.6536865234375, 4.83380126953125, 5.013916015625, 5.19403076171875, 5.3741455078125, 5.55426025390625, 5.734375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 11.0, 12.0, 12.0, 23.0, 23.0, 20.0, 30.0, 41.0, 47.0, 63.0, 55.0, 65.0, 55.0, 66.0, 66.0, 73.0, 54.0, 44.0, 39.0, 34.0, 32.0, 37.0, 20.0, 20.0, 14.0, 8.0, 8.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004856109619140625, -0.004707217216491699, -0.0045583248138427734, -0.004409432411193848, -0.004260540008544922, -0.004111647605895996, -0.00396275520324707, -0.0038138628005981445, -0.0036649703979492188, -0.003516077995300293, -0.003367185592651367, -0.0032182931900024414, -0.0030694007873535156, -0.00292050838470459, -0.002771615982055664, -0.0026227235794067383, -0.0024738311767578125, -0.0023249387741088867, -0.002176046371459961, -0.002027153968811035, -0.0018782615661621094, -0.0017293691635131836, -0.0015804767608642578, -0.001431584358215332, -0.0012826919555664062, -0.0011337995529174805, -0.0009849071502685547, -0.0008360147476196289, -0.0006871223449707031, -0.0005382299423217773, -0.00038933753967285156, -0.00024044513702392578, -9.1552734375e-05, 5.733966827392578e-05, 0.00020623207092285156, 0.00035512447357177734, 0.0005040168762207031, 0.0006529092788696289, 0.0008018016815185547, 0.0009506940841674805, 0.0010995864868164062, 0.001248478889465332, 0.0013973712921142578, 0.0015462636947631836, 0.0016951560974121094, 0.0018440485000610352, 0.001992940902709961, 0.0021418333053588867, 0.0022907257080078125, 0.0024396181106567383, 0.002588510513305664, 0.00273740291595459, 0.0028862953186035156, 0.0030351877212524414, 0.003184080123901367, 0.003332972526550293, 0.0034818649291992188, 0.0036307573318481445, 0.0037796497344970703, 0.003928542137145996, 0.004077434539794922, 0.004226326942443848, 0.0043752193450927734, 0.004524111747741699, 0.004673004150390625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 10.0, 11.0, 8.0, 17.0, 27.0, 53.0, 72.0, 110.0, 195.0, 376.0, 677.0, 1268.0, 2341.0, 4920.0, 10375.0, 22791.0, 52529.0, 119855.0, 237491.0, 281996.0, 172110.0, 78535.0, 33852.0, 14987.0, 6864.0, 3353.0, 1701.0, 870.0, 464.0, 283.0, 160.0, 91.0, 63.0, 32.0, 24.0, 13.0, 15.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196380615234375, -0.019028902053833008, -0.018419742584228516, -0.017810583114624023, -0.01720142364501953, -0.01659226417541504, -0.015983104705810547, -0.015373945236206055, -0.014764785766601562, -0.01415562629699707, -0.013546466827392578, -0.012937307357788086, -0.012328147888183594, -0.011718988418579102, -0.01110982894897461, -0.010500669479370117, -0.009891510009765625, -0.009282350540161133, -0.00867319107055664, -0.008064031600952148, -0.007454872131347656, -0.006845712661743164, -0.006236553192138672, -0.00562739372253418, -0.0050182342529296875, -0.004409074783325195, -0.003799915313720703, -0.003190755844116211, -0.0025815963745117188, -0.0019724369049072266, -0.0013632774353027344, -0.0007541179656982422, -0.00014495849609375, 0.0004642009735107422, 0.0010733604431152344, 0.0016825199127197266, 0.0022916793823242188, 0.002900838851928711, 0.003509998321533203, 0.004119157791137695, 0.0047283172607421875, 0.00533747673034668, 0.005946636199951172, 0.006555795669555664, 0.007164955139160156, 0.0077741146087646484, 0.00838327407836914, 0.008992433547973633, 0.009601593017578125, 0.010210752487182617, 0.01081991195678711, 0.011429071426391602, 0.012038230895996094, 0.012647390365600586, 0.013256549835205078, 0.01386570930480957, 0.014474868774414062, 0.015084028244018555, 0.015693187713623047, 0.01630234718322754, 0.01691150665283203, 0.017520666122436523, 0.018129825592041016, 0.018738985061645508, 0.01934814453125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 2.0, 9.0, 7.0, 10.0, 9.0, 22.0, 37.0, 35.0, 53.0, 59.0, 86.0, 92.0, 74.0, 84.0, 95.0, 78.0, 57.0, 33.0, 43.0, 26.0, 26.0, 19.0, 5.0, 9.0, 6.0, 6.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.011856141500175, -0.011549847200512886, -0.011243552900850773, -0.010937259532511234, -0.010630965232849121, -0.010324670933187008, -0.010018376633524895, -0.009712083265185356, -0.009405788965523243, -0.00909949466586113, -0.008793200366199017, -0.008486906997859478, -0.008180612698197365, -0.007874318398535252, -0.007568024098873138, -0.0072617302648723125, -0.006955435965210199, -0.006649141665548086, -0.00634284783154726, -0.006036553531885147, -0.005730259697884321, -0.005423965398222208, -0.005117671564221382, -0.004811377264559269, -0.004505082964897156, -0.004198788665235043, -0.0038924948312342167, -0.0035862005315721035, -0.0032799066975712776, -0.0029736123979091644, -0.002667318331077695, -0.0023610242642462254, -0.0020547308959066868, -0.0017484368290752172, -0.0014421427622437477, -0.0011358485789969563, -0.0008295545121654868, -0.0005232604453340173, -0.00021696626208722591, 8.932780474424362e-05, 0.00039562187157571316, 0.0007019159384071827, 0.0010082100052386522, 0.0013145041884854436, 0.0016207982553169131, 0.0019270923221483827, 0.002233386505395174, 0.0025396805722266436, 0.002845974639058113, 0.0031522687058895826, 0.003458562772721052, 0.0037648570723831654, 0.004071150906383991, 0.004377445206046104, 0.004683739505708218, 0.0049900333397090435, 0.005296327173709869, 0.005602621473371983, 0.0059089153073728085, 0.006215209607034922, 0.0065215034410357475, 0.006827797740697861, 0.007134092040359974, 0.0074403858743608, 0.007746680174022913]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 6.0, 5.0, 5.0, 4.0, 4.0, 13.0, 7.0, 9.0, 15.0, 16.0, 22.0, 24.0, 14.0, 29.0, 28.0, 43.0, 34.0, 31.0, 32.0, 40.0, 37.0, 45.0, 36.0, 32.0, 38.0, 42.0, 37.0, 28.0, 32.0, 30.0, 35.0, 28.0, 17.0, 29.0, 27.0, 22.0, 15.0, 14.0, 16.0, 5.0, 17.0, 5.0, 9.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.003509044647216797, -0.0034059500321745872, -0.0033028554171323776, -0.003199760802090168, -0.0030966661870479584, -0.0029935715720057487, -0.002890476956963539, -0.0027873823419213295, -0.00268428772687912, -0.0025811931118369102, -0.0024780984967947006, -0.002375003881752491, -0.0022719092667102814, -0.0021688146516680717, -0.002065720036625862, -0.0019626254215836525, -0.0018595308065414429, -0.0017564361914992332, -0.0016533415764570236, -0.001550246961414814, -0.0014471523463726044, -0.0013440577313303947, -0.0012409631162881851, -0.0011378685012459755, -0.0010347738862037659, -0.0009316792711615562, -0.0008285846561193466, -0.000725490041077137, -0.0006223954260349274, -0.0005193008109927177, -0.0004162061959505081, -0.0003131115809082985, -0.00021001696586608887, -0.00010692235082387924, -3.827735781669617e-06, 9.926687926054001e-05, 0.00020236149430274963, 0.00030545610934495926, 0.0004085507243871689, 0.0005116453394293785, 0.0006147399544715881, 0.0007178345695137978, 0.0008209291845560074, 0.000924023799598217, 0.0010271184146404266, 0.0011302130296826363, 0.0012333076447248459, 0.0013364022597670555, 0.0014394968748092651, 0.0015425914898514748, 0.0016456861048936844, 0.001748780719935894, 0.0018518753349781036, 0.0019549699500203133, 0.002058064565062523, 0.0021611591801047325, 0.002264253795146942, 0.0023673484101891518, 0.0024704430252313614, 0.002573537640273571, 0.0026766322553157806, 0.0027797268703579903, 0.0028828214854002, 0.0029859161004424095, 0.003089010715484619]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 2.0, 9.0, 3.0, 17.0, 13.0, 18.0, 21.0, 17.0, 26.0, 32.0, 32.0, 37.0, 41.0, 57.0, 53.0, 61.0, 47.0, 59.0, 49.0, 42.0, 43.0, 47.0, 35.0, 30.0, 32.0, 32.0, 24.0, 27.0, 19.0, 12.0, 17.0, 10.0, 8.0, 6.0, 7.0, 7.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.75, -204.296875, -196.84375, -189.390625, -181.9375, -174.484375, -167.03125, -159.578125, -152.125, -144.671875, -137.21875, -129.765625, -122.3125, -114.859375, -107.40625, -99.953125, -92.5, -85.046875, -77.59375, -70.140625, -62.6875, -55.234375, -47.78125, -40.328125, -32.875, -25.421875, -17.96875, -10.515625, -3.0625, 4.390625, 11.84375, 19.296875, 26.75, 34.203125, 41.65625, 49.109375, 56.5625, 64.015625, 71.46875, 78.921875, 86.375, 93.828125, 101.28125, 108.734375, 116.1875, 123.640625, 131.09375, 138.546875, 146.0, 153.453125, 160.90625, 168.359375, 175.8125, 183.265625, 190.71875, 198.171875, 205.625, 213.078125, 220.53125, 227.984375, 235.4375, 242.890625, 250.34375, 257.796875, 265.25]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 11.0, 8.0, 8.0, 15.0, 25.0, 24.0, 27.0, 38.0, 35.0, 78.0, 98.0, 163.0, 364.0, 1003.0, 3312.0, 12105.0, 52519.0, 266124.0, 518612.0, 152183.0, 30660.0, 7539.0, 2191.0, 668.0, 267.0, 142.0, 89.0, 55.0, 51.0, 41.0, 18.0, 27.0, 14.0, 8.0, 11.0, 10.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.0625, -37.73046875, -36.3984375, -35.06640625, -33.734375, -32.40234375, -31.0703125, -29.73828125, -28.40625, -27.07421875, -25.7421875, -24.41015625, -23.078125, -21.74609375, -20.4140625, -19.08203125, -17.75, -16.41796875, -15.0859375, -13.75390625, -12.421875, -11.08984375, -9.7578125, -8.42578125, -7.09375, -5.76171875, -4.4296875, -3.09765625, -1.765625, -0.43359375, 0.8984375, 2.23046875, 3.5625, 4.89453125, 6.2265625, 7.55859375, 8.890625, 10.22265625, 11.5546875, 12.88671875, 14.21875, 15.55078125, 16.8828125, 18.21484375, 19.546875, 20.87890625, 22.2109375, 23.54296875, 24.875, 26.20703125, 27.5390625, 28.87109375, 30.203125, 31.53515625, 32.8671875, 34.19921875, 35.53125, 36.86328125, 38.1953125, 39.52734375, 40.859375, 42.19140625, 43.5234375, 44.85546875, 46.1875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 6.0, 6.0, 14.0, 16.0, 16.0, 25.0, 26.0, 39.0, 53.0, 62.0, 70.0, 59.0, 80.0, 2119.0, 68.0, 50.0, 62.0, 45.0, 53.0, 37.0, 27.0, 28.0, 23.0, 23.0, 16.0, 15.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-393.0, -380.04296875, -367.0859375, -354.12890625, -341.171875, -328.21484375, -315.2578125, -302.30078125, -289.34375, -276.38671875, -263.4296875, -250.47265625, -237.515625, -224.55859375, -211.6015625, -198.64453125, -185.6875, -172.73046875, -159.7734375, -146.81640625, -133.859375, -120.90234375, -107.9453125, -94.98828125, -82.03125, -69.07421875, -56.1171875, -43.16015625, -30.203125, -17.24609375, -4.2890625, 8.66796875, 21.625, 34.58203125, 47.5390625, 60.49609375, 73.453125, 86.41015625, 99.3671875, 112.32421875, 125.28125, 138.23828125, 151.1953125, 164.15234375, 177.109375, 190.06640625, 203.0234375, 215.98046875, 228.9375, 241.89453125, 254.8515625, 267.80859375, 280.765625, 293.72265625, 306.6796875, 319.63671875, 332.59375, 345.55078125, 358.5078125, 371.46484375, 384.421875, 397.37890625, 410.3359375, 423.29296875, 436.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 11.0, 8.0, 22.0, 35.0, 45.0, 98.0, 128.0, 264.0, 516.0, 1178.0, 3679.0, 20693.0, 249332.0, 2779169.0, 78138.0, 8670.0, 2084.0, 805.0, 375.0, 178.0, 129.0, 47.0, 38.0, 24.0, 15.0, 13.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.28125, -35.91455078125, -34.5478515625, -33.18115234375, -31.814453125, -30.44775390625, -29.0810546875, -27.71435546875, -26.34765625, -24.98095703125, -23.6142578125, -22.24755859375, -20.880859375, -19.51416015625, -18.1474609375, -16.78076171875, -15.4140625, -14.04736328125, -12.6806640625, -11.31396484375, -9.947265625, -8.58056640625, -7.2138671875, -5.84716796875, -4.48046875, -3.11376953125, -1.7470703125, -0.38037109375, 0.986328125, 2.35302734375, 3.7197265625, 5.08642578125, 6.453125, 7.81982421875, 9.1865234375, 10.55322265625, 11.919921875, 13.28662109375, 14.6533203125, 16.02001953125, 17.38671875, 18.75341796875, 20.1201171875, 21.48681640625, 22.853515625, 24.22021484375, 25.5869140625, 26.95361328125, 28.3203125, 29.68701171875, 31.0537109375, 32.42041015625, 33.787109375, 35.15380859375, 36.5205078125, 37.88720703125, 39.25390625, 40.62060546875, 41.9873046875, 43.35400390625, 44.720703125, 46.08740234375, 47.4541015625, 48.82080078125, 50.1875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 7.0, 10.0, 18.0, 38.0, 115.0, 178.0, 194.0, 173.0, 108.0, 59.0, 29.0, 17.0, 12.0, 7.0, 8.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1047.2930908203125, -1024.2669677734375, -1001.2409057617188, -978.21484375, -955.1887817382812, -932.1627197265625, -909.1365966796875, -886.1105346679688, -863.08447265625, -840.0584106445312, -817.0322875976562, -794.0062255859375, -770.9801635742188, -747.9541015625, -724.927978515625, -701.9019165039062, -678.8758544921875, -655.8497924804688, -632.8236694335938, -609.797607421875, -586.7715454101562, -563.7454833984375, -540.7193603515625, -517.6932983398438, -494.66717529296875, -471.6410827636719, -448.6150207519531, -425.58892822265625, -402.5628662109375, -379.5367736816406, -356.51068115234375, -333.484619140625, -310.45855712890625, -287.4324645996094, -264.4064025878906, -241.38031005859375, -218.354248046875, -195.32815551757812, -172.3020782470703, -149.2760009765625, -126.24992370605469, -103.22384643554688, -80.19776916503906, -57.17168426513672, -34.145606994628906, -11.119529724121094, 11.90655517578125, 34.93263244628906, 57.958709716796875, 80.98478698730469, 104.0108642578125, 127.03694915771484, 150.06301879882812, 173.089111328125, 196.1151885986328, 219.14126586914062, 242.16734313964844, 265.19342041015625, 288.2195129394531, 311.2455749511719, 334.27166748046875, 357.2977294921875, 380.3238220214844, 403.34991455078125, 426.3759765625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 5.0, 6.0, 6.0, 9.0, 5.0, 14.0, 9.0, 10.0, 15.0, 16.0, 18.0, 24.0, 24.0, 31.0, 32.0, 33.0, 29.0, 52.0, 35.0, 38.0, 36.0, 46.0, 38.0, 44.0, 37.0, 31.0, 37.0, 29.0, 44.0, 29.0, 33.0, 28.0, 19.0, 24.0, 21.0, 15.0, 21.0, 8.0, 7.0, 10.0, 6.0, 7.0, 6.0, 7.0, 7.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-446.8499450683594, -432.5949401855469, -418.33990478515625, -404.08489990234375, -389.8298645019531, -375.5748596191406, -361.31982421875, -347.0648193359375, -332.809814453125, -318.5548095703125, -304.2997741699219, -290.0447692871094, -275.78973388671875, -261.53472900390625, -247.2797088623047, -233.02468872070312, -218.7696533203125, -204.51463317871094, -190.25961303710938, -176.00460815429688, -161.74957275390625, -147.49456787109375, -133.2395477294922, -118.98452758789062, -104.72950744628906, -90.4744873046875, -76.21946716308594, -61.964454650878906, -47.709434509277344, -33.45441436767578, -19.19940185546875, -4.9443817138671875, 9.31060791015625, 23.56562614440918, 37.82064437866211, 52.075660705566406, 66.33068084716797, 80.58570098876953, 94.84071350097656, 109.09573364257812, 123.35075378417969, 137.60577392578125, 151.8607940673828, 166.11581420898438, 180.37081909179688, 194.6258544921875, 208.880859375, 223.13587951660156, 237.39089965820312, 251.6459197998047, 265.90093994140625, 280.15594482421875, 294.4109802246094, 308.6659851074219, 322.9210205078125, 337.176025390625, 351.4310302734375, 365.68603515625, 379.9410705566406, 394.1960754394531, 408.45111083984375, 422.70611572265625, 436.96112060546875, 451.2161560058594, 465.47119140625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 12.0, 12.0, 14.0, 27.0, 29.0, 38.0, 65.0, 88.0, 100.0, 154.0, 247.0, 273.0, 381.0, 557.0, 731.0, 1130.0, 1041128.0, 995.0, 700.0, 514.0, 373.0, 257.0, 186.0, 158.0, 99.0, 74.0, 65.0, 39.0, 30.0, 15.0, 16.0, 2.0, 9.0, 6.0, 10.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.6254425048828, -158.5720977783203, -153.5187530517578, -148.4654083251953, -143.4120635986328, -138.3587188720703, -133.3053741455078, -128.25204467773438, -123.19869232177734, -118.14534759521484, -113.09200286865234, -108.03865814208984, -102.98532104492188, -97.93197631835938, -92.87863159179688, -87.82528686523438, -82.77194213867188, -77.71859741210938, -72.66525268554688, -67.61190795898438, -62.55856704711914, -57.50522232055664, -52.451881408691406, -47.398536682128906, -42.345191955566406, -37.291847229003906, -32.238502502441406, -27.185161590576172, -22.131816864013672, -17.078472137451172, -12.025129318237305, -6.9717864990234375, -1.9184417724609375, 3.134902000427246, 8.18824577331543, 13.241589546203613, 18.294933319091797, 23.348278045654297, 28.401620864868164, 33.45496368408203, 38.50830841064453, 43.56165313720703, 48.61499786376953, 53.668338775634766, 58.721683502197266, 63.775028228759766, 68.828369140625, 73.8817138671875, 78.93505859375, 83.9884033203125, 89.041748046875, 94.0950927734375, 99.1484375, 104.2017822265625, 109.25511932373047, 114.30846405029297, 119.36180877685547, 124.41515350341797, 129.46849060058594, 134.52183532714844, 139.57518005371094, 144.62852478027344, 149.68186950683594, 154.73521423339844, 159.78855895996094]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 10.0, 7.0, 14.0, 15.0, 24.0, 31.0, 130.0, 1065.0, 51457080.0, 4463.0, 156.0, 57.0, 22.0, 15.0, 18.0, 8.0, 5.0, 7.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1546.0, -1463.11474609375, -1380.2293701171875, -1297.3441162109375, -1214.458740234375, -1131.573486328125, -1048.688232421875, -965.8029174804688, -882.9176025390625, -800.0322875976562, -717.14697265625, -634.26171875, -551.3764038085938, -468.4910888671875, -385.6058044433594, -302.72052001953125, -219.835205078125, -136.9499053955078, -54.064605712890625, 28.820693969726562, 111.70599365234375, 194.59130859375, 277.4765930175781, 360.36187744140625, 443.2471923828125, 526.1325073242188, 609.017822265625, 691.903076171875, 774.7883911132812, 857.6737060546875, 940.5589599609375, 1023.4442749023438, 1106.329345703125, 1189.214599609375, 1272.0999755859375, 1354.9852294921875, 1437.87060546875, 1520.755859375, 1603.64111328125, 1686.5263671875, 1769.4117431640625, 1852.2969970703125, 1935.182373046875, 2018.067626953125, 2100.952880859375, 2183.83837890625, 2266.7236328125, 2349.60888671875, 2432.494140625, 2515.37939453125, 2598.2646484375, 2681.150146484375, 2764.035400390625, 2846.920654296875, 2929.805908203125, 3012.691162109375, 3095.57666015625, 3178.4619140625, 3261.34716796875, 3344.232666015625, 3427.117919921875, 3510.003173828125, 3592.888427734375, 3675.773681640625, 3758.658935546875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 14.0, 27.0, 34.0, 54.0, 87.0, 137.0, 195.0, 317.0, 457.0, 853.0, 1297.0, 1931.0, 2894.0, 4833.0, 7239.0, 11144.0, 17371.0, 26815.0, 41376.0, 64451.0, 100876.0, 162293.0, 278835.0, 570150.0, 3964363.0, 430538.0, 227760.0, 135713.0, 85181.0, 54167.0, 35340.0, 22956.0, 14850.0, 9479.0, 6263.0, 4014.0, 2579.0, 1674.0, 1042.0, 647.0, 427.0, 288.0, 181.0, 106.0, 65.0, 43.0, 34.0, 15.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.07379150390625, -2.0030517578125, -1.93231201171875, -1.861572265625, -1.79083251953125, -1.7200927734375, -1.64935302734375, -1.57861328125, -1.50787353515625, -1.4371337890625, -1.36639404296875, -1.295654296875, -1.22491455078125, -1.1541748046875, -1.08343505859375, -1.0126953125, -0.94195556640625, -0.8712158203125, -0.80047607421875, -0.729736328125, -0.65899658203125, -0.5882568359375, -0.51751708984375, -0.44677734375, -0.37603759765625, -0.3052978515625, -0.23455810546875, -0.163818359375, -0.09307861328125, -0.0223388671875, 0.04840087890625, 0.119140625, 0.18988037109375, 0.2606201171875, 0.33135986328125, 0.402099609375, 0.47283935546875, 0.5435791015625, 0.61431884765625, 0.68505859375, 0.75579833984375, 0.8265380859375, 0.89727783203125, 0.968017578125, 1.03875732421875, 1.1094970703125, 1.18023681640625, 1.2509765625, 1.32171630859375, 1.3924560546875, 1.46319580078125, 1.533935546875, 1.60467529296875, 1.6754150390625, 1.74615478515625, 1.81689453125, 1.88763427734375, 1.9583740234375, 2.02911376953125, 2.099853515625, 2.17059326171875, 2.2413330078125, 2.31207275390625, 2.3828125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 7.0, 12.0, 12.0, 17.0, 26.0, 23.0, 28.0, 28.0, 29.0, 31.0, 43.0, 25.0, 31.0, 38.0, 29.0, 45.0, 34.0, 1050.0, 61.0, 41.0, 33.0, 38.0, 31.0, 22.0, 32.0, 20.0, 33.0, 25.0, 17.0, 25.0, 17.0, 19.0, 14.0, 16.0, 16.0, 9.0, 6.0, 3.0, 6.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-101.3125, -98.220703125, -95.12890625, -92.037109375, -88.9453125, -85.853515625, -82.76171875, -79.669921875, -76.578125, -73.486328125, -70.39453125, -67.302734375, -64.2109375, -61.119140625, -58.02734375, -54.935546875, -51.84375, -48.751953125, -45.66015625, -42.568359375, -39.4765625, -36.384765625, -33.29296875, -30.201171875, -27.109375, -24.017578125, -20.92578125, -17.833984375, -14.7421875, -11.650390625, -8.55859375, -5.466796875, -2.375, 0.716796875, 3.80859375, 6.900390625, 9.9921875, 13.083984375, 16.17578125, 19.267578125, 22.359375, 25.451171875, 28.54296875, 31.634765625, 34.7265625, 37.818359375, 40.91015625, 44.001953125, 47.09375, 50.185546875, 53.27734375, 56.369140625, 59.4609375, 62.552734375, 65.64453125, 68.736328125, 71.828125, 74.919921875, 78.01171875, 81.103515625, 84.1953125, 87.287109375, 90.37890625, 93.470703125, 96.5625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 3.0, 9.0, 11.0, 11.0, 19.0, 24.0, 44.0, 74.0, 139.0, 178.0, 257.0, 383.0, 520.0, 779.0, 1084.0, 1568.0, 2342.0, 3324.0, 4751.0, 7094.0, 9699.0, 14167.0, 21022.0, 30238.0, 44303.0, 66780.0, 105286.0, 171900.0, 307493.0, 555192.0, 3828524.0, 453302.0, 247063.0, 143698.0, 88866.0, 57552.0, 38200.0, 26226.0, 18260.0, 12424.0, 8763.0, 6003.0, 4215.0, 3033.0, 2040.0, 1423.0, 979.0, 644.0, 489.0, 331.0, 217.0, 139.0, 104.0, 84.0, 48.0, 38.0, 29.0, 17.0, 20.0, 14.0, 8.0, 1.0, 4.0], "bins": [-1.796875, -1.739501953125, -1.68212890625, -1.624755859375, -1.5673828125, -1.510009765625, -1.45263671875, -1.395263671875, -1.337890625, -1.280517578125, -1.22314453125, -1.165771484375, -1.1083984375, -1.051025390625, -0.99365234375, -0.936279296875, -0.87890625, -0.821533203125, -0.76416015625, -0.706787109375, -0.6494140625, -0.592041015625, -0.53466796875, -0.477294921875, -0.419921875, -0.362548828125, -0.30517578125, -0.247802734375, -0.1904296875, -0.133056640625, -0.07568359375, -0.018310546875, 0.0390625, 0.096435546875, 0.15380859375, 0.211181640625, 0.2685546875, 0.325927734375, 0.38330078125, 0.440673828125, 0.498046875, 0.555419921875, 0.61279296875, 0.670166015625, 0.7275390625, 0.784912109375, 0.84228515625, 0.899658203125, 0.95703125, 1.014404296875, 1.07177734375, 1.129150390625, 1.1865234375, 1.243896484375, 1.30126953125, 1.358642578125, 1.416015625, 1.473388671875, 1.53076171875, 1.588134765625, 1.6455078125, 1.702880859375, 1.76025390625, 1.817626953125, 1.875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 11.0, 11.0, 6.0, 4.0, 10.0, 9.0, 11.0, 9.0, 13.0, 14.0, 19.0, 18.0, 18.0, 23.0, 30.0, 27.0, 35.0, 25.0, 39.0, 29.0, 30.0, 42.0, 1004.0, 104.0, 36.0, 36.0, 36.0, 43.0, 37.0, 41.0, 25.0, 20.0, 22.0, 22.0, 26.0, 18.0, 18.0, 10.0, 14.0, 8.0, 11.0, 12.0, 14.0, 10.0, 4.0, 3.0, 6.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0], "bins": [-94.6875, -91.7177734375, -88.748046875, -85.7783203125, -82.80859375, -79.8388671875, -76.869140625, -73.8994140625, -70.9296875, -67.9599609375, -64.990234375, -62.0205078125, -59.05078125, -56.0810546875, -53.111328125, -50.1416015625, -47.171875, -44.2021484375, -41.232421875, -38.2626953125, -35.29296875, -32.3232421875, -29.353515625, -26.3837890625, -23.4140625, -20.4443359375, -17.474609375, -14.5048828125, -11.53515625, -8.5654296875, -5.595703125, -2.6259765625, 0.34375, 3.3134765625, 6.283203125, 9.2529296875, 12.22265625, 15.1923828125, 18.162109375, 21.1318359375, 24.1015625, 27.0712890625, 30.041015625, 33.0107421875, 35.98046875, 38.9501953125, 41.919921875, 44.8896484375, 47.859375, 50.8291015625, 53.798828125, 56.7685546875, 59.73828125, 62.7080078125, 65.677734375, 68.6474609375, 71.6171875, 74.5869140625, 77.556640625, 80.5263671875, 83.49609375, 86.4658203125, 89.435546875, 92.4052734375, 95.375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 16.0, 20.0, 18.0, 21.0, 29.0, 35.0, 74.0, 84.0, 108.0, 143.0, 208.0, 260.0, 427.0, 573.0, 820.0, 1159.0, 1758.0, 2765.0, 4329.0, 6977.0, 11145.0, 19208.0, 36271.0, 84451.0, 914643.0, 5017124.0, 96060.0, 38967.0, 20871.0, 12191.0, 7367.0, 4455.0, 2880.0, 1774.0, 1239.0, 858.0, 589.0, 416.0, 298.0, 214.0, 170.0, 101.0, 100.0, 71.0, 30.0, 29.0, 18.0, 31.0, 12.0, 9.0, 10.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.37890625, -4.2423095703125, -4.105712890625, -3.9691162109375, -3.83251953125, -3.6959228515625, -3.559326171875, -3.4227294921875, -3.2861328125, -3.1495361328125, -3.012939453125, -2.8763427734375, -2.73974609375, -2.6031494140625, -2.466552734375, -2.3299560546875, -2.193359375, -2.0567626953125, -1.920166015625, -1.7835693359375, -1.64697265625, -1.5103759765625, -1.373779296875, -1.2371826171875, -1.1005859375, -0.9639892578125, -0.827392578125, -0.6907958984375, -0.55419921875, -0.4176025390625, -0.281005859375, -0.1444091796875, -0.0078125, 0.1287841796875, 0.265380859375, 0.4019775390625, 0.53857421875, 0.6751708984375, 0.811767578125, 0.9483642578125, 1.0849609375, 1.2215576171875, 1.358154296875, 1.4947509765625, 1.63134765625, 1.7679443359375, 1.904541015625, 2.0411376953125, 2.177734375, 2.3143310546875, 2.450927734375, 2.5875244140625, 2.72412109375, 2.8607177734375, 2.997314453125, 3.1339111328125, 3.2705078125, 3.4071044921875, 3.543701171875, 3.6802978515625, 3.81689453125, 3.9534912109375, 4.090087890625, 4.2266845703125, 4.36328125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 15.0, 7.0, 6.0, 17.0, 15.0, 15.0, 26.0, 24.0, 19.0, 35.0, 52.0, 30.0, 40.0, 43.0, 33.0, 51.0, 41.0, 1062.0, 44.0, 47.0, 36.0, 39.0, 37.0, 30.0, 35.0, 16.0, 35.0, 22.0, 17.0, 20.0, 23.0, 10.0, 12.0, 11.0, 10.0, 6.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-82.5625, -79.75, -76.9375, -74.125, -71.3125, -68.5, -65.6875, -62.875, -60.0625, -57.25, -54.4375, -51.625, -48.8125, -46.0, -43.1875, -40.375, -37.5625, -34.75, -31.9375, -29.125, -26.3125, -23.5, -20.6875, -17.875, -15.0625, -12.25, -9.4375, -6.625, -3.8125, -1.0, 1.8125, 4.625, 7.4375, 10.25, 13.0625, 15.875, 18.6875, 21.5, 24.3125, 27.125, 29.9375, 32.75, 35.5625, 38.375, 41.1875, 44.0, 46.8125, 49.625, 52.4375, 55.25, 58.0625, 60.875, 63.6875, 66.5, 69.3125, 72.125, 74.9375, 77.75, 80.5625, 83.375, 86.1875, 89.0, 91.8125, 94.625, 97.4375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 932.0, 66.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2995.4453125, -2939.714599609375, -2883.98388671875, -2828.2529296875, -2772.522216796875, -2716.79150390625, -2661.060791015625, -2605.329833984375, -2549.59912109375, -2493.868408203125, -2438.1376953125, -2382.40673828125, -2326.676025390625, -2270.9453125, -2215.214599609375, -2159.483642578125, -2103.7529296875, -2048.022216796875, -1992.2913818359375, -1936.5606689453125, -1880.829833984375, -1825.09912109375, -1769.3682861328125, -1713.6375732421875, -1657.9068603515625, -1602.1761474609375, -1546.4453125, -1490.714599609375, -1434.9837646484375, -1379.2530517578125, -1323.522216796875, -1267.79150390625, -1212.060791015625, -1156.330078125, -1100.5992431640625, -1044.8685302734375, -989.1376953125, -933.406982421875, -877.6761474609375, -821.9454345703125, -766.214599609375, -710.4838256835938, -654.7530517578125, -599.0222778320312, -543.29150390625, -487.5607604980469, -431.8299865722656, -376.0992126464844, -320.368408203125, -264.63763427734375, -208.9068603515625, -153.1761016845703, -97.44532775878906, -41.714569091796875, 14.016204833984375, 69.74697875976562, 125.47775268554688, 181.20852661132812, 236.93930053710938, 292.6700439453125, 348.40081787109375, 404.131591796875, 459.86236572265625, 515.5931396484375, 571.3239135742188]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 9.0, 8.0, 6.0, 7.0, 10.0, 8.0, 9.0, 18.0, 16.0, 18.0, 23.0, 24.0, 22.0, 26.0, 37.0, 35.0, 40.0, 50.0, 47.0, 32.0, 37.0, 47.0, 40.0, 37.0, 46.0, 25.0, 40.0, 35.0, 35.0, 24.0, 24.0, 28.0, 19.0, 20.0, 11.0, 12.0, 14.0, 12.0, 4.0, 9.0, 7.0, 10.0, 5.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-203.13497924804688, -196.5615997314453, -189.98822021484375, -183.4148406982422, -176.84146118164062, -170.26808166503906, -163.6947021484375, -157.121337890625, -150.54794311523438, -143.9745635986328, -137.40118408203125, -130.8278045654297, -124.25442504882812, -117.68104553222656, -111.10767364501953, -104.53429412841797, -97.96092224121094, -91.38754272460938, -84.81416320800781, -78.24078369140625, -71.66740417480469, -65.09402465820312, -58.520652770996094, -51.94727325439453, -45.37389373779297, -38.800514221191406, -32.227134704589844, -25.653759002685547, -19.080379486083984, -12.506999969482422, -5.933624267578125, 0.6397552490234375, 7.213134765625, 13.786513328552246, 20.359891891479492, 26.933269500732422, 33.506649017333984, 40.08002853393555, 46.653404235839844, 53.226783752441406, 59.80016326904297, 66.37354278564453, 72.9469223022461, 79.52029418945312, 86.09367370605469, 92.66705322265625, 99.24043273925781, 105.81381225585938, 112.38719177246094, 118.9605712890625, 125.53395080566406, 132.10733032226562, 138.6807098388672, 145.25408935546875, 151.82745361328125, 158.40084838867188, 164.97421264648438, 171.54759216308594, 178.1209716796875, 184.69435119628906, 191.26773071289062, 197.8411102294922, 204.41448974609375, 210.98785400390625, 217.56124877929688]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 3.0, 2.0, 0.0, 4.0, 9.0, 4.0, 4.0, 12.0, 9.0, 5.0, 6.0, 7.0, 11.0, 6.0, 18.0, 21.0, 25.0, 17.0, 53.0, 72.0, 132.0, 276.0, 1414.0, 24070.0, 4136401.0, 27445.0, 3335.0, 535.0, 110.0, 74.0, 54.0, 22.0, 22.0, 16.0, 17.0, 11.0, 17.0, 13.0, 0.0, 8.0, 6.0, 5.0, 3.0, 3.0, 9.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.5009765625, -0.4868659973144531, -0.47275543212890625, -0.4586448669433594, -0.4445343017578125, -0.4304237365722656, -0.41631317138671875, -0.4022026062011719, -0.388092041015625, -0.3739814758300781, -0.35987091064453125, -0.3457603454589844, -0.3316497802734375, -0.3175392150878906, -0.30342864990234375, -0.2893180847167969, -0.27520751953125, -0.2610969543457031, -0.24698638916015625, -0.23287582397460938, -0.2187652587890625, -0.20465469360351562, -0.19054412841796875, -0.17643356323242188, -0.162322998046875, -0.14821243286132812, -0.13410186767578125, -0.11999130249023438, -0.1058807373046875, -0.09177017211914062, -0.07765960693359375, -0.06354904174804688, -0.0494384765625, -0.035327911376953125, -0.02121734619140625, -0.007106781005859375, 0.0070037841796875, 0.021114349365234375, 0.03522491455078125, 0.049335479736328125, 0.063446044921875, 0.07755661010742188, 0.09166717529296875, 0.10577774047851562, 0.1198883056640625, 0.13399887084960938, 0.14810943603515625, 0.16222000122070312, 0.17633056640625, 0.19044113159179688, 0.20455169677734375, 0.21866226196289062, 0.2327728271484375, 0.24688339233398438, 0.26099395751953125, 0.2751045227050781, 0.289215087890625, 0.3033256530761719, 0.31743621826171875, 0.3315467834472656, 0.3456573486328125, 0.3597679138183594, 0.37387847900390625, 0.3879890441894531, 0.402099609375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 1.0, 6.0, 7.0, 15.0, 14.0, 19.0, 23.0, 781.0, 22.0, 14.0, 15.0, 13.0, 12.0, 9.0, 4.0, 2.0, 6.0, 5.0, 5.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.3019981384277344, -0.29320526123046875, -0.2844123840332031, -0.2756195068359375, -0.2668266296386719, -0.25803375244140625, -0.24924087524414062, -0.240447998046875, -0.23165512084960938, -0.22286224365234375, -0.21406936645507812, -0.2052764892578125, -0.19648361206054688, -0.18769073486328125, -0.17889785766601562, -0.17010498046875, -0.16131210327148438, -0.15251922607421875, -0.14372634887695312, -0.1349334716796875, -0.12614059448242188, -0.11734771728515625, -0.10855484008789062, -0.099761962890625, -0.09096908569335938, -0.08217620849609375, -0.07338333129882812, -0.0645904541015625, -0.055797576904296875, -0.04700469970703125, -0.038211822509765625, -0.0294189453125, -0.020626068115234375, -0.01183319091796875, -0.003040313720703125, 0.0057525634765625, 0.014545440673828125, 0.02333831787109375, 0.032131195068359375, 0.040924072265625, 0.049716949462890625, 0.05850982666015625, 0.06730270385742188, 0.0760955810546875, 0.08488845825195312, 0.09368133544921875, 0.10247421264648438, 0.11126708984375, 0.12005996704101562, 0.12885284423828125, 0.13764572143554688, 0.1464385986328125, 0.15523147583007812, 0.16402435302734375, 0.17281723022460938, 0.181610107421875, 0.19040298461914062, 0.19919586181640625, 0.20798873901367188, 0.2167816162109375, 0.22557449340820312, 0.23436737060546875, 0.24316024780273438, 0.251953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 10.0, 24.0, 22.0, 29.0, 52.0, 116.0, 270.0, 572.0, 1960.0, 10904.0, 4145896.0, 31254.0, 2314.0, 500.0, 165.0, 66.0, 44.0, 28.0, 15.0, 19.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.732421875, -0.7118911743164062, -0.6913604736328125, -0.6708297729492188, -0.650299072265625, -0.6297683715820312, -0.6092376708984375, -0.5887069702148438, -0.56817626953125, -0.5476455688476562, -0.5271148681640625, -0.5065841674804688, -0.486053466796875, -0.46552276611328125, -0.4449920654296875, -0.42446136474609375, -0.4039306640625, -0.38339996337890625, -0.3628692626953125, -0.34233856201171875, -0.321807861328125, -0.30127716064453125, -0.2807464599609375, -0.26021575927734375, -0.23968505859375, -0.21915435791015625, -0.1986236572265625, -0.17809295654296875, -0.157562255859375, -0.13703155517578125, -0.1165008544921875, -0.09597015380859375, -0.075439453125, -0.05490875244140625, -0.0343780517578125, -0.01384735107421875, 0.006683349609375, 0.02721405029296875, 0.0477447509765625, 0.06827545166015625, 0.08880615234375, 0.10933685302734375, 0.1298675537109375, 0.15039825439453125, 0.170928955078125, 0.19145965576171875, 0.2119903564453125, 0.23252105712890625, 0.2530517578125, 0.27358245849609375, 0.2941131591796875, 0.31464385986328125, 0.335174560546875, 0.35570526123046875, 0.3762359619140625, 0.39676666259765625, 0.41729736328125, 0.43782806396484375, 0.4583587646484375, 0.47888946533203125, 0.499420166015625, 0.5199508666992188, 0.5404815673828125, 0.5610122680664062, 0.58154296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 2.0, 7.0, 5.0, 14.0, 15.0, 41.0, 160.0, 801.0, 2599.0, 288.0, 69.0, 18.0, 19.0, 5.0, 4.0, 4.0, 1.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.332763671875, -0.3238239288330078, -0.3148841857910156, -0.30594444274902344, -0.29700469970703125, -0.28806495666503906, -0.2791252136230469, -0.2701854705810547, -0.2612457275390625, -0.2523059844970703, -0.24336624145507812, -0.23442649841308594, -0.22548675537109375, -0.21654701232910156, -0.20760726928710938, -0.1986675262451172, -0.189727783203125, -0.1807880401611328, -0.17184829711914062, -0.16290855407714844, -0.15396881103515625, -0.14502906799316406, -0.13608932495117188, -0.1271495819091797, -0.1182098388671875, -0.10927009582519531, -0.10033035278320312, -0.09139060974121094, -0.08245086669921875, -0.07351112365722656, -0.06457138061523438, -0.05563163757324219, -0.04669189453125, -0.03775215148925781, -0.028812408447265625, -0.019872665405273438, -0.01093292236328125, -0.0019931793212890625, 0.006946563720703125, 0.015886306762695312, 0.0248260498046875, 0.03376579284667969, 0.042705535888671875, 0.05164527893066406, 0.06058502197265625, 0.06952476501464844, 0.07846450805664062, 0.08740425109863281, 0.096343994140625, 0.10528373718261719, 0.11422348022460938, 0.12316322326660156, 0.13210296630859375, 0.14104270935058594, 0.14998245239257812, 0.1589221954345703, 0.1678619384765625, 0.1768016815185547, 0.18574142456054688, 0.19468116760253906, 0.20362091064453125, 0.21256065368652344, 0.22150039672851562, 0.2304401397705078, 0.2393798828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 11.0, 28.0, 104.0, 557.0, 198.0, 49.0, 27.0, 11.0, 7.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5676230192184448, -0.5529505014419556, -0.5382780432701111, -0.5236055254936218, -0.5089330673217773, -0.4942605495452881, -0.4795880615711212, -0.46491557359695435, -0.4502430558204651, -0.4355705678462982, -0.42089807987213135, -0.4062255620956421, -0.3915530741214752, -0.37688058614730835, -0.3622080981731415, -0.3475356101989746, -0.33286312222480774, -0.31819063425064087, -0.303518146276474, -0.28884565830230713, -0.27417314052581787, -0.259500652551651, -0.24482816457748413, -0.23015567660331726, -0.2154831737279892, -0.20081068575382233, -0.18613818287849426, -0.1714656949043274, -0.15679320693016052, -0.14212070405483246, -0.1274482160806656, -0.11277572065591812, -0.09810322523117065, -0.08343072980642319, -0.06875823438167572, -0.05408574640750885, -0.03941325098276138, -0.024740755558013916, -0.010068267583847046, 0.004604227840900421, 0.019276723265647888, 0.033949218690395355, 0.048621710389852524, 0.06329420208930969, 0.07796669751405716, 0.09263919293880463, 0.1073116809129715, 0.12198417633771896, 0.13665667176246643, 0.1513291597366333, 0.16600166261196136, 0.18067415058612823, 0.1953466534614563, 0.21001914143562317, 0.22469162940979004, 0.2393641173839569, 0.2540366053581238, 0.26870909333229065, 0.2833815813064575, 0.2980540990829468, 0.31272658705711365, 0.3273990750312805, 0.3420715630054474, 0.35674405097961426, 0.3714165687561035]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 9.0, 4.0, 8.0, 14.0, 26.0, 48.0, 83.0, 100.0, 115.0, 143.0, 117.0, 95.0, 61.0, 46.0, 27.0, 16.0, 17.0, 6.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1085833311080933, -1.0783967971801758, -1.0482103824615479, -1.01802396774292, -0.9878374338150024, -0.9576509594917297, -0.927464485168457, -0.8972780108451843, -0.8670915365219116, -0.8369050621986389, -0.8067185878753662, -0.7765321135520935, -0.7463456392288208, -0.7161591649055481, -0.6859726905822754, -0.6557862162590027, -0.62559974193573, -0.5954132676124573, -0.5652267932891846, -0.5350403189659119, -0.5048538446426392, -0.47466737031936646, -0.44448089599609375, -0.41429442167282104, -0.38410794734954834, -0.35392147302627563, -0.32373499870300293, -0.2935485243797302, -0.2633620500564575, -0.23317557573318481, -0.2029891014099121, -0.1728026270866394, -0.1426161527633667, -0.112429678440094, -0.08224320411682129, -0.052056729793548584, -0.02187025547027588, 0.008316218852996826, 0.03850269317626953, 0.06868916749954224, 0.09887564182281494, 0.12906211614608765, 0.15924859046936035, 0.18943506479263306, 0.21962153911590576, 0.24980801343917847, 0.27999448776245117, 0.3101809620857239, 0.3403674364089966, 0.3705539107322693, 0.400740385055542, 0.4309268593788147, 0.4611133337020874, 0.4912998080253601, 0.5214862823486328, 0.5516727566719055, 0.5818592309951782, 0.6120457053184509, 0.6422321796417236, 0.6724186539649963, 0.702605128288269, 0.7327916026115417, 0.7629780769348145, 0.7931645512580872, 0.8233510255813599]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 11.0, 9.0, 13.0, 26.0, 23.0, 42.0, 59.0, 75.0, 87.0, 138.0, 192.0, 301.0, 394.0, 583.0, 838.0, 1261.0, 1947.0, 3203.0, 5594.0, 11846.0, 33046.0, 921792.0, 38321.0, 13032.0, 6133.0, 3414.0, 2112.0, 1305.0, 838.0, 578.0, 362.0, 281.0, 177.0, 128.0, 107.0, 63.0, 56.0, 33.0, 40.0, 24.0, 15.0, 13.0, 5.0, 10.0, 8.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.9990234375, -0.9640350341796875, -0.929046630859375, -0.8940582275390625, -0.85906982421875, -0.8240814208984375, -0.789093017578125, -0.7541046142578125, -0.7191162109375, -0.6841278076171875, -0.649139404296875, -0.6141510009765625, -0.57916259765625, -0.5441741943359375, -0.509185791015625, -0.4741973876953125, -0.439208984375, -0.4042205810546875, -0.369232177734375, -0.3342437744140625, -0.29925537109375, -0.2642669677734375, -0.229278564453125, -0.1942901611328125, -0.1593017578125, -0.1243133544921875, -0.089324951171875, -0.0543365478515625, -0.01934814453125, 0.0156402587890625, 0.050628662109375, 0.0856170654296875, 0.12060546875, 0.1555938720703125, 0.190582275390625, 0.2255706787109375, 0.26055908203125, 0.2955474853515625, 0.330535888671875, 0.3655242919921875, 0.4005126953125, 0.4355010986328125, 0.470489501953125, 0.5054779052734375, 0.54046630859375, 0.5754547119140625, 0.610443115234375, 0.6454315185546875, 0.680419921875, 0.7154083251953125, 0.750396728515625, 0.7853851318359375, 0.82037353515625, 0.8553619384765625, 0.890350341796875, 0.9253387451171875, 0.9603271484375, 0.9953155517578125, 1.030303955078125, 1.0652923583984375, 1.10028076171875, 1.1352691650390625, 1.170257568359375, 1.2052459716796875, 1.240234375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 6.0, 3.0, 18.0, 11.0, 17.0, 20.0, 739.0, 65.0, 15.0, 14.0, 17.0, 8.0, 15.0, 5.0, 2.0, 4.0, 7.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30859375, -0.2999687194824219, -0.29134368896484375, -0.2827186584472656, -0.2740936279296875, -0.2654685974121094, -0.25684356689453125, -0.24821853637695312, -0.239593505859375, -0.23096847534179688, -0.22234344482421875, -0.21371841430664062, -0.2050933837890625, -0.19646835327148438, -0.18784332275390625, -0.17921829223632812, -0.17059326171875, -0.16196823120117188, -0.15334320068359375, -0.14471817016601562, -0.1360931396484375, -0.12746810913085938, -0.11884307861328125, -0.11021804809570312, -0.101593017578125, -0.09296798706054688, -0.08434295654296875, -0.07571792602539062, -0.0670928955078125, -0.058467864990234375, -0.04984283447265625, -0.041217803955078125, -0.0325927734375, -0.023967742919921875, -0.01534271240234375, -0.006717681884765625, 0.0019073486328125, 0.010532379150390625, 0.01915740966796875, 0.027782440185546875, 0.036407470703125, 0.045032501220703125, 0.05365753173828125, 0.062282562255859375, 0.0709075927734375, 0.07953262329101562, 0.08815765380859375, 0.09678268432617188, 0.10540771484375, 0.11403274536132812, 0.12265777587890625, 0.13128280639648438, 0.1399078369140625, 0.14853286743164062, 0.15715789794921875, 0.16578292846679688, 0.174407958984375, 0.18303298950195312, 0.19165802001953125, 0.20028305053710938, 0.2089080810546875, 0.21753311157226562, 0.22615814208984375, 0.23478317260742188, 0.243408203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 7.0, 5.0, 18.0, 20.0, 22.0, 21.0, 32.0, 42.0, 51.0, 60.0, 74.0, 107.0, 160.0, 265.0, 550.0, 1140.0, 2855.0, 8891.0, 36238.0, 324032.0, 607683.0, 48886.0, 11054.0, 3414.0, 1381.0, 591.0, 279.0, 155.0, 101.0, 80.0, 68.0, 57.0, 45.0, 47.0, 31.0, 18.0, 13.0, 12.0, 9.0, 10.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.83251953125, -0.8087921142578125, -0.785064697265625, -0.7613372802734375, -0.73760986328125, -0.7138824462890625, -0.690155029296875, -0.6664276123046875, -0.6427001953125, -0.6189727783203125, -0.595245361328125, -0.5715179443359375, -0.54779052734375, -0.5240631103515625, -0.500335693359375, -0.4766082763671875, -0.452880859375, -0.4291534423828125, -0.405426025390625, -0.3816986083984375, -0.35797119140625, -0.3342437744140625, -0.310516357421875, -0.2867889404296875, -0.2630615234375, -0.2393341064453125, -0.215606689453125, -0.1918792724609375, -0.16815185546875, -0.1444244384765625, -0.120697021484375, -0.0969696044921875, -0.0732421875, -0.0495147705078125, -0.025787353515625, -0.0020599365234375, 0.02166748046875, 0.0453948974609375, 0.069122314453125, 0.0928497314453125, 0.1165771484375, 0.1403045654296875, 0.164031982421875, 0.1877593994140625, 0.21148681640625, 0.2352142333984375, 0.258941650390625, 0.2826690673828125, 0.306396484375, 0.3301239013671875, 0.353851318359375, 0.3775787353515625, 0.40130615234375, 0.4250335693359375, 0.448760986328125, 0.4724884033203125, 0.4962158203125, 0.5199432373046875, 0.543670654296875, 0.5673980712890625, 0.59112548828125, 0.6148529052734375, 0.638580322265625, 0.6623077392578125, 0.68603515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 11.0, 9.0, 2.0, 7.0, 20.0, 11.0, 9.0, 14.0, 18.0, 20.0, 16.0, 19.0, 32.0, 29.0, 29.0, 27.0, 38.0, 40.0, 30.0, 37.0, 35.0, 32.0, 48.0, 34.0, 26.0, 39.0, 25.0, 23.0, 39.0, 25.0, 29.0, 29.0, 28.0, 29.0, 19.0, 20.0, 24.0, 15.0, 12.0, 4.0, 10.0, 8.0, 6.0, 3.0, 5.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.9501953125, -0.92230224609375, -0.8944091796875, -0.86651611328125, -0.838623046875, -0.81072998046875, -0.7828369140625, -0.75494384765625, -0.72705078125, -0.69915771484375, -0.6712646484375, -0.64337158203125, -0.615478515625, -0.58758544921875, -0.5596923828125, -0.53179931640625, -0.50390625, -0.47601318359375, -0.4481201171875, -0.42022705078125, -0.392333984375, -0.36444091796875, -0.3365478515625, -0.30865478515625, -0.28076171875, -0.25286865234375, -0.2249755859375, -0.19708251953125, -0.169189453125, -0.14129638671875, -0.1134033203125, -0.08551025390625, -0.0576171875, -0.02972412109375, -0.0018310546875, 0.02606201171875, 0.053955078125, 0.08184814453125, 0.1097412109375, 0.13763427734375, 0.16552734375, 0.19342041015625, 0.2213134765625, 0.24920654296875, 0.277099609375, 0.30499267578125, 0.3328857421875, 0.36077880859375, 0.388671875, 0.41656494140625, 0.4444580078125, 0.47235107421875, 0.500244140625, 0.52813720703125, 0.5560302734375, 0.58392333984375, 0.61181640625, 0.63970947265625, 0.6676025390625, 0.69549560546875, 0.723388671875, 0.75128173828125, 0.7791748046875, 0.80706787109375, 0.8349609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 15.0, 22.0, 32.0, 56.0, 102.0, 260.0, 595.0, 1904.0, 16153.0, 1012378.0, 14131.0, 1725.0, 593.0, 274.0, 114.0, 64.0, 40.0, 14.0, 16.0, 14.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.230804443359375, -0.22137451171875, -0.211944580078125, -0.2025146484375, -0.193084716796875, -0.18365478515625, -0.174224853515625, -0.164794921875, -0.155364990234375, -0.14593505859375, -0.136505126953125, -0.1270751953125, -0.117645263671875, -0.10821533203125, -0.098785400390625, -0.08935546875, -0.079925537109375, -0.07049560546875, -0.061065673828125, -0.0516357421875, -0.042205810546875, -0.03277587890625, -0.023345947265625, -0.013916015625, -0.004486083984375, 0.00494384765625, 0.014373779296875, 0.0238037109375, 0.033233642578125, 0.04266357421875, 0.052093505859375, 0.0615234375, 0.070953369140625, 0.08038330078125, 0.089813232421875, 0.0992431640625, 0.108673095703125, 0.11810302734375, 0.127532958984375, 0.136962890625, 0.146392822265625, 0.15582275390625, 0.165252685546875, 0.1746826171875, 0.184112548828125, 0.19354248046875, 0.202972412109375, 0.21240234375, 0.221832275390625, 0.23126220703125, 0.240692138671875, 0.2501220703125, 0.259552001953125, 0.26898193359375, 0.278411865234375, 0.287841796875, 0.297271728515625, 0.30670166015625, 0.316131591796875, 0.3255615234375, 0.334991455078125, 0.34442138671875, 0.353851318359375, 0.36328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 7.0, 6.0, 13.0, 16.0, 41.0, 91.0, 234.0, 309.0, 161.0, 52.0, 34.0, 17.0, 9.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2292137145996094e-05, -2.1676532924175262e-05, -2.106092870235443e-05, -2.04453244805336e-05, -1.982972025871277e-05, -1.9214116036891937e-05, -1.8598511815071106e-05, -1.7982907593250275e-05, -1.7367303371429443e-05, -1.6751699149608612e-05, -1.613609492778778e-05, -1.552049070596695e-05, -1.4904886484146118e-05, -1.4289282262325287e-05, -1.3673678040504456e-05, -1.3058073818683624e-05, -1.2442469596862793e-05, -1.1826865375041962e-05, -1.121126115322113e-05, -1.0595656931400299e-05, -9.980052709579468e-06, -9.364448487758636e-06, -8.748844265937805e-06, -8.133240044116974e-06, -7.517635822296143e-06, -6.902031600475311e-06, -6.28642737865448e-06, -5.670823156833649e-06, -5.055218935012817e-06, -4.439614713191986e-06, -3.824010491371155e-06, -3.2084062695503235e-06, -2.592802047729492e-06, -1.977197825908661e-06, -1.3615936040878296e-06, -7.459893822669983e-07, -1.30385160446167e-07, 4.852190613746643e-07, 1.1008232831954956e-06, 1.716427505016327e-06, 2.332031726837158e-06, 2.9476359486579895e-06, 3.563240170478821e-06, 4.178844392299652e-06, 4.794448614120483e-06, 5.410052835941315e-06, 6.025657057762146e-06, 6.641261279582977e-06, 7.256865501403809e-06, 7.87246972322464e-06, 8.488073945045471e-06, 9.103678166866302e-06, 9.719282388687134e-06, 1.0334886610507965e-05, 1.0950490832328796e-05, 1.1566095054149628e-05, 1.2181699275970459e-05, 1.279730349779129e-05, 1.3412907719612122e-05, 1.4028511941432953e-05, 1.4644116163253784e-05, 1.5259720385074615e-05, 1.5875324606895447e-05, 1.6490928828716278e-05, 1.710653305053711e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 9.0, 16.0, 38.0, 57.0, 96.0, 197.0, 748.0, 5253.0, 1008671.0, 31110.0, 1621.0, 435.0, 138.0, 69.0, 28.0, 24.0, 14.0, 11.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4365234375, -0.417327880859375, -0.39813232421875, -0.378936767578125, -0.3597412109375, -0.340545654296875, -0.32135009765625, -0.302154541015625, -0.282958984375, -0.263763427734375, -0.24456787109375, -0.225372314453125, -0.2061767578125, -0.186981201171875, -0.16778564453125, -0.148590087890625, -0.12939453125, -0.110198974609375, -0.09100341796875, -0.071807861328125, -0.0526123046875, -0.033416748046875, -0.01422119140625, 0.004974365234375, 0.024169921875, 0.043365478515625, 0.06256103515625, 0.081756591796875, 0.1009521484375, 0.120147705078125, 0.13934326171875, 0.158538818359375, 0.177734375, 0.196929931640625, 0.21612548828125, 0.235321044921875, 0.2545166015625, 0.273712158203125, 0.29290771484375, 0.312103271484375, 0.331298828125, 0.350494384765625, 0.36968994140625, 0.388885498046875, 0.4080810546875, 0.427276611328125, 0.44647216796875, 0.465667724609375, 0.48486328125, 0.504058837890625, 0.52325439453125, 0.542449951171875, 0.5616455078125, 0.580841064453125, 0.60003662109375, 0.619232177734375, 0.638427734375, 0.657623291015625, 0.67681884765625, 0.696014404296875, 0.7152099609375, 0.734405517578125, 0.75360107421875, 0.772796630859375, 0.7919921875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 16.0, 16.0, 29.0, 35.0, 84.0, 228.0, 307.0, 141.0, 48.0, 34.0, 14.0, 15.0, 5.0, 4.0, 4.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36572265625, -0.3456573486328125, -0.325592041015625, -0.3055267333984375, -0.28546142578125, -0.2653961181640625, -0.245330810546875, -0.2252655029296875, -0.2052001953125, -0.1851348876953125, -0.165069580078125, -0.1450042724609375, -0.12493896484375, -0.1048736572265625, -0.084808349609375, -0.0647430419921875, -0.044677734375, -0.0246124267578125, -0.004547119140625, 0.0155181884765625, 0.03558349609375, 0.0556488037109375, 0.075714111328125, 0.0957794189453125, 0.1158447265625, 0.1359100341796875, 0.155975341796875, 0.1760406494140625, 0.19610595703125, 0.2161712646484375, 0.236236572265625, 0.2563018798828125, 0.2763671875, 0.2964324951171875, 0.316497802734375, 0.3365631103515625, 0.35662841796875, 0.3766937255859375, 0.396759033203125, 0.4168243408203125, 0.4368896484375, 0.4569549560546875, 0.477020263671875, 0.4970855712890625, 0.51715087890625, 0.5372161865234375, 0.557281494140625, 0.5773468017578125, 0.597412109375, 0.6174774169921875, 0.637542724609375, 0.6576080322265625, 0.67767333984375, 0.6977386474609375, 0.717803955078125, 0.7378692626953125, 0.7579345703125, 0.7779998779296875, 0.798065185546875, 0.8181304931640625, 0.83819580078125, 0.8582611083984375, 0.878326416015625, 0.8983917236328125, 0.91845703125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 33.0, 71.0, 666.0, 164.0, 49.0, 9.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.288055896759033, -2.9463248252868652, -2.6045937538146973, -2.2628629207611084, -1.9211318492889404, -1.5794007778167725, -1.2376699447631836, -0.8959388732910156, -0.5542078018188477, -0.21247678995132446, 0.12925422191619873, 0.47098517417907715, 0.8127162456512451, 1.154447317123413, 1.496178150177002, 1.83790922164917, 2.179640293121338, 2.521371364593506, 2.863102436065674, 3.2048332691192627, 3.5465643405914307, 3.8882954120635986, 4.2300262451171875, 4.5717573165893555, 4.913488388061523, 5.255219459533691, 5.596950531005859, 5.938681602478027, 6.280412673950195, 6.622143745422363, 6.963874340057373, 7.305605411529541, 7.647336959838867, 7.989068031311035, 8.330799102783203, 8.672530174255371, 9.014261245727539, 9.355992317199707, 9.697723388671875, 10.039453506469727, 10.381185531616211, 10.722916603088379, 11.064647674560547, 11.406378746032715, 11.748109817504883, 12.08984088897705, 12.431571960449219, 12.77330207824707, 13.115033149719238, 13.456764221191406, 13.798495292663574, 14.140226364135742, 14.48195743560791, 14.823688507080078, 15.16541862487793, 15.507150650024414, 15.848880767822266, 16.190610885620117, 16.5323429107666, 16.874073028564453, 17.215805053710938, 17.55753517150879, 17.899267196655273, 18.240997314453125, 18.58272933959961]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 7.0, 11.0, 15.0, 15.0, 32.0, 47.0, 85.0, 150.0, 202.0, 173.0, 97.0, 55.0, 24.0, 15.0, 14.0, 10.0, 7.0, 7.0, 2.0, 2.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.72482681274414, -22.995487213134766, -22.26614761352539, -21.536808013916016, -20.80746841430664, -20.078128814697266, -19.34878921508789, -18.619449615478516, -17.89011001586914, -17.160770416259766, -16.43143081665039, -15.702091217041016, -14.97275161743164, -14.243412017822266, -13.514073371887207, -12.784733772277832, -12.055395126342773, -11.326055526733398, -10.596715927124023, -9.867376327514648, -9.138036727905273, -8.408697128295898, -7.67935848236084, -6.950018882751465, -6.22067928314209, -5.491339683532715, -4.76200008392334, -4.032660961151123, -3.303321361541748, -2.573981761932373, -1.8446426391601562, -1.1153030395507812, -0.38596153259277344, 0.343377947807312, 1.0727174282073975, 1.8020567893981934, 2.5313963890075684, 3.2607359886169434, 3.99007511138916, 4.719414710998535, 5.44875431060791, 6.178093910217285, 6.90743350982666, 7.636772632598877, 8.366111755371094, 9.095451354980469, 9.824790954589844, 10.554130554199219, 11.283470153808594, 12.012809753417969, 12.742149353027344, 13.471488952636719, 14.200828552246094, 14.930168151855469, 15.659506797790527, 16.38884735107422, 17.118186950683594, 17.84752655029297, 18.576866149902344, 19.30620574951172, 20.035545349121094, 20.76488494873047, 21.494224548339844, 22.22356414794922, 22.95290184020996]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 6.0, 10.0, 14.0, 20.0, 18.0, 36.0, 37.0, 49.0, 78.0, 138.0, 219.0, 349.0, 545.0, 803.0, 1421.0, 2305.0, 4608.0, 10417.0, 34878.0, 4080996.0, 37522.0, 10805.0, 4389.0, 2115.0, 1097.0, 571.0, 344.0, 191.0, 117.0, 60.0, 45.0, 19.0, 13.0, 11.0, 10.0, 4.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.228515625, -2.1690826416015625, -2.109649658203125, -2.0502166748046875, -1.99078369140625, -1.9313507080078125, -1.871917724609375, -1.8124847412109375, -1.7530517578125, -1.6936187744140625, -1.634185791015625, -1.5747528076171875, -1.51531982421875, -1.4558868408203125, -1.396453857421875, -1.3370208740234375, -1.277587890625, -1.2181549072265625, -1.158721923828125, -1.0992889404296875, -1.03985595703125, -0.9804229736328125, -0.920989990234375, -0.8615570068359375, -0.8021240234375, -0.7426910400390625, -0.683258056640625, -0.6238250732421875, -0.56439208984375, -0.5049591064453125, -0.445526123046875, -0.3860931396484375, -0.32666015625, -0.2672271728515625, -0.207794189453125, -0.1483612060546875, -0.08892822265625, -0.0294952392578125, 0.029937744140625, 0.0893707275390625, 0.1488037109375, 0.2082366943359375, 0.267669677734375, 0.3271026611328125, 0.38653564453125, 0.4459686279296875, 0.505401611328125, 0.5648345947265625, 0.624267578125, 0.6837005615234375, 0.743133544921875, 0.8025665283203125, 0.86199951171875, 0.9214324951171875, 0.980865478515625, 1.0402984619140625, 1.0997314453125, 1.1591644287109375, 1.218597412109375, 1.2780303955078125, 1.33746337890625, 1.3968963623046875, 1.456329345703125, 1.5157623291015625, 1.5751953125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 6.0, 6.0, 15.0, 11.0, 8.0, 11.0, 20.0, 223.0, 553.0, 34.0, 13.0, 7.0, 13.0, 14.0, 15.0, 4.0, 10.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2432861328125, -0.23690032958984375, -0.2305145263671875, -0.22412872314453125, -0.217742919921875, -0.21135711669921875, -0.2049713134765625, -0.19858551025390625, -0.19219970703125, -0.18581390380859375, -0.1794281005859375, -0.17304229736328125, -0.166656494140625, -0.16027069091796875, -0.1538848876953125, -0.14749908447265625, -0.14111328125, -0.13472747802734375, -0.1283416748046875, -0.12195587158203125, -0.115570068359375, -0.10918426513671875, -0.1027984619140625, -0.09641265869140625, -0.09002685546875, -0.08364105224609375, -0.0772552490234375, -0.07086944580078125, -0.064483642578125, -0.05809783935546875, -0.0517120361328125, -0.04532623291015625, -0.0389404296875, -0.03255462646484375, -0.0261688232421875, -0.01978302001953125, -0.013397216796875, -0.00701141357421875, -0.0006256103515625, 0.00576019287109375, 0.01214599609375, 0.01853179931640625, 0.0249176025390625, 0.03130340576171875, 0.037689208984375, 0.04407501220703125, 0.0504608154296875, 0.05684661865234375, 0.063232421875, 0.06961822509765625, 0.0760040283203125, 0.08238983154296875, 0.088775634765625, 0.09516143798828125, 0.1015472412109375, 0.10793304443359375, 0.11431884765625, 0.12070465087890625, 0.1270904541015625, 0.13347625732421875, 0.139862060546875, 0.14624786376953125, 0.1526336669921875, 0.15901947021484375, 0.1654052734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 11.0, 9.0, 15.0, 11.0, 20.0, 26.0, 41.0, 73.0, 104.0, 228.0, 502.0, 1640.0, 6391.0, 48980.0, 4051227.0, 73738.0, 8093.0, 1889.0, 644.0, 256.0, 117.0, 65.0, 41.0, 22.0, 23.0, 23.0, 13.0, 16.0, 7.0, 10.0, 4.0, 6.0, 0.0, 5.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4189453125, -1.3753814697265625, -1.331817626953125, -1.2882537841796875, -1.24468994140625, -1.2011260986328125, -1.157562255859375, -1.1139984130859375, -1.0704345703125, -1.0268707275390625, -0.983306884765625, -0.9397430419921875, -0.89617919921875, -0.8526153564453125, -0.809051513671875, -0.7654876708984375, -0.721923828125, -0.6783599853515625, -0.634796142578125, -0.5912322998046875, -0.54766845703125, -0.5041046142578125, -0.460540771484375, -0.4169769287109375, -0.3734130859375, -0.3298492431640625, -0.286285400390625, -0.2427215576171875, -0.19915771484375, -0.1555938720703125, -0.112030029296875, -0.0684661865234375, -0.02490234375, 0.0186614990234375, 0.062225341796875, 0.1057891845703125, 0.14935302734375, 0.1929168701171875, 0.236480712890625, 0.2800445556640625, 0.3236083984375, 0.3671722412109375, 0.410736083984375, 0.4542999267578125, 0.49786376953125, 0.5414276123046875, 0.584991455078125, 0.6285552978515625, 0.672119140625, 0.7156829833984375, 0.759246826171875, 0.8028106689453125, 0.84637451171875, 0.8899383544921875, 0.933502197265625, 0.9770660400390625, 1.0206298828125, 1.0641937255859375, 1.107757568359375, 1.1513214111328125, 1.19488525390625, 1.2384490966796875, 1.282012939453125, 1.3255767822265625, 1.369140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 8.0, 8.0, 4.0, 7.0, 9.0, 7.0, 14.0, 14.0, 26.0, 31.0, 35.0, 68.0, 100.0, 196.0, 2470.0, 672.0, 126.0, 78.0, 42.0, 22.0, 22.0, 18.0, 12.0, 11.0, 7.0, 9.0, 7.0, 6.0, 6.0, 3.0, 5.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2734375, -0.2651214599609375, -0.256805419921875, -0.2484893798828125, -0.24017333984375, -0.2318572998046875, -0.223541259765625, -0.2152252197265625, -0.2069091796875, -0.1985931396484375, -0.190277099609375, -0.1819610595703125, -0.17364501953125, -0.1653289794921875, -0.157012939453125, -0.1486968994140625, -0.140380859375, -0.1320648193359375, -0.123748779296875, -0.1154327392578125, -0.10711669921875, -0.0988006591796875, -0.090484619140625, -0.0821685791015625, -0.0738525390625, -0.0655364990234375, -0.057220458984375, -0.0489044189453125, -0.04058837890625, -0.0322723388671875, -0.023956298828125, -0.0156402587890625, -0.00732421875, 0.0009918212890625, 0.009307861328125, 0.0176239013671875, 0.02593994140625, 0.0342559814453125, 0.042572021484375, 0.0508880615234375, 0.0592041015625, 0.0675201416015625, 0.075836181640625, 0.0841522216796875, 0.09246826171875, 0.1007843017578125, 0.109100341796875, 0.1174163818359375, 0.125732421875, 0.1340484619140625, 0.142364501953125, 0.1506805419921875, 0.15899658203125, 0.1673126220703125, 0.175628662109375, 0.1839447021484375, 0.1922607421875, 0.2005767822265625, 0.208892822265625, 0.2172088623046875, 0.22552490234375, 0.2338409423828125, 0.242156982421875, 0.2504730224609375, 0.2587890625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 31.0, 970.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5032474994659424, -1.225464105606079, -0.9476807713508606, -0.6698974370956421, -0.3921140432357788, -0.11433064937591553, 0.1634526252746582, 0.4412360191345215, 0.7190194129943848, 0.996802806854248, 1.2745862007141113, 1.552369475364685, 1.8301528692245483, 2.107936382293701, 2.3857195377349854, 2.6635029315948486, 2.941286325454712, 3.219069719314575, 3.4968531131744385, 3.7746362686157227, 4.052419662475586, 4.330203056335449, 4.6079864501953125, 4.885769844055176, 5.163553237915039, 5.441336631774902, 5.719120025634766, 5.996903419494629, 6.274686813354492, 6.5524702072143555, 6.830253601074219, 7.108036994934082, 7.385819435119629, 7.663602828979492, 7.9413862228393555, 8.219169616699219, 8.496953010559082, 8.774736404418945, 9.052519798278809, 9.330303192138672, 9.608086585998535, 9.885869979858398, 10.163653373718262, 10.441436767578125, 10.719220161437988, 10.997003555297852, 11.274786949157715, 11.552570343017578, 11.830352783203125, 12.108136177062988, 12.385919570922852, 12.663702964782715, 12.941486358642578, 13.219269752502441, 13.497053146362305, 13.774836540222168, 14.052619934082031, 14.330403327941895, 14.608186721801758, 14.885970115661621, 15.163753509521484, 15.441536903381348, 15.719320297241211, 15.997103691101074, 16.274887084960938]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 6.0, 4.0, 5.0, 6.0, 9.0, 14.0, 24.0, 42.0, 40.0, 59.0, 79.0, 103.0, 102.0, 113.0, 96.0, 73.0, 73.0, 47.0, 22.0, 18.0, 6.0, 6.0, 5.0, 4.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2213718891143799, -1.1778141260147095, -1.134256362915039, -1.0906985998153687, -1.0471408367156982, -1.0035831928253174, -0.960025429725647, -0.9164676666259766, -0.8729099035263062, -0.8293521404266357, -0.7857943773269653, -0.7422366738319397, -0.6986789107322693, -0.6551211476325989, -0.6115634441375732, -0.5680056810379028, -0.5244479179382324, -0.480890154838562, -0.437332421541214, -0.39377468824386597, -0.35021692514419556, -0.30665916204452515, -0.2631014287471771, -0.2195436954498291, -0.1759859323501587, -0.13242818415164948, -0.08887043595314026, -0.04531268775463104, -0.0017549395561218262, 0.04180280864238739, 0.0853605568408966, 0.12891829013824463, 0.17247605323791504, 0.21603380143642426, 0.25959154963493347, 0.3031492829322815, 0.3467070460319519, 0.3902648091316223, 0.43382254242897034, 0.47738027572631836, 0.5209380388259888, 0.5644958019256592, 0.6080535650253296, 0.6516112685203552, 0.6951690316200256, 0.738726794719696, 0.7822844982147217, 0.8258422613143921, 0.8694000244140625, 0.9129577875137329, 0.9565155506134033, 1.0000733137130737, 1.0436310768127441, 1.087188720703125, 1.1307464838027954, 1.1743042469024658, 1.2178620100021362, 1.2614197731018066, 1.304977536201477, 1.3485352993011475, 1.3920929431915283, 1.4356507062911987, 1.4792084693908691, 1.5227662324905396, 1.56632399559021]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 14.0, 11.0, 16.0, 37.0, 39.0, 62.0, 108.0, 129.0, 237.0, 453.0, 760.0, 1480.0, 2873.0, 5932.0, 14959.0, 55013.0, 912031.0, 33117.0, 11224.0, 4853.0, 2309.0, 1226.0, 631.0, 406.0, 230.0, 137.0, 82.0, 64.0, 36.0, 23.0, 18.0, 10.0, 13.0, 6.0, 3.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0439453125, -1.009552001953125, -0.97515869140625, -0.940765380859375, -0.9063720703125, -0.871978759765625, -0.83758544921875, -0.803192138671875, -0.768798828125, -0.734405517578125, -0.70001220703125, -0.665618896484375, -0.6312255859375, -0.596832275390625, -0.56243896484375, -0.528045654296875, -0.49365234375, -0.459259033203125, -0.42486572265625, -0.390472412109375, -0.3560791015625, -0.321685791015625, -0.28729248046875, -0.252899169921875, -0.218505859375, -0.184112548828125, -0.14971923828125, -0.115325927734375, -0.0809326171875, -0.046539306640625, -0.01214599609375, 0.022247314453125, 0.056640625, 0.091033935546875, 0.12542724609375, 0.159820556640625, 0.1942138671875, 0.228607177734375, 0.26300048828125, 0.297393798828125, 0.331787109375, 0.366180419921875, 0.40057373046875, 0.434967041015625, 0.4693603515625, 0.503753662109375, 0.53814697265625, 0.572540283203125, 0.60693359375, 0.641326904296875, 0.67572021484375, 0.710113525390625, 0.7445068359375, 0.778900146484375, 0.81329345703125, 0.847686767578125, 0.882080078125, 0.916473388671875, 0.95086669921875, 0.985260009765625, 1.0196533203125, 1.054046630859375, 1.08843994140625, 1.122833251953125, 1.1572265625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 4.0, 10.0, 12.0, 7.0, 11.0, 18.0, 25.0, 303.0, 441.0, 50.0, 12.0, 16.0, 11.0, 13.0, 7.0, 11.0, 6.0, 2.0, 9.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2109375, -0.20508766174316406, -0.19923782348632812, -0.1933879852294922, -0.18753814697265625, -0.1816883087158203, -0.17583847045898438, -0.16998863220214844, -0.1641387939453125, -0.15828895568847656, -0.15243911743164062, -0.1465892791748047, -0.14073944091796875, -0.1348896026611328, -0.12903976440429688, -0.12318992614746094, -0.117340087890625, -0.11149024963378906, -0.10564041137695312, -0.09979057312011719, -0.09394073486328125, -0.08809089660644531, -0.08224105834960938, -0.07639122009277344, -0.0705413818359375, -0.06469154357910156, -0.058841705322265625, -0.05299186706542969, -0.04714202880859375, -0.04129219055175781, -0.035442352294921875, -0.029592514038085938, -0.02374267578125, -0.017892837524414062, -0.012042999267578125, -0.0061931610107421875, -0.00034332275390625, 0.0055065155029296875, 0.011356353759765625, 0.017206192016601562, 0.0230560302734375, 0.028905868530273438, 0.034755706787109375, 0.04060554504394531, 0.04645538330078125, 0.05230522155761719, 0.058155059814453125, 0.06400489807128906, 0.069854736328125, 0.07570457458496094, 0.08155441284179688, 0.08740425109863281, 0.09325408935546875, 0.09910392761230469, 0.10495376586914062, 0.11080360412597656, 0.1166534423828125, 0.12250328063964844, 0.12835311889648438, 0.1342029571533203, 0.14005279541015625, 0.1459026336669922, 0.15175247192382812, 0.15760231018066406, 0.1634521484375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 7.0, 7.0, 6.0, 12.0, 17.0, 15.0, 19.0, 20.0, 20.0, 37.0, 48.0, 40.0, 83.0, 116.0, 205.0, 539.0, 2788.0, 58402.0, 941473.0, 40812.0, 2665.0, 549.0, 210.0, 126.0, 68.0, 50.0, 26.0, 41.0, 24.0, 27.0, 18.0, 22.0, 10.0, 13.0, 15.0, 5.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9482421875, -0.9136810302734375, -0.879119873046875, -0.8445587158203125, -0.80999755859375, -0.7754364013671875, -0.740875244140625, -0.7063140869140625, -0.6717529296875, -0.6371917724609375, -0.602630615234375, -0.5680694580078125, -0.53350830078125, -0.4989471435546875, -0.464385986328125, -0.4298248291015625, -0.395263671875, -0.3607025146484375, -0.326141357421875, -0.2915802001953125, -0.25701904296875, -0.2224578857421875, -0.187896728515625, -0.1533355712890625, -0.1187744140625, -0.0842132568359375, -0.049652099609375, -0.0150909423828125, 0.01947021484375, 0.0540313720703125, 0.088592529296875, 0.1231536865234375, 0.15771484375, 0.1922760009765625, 0.226837158203125, 0.2613983154296875, 0.29595947265625, 0.3305206298828125, 0.365081787109375, 0.3996429443359375, 0.4342041015625, 0.4687652587890625, 0.503326416015625, 0.5378875732421875, 0.57244873046875, 0.6070098876953125, 0.641571044921875, 0.6761322021484375, 0.710693359375, 0.7452545166015625, 0.779815673828125, 0.8143768310546875, 0.84893798828125, 0.8834991455078125, 0.918060302734375, 0.9526214599609375, 0.9871826171875, 1.0217437744140625, 1.056304931640625, 1.0908660888671875, 1.12542724609375, 1.1599884033203125, 1.194549560546875, 1.2291107177734375, 1.263671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 6.0, 18.0, 11.0, 15.0, 15.0, 19.0, 30.0, 27.0, 34.0, 35.0, 33.0, 36.0, 45.0, 45.0, 43.0, 49.0, 44.0, 42.0, 56.0, 41.0, 50.0, 37.0, 30.0, 34.0, 23.0, 31.0, 15.0, 19.0, 23.0, 16.0, 17.0, 15.0, 6.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.48046875, -0.46387481689453125, -0.4472808837890625, -0.43068695068359375, -0.414093017578125, -0.39749908447265625, -0.3809051513671875, -0.36431121826171875, -0.34771728515625, -0.33112335205078125, -0.3145294189453125, -0.29793548583984375, -0.281341552734375, -0.26474761962890625, -0.2481536865234375, -0.23155975341796875, -0.2149658203125, -0.19837188720703125, -0.1817779541015625, -0.16518402099609375, -0.148590087890625, -0.13199615478515625, -0.1154022216796875, -0.09880828857421875, -0.08221435546875, -0.06562042236328125, -0.0490264892578125, -0.03243255615234375, -0.015838623046875, 0.00075531005859375, 0.0173492431640625, 0.03394317626953125, 0.050537109375, 0.06713104248046875, 0.0837249755859375, 0.10031890869140625, 0.116912841796875, 0.13350677490234375, 0.1501007080078125, 0.16669464111328125, 0.18328857421875, 0.19988250732421875, 0.2164764404296875, 0.23307037353515625, 0.249664306640625, 0.26625823974609375, 0.2828521728515625, 0.29944610595703125, 0.3160400390625, 0.33263397216796875, 0.3492279052734375, 0.36582183837890625, 0.382415771484375, 0.39900970458984375, 0.4156036376953125, 0.43219757080078125, 0.44879150390625, 0.46538543701171875, 0.4819793701171875, 0.49857330322265625, 0.515167236328125, 0.5317611694335938, 0.5483551025390625, 0.5649490356445312, 0.58154296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 7.0, 10.0, 16.0, 32.0, 47.0, 115.0, 239.0, 879.0, 8536.0, 1034057.0, 3641.0, 605.0, 185.0, 73.0, 38.0, 23.0, 11.0, 10.0, 5.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.6086349487304688, -0.5898284912109375, -0.5710220336914062, -0.552215576171875, -0.5334091186523438, -0.5146026611328125, -0.49579620361328125, -0.47698974609375, -0.45818328857421875, -0.4393768310546875, -0.42057037353515625, -0.401763916015625, -0.38295745849609375, -0.3641510009765625, -0.34534454345703125, -0.3265380859375, -0.30773162841796875, -0.2889251708984375, -0.27011871337890625, -0.251312255859375, -0.23250579833984375, -0.2136993408203125, -0.19489288330078125, -0.17608642578125, -0.15727996826171875, -0.1384735107421875, -0.11966705322265625, -0.100860595703125, -0.08205413818359375, -0.0632476806640625, -0.04444122314453125, -0.025634765625, -0.00682830810546875, 0.0119781494140625, 0.03078460693359375, 0.049591064453125, 0.06839752197265625, 0.0872039794921875, 0.10601043701171875, 0.12481689453125, 0.14362335205078125, 0.1624298095703125, 0.18123626708984375, 0.200042724609375, 0.21884918212890625, 0.2376556396484375, 0.25646209716796875, 0.2752685546875, 0.29407501220703125, 0.3128814697265625, 0.33168792724609375, 0.350494384765625, 0.36930084228515625, 0.3881072998046875, 0.40691375732421875, 0.42572021484375, 0.44452667236328125, 0.4633331298828125, 0.48213958740234375, 0.500946044921875, 0.5197525024414062, 0.5385589599609375, 0.5573654174804688, 0.576171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 6.0, 5.0, 19.0, 31.0, 83.0, 118.0, 204.0, 197.0, 149.0, 79.0, 43.0, 23.0, 9.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5020370483398438e-05, -1.4564022421836853e-05, -1.4107674360275269e-05, -1.3651326298713684e-05, -1.31949782371521e-05, -1.2738630175590515e-05, -1.228228211402893e-05, -1.1825934052467346e-05, -1.1369585990905762e-05, -1.0913237929344177e-05, -1.0456889867782593e-05, -1.0000541806221008e-05, -9.544193744659424e-06, -9.08784568309784e-06, -8.631497621536255e-06, -8.17514955997467e-06, -7.718801498413086e-06, -7.2624534368515015e-06, -6.806105375289917e-06, -6.3497573137283325e-06, -5.893409252166748e-06, -5.4370611906051636e-06, -4.980713129043579e-06, -4.524365067481995e-06, -4.06801700592041e-06, -3.6116689443588257e-06, -3.155320882797241e-06, -2.6989728212356567e-06, -2.2426247596740723e-06, -1.7862766981124878e-06, -1.3299286365509033e-06, -8.735805749893188e-07, -4.172325134277344e-07, 3.91155481338501e-08, 4.954636096954346e-07, 9.51811671257019e-07, 1.4081597328186035e-06, 1.864507794380188e-06, 2.3208558559417725e-06, 2.777203917503357e-06, 3.2335519790649414e-06, 3.689900040626526e-06, 4.14624810218811e-06, 4.602596163749695e-06, 5.058944225311279e-06, 5.515292286872864e-06, 5.971640348434448e-06, 6.427988409996033e-06, 6.884336471557617e-06, 7.340684533119202e-06, 7.797032594680786e-06, 8.25338065624237e-06, 8.709728717803955e-06, 9.16607677936554e-06, 9.622424840927124e-06, 1.0078772902488708e-05, 1.0535120964050293e-05, 1.0991469025611877e-05, 1.1447817087173462e-05, 1.1904165148735046e-05, 1.2360513210296631e-05, 1.2816861271858215e-05, 1.32732093334198e-05, 1.3729557394981384e-05, 1.4185905456542969e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 0.0, 5.0, 1.0, 9.0, 18.0, 17.0, 28.0, 51.0, 142.0, 400.0, 2134.0, 123357.0, 918986.0, 2867.0, 307.0, 108.0, 37.0, 18.0, 19.0, 13.0, 7.0, 7.0, 9.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53076171875, -0.5175247192382812, -0.5042877197265625, -0.49105072021484375, -0.477813720703125, -0.46457672119140625, -0.4513397216796875, -0.43810272216796875, -0.42486572265625, -0.41162872314453125, -0.3983917236328125, -0.38515472412109375, -0.371917724609375, -0.35868072509765625, -0.3454437255859375, -0.33220672607421875, -0.3189697265625, -0.30573272705078125, -0.2924957275390625, -0.27925872802734375, -0.266021728515625, -0.25278472900390625, -0.2395477294921875, -0.22631072998046875, -0.21307373046875, -0.19983673095703125, -0.1865997314453125, -0.17336273193359375, -0.160125732421875, -0.14688873291015625, -0.1336517333984375, -0.12041473388671875, -0.107177734375, -0.09394073486328125, -0.0807037353515625, -0.06746673583984375, -0.054229736328125, -0.04099273681640625, -0.0277557373046875, -0.01451873779296875, -0.00128173828125, 0.01195526123046875, 0.0251922607421875, 0.03842926025390625, 0.051666259765625, 0.06490325927734375, 0.0781402587890625, 0.09137725830078125, 0.1046142578125, 0.11785125732421875, 0.1310882568359375, 0.14432525634765625, 0.157562255859375, 0.17079925537109375, 0.1840362548828125, 0.19727325439453125, 0.21051025390625, 0.22374725341796875, 0.2369842529296875, 0.25022125244140625, 0.263458251953125, 0.27669525146484375, 0.2899322509765625, 0.30316925048828125, 0.31640625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 11.0, 6.0, 10.0, 11.0, 20.0, 39.0, 49.0, 94.0, 203.0, 260.0, 122.0, 52.0, 36.0, 21.0, 8.0, 13.0, 7.0, 7.0, 4.0, 10.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26171875, -0.25536155700683594, -0.24900436401367188, -0.2426471710205078, -0.23628997802734375, -0.2299327850341797, -0.22357559204101562, -0.21721839904785156, -0.2108612060546875, -0.20450401306152344, -0.19814682006835938, -0.1917896270751953, -0.18543243408203125, -0.1790752410888672, -0.17271804809570312, -0.16636085510253906, -0.160003662109375, -0.15364646911621094, -0.14728927612304688, -0.1409320831298828, -0.13457489013671875, -0.1282176971435547, -0.12186050415039062, -0.11550331115722656, -0.1091461181640625, -0.10278892517089844, -0.09643173217773438, -0.09007453918457031, -0.08371734619140625, -0.07736015319824219, -0.07100296020507812, -0.06464576721191406, -0.05828857421875, -0.05193138122558594, -0.045574188232421875, -0.03921699523925781, -0.03285980224609375, -0.026502609252929688, -0.020145416259765625, -0.013788223266601562, -0.0074310302734375, -0.0010738372802734375, 0.005283355712890625, 0.011640548706054688, 0.01799774169921875, 0.024354934692382812, 0.030712127685546875, 0.03706932067871094, 0.043426513671875, 0.04978370666503906, 0.056140899658203125, 0.06249809265136719, 0.06885528564453125, 0.07521247863769531, 0.08156967163085938, 0.08792686462402344, 0.0942840576171875, 0.10064125061035156, 0.10699844360351562, 0.11335563659667969, 0.11971282958984375, 0.1260700225830078, 0.13242721557617188, 0.13878440856933594, 0.1451416015625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 13.0, 83.0, 803.0, 96.0, 11.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0751290321350098, -1.829355239868164, -1.5835813283920288, -1.3378074169158936, -1.0920336246490479, -0.8462598323822021, -0.6004859209060669, -0.35471200942993164, -0.10893821716308594, 0.13683563470840454, 0.382609486579895, 0.6283833384513855, 0.874157190322876, 1.1199309825897217, 1.365704894065857, 1.6114788055419922, 1.857252597808838, 2.1030263900756836, 2.3488001823425293, 2.594574213027954, 2.8403480052948, 3.0861217975616455, 3.3318958282470703, 3.577669620513916, 3.8234434127807617, 4.069217205047607, 4.314990997314453, 4.560764789581299, 4.8065385818481445, 5.052312850952148, 5.298086643218994, 5.54386043548584, 5.789633750915527, 6.035407543182373, 6.281181335449219, 6.5269551277160645, 6.77272891998291, 7.018503189086914, 7.26427698135376, 7.5100507736206055, 7.755824565887451, 8.001598358154297, 8.2473726272583, 8.493145942687988, 8.738920211791992, 8.98469352722168, 9.230467796325684, 9.476242065429688, 9.722015380859375, 9.967789649963379, 10.213562965393066, 10.45933723449707, 10.705110549926758, 10.950884819030762, 11.19665813446045, 11.442432403564453, 11.68820571899414, 11.933979988098145, 12.179753303527832, 12.425527572631836, 12.671300888061523, 12.917075157165527, 13.162848472595215, 13.408622741699219, 13.654397010803223]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 11.0, 8.0, 10.0, 16.0, 30.0, 35.0, 58.0, 78.0, 95.0, 99.0, 110.0, 95.0, 87.0, 86.0, 57.0, 34.0, 28.0, 19.0, 7.0, 6.0, 4.0, 1.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.831767559051514, -7.628604412078857, -7.425441265106201, -7.222278118133545, -7.019115447998047, -6.815952301025391, -6.612789154052734, -6.409626007080078, -6.206462860107422, -6.003299713134766, -5.800136566162109, -5.596973419189453, -5.393810272216797, -5.190647125244141, -4.987484455108643, -4.784321308135986, -4.58115816116333, -4.377995014190674, -4.174831867218018, -3.9716689586639404, -3.768505811691284, -3.565342664718628, -3.362179756164551, -3.1590166091918945, -2.9558534622192383, -2.752690315246582, -2.549527168273926, -2.3463642597198486, -2.1432011127471924, -1.9400379657745361, -1.7368749380111694, -1.5337119102478027, -1.3305482864379883, -1.127385139465332, -0.9242221117019653, -0.7210590243339539, -0.5178959369659424, -0.31473278999328613, -0.11156976222991943, 0.09159326553344727, 0.2947564125061035, 0.497919499874115, 0.7010825872421265, 0.9042456746101379, 1.1074087619781494, 1.3105719089508057, 1.5137349367141724, 1.716897964477539, 1.9200611114501953, 2.1232242584228516, 2.326387405395508, 2.529550313949585, 2.732713460922241, 2.9358766078948975, 3.1390395164489746, 3.342202663421631, 3.545365810394287, 3.7485289573669434, 3.9516921043395996, 4.154855251312256, 4.358017921447754, 4.56118106842041, 4.764344215393066, 4.967507362365723, 5.170670509338379]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 12.0, 10.0, 10.0, 13.0, 30.0, 36.0, 58.0, 90.0, 111.0, 187.0, 348.0, 495.0, 807.0, 1454.0, 2758.0, 6191.0, 27094.0, 4114385.0, 28525.0, 6119.0, 2589.0, 1335.0, 698.0, 366.0, 218.0, 122.0, 59.0, 50.0, 27.0, 22.0, 19.0, 8.0, 7.0, 12.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.927734375, -1.868408203125, -1.80908203125, -1.749755859375, -1.6904296875, -1.631103515625, -1.57177734375, -1.512451171875, -1.453125, -1.393798828125, -1.33447265625, -1.275146484375, -1.2158203125, -1.156494140625, -1.09716796875, -1.037841796875, -0.978515625, -0.919189453125, -0.85986328125, -0.800537109375, -0.7412109375, -0.681884765625, -0.62255859375, -0.563232421875, -0.50390625, -0.444580078125, -0.38525390625, -0.325927734375, -0.2666015625, -0.207275390625, -0.14794921875, -0.088623046875, -0.029296875, 0.030029296875, 0.08935546875, 0.148681640625, 0.2080078125, 0.267333984375, 0.32666015625, 0.385986328125, 0.4453125, 0.504638671875, 0.56396484375, 0.623291015625, 0.6826171875, 0.741943359375, 0.80126953125, 0.860595703125, 0.919921875, 0.979248046875, 1.03857421875, 1.097900390625, 1.1572265625, 1.216552734375, 1.27587890625, 1.335205078125, 1.39453125, 1.453857421875, 1.51318359375, 1.572509765625, 1.6318359375, 1.691162109375, 1.75048828125, 1.809814453125, 1.869140625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 4.0, 7.0, 4.0, 3.0, 8.0, 8.0, 18.0, 9.0, 14.0, 27.0, 159.0, 498.0, 138.0, 17.0, 15.0, 11.0, 12.0, 10.0, 10.0, 5.0, 9.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18212890625, -0.17650413513183594, -0.17087936401367188, -0.1652545928955078, -0.15962982177734375, -0.1540050506591797, -0.14838027954101562, -0.14275550842285156, -0.1371307373046875, -0.13150596618652344, -0.12588119506835938, -0.12025642395019531, -0.11463165283203125, -0.10900688171386719, -0.10338211059570312, -0.09775733947753906, -0.092132568359375, -0.08650779724121094, -0.08088302612304688, -0.07525825500488281, -0.06963348388671875, -0.06400871276855469, -0.058383941650390625, -0.05275917053222656, -0.0471343994140625, -0.04150962829589844, -0.035884857177734375, -0.030260086059570312, -0.02463531494140625, -0.019010543823242188, -0.013385772705078125, -0.0077610015869140625, -0.00213623046875, 0.0034885406494140625, 0.009113311767578125, 0.014738082885742188, 0.02036285400390625, 0.025987625122070312, 0.031612396240234375, 0.03723716735839844, 0.0428619384765625, 0.04848670959472656, 0.054111480712890625, 0.05973625183105469, 0.06536102294921875, 0.07098579406738281, 0.07661056518554688, 0.08223533630371094, 0.087860107421875, 0.09348487854003906, 0.09910964965820312, 0.10473442077636719, 0.11035919189453125, 0.11598396301269531, 0.12160873413085938, 0.12723350524902344, 0.1328582763671875, 0.13848304748535156, 0.14410781860351562, 0.1497325897216797, 0.15535736083984375, 0.1609821319580078, 0.16660690307617188, 0.17223167419433594, 0.1778564453125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 11.0, 12.0, 6.0, 25.0, 23.0, 35.0, 36.0, 81.0, 104.0, 214.0, 777.0, 5948.0, 4059704.0, 123447.0, 2844.0, 535.0, 171.0, 90.0, 71.0, 30.0, 29.0, 16.0, 11.0, 10.0, 10.0, 10.0, 6.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.33984375, -2.26861572265625, -2.1973876953125, -2.12615966796875, -2.054931640625, -1.98370361328125, -1.9124755859375, -1.84124755859375, -1.77001953125, -1.69879150390625, -1.6275634765625, -1.55633544921875, -1.485107421875, -1.41387939453125, -1.3426513671875, -1.27142333984375, -1.2001953125, -1.12896728515625, -1.0577392578125, -0.98651123046875, -0.915283203125, -0.84405517578125, -0.7728271484375, -0.70159912109375, -0.63037109375, -0.55914306640625, -0.4879150390625, -0.41668701171875, -0.345458984375, -0.27423095703125, -0.2030029296875, -0.13177490234375, -0.060546875, 0.01068115234375, 0.0819091796875, 0.15313720703125, 0.224365234375, 0.29559326171875, 0.3668212890625, 0.43804931640625, 0.50927734375, 0.58050537109375, 0.6517333984375, 0.72296142578125, 0.794189453125, 0.86541748046875, 0.9366455078125, 1.00787353515625, 1.0791015625, 1.15032958984375, 1.2215576171875, 1.29278564453125, 1.364013671875, 1.43524169921875, 1.5064697265625, 1.57769775390625, 1.64892578125, 1.72015380859375, 1.7913818359375, 1.86260986328125, 1.933837890625, 2.00506591796875, 2.0762939453125, 2.14752197265625, 2.21875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 6.0, 11.0, 4.0, 7.0, 18.0, 21.0, 19.0, 31.0, 53.0, 92.0, 564.0, 2863.0, 136.0, 66.0, 51.0, 23.0, 17.0, 26.0, 14.0, 5.0, 10.0, 8.0, 4.0, 0.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3173828125, -0.30651092529296875, -0.2956390380859375, -0.28476715087890625, -0.273895263671875, -0.26302337646484375, -0.2521514892578125, -0.24127960205078125, -0.23040771484375, -0.21953582763671875, -0.2086639404296875, -0.19779205322265625, -0.186920166015625, -0.17604827880859375, -0.1651763916015625, -0.15430450439453125, -0.1434326171875, -0.13256072998046875, -0.1216888427734375, -0.11081695556640625, -0.099945068359375, -0.08907318115234375, -0.0782012939453125, -0.06732940673828125, -0.05645751953125, -0.04558563232421875, -0.0347137451171875, -0.02384185791015625, -0.012969970703125, -0.00209808349609375, 0.0087738037109375, 0.01964569091796875, 0.030517578125, 0.04138946533203125, 0.0522613525390625, 0.06313323974609375, 0.074005126953125, 0.08487701416015625, 0.0957489013671875, 0.10662078857421875, 0.11749267578125, 0.12836456298828125, 0.1392364501953125, 0.15010833740234375, 0.160980224609375, 0.17185211181640625, 0.1827239990234375, 0.19359588623046875, 0.2044677734375, 0.21533966064453125, 0.2262115478515625, 0.23708343505859375, 0.247955322265625, 0.25882720947265625, 0.2696990966796875, 0.28057098388671875, 0.29144287109375, 0.30231475830078125, 0.3131866455078125, 0.32405853271484375, 0.334930419921875, 0.34580230712890625, 0.3566741943359375, 0.36754608154296875, 0.37841796875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 25.0, 962.0, 25.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5877652168273926, -1.418749213218689, -1.2497332096099854, -1.0807172060012817, -0.9117012023925781, -0.7426851987838745, -0.5736691951751709, -0.4046531915664673, -0.23563718795776367, -0.06662118434906006, 0.10239481925964355, 0.27141082286834717, 0.4404268264770508, 0.6094428300857544, 0.778458833694458, 0.9474748373031616, 1.1164908409118652, 1.2855068445205688, 1.4545228481292725, 1.623538851737976, 1.7925548553466797, 1.9615708589553833, 2.130586862564087, 2.29960298538208, 2.468618869781494, 2.637634754180908, 2.8066508769989014, 2.9756669998168945, 3.1446828842163086, 3.3136987686157227, 3.482714891433716, 3.651731014251709, 3.8207473754882812, 3.9897632598876953, 4.158779144287109, 4.327795505523682, 4.496811389923096, 4.66582727432251, 4.834843635559082, 5.003859519958496, 5.17287540435791, 5.341891288757324, 5.510907173156738, 5.6799235343933105, 5.848939418792725, 6.017955303192139, 6.186971664428711, 6.355987548828125, 6.525003433227539, 6.694019317626953, 6.863035202026367, 7.0320515632629395, 7.2010674476623535, 7.370083332061768, 7.53909969329834, 7.708115577697754, 7.877131462097168, 8.046147346496582, 8.215163230895996, 8.38417911529541, 8.55319595336914, 8.722211837768555, 8.891227722167969, 9.060243606567383, 9.229259490966797]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 5.0, 4.0, 5.0, 9.0, 20.0, 18.0, 37.0, 61.0, 56.0, 67.0, 111.0, 105.0, 107.0, 105.0, 84.0, 68.0, 41.0, 22.0, 17.0, 9.0, 11.0, 4.0, 2.0, 2.0, 4.0, 7.0, 3.0, 1.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1792802810668945, -1.1334666013717651, -1.0876529216766357, -1.041839361190796, -0.9960256218910217, -0.9502120018005371, -0.9043983221054077, -0.8585846424102783, -0.8127709627151489, -0.7669572830200195, -0.7211436629295349, -0.6753299832344055, -0.6295163035392761, -0.5837026834487915, -0.5378890037536621, -0.4920753240585327, -0.4462617039680481, -0.4004480540752411, -0.3546343743801117, -0.3088207244873047, -0.2630070447921753, -0.2171933948993683, -0.17137974500656128, -0.12556606531143188, -0.07975241541862488, -0.033938754349946976, 0.011874906718730927, 0.05768856406211853, 0.10350222885608673, 0.14931589365005493, 0.19512954354286194, 0.24094322323799133, 0.28675687313079834, 0.33257052302360535, 0.37838420271873474, 0.42419785261154175, 0.47001153230667114, 0.5158251523971558, 0.5616388320922852, 0.6074525117874146, 0.653266191482544, 0.6990798711776733, 0.744893491268158, 0.7907071709632874, 0.8365208506584167, 0.8823344707489014, 0.9281481504440308, 0.9739618301391602, 1.019775390625, 1.0655890703201294, 1.1114027500152588, 1.1572163105010986, 1.203029990196228, 1.2488436698913574, 1.2946573495864868, 1.3404710292816162, 1.3862847089767456, 1.432098388671875, 1.4779120683670044, 1.5237257480621338, 1.5695393085479736, 1.615352988243103, 1.6611666679382324, 1.7069803476333618, 1.7527940273284912]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 8.0, 10.0, 17.0, 26.0, 34.0, 56.0, 62.0, 118.0, 160.0, 260.0, 469.0, 835.0, 1582.0, 3547.0, 9843.0, 56111.0, 926437.0, 35009.0, 7851.0, 2933.0, 1348.0, 738.0, 391.0, 219.0, 151.0, 90.0, 63.0, 43.0, 41.0, 21.0, 14.0, 15.0, 12.0, 12.0, 5.0, 4.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9372711181640625, -0.909210205078125, -0.8811492919921875, -0.85308837890625, -0.8250274658203125, -0.796966552734375, -0.7689056396484375, -0.7408447265625, -0.7127838134765625, -0.684722900390625, -0.6566619873046875, -0.62860107421875, -0.6005401611328125, -0.572479248046875, -0.5444183349609375, -0.516357421875, -0.4882965087890625, -0.460235595703125, -0.4321746826171875, -0.40411376953125, -0.3760528564453125, -0.347991943359375, -0.3199310302734375, -0.2918701171875, -0.2638092041015625, -0.235748291015625, -0.2076873779296875, -0.17962646484375, -0.1515655517578125, -0.123504638671875, -0.0954437255859375, -0.0673828125, -0.0393218994140625, -0.011260986328125, 0.0167999267578125, 0.04486083984375, 0.0729217529296875, 0.100982666015625, 0.1290435791015625, 0.1571044921875, 0.1851654052734375, 0.213226318359375, 0.2412872314453125, 0.26934814453125, 0.2974090576171875, 0.325469970703125, 0.3535308837890625, 0.381591796875, 0.4096527099609375, 0.437713623046875, 0.4657745361328125, 0.49383544921875, 0.5218963623046875, 0.549957275390625, 0.5780181884765625, 0.6060791015625, 0.6341400146484375, 0.662200927734375, 0.6902618408203125, 0.71832275390625, 0.7463836669921875, 0.774444580078125, 0.8025054931640625, 0.83056640625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 11.0, 7.0, 13.0, 10.0, 24.0, 59.0, 295.0, 374.0, 86.0, 20.0, 13.0, 21.0, 7.0, 10.0, 8.0, 9.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1527099609375, -0.1476287841796875, -0.142547607421875, -0.1374664306640625, -0.13238525390625, -0.1273040771484375, -0.122222900390625, -0.1171417236328125, -0.112060546875, -0.1069793701171875, -0.101898193359375, -0.0968170166015625, -0.09173583984375, -0.0866546630859375, -0.081573486328125, -0.0764923095703125, -0.0714111328125, -0.0663299560546875, -0.061248779296875, -0.0561676025390625, -0.05108642578125, -0.0460052490234375, -0.040924072265625, -0.0358428955078125, -0.03076171875, -0.0256805419921875, -0.020599365234375, -0.0155181884765625, -0.01043701171875, -0.0053558349609375, -0.000274658203125, 0.0048065185546875, 0.0098876953125, 0.0149688720703125, 0.020050048828125, 0.0251312255859375, 0.03021240234375, 0.0352935791015625, 0.040374755859375, 0.0454559326171875, 0.050537109375, 0.0556182861328125, 0.060699462890625, 0.0657806396484375, 0.07086181640625, 0.0759429931640625, 0.081024169921875, 0.0861053466796875, 0.0911865234375, 0.0962677001953125, 0.101348876953125, 0.1064300537109375, 0.11151123046875, 0.1165924072265625, 0.121673583984375, 0.1267547607421875, 0.1318359375, 0.1369171142578125, 0.141998291015625, 0.1470794677734375, 0.15216064453125, 0.1572418212890625, 0.162322998046875, 0.1674041748046875, 0.1724853515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 1.0, 15.0, 7.0, 15.0, 9.0, 16.0, 23.0, 27.0, 16.0, 21.0, 44.0, 60.0, 98.0, 125.0, 159.0, 258.0, 477.0, 1342.0, 7074.0, 362978.0, 663080.0, 9678.0, 1544.0, 520.0, 272.0, 168.0, 114.0, 101.0, 63.0, 45.0, 39.0, 31.0, 25.0, 12.0, 14.0, 21.0, 17.0, 8.0, 6.0, 8.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.890625, -0.860992431640625, -0.83135986328125, -0.801727294921875, -0.7720947265625, -0.742462158203125, -0.71282958984375, -0.683197021484375, -0.653564453125, -0.623931884765625, -0.59429931640625, -0.564666748046875, -0.5350341796875, -0.505401611328125, -0.47576904296875, -0.446136474609375, -0.41650390625, -0.386871337890625, -0.35723876953125, -0.327606201171875, -0.2979736328125, -0.268341064453125, -0.23870849609375, -0.209075927734375, -0.179443359375, -0.149810791015625, -0.12017822265625, -0.090545654296875, -0.0609130859375, -0.031280517578125, -0.00164794921875, 0.027984619140625, 0.0576171875, 0.087249755859375, 0.11688232421875, 0.146514892578125, 0.1761474609375, 0.205780029296875, 0.23541259765625, 0.265045166015625, 0.294677734375, 0.324310302734375, 0.35394287109375, 0.383575439453125, 0.4132080078125, 0.442840576171875, 0.47247314453125, 0.502105712890625, 0.53173828125, 0.561370849609375, 0.59100341796875, 0.620635986328125, 0.6502685546875, 0.679901123046875, 0.70953369140625, 0.739166259765625, 0.768798828125, 0.798431396484375, 0.82806396484375, 0.857696533203125, 0.8873291015625, 0.916961669921875, 0.94659423828125, 0.976226806640625, 1.005859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 2.0, 2.0, 3.0, 5.0, 11.0, 12.0, 15.0, 10.0, 11.0, 19.0, 21.0, 9.0, 20.0, 26.0, 31.0, 31.0, 33.0, 37.0, 34.0, 41.0, 45.0, 42.0, 35.0, 41.0, 29.0, 45.0, 40.0, 40.0, 31.0, 17.0, 32.0, 30.0, 27.0, 28.0, 25.0, 21.0, 9.0, 9.0, 20.0, 15.0, 8.0, 5.0, 12.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.297119140625, -0.2871971130371094, -0.27727508544921875, -0.2673530578613281, -0.2574310302734375, -0.24750900268554688, -0.23758697509765625, -0.22766494750976562, -0.217742919921875, -0.20782089233398438, -0.19789886474609375, -0.18797683715820312, -0.1780548095703125, -0.16813278198242188, -0.15821075439453125, -0.14828872680664062, -0.13836669921875, -0.12844467163085938, -0.11852264404296875, -0.10860061645507812, -0.0986785888671875, -0.08875656127929688, -0.07883453369140625, -0.06891250610351562, -0.058990478515625, -0.049068450927734375, -0.03914642333984375, -0.029224395751953125, -0.0193023681640625, -0.009380340576171875, 0.00054168701171875, 0.010463714599609375, 0.0203857421875, 0.030307769775390625, 0.04022979736328125, 0.050151824951171875, 0.0600738525390625, 0.06999588012695312, 0.07991790771484375, 0.08983993530273438, 0.099761962890625, 0.10968399047851562, 0.11960601806640625, 0.12952804565429688, 0.1394500732421875, 0.14937210083007812, 0.15929412841796875, 0.16921615600585938, 0.17913818359375, 0.18906021118164062, 0.19898223876953125, 0.20890426635742188, 0.2188262939453125, 0.22874832153320312, 0.23867034912109375, 0.24859237670898438, 0.258514404296875, 0.2684364318847656, 0.27835845947265625, 0.2882804870605469, 0.2982025146484375, 0.3081245422363281, 0.31804656982421875, 0.3279685974121094, 0.337890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 7.0, 14.0, 12.0, 13.0, 24.0, 39.0, 46.0, 98.0, 136.0, 280.0, 622.0, 1628.0, 5457.0, 30748.0, 703028.0, 281209.0, 18688.0, 4071.0, 1253.0, 532.0, 248.0, 125.0, 83.0, 56.0, 28.0, 22.0, 19.0, 18.0, 9.0, 11.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.193359375, -0.18811607360839844, -0.18287277221679688, -0.1776294708251953, -0.17238616943359375, -0.1671428680419922, -0.16189956665039062, -0.15665626525878906, -0.1514129638671875, -0.14616966247558594, -0.14092636108398438, -0.1356830596923828, -0.13043975830078125, -0.1251964569091797, -0.11995315551757812, -0.11470985412597656, -0.109466552734375, -0.10422325134277344, -0.09897994995117188, -0.09373664855957031, -0.08849334716796875, -0.08325004577636719, -0.07800674438476562, -0.07276344299316406, -0.0675201416015625, -0.06227684020996094, -0.057033538818359375, -0.05179023742675781, -0.04654693603515625, -0.04130363464355469, -0.036060333251953125, -0.030817031860351562, -0.02557373046875, -0.020330429077148438, -0.015087127685546875, -0.009843826293945312, -0.00460052490234375, 0.0006427764892578125, 0.005886077880859375, 0.011129379272460938, 0.0163726806640625, 0.021615982055664062, 0.026859283447265625, 0.03210258483886719, 0.03734588623046875, 0.04258918762207031, 0.047832489013671875, 0.05307579040527344, 0.058319091796875, 0.06356239318847656, 0.06880569458007812, 0.07404899597167969, 0.07929229736328125, 0.08453559875488281, 0.08977890014648438, 0.09502220153808594, 0.1002655029296875, 0.10550880432128906, 0.11075210571289062, 0.11599540710449219, 0.12123870849609375, 0.1264820098876953, 0.13172531127929688, 0.13696861267089844, 0.1422119140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 7.0, 11.0, 7.0, 15.0, 10.0, 15.0, 27.0, 49.0, 71.0, 140.0, 217.0, 159.0, 85.0, 48.0, 43.0, 25.0, 18.0, 15.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.568960189819336e-05, -2.497062087059021e-05, -2.425163984298706e-05, -2.353265881538391e-05, -2.2813677787780762e-05, -2.2094696760177612e-05, -2.1375715732574463e-05, -2.0656734704971313e-05, -1.9937753677368164e-05, -1.9218772649765015e-05, -1.8499791622161865e-05, -1.7780810594558716e-05, -1.7061829566955566e-05, -1.6342848539352417e-05, -1.5623867511749268e-05, -1.4904886484146118e-05, -1.4185905456542969e-05, -1.346692442893982e-05, -1.274794340133667e-05, -1.202896237373352e-05, -1.1309981346130371e-05, -1.0591000318527222e-05, -9.872019290924072e-06, -9.153038263320923e-06, -8.434057235717773e-06, -7.715076208114624e-06, -6.996095180511475e-06, -6.277114152908325e-06, -5.558133125305176e-06, -4.839152097702026e-06, -4.120171070098877e-06, -3.4011900424957275e-06, -2.682209014892578e-06, -1.9632279872894287e-06, -1.2442469596862793e-06, -5.252659320831299e-07, 1.9371509552001953e-07, 9.126961231231689e-07, 1.6316771507263184e-06, 2.3506581783294678e-06, 3.069639205932617e-06, 3.7886202335357666e-06, 4.507601261138916e-06, 5.2265822887420654e-06, 5.945563316345215e-06, 6.664544343948364e-06, 7.383525371551514e-06, 8.102506399154663e-06, 8.821487426757812e-06, 9.540468454360962e-06, 1.0259449481964111e-05, 1.097843050956726e-05, 1.169741153717041e-05, 1.241639256477356e-05, 1.3135373592376709e-05, 1.3854354619979858e-05, 1.4573335647583008e-05, 1.5292316675186157e-05, 1.6011297702789307e-05, 1.6730278730392456e-05, 1.7449259757995605e-05, 1.8168240785598755e-05, 1.8887221813201904e-05, 1.9606202840805054e-05, 2.0325183868408203e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 5.0, 4.0, 12.0, 10.0, 14.0, 23.0, 41.0, 74.0, 171.0, 506.0, 2802.0, 151250.0, 887201.0, 5301.0, 690.0, 208.0, 98.0, 45.0, 35.0, 21.0, 6.0, 5.0, 9.0, 5.0, 5.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.611328125, -0.595703125, -0.580078125, -0.564453125, -0.548828125, -0.533203125, -0.517578125, -0.501953125, -0.486328125, -0.470703125, -0.455078125, -0.439453125, -0.423828125, -0.408203125, -0.392578125, -0.376953125, -0.361328125, -0.345703125, -0.330078125, -0.314453125, -0.298828125, -0.283203125, -0.267578125, -0.251953125, -0.236328125, -0.220703125, -0.205078125, -0.189453125, -0.173828125, -0.158203125, -0.142578125, -0.126953125, -0.111328125, -0.095703125, -0.080078125, -0.064453125, -0.048828125, -0.033203125, -0.017578125, -0.001953125, 0.013671875, 0.029296875, 0.044921875, 0.060546875, 0.076171875, 0.091796875, 0.107421875, 0.123046875, 0.138671875, 0.154296875, 0.169921875, 0.185546875, 0.201171875, 0.216796875, 0.232421875, 0.248046875, 0.263671875, 0.279296875, 0.294921875, 0.310546875, 0.326171875, 0.341796875, 0.357421875, 0.373046875, 0.388671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 2.0, 6.0, 6.0, 14.0, 12.0, 18.0, 27.0, 45.0, 69.0, 85.0, 126.0, 165.0, 128.0, 84.0, 49.0, 52.0, 37.0, 19.0, 18.0, 11.0, 5.0, 1.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.191162109375, -0.18642425537109375, -0.1816864013671875, -0.17694854736328125, -0.172210693359375, -0.16747283935546875, -0.1627349853515625, -0.15799713134765625, -0.15325927734375, -0.14852142333984375, -0.1437835693359375, -0.13904571533203125, -0.134307861328125, -0.12957000732421875, -0.1248321533203125, -0.12009429931640625, -0.1153564453125, -0.11061859130859375, -0.1058807373046875, -0.10114288330078125, -0.096405029296875, -0.09166717529296875, -0.0869293212890625, -0.08219146728515625, -0.07745361328125, -0.07271575927734375, -0.0679779052734375, -0.06324005126953125, -0.058502197265625, -0.05376434326171875, -0.0490264892578125, -0.04428863525390625, -0.03955078125, -0.03481292724609375, -0.0300750732421875, -0.02533721923828125, -0.020599365234375, -0.01586151123046875, -0.0111236572265625, -0.00638580322265625, -0.00164794921875, 0.00308990478515625, 0.0078277587890625, 0.01256561279296875, 0.017303466796875, 0.02204132080078125, 0.0267791748046875, 0.03151702880859375, 0.0362548828125, 0.04099273681640625, 0.0457305908203125, 0.05046844482421875, 0.055206298828125, 0.05994415283203125, 0.0646820068359375, 0.06941986083984375, 0.07415771484375, 0.07889556884765625, 0.0836334228515625, 0.08837127685546875, 0.093109130859375, 0.09784698486328125, 0.1025848388671875, 0.10732269287109375, 0.112060546875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 11.0, 84.0, 712.0, 173.0, 24.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.296865463256836, -12.075573921203613, -11.85428237915039, -11.632990837097168, -11.411699295043945, -11.190407752990723, -10.9691162109375, -10.747824668884277, -10.526533126831055, -10.305241584777832, -10.08395004272461, -9.862658500671387, -9.641366958618164, -9.420075416564941, -9.198783874511719, -8.977492332458496, -8.756200790405273, -8.53490924835205, -8.313617706298828, -8.092326164245605, -7.871034622192383, -7.64974308013916, -7.4284515380859375, -7.207159996032715, -6.98586893081665, -6.764577388763428, -6.543285846710205, -6.321994304656982, -6.10070276260376, -5.879411220550537, -5.6581196784973145, -5.436828136444092, -5.215536594390869, -4.9942450523376465, -4.772953510284424, -4.551661968231201, -4.3303704261779785, -4.109078884124756, -3.887787342071533, -3.6664958000183105, -3.445204257965088, -3.2239127159118652, -3.0026211738586426, -2.78132963180542, -2.5600380897521973, -2.3387465476989746, -2.117455005645752, -1.8961635828018188, -1.6748721599578857, -1.453580617904663, -1.2322890758514404, -1.0109975337982178, -0.7897060513496399, -0.568414568901062, -0.34712302684783936, -0.1258314847946167, 0.09546005725860596, 0.3167515993118286, 0.5380431413650513, 0.7593346238136292, 0.9806261658668518, 1.2019176483154297, 1.4232091903686523, 1.644500732421875, 1.8657922744750977]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 3.0, 11.0, 12.0, 15.0, 18.0, 18.0, 22.0, 28.0, 20.0, 37.0, 50.0, 61.0, 63.0, 58.0, 72.0, 48.0, 69.0, 58.0, 54.0, 42.0, 50.0, 36.0, 29.0, 24.0, 23.0, 22.0, 12.0, 11.0, 10.0, 8.0, 2.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.9163193702697754, -3.8081178665161133, -3.6999166011810303, -3.591715097427368, -3.483513832092285, -3.375312328338623, -3.267110824584961, -3.158909320831299, -3.050708055496216, -2.9425065517425537, -2.8343052864074707, -2.7261037826538086, -2.6179022789001465, -2.5097010135650635, -2.4014995098114014, -2.2932982444763184, -2.1850967407226562, -2.076895236968994, -1.9686939716339111, -1.860492467880249, -1.7522910833358765, -1.644089698791504, -1.5358881950378418, -1.4276868104934692, -1.3194854259490967, -1.2112840414047241, -1.1030826568603516, -0.9948811531066895, -0.8866797685623169, -0.7784783840179443, -0.670276939868927, -0.5620754957199097, -0.4538741111755371, -0.34567269682884216, -0.23747128248214722, -0.12926986813545227, -0.021068453788757324, 0.08713293075561523, 0.19533437490463257, 0.3035358190536499, 0.41173720359802246, 0.519938588142395, 0.6281400322914124, 0.7363414764404297, 0.8445428609848022, 0.9527442455291748, 1.060945749282837, 1.1691471338272095, 1.277348518371582, 1.3855499029159546, 1.4937512874603271, 1.6019527912139893, 1.7101541757583618, 1.8183555603027344, 1.9265570640563965, 2.0347585678100586, 2.1429598331451416, 2.2511613368988037, 2.3593626022338867, 2.467564105987549, 2.575765609741211, 2.683966875076294, 2.792168378829956, 2.900369644165039, 3.008571147918701]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 4.0, 6.0, 6.0, 16.0, 21.0, 39.0, 102.0, 515.0, 5791.0, 4183666.0, 3544.0, 387.0, 84.0, 23.0, 18.0, 19.0, 12.0, 12.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.490234375, -3.352996826171875, -3.21575927734375, -3.078521728515625, -2.9412841796875, -2.804046630859375, -2.66680908203125, -2.529571533203125, -2.392333984375, -2.255096435546875, -2.11785888671875, -1.980621337890625, -1.8433837890625, -1.706146240234375, -1.56890869140625, -1.431671142578125, -1.29443359375, -1.157196044921875, -1.01995849609375, -0.882720947265625, -0.7454833984375, -0.608245849609375, -0.47100830078125, -0.333770751953125, -0.196533203125, -0.059295654296875, 0.07794189453125, 0.215179443359375, 0.3524169921875, 0.489654541015625, 0.62689208984375, 0.764129638671875, 0.9013671875, 1.038604736328125, 1.17584228515625, 1.313079833984375, 1.4503173828125, 1.587554931640625, 1.72479248046875, 1.862030029296875, 1.999267578125, 2.136505126953125, 2.27374267578125, 2.410980224609375, 2.5482177734375, 2.685455322265625, 2.82269287109375, 2.959930419921875, 3.09716796875, 3.234405517578125, 3.37164306640625, 3.508880615234375, 3.6461181640625, 3.783355712890625, 3.92059326171875, 4.057830810546875, 4.195068359375, 4.332305908203125, 4.46954345703125, 4.606781005859375, 4.7440185546875, 4.881256103515625, 5.01849365234375, 5.155731201171875, 5.29296875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 6.0, 6.0, 8.0, 15.0, 14.0, 19.0, 36.0, 118.0, 345.0, 248.0, 82.0, 32.0, 9.0, 11.0, 6.0, 8.0, 12.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1424560546875, -0.13712501525878906, -0.13179397583007812, -0.1264629364013672, -0.12113189697265625, -0.11580085754394531, -0.11046981811523438, -0.10513877868652344, -0.0998077392578125, -0.09447669982910156, -0.08914566040039062, -0.08381462097167969, -0.07848358154296875, -0.07315254211425781, -0.06782150268554688, -0.06249046325683594, -0.057159423828125, -0.05182838439941406, -0.046497344970703125, -0.04116630554199219, -0.03583526611328125, -0.030504226684570312, -0.025173187255859375, -0.019842147827148438, -0.0145111083984375, -0.009180068969726562, -0.003849029541015625, 0.0014820098876953125, 0.00681304931640625, 0.012144088745117188, 0.017475128173828125, 0.022806167602539062, 0.02813720703125, 0.03346824645996094, 0.038799285888671875, 0.04413032531738281, 0.04946136474609375, 0.05479240417480469, 0.060123443603515625, 0.06545448303222656, 0.0707855224609375, 0.07611656188964844, 0.08144760131835938, 0.08677864074707031, 0.09210968017578125, 0.09744071960449219, 0.10277175903320312, 0.10810279846191406, 0.113433837890625, 0.11876487731933594, 0.12409591674804688, 0.1294269561767578, 0.13475799560546875, 0.1400890350341797, 0.14542007446289062, 0.15075111389160156, 0.1560821533203125, 0.16141319274902344, 0.16674423217773438, 0.1720752716064453, 0.17740631103515625, 0.1827373504638672, 0.18806838989257812, 0.19339942932128906, 0.19873046875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 10.0, 8.0, 18.0, 12.0, 26.0, 20.0, 68.0, 108.0, 255.0, 1000.0, 11580.0, 4123726.0, 54199.0, 2421.0, 415.0, 153.0, 95.0, 48.0, 26.0, 22.0, 11.0, 7.0, 6.0, 8.0, 2.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1337890625, -1.0942535400390625, -1.054718017578125, -1.0151824951171875, -0.97564697265625, -0.9361114501953125, -0.896575927734375, -0.8570404052734375, -0.8175048828125, -0.7779693603515625, -0.738433837890625, -0.6988983154296875, -0.65936279296875, -0.6198272705078125, -0.580291748046875, -0.5407562255859375, -0.501220703125, -0.4616851806640625, -0.422149658203125, -0.3826141357421875, -0.34307861328125, -0.3035430908203125, -0.264007568359375, -0.2244720458984375, -0.1849365234375, -0.1454010009765625, -0.105865478515625, -0.0663299560546875, -0.02679443359375, 0.0127410888671875, 0.052276611328125, 0.0918121337890625, 0.13134765625, 0.1708831787109375, 0.210418701171875, 0.2499542236328125, 0.28948974609375, 0.3290252685546875, 0.368560791015625, 0.4080963134765625, 0.4476318359375, 0.4871673583984375, 0.526702880859375, 0.5662384033203125, 0.60577392578125, 0.6453094482421875, 0.684844970703125, 0.7243804931640625, 0.763916015625, 0.8034515380859375, 0.842987060546875, 0.8825225830078125, 0.92205810546875, 0.9615936279296875, 1.001129150390625, 1.0406646728515625, 1.0802001953125, 1.1197357177734375, 1.159271240234375, 1.1988067626953125, 1.23834228515625, 1.2778778076171875, 1.317413330078125, 1.3569488525390625, 1.396484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 10.0, 6.0, 6.0, 11.0, 12.0, 20.0, 30.0, 37.0, 107.0, 543.0, 2766.0, 308.0, 66.0, 33.0, 24.0, 14.0, 14.0, 6.0, 12.0, 6.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1854248046875, -0.17910385131835938, -0.17278289794921875, -0.16646194458007812, -0.1601409912109375, -0.15382003784179688, -0.14749908447265625, -0.14117813110351562, -0.134857177734375, -0.12853622436523438, -0.12221527099609375, -0.11589431762695312, -0.1095733642578125, -0.10325241088867188, -0.09693145751953125, -0.09061050415039062, -0.08428955078125, -0.07796859741210938, -0.07164764404296875, -0.06532669067382812, -0.0590057373046875, -0.052684783935546875, -0.04636383056640625, -0.040042877197265625, -0.033721923828125, -0.027400970458984375, -0.02108001708984375, -0.014759063720703125, -0.0084381103515625, -0.002117156982421875, 0.00420379638671875, 0.010524749755859375, 0.016845703125, 0.023166656494140625, 0.02948760986328125, 0.035808563232421875, 0.0421295166015625, 0.048450469970703125, 0.05477142333984375, 0.061092376708984375, 0.067413330078125, 0.07373428344726562, 0.08005523681640625, 0.08637619018554688, 0.0926971435546875, 0.09901809692382812, 0.10533905029296875, 0.11166000366210938, 0.11798095703125, 0.12430191040039062, 0.13062286376953125, 0.13694381713867188, 0.1432647705078125, 0.14958572387695312, 0.15590667724609375, 0.16222763061523438, 0.168548583984375, 0.17486953735351562, 0.18119049072265625, 0.18751144409179688, 0.1938323974609375, 0.20015335083007812, 0.20647430419921875, 0.21279525756835938, 0.2191162109375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 9.0, 804.0, 199.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5977959632873535, -0.4951344430446625, -0.39247292280197144, -0.2898114323616028, -0.18714991211891174, -0.0844883918762207, 0.01817309856414795, 0.12083464860916138, 0.22349613904953003, 0.32615765929222107, 0.4288191795349121, 0.5314806699752808, 0.6341421604156494, 0.7368037104606628, 0.8394652009010315, 0.9421267509460449, 1.0447882413864136, 1.1474497318267822, 1.2501112222671509, 1.3527727127075195, 1.4554343223571777, 1.5580958127975464, 1.660757303237915, 1.7634189128875732, 1.8660802841186523, 1.968741774559021, 2.0714032649993896, 2.174064874649048, 2.276726245880127, 2.379387855529785, 2.4820494651794434, 2.5847108364105225, 2.6873724460601807, 2.790034055709839, 2.892695426940918, 2.995357036590576, 3.0980184078216553, 3.2006800174713135, 3.3033413887023926, 3.406002998352051, 3.508664608001709, 3.611326217651367, 3.7139875888824463, 3.8166491985321045, 3.9193105697631836, 4.021972179412842, 4.1246337890625, 4.227295398712158, 4.329956531524658, 4.432618141174316, 4.535279750823975, 4.637940883636475, 4.740602493286133, 4.843264102935791, 4.945925712585449, 5.048587322235107, 5.151248931884766, 5.253910541534424, 5.356572151184082, 5.459233283996582, 5.56189489364624, 5.664556503295898, 5.767218112945557, 5.869879722595215, 5.972540855407715]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 13.0, 9.0, 13.0, 14.0, 23.0, 21.0, 26.0, 48.0, 50.0, 52.0, 60.0, 58.0, 51.0, 73.0, 69.0, 62.0, 60.0, 54.0, 45.0, 35.0, 43.0, 22.0, 17.0, 10.0, 18.0, 7.0, 13.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6082558631896973, -0.5892598628997803, -0.5702638626098633, -0.5512679219245911, -0.5322719216346741, -0.5132759213447571, -0.4942799210548401, -0.4752839207649231, -0.4562879502773285, -0.4372919499874115, -0.4182959794998169, -0.3992999792098999, -0.3803039789199829, -0.3613080084323883, -0.3423120081424713, -0.3233160376548767, -0.3043200373649597, -0.2853240370750427, -0.2663280665874481, -0.24733206629753113, -0.22833608090877533, -0.20934009552001953, -0.19034409523010254, -0.17134810984134674, -0.15235212445259094, -0.13335613906383514, -0.11436014622449875, -0.09536415338516235, -0.07636816799640656, -0.05737218260765076, -0.03837618976831436, -0.019380196928977966, -0.00038421154022216797, 0.01861177757382393, 0.037607766687870026, 0.05660375580191612, 0.07559974491596222, 0.09459573030471802, 0.11359172314405441, 0.1325877159833908, 0.1515837013721466, 0.1705796867609024, 0.1895756721496582, 0.2085716724395752, 0.227567657828331, 0.2465636432170868, 0.2655596435070038, 0.2845556139945984, 0.3035516142845154, 0.3225476145744324, 0.341543585062027, 0.36053958535194397, 0.3795355558395386, 0.39853155612945557, 0.41752755641937256, 0.43652355670928955, 0.45551952719688416, 0.47451552748680115, 0.49351149797439575, 0.5125074982643127, 0.5315034985542297, 0.550499439239502, 0.569495439529419, 0.5884914398193359, 0.6074874401092529]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 2.0, 2.0, 9.0, 9.0, 18.0, 20.0, 42.0, 51.0, 111.0, 145.0, 293.0, 557.0, 1340.0, 3348.0, 10563.0, 53998.0, 896361.0, 64005.0, 11364.0, 3657.0, 1354.0, 584.0, 294.0, 142.0, 108.0, 47.0, 34.0, 26.0, 26.0, 14.0, 7.0, 8.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400390625, -0.3852996826171875, -0.370208740234375, -0.3551177978515625, -0.34002685546875, -0.3249359130859375, -0.309844970703125, -0.2947540283203125, -0.2796630859375, -0.2645721435546875, -0.249481201171875, -0.2343902587890625, -0.21929931640625, -0.2042083740234375, -0.189117431640625, -0.1740264892578125, -0.158935546875, -0.1438446044921875, -0.128753662109375, -0.1136627197265625, -0.09857177734375, -0.0834808349609375, -0.068389892578125, -0.0532989501953125, -0.0382080078125, -0.0231170654296875, -0.008026123046875, 0.0070648193359375, 0.02215576171875, 0.0372467041015625, 0.052337646484375, 0.0674285888671875, 0.08251953125, 0.0976104736328125, 0.112701416015625, 0.1277923583984375, 0.14288330078125, 0.1579742431640625, 0.173065185546875, 0.1881561279296875, 0.2032470703125, 0.2183380126953125, 0.233428955078125, 0.2485198974609375, 0.26361083984375, 0.2787017822265625, 0.293792724609375, 0.3088836669921875, 0.323974609375, 0.3390655517578125, 0.354156494140625, 0.3692474365234375, 0.38433837890625, 0.3994293212890625, 0.414520263671875, 0.4296112060546875, 0.4447021484375, 0.4597930908203125, 0.474884033203125, 0.4899749755859375, 0.50506591796875, 0.5201568603515625, 0.535247802734375, 0.5503387451171875, 0.5654296875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 8.0, 6.0, 8.0, 12.0, 18.0, 14.0, 40.0, 122.0, 310.0, 261.0, 104.0, 28.0, 11.0, 12.0, 8.0, 8.0, 13.0, 7.0, 1.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1365966796875, -0.1314983367919922, -0.12639999389648438, -0.12130165100097656, -0.11620330810546875, -0.11110496520996094, -0.10600662231445312, -0.10090827941894531, -0.0958099365234375, -0.09071159362792969, -0.08561325073242188, -0.08051490783691406, -0.07541656494140625, -0.07031822204589844, -0.06521987915039062, -0.06012153625488281, -0.055023193359375, -0.04992485046386719, -0.044826507568359375, -0.03972816467285156, -0.03462982177734375, -0.029531478881835938, -0.024433135986328125, -0.019334793090820312, -0.0142364501953125, -0.009138107299804688, -0.004039764404296875, 0.0010585784912109375, 0.00615692138671875, 0.011255264282226562, 0.016353607177734375, 0.021451950073242188, 0.02655029296875, 0.03164863586425781, 0.036746978759765625, 0.04184532165527344, 0.04694366455078125, 0.05204200744628906, 0.057140350341796875, 0.06223869323730469, 0.0673370361328125, 0.07243537902832031, 0.07753372192382812, 0.08263206481933594, 0.08773040771484375, 0.09282875061035156, 0.09792709350585938, 0.10302543640136719, 0.108123779296875, 0.11322212219238281, 0.11832046508789062, 0.12341880798339844, 0.12851715087890625, 0.13361549377441406, 0.13871383666992188, 0.1438121795654297, 0.1489105224609375, 0.1540088653564453, 0.15910720825195312, 0.16420555114746094, 0.16930389404296875, 0.17440223693847656, 0.17950057983398438, 0.1845989227294922, 0.189697265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 10.0, 12.0, 14.0, 23.0, 37.0, 23.0, 46.0, 56.0, 57.0, 89.0, 86.0, 85.0, 116.0, 199.0, 240.0, 486.0, 1365.0, 7035.0, 269764.0, 750022.0, 14965.0, 1907.0, 651.0, 309.0, 205.0, 150.0, 78.0, 105.0, 71.0, 76.0, 52.0, 44.0, 26.0, 40.0, 36.0, 17.0, 11.0, 8.0, 5.0, 7.0, 9.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.56494140625, -0.54736328125, -0.52978515625, -0.51220703125, -0.49462890625, -0.47705078125, -0.45947265625, -0.44189453125, -0.42431640625, -0.40673828125, -0.38916015625, -0.37158203125, -0.35400390625, -0.33642578125, -0.31884765625, -0.30126953125, -0.28369140625, -0.26611328125, -0.24853515625, -0.23095703125, -0.21337890625, -0.19580078125, -0.17822265625, -0.16064453125, -0.14306640625, -0.12548828125, -0.10791015625, -0.09033203125, -0.07275390625, -0.05517578125, -0.03759765625, -0.02001953125, -0.00244140625, 0.01513671875, 0.03271484375, 0.05029296875, 0.06787109375, 0.08544921875, 0.10302734375, 0.12060546875, 0.13818359375, 0.15576171875, 0.17333984375, 0.19091796875, 0.20849609375, 0.22607421875, 0.24365234375, 0.26123046875, 0.27880859375, 0.29638671875, 0.31396484375, 0.33154296875, 0.34912109375, 0.36669921875, 0.38427734375, 0.40185546875, 0.41943359375, 0.43701171875, 0.45458984375, 0.47216796875, 0.48974609375, 0.50732421875, 0.52490234375, 0.54248046875, 0.56005859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 7.0, 6.0, 9.0, 7.0, 15.0, 21.0, 26.0, 29.0, 28.0, 25.0, 18.0, 24.0, 36.0, 42.0, 42.0, 60.0, 48.0, 43.0, 43.0, 59.0, 38.0, 36.0, 58.0, 35.0, 36.0, 26.0, 21.0, 32.0, 23.0, 20.0, 21.0, 16.0, 11.0, 11.0, 12.0, 2.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.337158203125, -0.3266334533691406, -0.31610870361328125, -0.3055839538574219, -0.2950592041015625, -0.2845344543457031, -0.27400970458984375, -0.2634849548339844, -0.252960205078125, -0.24243545532226562, -0.23191070556640625, -0.22138595581054688, -0.2108612060546875, -0.20033645629882812, -0.18981170654296875, -0.17928695678710938, -0.16876220703125, -0.15823745727539062, -0.14771270751953125, -0.13718795776367188, -0.1266632080078125, -0.11613845825195312, -0.10561370849609375, -0.09508895874023438, -0.084564208984375, -0.07403945922851562, -0.06351470947265625, -0.052989959716796875, -0.0424652099609375, -0.031940460205078125, -0.02141571044921875, -0.010890960693359375, -0.0003662109375, 0.010158538818359375, 0.02068328857421875, 0.031208038330078125, 0.0417327880859375, 0.052257537841796875, 0.06278228759765625, 0.07330703735351562, 0.083831787109375, 0.09435653686523438, 0.10488128662109375, 0.11540603637695312, 0.1259307861328125, 0.13645553588867188, 0.14698028564453125, 0.15750503540039062, 0.16802978515625, 0.17855453491210938, 0.18907928466796875, 0.19960403442382812, 0.2101287841796875, 0.22065353393554688, 0.23117828369140625, 0.24170303344726562, 0.252227783203125, 0.2627525329589844, 0.27327728271484375, 0.2838020324707031, 0.2943267822265625, 0.3048515319824219, 0.31537628173828125, 0.3259010314941406, 0.33642578125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 1.0, 4.0, 3.0, 6.0, 13.0, 10.0, 10.0, 16.0, 18.0, 28.0, 49.0, 88.0, 156.0, 286.0, 702.0, 1808.0, 6031.0, 37368.0, 781837.0, 199807.0, 14823.0, 3410.0, 1092.0, 460.0, 217.0, 102.0, 61.0, 41.0, 24.0, 21.0, 22.0, 10.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.174072265625, -0.16958332061767578, -0.16509437561035156, -0.16060543060302734, -0.15611648559570312, -0.1516275405883789, -0.1471385955810547, -0.14264965057373047, -0.13816070556640625, -0.13367176055908203, -0.1291828155517578, -0.1246938705444336, -0.12020492553710938, -0.11571598052978516, -0.11122703552246094, -0.10673809051513672, -0.1022491455078125, -0.09776020050048828, -0.09327125549316406, -0.08878231048583984, -0.08429336547851562, -0.0798044204711914, -0.07531547546386719, -0.07082653045654297, -0.06633758544921875, -0.06184864044189453, -0.05735969543457031, -0.052870750427246094, -0.048381805419921875, -0.043892860412597656, -0.03940391540527344, -0.03491497039794922, -0.030426025390625, -0.02593708038330078, -0.021448135375976562, -0.016959190368652344, -0.012470245361328125, -0.007981300354003906, -0.0034923553466796875, 0.0009965896606445312, 0.00548553466796875, 0.009974479675292969, 0.014463424682617188, 0.018952369689941406, 0.023441314697265625, 0.027930259704589844, 0.03241920471191406, 0.03690814971923828, 0.0413970947265625, 0.04588603973388672, 0.05037498474121094, 0.054863929748535156, 0.059352874755859375, 0.0638418197631836, 0.06833076477050781, 0.07281970977783203, 0.07730865478515625, 0.08179759979248047, 0.08628654479980469, 0.0907754898071289, 0.09526443481445312, 0.09975337982177734, 0.10424232482910156, 0.10873126983642578, 0.11322021484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 11.0, 18.0, 18.0, 27.0, 26.0, 55.0, 76.0, 170.0, 185.0, 145.0, 85.0, 41.0, 32.0, 16.0, 19.0, 15.0, 13.0, 9.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0265579223632812e-05, -1.9599683582782745e-05, -1.8933787941932678e-05, -1.826789230108261e-05, -1.7601996660232544e-05, -1.6936101019382477e-05, -1.627020537853241e-05, -1.5604309737682343e-05, -1.4938414096832275e-05, -1.4272518455982208e-05, -1.3606622815132141e-05, -1.2940727174282074e-05, -1.2274831533432007e-05, -1.160893589258194e-05, -1.0943040251731873e-05, -1.0277144610881805e-05, -9.611248970031738e-06, -8.945353329181671e-06, -8.279457688331604e-06, -7.613562047481537e-06, -6.94766640663147e-06, -6.281770765781403e-06, -5.6158751249313354e-06, -4.949979484081268e-06, -4.284083843231201e-06, -3.618188202381134e-06, -2.952292561531067e-06, -2.2863969206809998e-06, -1.6205012798309326e-06, -9.546056389808655e-07, -2.8870999813079834e-07, 3.771856427192688e-07, 1.043081283569336e-06, 1.708976924419403e-06, 2.3748725652694702e-06, 3.0407682061195374e-06, 3.7066638469696045e-06, 4.372559487819672e-06, 5.038455128669739e-06, 5.704350769519806e-06, 6.370246410369873e-06, 7.03614205121994e-06, 7.702037692070007e-06, 8.367933332920074e-06, 9.033828973770142e-06, 9.699724614620209e-06, 1.0365620255470276e-05, 1.1031515896320343e-05, 1.169741153717041e-05, 1.2363307178020477e-05, 1.3029202818870544e-05, 1.3695098459720612e-05, 1.4360994100570679e-05, 1.5026889741420746e-05, 1.5692785382270813e-05, 1.635868102312088e-05, 1.7024576663970947e-05, 1.7690472304821014e-05, 1.835636794567108e-05, 1.902226358652115e-05, 1.9688159227371216e-05, 2.0354054868221283e-05, 2.101995050907135e-05, 2.1685846149921417e-05, 2.2351741790771484e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 14.0, 20.0, 34.0, 51.0, 138.0, 390.0, 2260.0, 78859.0, 958303.0, 7222.0, 869.0, 207.0, 86.0, 38.0, 22.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.390380859375, -0.3782691955566406, -0.36615753173828125, -0.3540458679199219, -0.3419342041015625, -0.3298225402832031, -0.31771087646484375, -0.3055992126464844, -0.293487548828125, -0.2813758850097656, -0.26926422119140625, -0.2571525573730469, -0.2450408935546875, -0.23292922973632812, -0.22081756591796875, -0.20870590209960938, -0.19659423828125, -0.18448257446289062, -0.17237091064453125, -0.16025924682617188, -0.1481475830078125, -0.13603591918945312, -0.12392425537109375, -0.11181259155273438, -0.099700927734375, -0.08758926391601562, -0.07547760009765625, -0.06336593627929688, -0.0512542724609375, -0.039142608642578125, -0.02703094482421875, -0.014919281005859375, -0.0028076171875, 0.009304046630859375, 0.02141571044921875, 0.033527374267578125, 0.0456390380859375, 0.057750701904296875, 0.06986236572265625, 0.08197402954101562, 0.094085693359375, 0.10619735717773438, 0.11830902099609375, 0.13042068481445312, 0.1425323486328125, 0.15464401245117188, 0.16675567626953125, 0.17886734008789062, 0.19097900390625, 0.20309066772460938, 0.21520233154296875, 0.22731399536132812, 0.2394256591796875, 0.2515373229980469, 0.26364898681640625, 0.2757606506347656, 0.287872314453125, 0.2999839782714844, 0.31209564208984375, 0.3242073059082031, 0.3363189697265625, 0.3484306335449219, 0.36054229736328125, 0.3726539611816406, 0.384765625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 15.0, 31.0, 50.0, 73.0, 180.0, 244.0, 197.0, 97.0, 46.0, 26.0, 12.0, 10.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2196044921875, -0.213043212890625, -0.20648193359375, -0.199920654296875, -0.193359375, -0.186798095703125, -0.18023681640625, -0.173675537109375, -0.1671142578125, -0.160552978515625, -0.15399169921875, -0.147430419921875, -0.140869140625, -0.134307861328125, -0.12774658203125, -0.121185302734375, -0.1146240234375, -0.108062744140625, -0.10150146484375, -0.094940185546875, -0.08837890625, -0.081817626953125, -0.07525634765625, -0.068695068359375, -0.0621337890625, -0.055572509765625, -0.04901123046875, -0.042449951171875, -0.035888671875, -0.029327392578125, -0.02276611328125, -0.016204833984375, -0.0096435546875, -0.003082275390625, 0.00347900390625, 0.010040283203125, 0.0166015625, 0.023162841796875, 0.02972412109375, 0.036285400390625, 0.0428466796875, 0.049407958984375, 0.05596923828125, 0.062530517578125, 0.069091796875, 0.075653076171875, 0.08221435546875, 0.088775634765625, 0.0953369140625, 0.101898193359375, 0.10845947265625, 0.115020751953125, 0.12158203125, 0.128143310546875, 0.13470458984375, 0.141265869140625, 0.1478271484375, 0.154388427734375, 0.16094970703125, 0.167510986328125, 0.174072265625, 0.180633544921875, 0.18719482421875, 0.193756103515625, 0.2003173828125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 11.0, 257.0, 718.0, 24.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2328357696533203, -2.0331013202667236, -1.833366870880127, -1.6336325407028198, -1.4338980913162231, -1.2341636419296265, -1.0344293117523193, -0.8346948623657227, -0.634960412979126, -0.4352259933948517, -0.2354915738105774, -0.03575718402862549, 0.1639772653579712, 0.36371171474456787, 0.563446044921875, 0.7631804943084717, 0.9629149436950684, 1.162649393081665, 1.3623838424682617, 1.5621181726455688, 1.7618526220321655, 1.9615870714187622, 2.1613214015960693, 2.361055850982666, 2.5607903003692627, 2.7605247497558594, 2.960259199142456, 3.1599936485290527, 3.3597278594970703, 3.559462547302246, 3.7591967582702637, 3.9589312076568604, 4.158665657043457, 4.358399868011475, 4.55813455581665, 4.757868766784668, 4.957603454589844, 5.157337665557861, 5.357071876525879, 5.556806564331055, 5.7565412521362305, 5.956275463104248, 6.156010150909424, 6.355744361877441, 6.555479049682617, 6.755213260650635, 6.954947471618652, 7.154682159423828, 7.354416370391846, 7.554150581359863, 7.753885269165039, 7.953619480133057, 8.153353691101074, 8.35308837890625, 8.552823066711426, 8.752557754516602, 8.952291488647461, 9.152026176452637, 9.351759910583496, 9.551494598388672, 9.751229286193848, 9.950963973999023, 10.150697708129883, 10.350432395935059, 10.550167083740234]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 0.0, 12.0, 11.0, 16.0, 15.0, 16.0, 28.0, 25.0, 32.0, 41.0, 28.0, 50.0, 47.0, 43.0, 44.0, 53.0, 52.0, 59.0, 53.0, 55.0, 49.0, 58.0, 35.0, 34.0, 29.0, 25.0, 20.0, 15.0, 13.0, 7.0, 12.0, 8.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0935630798339844, -2.021535873413086, -1.949508547782898, -1.8774813413619995, -1.8054540157318115, -1.733426809310913, -1.6613996028900146, -1.5893723964691162, -1.5173450708389282, -1.4453178644180298, -1.3732905387878418, -1.3012633323669434, -1.229236125946045, -1.157208800315857, -1.0851815938949585, -1.0131542682647705, -0.9411270618438721, -0.8690997958183289, -0.7970725297927856, -0.7250453233718872, -0.653018057346344, -0.5809907913208008, -0.5089635848999023, -0.43693631887435913, -0.3649090528488159, -0.2928817868232727, -0.22085455060005188, -0.14882729947566986, -0.07680004835128784, -0.004772782325744629, 0.0672544538974762, 0.13928169012069702, 0.21130895614624023, 0.28333622217178345, 0.3553634583950043, 0.4273906946182251, 0.4994179606437683, 0.5714452266693115, 0.64347243309021, 0.7154996991157532, 0.7875269651412964, 0.8595542311668396, 0.9315814971923828, 1.0036087036132812, 1.0756359100341797, 1.1476632356643677, 1.2196904420852661, 1.291717767715454, 1.3637449741363525, 1.435772180557251, 1.507799506187439, 1.5798267126083374, 1.6518540382385254, 1.7238812446594238, 1.7959084510803223, 1.8679356575012207, 1.9399629831314087, 2.0119903087615967, 2.084017515182495, 2.1560447216033936, 2.228071928024292, 2.3000993728637695, 2.372126579284668, 2.4441537857055664, 2.516180992126465]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 7.0, 9.0, 11.0, 24.0, 30.0, 61.0, 89.0, 169.0, 341.0, 895.0, 3733.0, 359098.0, 3823270.0, 4652.0, 1026.0, 410.0, 187.0, 110.0, 60.0, 35.0, 23.0, 13.0, 3.0, 4.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5791015625, -0.553985595703125, -0.52886962890625, -0.503753662109375, -0.4786376953125, -0.453521728515625, -0.42840576171875, -0.403289794921875, -0.378173828125, -0.353057861328125, -0.32794189453125, -0.302825927734375, -0.2777099609375, -0.252593994140625, -0.22747802734375, -0.202362060546875, -0.17724609375, -0.152130126953125, -0.12701416015625, -0.101898193359375, -0.0767822265625, -0.051666259765625, -0.02655029296875, -0.001434326171875, 0.023681640625, 0.048797607421875, 0.07391357421875, 0.099029541015625, 0.1241455078125, 0.149261474609375, 0.17437744140625, 0.199493408203125, 0.224609375, 0.249725341796875, 0.27484130859375, 0.299957275390625, 0.3250732421875, 0.350189208984375, 0.37530517578125, 0.400421142578125, 0.425537109375, 0.450653076171875, 0.47576904296875, 0.500885009765625, 0.5260009765625, 0.551116943359375, 0.57623291015625, 0.601348876953125, 0.62646484375, 0.651580810546875, 0.67669677734375, 0.701812744140625, 0.7269287109375, 0.752044677734375, 0.77716064453125, 0.802276611328125, 0.827392578125, 0.852508544921875, 0.87762451171875, 0.902740478515625, 0.9278564453125, 0.952972412109375, 0.97808837890625, 1.003204345703125, 1.0283203125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 2.0, 5.0, 11.0, 8.0, 17.0, 10.0, 25.0, 67.0, 172.0, 298.0, 227.0, 68.0, 27.0, 15.0, 6.0, 10.0, 10.0, 7.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.12815475463867188, -0.12313079833984375, -0.11810684204101562, -0.1130828857421875, -0.10805892944335938, -0.10303497314453125, -0.09801101684570312, -0.092987060546875, -0.08796310424804688, -0.08293914794921875, -0.07791519165039062, -0.0728912353515625, -0.06786727905273438, -0.06284332275390625, -0.057819366455078125, -0.05279541015625, -0.047771453857421875, -0.04274749755859375, -0.037723541259765625, -0.0326995849609375, -0.027675628662109375, -0.02265167236328125, -0.017627716064453125, -0.012603759765625, -0.007579803466796875, -0.00255584716796875, 0.002468109130859375, 0.0074920654296875, 0.012516021728515625, 0.01753997802734375, 0.022563934326171875, 0.027587890625, 0.032611846923828125, 0.03763580322265625, 0.042659759521484375, 0.0476837158203125, 0.052707672119140625, 0.05773162841796875, 0.06275558471679688, 0.067779541015625, 0.07280349731445312, 0.07782745361328125, 0.08285140991210938, 0.0878753662109375, 0.09289932250976562, 0.09792327880859375, 0.10294723510742188, 0.10797119140625, 0.11299514770507812, 0.11801910400390625, 0.12304306030273438, 0.1280670166015625, 0.13309097290039062, 0.13811492919921875, 0.14313888549804688, 0.148162841796875, 0.15318679809570312, 0.15821075439453125, 0.16323471069335938, 0.1682586669921875, 0.17328262329101562, 0.17830657958984375, 0.18333053588867188, 0.1883544921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 12.0, 3.0, 5.0, 7.0, 5.0, 14.0, 24.0, 27.0, 27.0, 62.0, 156.0, 417.0, 1742.0, 17594.0, 4104652.0, 66106.0, 2582.0, 422.0, 189.0, 73.0, 41.0, 32.0, 21.0, 16.0, 10.0, 15.0, 8.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7158203125, -0.6968154907226562, -0.6778106689453125, -0.6588058471679688, -0.639801025390625, -0.6207962036132812, -0.6017913818359375, -0.5827865600585938, -0.56378173828125, -0.5447769165039062, -0.5257720947265625, -0.5067672729492188, -0.487762451171875, -0.46875762939453125, -0.4497528076171875, -0.43074798583984375, -0.4117431640625, -0.39273834228515625, -0.3737335205078125, -0.35472869873046875, -0.335723876953125, -0.31671905517578125, -0.2977142333984375, -0.27870941162109375, -0.25970458984375, -0.24069976806640625, -0.2216949462890625, -0.20269012451171875, -0.183685302734375, -0.16468048095703125, -0.1456756591796875, -0.12667083740234375, -0.107666015625, -0.08866119384765625, -0.0696563720703125, -0.05065155029296875, -0.031646728515625, -0.01264190673828125, 0.0063629150390625, 0.02536773681640625, 0.04437255859375, 0.06337738037109375, 0.0823822021484375, 0.10138702392578125, 0.120391845703125, 0.13939666748046875, 0.1584014892578125, 0.17740631103515625, 0.1964111328125, 0.21541595458984375, 0.2344207763671875, 0.25342559814453125, 0.272430419921875, 0.29143524169921875, 0.3104400634765625, 0.32944488525390625, 0.34844970703125, 0.36745452880859375, 0.3864593505859375, 0.40546417236328125, 0.424468994140625, 0.44347381591796875, 0.4624786376953125, 0.48148345947265625, 0.50048828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 2.0, 8.0, 13.0, 10.0, 21.0, 42.0, 85.0, 482.0, 2703.0, 493.0, 112.0, 24.0, 14.0, 12.0, 11.0, 4.0, 6.0, 2.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1695556640625, -0.16526126861572266, -0.1609668731689453, -0.15667247772216797, -0.15237808227539062, -0.14808368682861328, -0.14378929138183594, -0.1394948959350586, -0.13520050048828125, -0.1309061050415039, -0.12661170959472656, -0.12231731414794922, -0.11802291870117188, -0.11372852325439453, -0.10943412780761719, -0.10513973236083984, -0.1008453369140625, -0.09655094146728516, -0.09225654602050781, -0.08796215057373047, -0.08366775512695312, -0.07937335968017578, -0.07507896423339844, -0.0707845687866211, -0.06649017333984375, -0.062195777893066406, -0.05790138244628906, -0.05360698699951172, -0.049312591552734375, -0.04501819610595703, -0.04072380065917969, -0.036429405212402344, -0.032135009765625, -0.027840614318847656, -0.023546218872070312, -0.01925182342529297, -0.014957427978515625, -0.010663032531738281, -0.0063686370849609375, -0.0020742416381835938, 0.00222015380859375, 0.006514549255371094, 0.010808944702148438, 0.015103340148925781, 0.019397735595703125, 0.02369213104248047, 0.027986526489257812, 0.032280921936035156, 0.0365753173828125, 0.040869712829589844, 0.04516410827636719, 0.04945850372314453, 0.053752899169921875, 0.05804729461669922, 0.06234169006347656, 0.0666360855102539, 0.07093048095703125, 0.0752248764038086, 0.07951927185058594, 0.08381366729736328, 0.08810806274414062, 0.09240245819091797, 0.09669685363769531, 0.10099124908447266, 0.10528564453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 14.0, 723.0, 273.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5706811547279358, -0.4876716136932373, -0.4046620726585388, -0.32165253162384033, -0.23864299058914185, -0.15563344955444336, -0.07262390851974487, 0.010385632514953613, 0.0933951735496521, 0.17640471458435059, 0.2594142556190491, 0.34242379665374756, 0.42543333768844604, 0.5084428787231445, 0.591452419757843, 0.6744619607925415, 0.75747150182724, 0.8404810428619385, 0.923490583896637, 1.0065001249313354, 1.0895097255706787, 1.1725192070007324, 1.2555286884307861, 1.3385382890701294, 1.4215478897094727, 1.5045573711395264, 1.5875669717788696, 1.670576572418213, 1.7535860538482666, 1.8365955352783203, 1.9196051359176636, 2.002614736557007, 2.0856242179870605, 2.1686336994171143, 2.251643180847168, 2.334652900695801, 2.4176623821258545, 2.500671863555908, 2.583681583404541, 2.6666910648345947, 2.7497005462646484, 2.832710027694702, 2.915719509124756, 2.9987292289733887, 3.0817387104034424, 3.164748191833496, 3.247757911682129, 3.3307673931121826, 3.4137768745422363, 3.49678635597229, 3.5797958374023438, 3.6628055572509766, 3.7458150386810303, 3.828824520111084, 3.911834239959717, 3.9948437213897705, 4.077853202819824, 4.160862922668457, 4.243872165679932, 4.3268818855285645, 4.409891128540039, 4.492900848388672, 4.575910568237305, 4.658919811248779, 4.741929531097412]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 3.0, 5.0, 6.0, 14.0, 12.0, 16.0, 26.0, 20.0, 34.0, 37.0, 41.0, 53.0, 58.0, 56.0, 56.0, 63.0, 54.0, 68.0, 60.0, 40.0, 55.0, 39.0, 42.0, 28.0, 28.0, 17.0, 22.0, 13.0, 10.0, 9.0, 5.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4249011278152466, -0.4135485589504242, -0.4021959602832794, -0.39084339141845703, -0.37949079275131226, -0.36813822388648987, -0.3567856550216675, -0.3454330563545227, -0.3340804874897003, -0.32272791862487793, -0.31137531995773315, -0.30002275109291077, -0.2886701822280884, -0.2773175835609436, -0.2659650146961212, -0.25461244583129883, -0.24325984716415405, -0.23190726339817047, -0.2205546796321869, -0.2092021107673645, -0.19784952700138092, -0.18649694323539734, -0.17514437437057495, -0.16379179060459137, -0.1524392068386078, -0.1410866230726242, -0.12973403930664062, -0.11838147044181824, -0.10702888667583466, -0.09567630290985107, -0.08432372659444809, -0.0729711502790451, -0.06161856651306152, -0.05026598647236824, -0.03891340643167496, -0.027560826390981674, -0.01620824635028839, -0.004855666309595108, 0.006496913731098175, 0.01784949004650116, 0.02920207381248474, 0.040554653853178024, 0.05190723389387131, 0.06325981020927429, 0.07461239397525787, 0.08596497774124146, 0.09731755405664444, 0.10867013037204742, 0.120022714138031, 0.1313752979040146, 0.14272788166999817, 0.15408045053482056, 0.16543303430080414, 0.17678561806678772, 0.1881381869316101, 0.1994907706975937, 0.21084335446357727, 0.22219593822956085, 0.23354852199554443, 0.24490109086036682, 0.2562536597251892, 0.267606258392334, 0.27895882725715637, 0.29031139612197876, 0.30166399478912354]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 8.0, 17.0, 18.0, 28.0, 38.0, 58.0, 96.0, 140.0, 210.0, 387.0, 714.0, 1433.0, 3057.0, 7167.0, 23034.0, 238978.0, 706289.0, 47269.0, 11282.0, 4136.0, 1962.0, 904.0, 512.0, 301.0, 177.0, 99.0, 77.0, 47.0, 26.0, 27.0, 13.0, 14.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25244140625, -0.24460411071777344, -0.23676681518554688, -0.2289295196533203, -0.22109222412109375, -0.2132549285888672, -0.20541763305664062, -0.19758033752441406, -0.1897430419921875, -0.18190574645996094, -0.17406845092773438, -0.1662311553955078, -0.15839385986328125, -0.1505565643310547, -0.14271926879882812, -0.13488197326660156, -0.127044677734375, -0.11920738220214844, -0.11137008666992188, -0.10353279113769531, -0.09569549560546875, -0.08785820007324219, -0.08002090454101562, -0.07218360900878906, -0.0643463134765625, -0.05650901794433594, -0.048671722412109375, -0.04083442687988281, -0.03299713134765625, -0.025159835815429688, -0.017322540283203125, -0.009485244750976562, -0.00164794921875, 0.0061893463134765625, 0.014026641845703125, 0.021863937377929688, 0.02970123291015625, 0.03753852844238281, 0.045375823974609375, 0.05321311950683594, 0.0610504150390625, 0.06888771057128906, 0.07672500610351562, 0.08456230163574219, 0.09239959716796875, 0.10023689270019531, 0.10807418823242188, 0.11591148376464844, 0.123748779296875, 0.13158607482910156, 0.13942337036132812, 0.1472606658935547, 0.15509796142578125, 0.1629352569580078, 0.17077255249023438, 0.17860984802246094, 0.1864471435546875, 0.19428443908691406, 0.20212173461914062, 0.2099590301513672, 0.21779632568359375, 0.2256336212158203, 0.23347091674804688, 0.24130821228027344, 0.2491455078125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 1.0, 5.0, 10.0, 7.0, 21.0, 6.0, 22.0, 56.0, 160.0, 295.0, 245.0, 77.0, 31.0, 12.0, 7.0, 12.0, 10.0, 5.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128662109375, -0.12383079528808594, -0.11899948120117188, -0.11416816711425781, -0.10933685302734375, -0.10450553894042969, -0.09967422485351562, -0.09484291076660156, -0.0900115966796875, -0.08518028259277344, -0.08034896850585938, -0.07551765441894531, -0.07068634033203125, -0.06585502624511719, -0.061023712158203125, -0.05619239807128906, -0.051361083984375, -0.04652976989746094, -0.041698455810546875, -0.03686714172363281, -0.03203582763671875, -0.027204513549804688, -0.022373199462890625, -0.017541885375976562, -0.0127105712890625, -0.007879257202148438, -0.003047943115234375, 0.0017833709716796875, 0.00661468505859375, 0.011445999145507812, 0.016277313232421875, 0.021108627319335938, 0.02593994140625, 0.030771255493164062, 0.035602569580078125, 0.04043388366699219, 0.04526519775390625, 0.05009651184082031, 0.054927825927734375, 0.05975914001464844, 0.0645904541015625, 0.06942176818847656, 0.07425308227539062, 0.07908439636230469, 0.08391571044921875, 0.08874702453613281, 0.09357833862304688, 0.09840965270996094, 0.103240966796875, 0.10807228088378906, 0.11290359497070312, 0.11773490905761719, 0.12256622314453125, 0.1273975372314453, 0.13222885131835938, 0.13706016540527344, 0.1418914794921875, 0.14672279357910156, 0.15155410766601562, 0.1563854217529297, 0.16121673583984375, 0.1660480499267578, 0.17087936401367188, 0.17571067810058594, 0.1805419921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 14.0, 32.0, 25.0, 32.0, 28.0, 65.0, 71.0, 89.0, 103.0, 127.0, 199.0, 225.0, 424.0, 890.0, 3219.0, 37967.0, 890569.0, 106641.0, 4976.0, 1249.0, 492.0, 267.0, 184.0, 145.0, 110.0, 103.0, 78.0, 47.0, 45.0, 45.0, 29.0, 21.0, 9.0, 11.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38232421875, -0.369842529296875, -0.35736083984375, -0.344879150390625, -0.3323974609375, -0.319915771484375, -0.30743408203125, -0.294952392578125, -0.282470703125, -0.269989013671875, -0.25750732421875, -0.245025634765625, -0.2325439453125, -0.220062255859375, -0.20758056640625, -0.195098876953125, -0.1826171875, -0.170135498046875, -0.15765380859375, -0.145172119140625, -0.1326904296875, -0.120208740234375, -0.10772705078125, -0.095245361328125, -0.082763671875, -0.070281982421875, -0.05780029296875, -0.045318603515625, -0.0328369140625, -0.020355224609375, -0.00787353515625, 0.004608154296875, 0.01708984375, 0.029571533203125, 0.04205322265625, 0.054534912109375, 0.0670166015625, 0.079498291015625, 0.09197998046875, 0.104461669921875, 0.116943359375, 0.129425048828125, 0.14190673828125, 0.154388427734375, 0.1668701171875, 0.179351806640625, 0.19183349609375, 0.204315185546875, 0.216796875, 0.229278564453125, 0.24176025390625, 0.254241943359375, 0.2667236328125, 0.279205322265625, 0.29168701171875, 0.304168701171875, 0.316650390625, 0.329132080078125, 0.34161376953125, 0.354095458984375, 0.3665771484375, 0.379058837890625, 0.39154052734375, 0.404022216796875, 0.41650390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 9.0, 9.0, 4.0, 9.0, 9.0, 12.0, 11.0, 18.0, 10.0, 18.0, 16.0, 22.0, 27.0, 29.0, 32.0, 30.0, 24.0, 36.0, 46.0, 38.0, 36.0, 23.0, 37.0, 20.0, 42.0, 50.0, 28.0, 37.0, 27.0, 29.0, 35.0, 27.0, 18.0, 22.0, 23.0, 18.0, 14.0, 24.0, 9.0, 10.0, 9.0, 10.0, 8.0, 10.0, 9.0, 5.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2235107421875, -0.21585655212402344, -0.20820236206054688, -0.2005481719970703, -0.19289398193359375, -0.1852397918701172, -0.17758560180664062, -0.16993141174316406, -0.1622772216796875, -0.15462303161621094, -0.14696884155273438, -0.1393146514892578, -0.13166046142578125, -0.12400627136230469, -0.11635208129882812, -0.10869789123535156, -0.101043701171875, -0.09338951110839844, -0.08573532104492188, -0.07808113098144531, -0.07042694091796875, -0.06277275085449219, -0.055118560791015625, -0.04746437072753906, -0.0398101806640625, -0.03215599060058594, -0.024501800537109375, -0.016847610473632812, -0.00919342041015625, -0.0015392303466796875, 0.006114959716796875, 0.013769149780273438, 0.02142333984375, 0.029077529907226562, 0.036731719970703125, 0.04438591003417969, 0.05204010009765625, 0.05969429016113281, 0.06734848022460938, 0.07500267028808594, 0.0826568603515625, 0.09031105041503906, 0.09796524047851562, 0.10561943054199219, 0.11327362060546875, 0.12092781066894531, 0.12858200073242188, 0.13623619079589844, 0.143890380859375, 0.15154457092285156, 0.15919876098632812, 0.1668529510498047, 0.17450714111328125, 0.1821613311767578, 0.18981552124023438, 0.19746971130371094, 0.2051239013671875, 0.21277809143066406, 0.22043228149414062, 0.2280864715576172, 0.23574066162109375, 0.2433948516845703, 0.2510490417480469, 0.25870323181152344, 0.266357421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 8.0, 11.0, 14.0, 22.0, 46.0, 54.0, 82.0, 152.0, 298.0, 629.0, 1537.0, 4294.0, 16043.0, 152088.0, 792943.0, 64713.0, 10294.0, 3104.0, 1097.0, 497.0, 247.0, 153.0, 85.0, 45.0, 34.0, 14.0, 18.0, 8.0, 6.0, 5.0, 4.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0777587890625, -0.07510948181152344, -0.07246017456054688, -0.06981086730957031, -0.06716156005859375, -0.06451225280761719, -0.061862945556640625, -0.05921363830566406, -0.0565643310546875, -0.05391502380371094, -0.051265716552734375, -0.04861640930175781, -0.04596710205078125, -0.04331779479980469, -0.040668487548828125, -0.03801918029785156, -0.035369873046875, -0.03272056579589844, -0.030071258544921875, -0.027421951293945312, -0.02477264404296875, -0.022123336791992188, -0.019474029541015625, -0.016824722290039062, -0.0141754150390625, -0.011526107788085938, -0.008876800537109375, -0.0062274932861328125, -0.00357818603515625, -0.0009288787841796875, 0.001720428466796875, 0.0043697357177734375, 0.00701904296875, 0.009668350219726562, 0.012317657470703125, 0.014966964721679688, 0.01761627197265625, 0.020265579223632812, 0.022914886474609375, 0.025564193725585938, 0.0282135009765625, 0.030862808227539062, 0.033512115478515625, 0.03616142272949219, 0.03881072998046875, 0.04146003723144531, 0.044109344482421875, 0.04675865173339844, 0.049407958984375, 0.05205726623535156, 0.054706573486328125, 0.05735588073730469, 0.06000518798828125, 0.06265449523925781, 0.06530380249023438, 0.06795310974121094, 0.0706024169921875, 0.07325172424316406, 0.07590103149414062, 0.07855033874511719, 0.08119964599609375, 0.08384895324707031, 0.08649826049804688, 0.08914756774902344, 0.091796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 11.0, 9.0, 15.0, 26.0, 23.0, 50.0, 72.0, 80.0, 116.0, 107.0, 122.0, 88.0, 81.0, 48.0, 25.0, 30.0, 23.0, 13.0, 5.0, 11.0, 4.0, 9.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.953975677490234e-06, -9.547919034957886e-06, -9.141862392425537e-06, -8.735805749893188e-06, -8.32974910736084e-06, -7.923692464828491e-06, -7.517635822296143e-06, -7.111579179763794e-06, -6.705522537231445e-06, -6.299465894699097e-06, -5.893409252166748e-06, -5.487352609634399e-06, -5.081295967102051e-06, -4.675239324569702e-06, -4.2691826820373535e-06, -3.863126039505005e-06, -3.4570693969726562e-06, -3.0510127544403076e-06, -2.644956111907959e-06, -2.2388994693756104e-06, -1.8328428268432617e-06, -1.426786184310913e-06, -1.0207295417785645e-06, -6.146728992462158e-07, -2.086162567138672e-07, 1.9744038581848145e-07, 6.034970283508301e-07, 1.0095536708831787e-06, 1.4156103134155273e-06, 1.821666955947876e-06, 2.2277235984802246e-06, 2.6337802410125732e-06, 3.039836883544922e-06, 3.4458935260772705e-06, 3.851950168609619e-06, 4.258006811141968e-06, 4.664063453674316e-06, 5.070120096206665e-06, 5.476176738739014e-06, 5.882233381271362e-06, 6.288290023803711e-06, 6.6943466663360596e-06, 7.100403308868408e-06, 7.506459951400757e-06, 7.912516593933105e-06, 8.318573236465454e-06, 8.724629878997803e-06, 9.130686521530151e-06, 9.5367431640625e-06, 9.942799806594849e-06, 1.0348856449127197e-05, 1.0754913091659546e-05, 1.1160969734191895e-05, 1.1567026376724243e-05, 1.1973083019256592e-05, 1.237913966178894e-05, 1.2785196304321289e-05, 1.3191252946853638e-05, 1.3597309589385986e-05, 1.4003366231918335e-05, 1.4409422874450684e-05, 1.4815479516983032e-05, 1.5221536159515381e-05, 1.562759280204773e-05, 1.6033649444580078e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 8.0, 11.0, 11.0, 21.0, 22.0, 22.0, 54.0, 79.0, 129.0, 206.0, 348.0, 699.0, 1510.0, 4514.0, 18324.0, 172801.0, 764736.0, 68580.0, 10916.0, 3134.0, 1101.0, 534.0, 290.0, 166.0, 119.0, 64.0, 50.0, 33.0, 15.0, 12.0, 12.0, 11.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08599853515625, -0.08316326141357422, -0.08032798767089844, -0.07749271392822266, -0.07465744018554688, -0.0718221664428711, -0.06898689270019531, -0.06615161895751953, -0.06331634521484375, -0.06048107147216797, -0.05764579772949219, -0.054810523986816406, -0.051975250244140625, -0.049139976501464844, -0.04630470275878906, -0.04346942901611328, -0.0406341552734375, -0.03779888153076172, -0.03496360778808594, -0.032128334045410156, -0.029293060302734375, -0.026457786560058594, -0.023622512817382812, -0.02078723907470703, -0.01795196533203125, -0.015116691589355469, -0.012281417846679688, -0.009446144104003906, -0.006610870361328125, -0.0037755966186523438, -0.0009403228759765625, 0.0018949508666992188, 0.004730224609375, 0.007565498352050781, 0.010400772094726562, 0.013236045837402344, 0.016071319580078125, 0.018906593322753906, 0.021741867065429688, 0.02457714080810547, 0.02741241455078125, 0.03024768829345703, 0.03308296203613281, 0.035918235778808594, 0.038753509521484375, 0.041588783264160156, 0.04442405700683594, 0.04725933074951172, 0.0500946044921875, 0.05292987823486328, 0.05576515197753906, 0.058600425720214844, 0.061435699462890625, 0.0642709732055664, 0.06710624694824219, 0.06994152069091797, 0.07277679443359375, 0.07561206817626953, 0.07844734191894531, 0.0812826156616211, 0.08411788940429688, 0.08695316314697266, 0.08978843688964844, 0.09262371063232422, 0.095458984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 11.0, 16.0, 19.0, 23.0, 27.0, 37.0, 57.0, 74.0, 107.0, 113.0, 131.0, 103.0, 79.0, 61.0, 39.0, 20.0, 16.0, 10.0, 11.0, 11.0, 5.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09417724609375, -0.09139823913574219, -0.08861923217773438, -0.08584022521972656, -0.08306121826171875, -0.08028221130371094, -0.07750320434570312, -0.07472419738769531, -0.0719451904296875, -0.06916618347167969, -0.06638717651367188, -0.06360816955566406, -0.06082916259765625, -0.05805015563964844, -0.055271148681640625, -0.05249214172363281, -0.049713134765625, -0.04693412780761719, -0.044155120849609375, -0.04137611389160156, -0.03859710693359375, -0.03581809997558594, -0.033039093017578125, -0.030260086059570312, -0.0274810791015625, -0.024702072143554688, -0.021923065185546875, -0.019144058227539062, -0.01636505126953125, -0.013586044311523438, -0.010807037353515625, -0.008028030395507812, -0.0052490234375, -0.0024700164794921875, 0.000308990478515625, 0.0030879974365234375, 0.00586700439453125, 0.008646011352539062, 0.011425018310546875, 0.014204025268554688, 0.0169830322265625, 0.019762039184570312, 0.022541046142578125, 0.025320053100585938, 0.02809906005859375, 0.030878067016601562, 0.033657073974609375, 0.03643608093261719, 0.039215087890625, 0.04199409484863281, 0.044773101806640625, 0.04755210876464844, 0.05033111572265625, 0.05311012268066406, 0.055889129638671875, 0.05866813659667969, 0.0614471435546875, 0.06422615051269531, 0.06700515747070312, 0.06978416442871094, 0.07256317138671875, 0.07534217834472656, 0.07812118530273438, 0.08090019226074219, 0.08367919921875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 17.0, 865.0, 124.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.909315586090088, -2.6805007457733154, -2.451686143875122, -2.2228713035583496, -1.9940565824508667, -1.7652418613433838, -1.5364270210266113, -1.3076122999191284, -1.0787975788116455, -0.8499828577041626, -0.6211680769920349, -0.3923532962799072, -0.16353857517242432, 0.0652761459350586, 0.29409098625183105, 0.522905707359314, 0.7517204284667969, 0.9805351495742798, 1.2093498706817627, 1.4381647109985352, 1.666979432106018, 1.895794153213501, 2.1246089935302734, 2.353423595428467, 2.5822384357452393, 2.8110532760620117, 3.039867877960205, 3.2686827182769775, 3.49749755859375, 3.7263121604919434, 3.955127000808716, 4.183941841125488, 4.41275691986084, 4.641571521759033, 4.870386600494385, 5.099201202392578, 5.3280158042907715, 5.556830406188965, 5.785645484924316, 6.01446008682251, 6.243274688720703, 6.4720892906188965, 6.700904369354248, 6.929718971252441, 7.158533573150635, 7.387348175048828, 7.61616325378418, 7.844977855682373, 8.073793411254883, 8.302608489990234, 8.53142261505127, 8.760237693786621, 8.989052772521973, 9.217866897583008, 9.44668197631836, 9.675497055053711, 9.904311180114746, 10.133126258850098, 10.361940383911133, 10.590755462646484, 10.819570541381836, 11.048384666442871, 11.277199745178223, 11.506014823913574, 11.73482894897461]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 7.0, 6.0, 5.0, 9.0, 17.0, 13.0, 12.0, 14.0, 22.0, 23.0, 31.0, 31.0, 22.0, 27.0, 40.0, 44.0, 37.0, 46.0, 42.0, 37.0, 47.0, 55.0, 38.0, 40.0, 40.0, 39.0, 34.0, 27.0, 37.0, 22.0, 28.0, 10.0, 13.0, 15.0, 11.0, 13.0, 7.0, 11.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.6813184022903442, -1.628021240234375, -1.5747239589691162, -1.521426796913147, -1.4681295156478882, -1.414832353591919, -1.3615350723266602, -1.308237910270691, -1.2549407482147217, -1.2016435861587524, -1.1483463048934937, -1.0950491428375244, -1.0417518615722656, -0.9884546995162964, -0.9351574778556824, -0.8818602561950684, -0.8285629749298096, -0.7752657532691956, -0.7219685316085815, -0.6686713695526123, -0.6153740882873535, -0.5620769262313843, -0.5087797045707703, -0.45548248291015625, -0.40218526124954224, -0.3488880395889282, -0.2955908179283142, -0.24229362607002258, -0.18899640440940857, -0.13569918274879456, -0.08240199089050293, -0.029104769229888916, 0.02419257164001465, 0.07748978585004807, 0.13078700006008148, 0.1840842068195343, 0.23738142848014832, 0.29067865014076233, 0.34397584199905396, 0.39727306365966797, 0.450570285320282, 0.503867506980896, 0.55716472864151, 0.610461950302124, 0.6637591123580933, 0.717056393623352, 0.7703535556793213, 0.8236507773399353, 0.8769479990005493, 0.9302452206611633, 0.9835424423217773, 1.0368396043777466, 1.0901368856430054, 1.1434340476989746, 1.1967313289642334, 1.2500284910202026, 1.3033256530761719, 1.3566228151321411, 1.4099200963974, 1.4632172584533691, 1.516514539718628, 1.5698117017745972, 1.6231088638305664, 1.6764061450958252, 1.729703426361084]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 6.0, 10.0, 12.0, 23.0, 24.0, 45.0, 65.0, 126.0, 196.0, 607.0, 6010.0, 4161903.0, 23406.0, 1089.0, 363.0, 146.0, 98.0, 44.0, 34.0, 20.0, 12.0, 10.0, 4.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53662109375, -0.5185165405273438, -0.5004119873046875, -0.48230743408203125, -0.464202880859375, -0.44609832763671875, -0.4279937744140625, -0.40988922119140625, -0.39178466796875, -0.37368011474609375, -0.3555755615234375, -0.33747100830078125, -0.319366455078125, -0.30126190185546875, -0.2831573486328125, -0.26505279541015625, -0.2469482421875, -0.22884368896484375, -0.2107391357421875, -0.19263458251953125, -0.174530029296875, -0.15642547607421875, -0.1383209228515625, -0.12021636962890625, -0.10211181640625, -0.08400726318359375, -0.0659027099609375, -0.04779815673828125, -0.029693603515625, -0.01158905029296875, 0.0065155029296875, 0.02462005615234375, 0.042724609375, 0.06082916259765625, 0.0789337158203125, 0.09703826904296875, 0.115142822265625, 0.13324737548828125, 0.1513519287109375, 0.16945648193359375, 0.18756103515625, 0.20566558837890625, 0.2237701416015625, 0.24187469482421875, 0.259979248046875, 0.27808380126953125, 0.2961883544921875, 0.31429290771484375, 0.3323974609375, 0.35050201416015625, 0.3686065673828125, 0.38671112060546875, 0.404815673828125, 0.42292022705078125, 0.4410247802734375, 0.45912933349609375, 0.47723388671875, 0.49533843994140625, 0.5134429931640625, 0.5315475463867188, 0.549652099609375, 0.5677566528320312, 0.5858612060546875, 0.6039657592773438, 0.6220703125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 3.0, 5.0, 5.0, 4.0, 15.0, 18.0, 22.0, 47.0, 166.0, 277.0, 236.0, 104.0, 31.0, 16.0, 10.0, 7.0, 13.0, 6.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1314697265625, -0.1267242431640625, -0.121978759765625, -0.1172332763671875, -0.11248779296875, -0.1077423095703125, -0.102996826171875, -0.0982513427734375, -0.093505859375, -0.0887603759765625, -0.084014892578125, -0.0792694091796875, -0.07452392578125, -0.0697784423828125, -0.065032958984375, -0.0602874755859375, -0.0555419921875, -0.0507965087890625, -0.046051025390625, -0.0413055419921875, -0.03656005859375, -0.0318145751953125, -0.027069091796875, -0.0223236083984375, -0.017578125, -0.0128326416015625, -0.008087158203125, -0.0033416748046875, 0.00140380859375, 0.0061492919921875, 0.010894775390625, 0.0156402587890625, 0.0203857421875, 0.0251312255859375, 0.029876708984375, 0.0346221923828125, 0.03936767578125, 0.0441131591796875, 0.048858642578125, 0.0536041259765625, 0.058349609375, 0.0630950927734375, 0.067840576171875, 0.0725860595703125, 0.07733154296875, 0.0820770263671875, 0.086822509765625, 0.0915679931640625, 0.0963134765625, 0.1010589599609375, 0.105804443359375, 0.1105499267578125, 0.11529541015625, 0.1200408935546875, 0.124786376953125, 0.1295318603515625, 0.13427734375, 0.1390228271484375, 0.143768310546875, 0.1485137939453125, 0.15325927734375, 0.1580047607421875, 0.162750244140625, 0.1674957275390625, 0.1722412109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 9.0, 25.0, 38.0, 88.0, 200.0, 692.0, 4064.0, 76753.0, 4062328.0, 46317.0, 2920.0, 496.0, 173.0, 79.0, 28.0, 17.0, 6.0, 10.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22607421875, -0.21718978881835938, -0.20830535888671875, -0.19942092895507812, -0.1905364990234375, -0.18165206909179688, -0.17276763916015625, -0.16388320922851562, -0.154998779296875, -0.14611434936523438, -0.13722991943359375, -0.12834548950195312, -0.1194610595703125, -0.11057662963867188, -0.10169219970703125, -0.09280776977539062, -0.08392333984375, -0.07503890991210938, -0.06615447998046875, -0.057270050048828125, -0.0483856201171875, -0.039501190185546875, -0.03061676025390625, -0.021732330322265625, -0.012847900390625, -0.003963470458984375, 0.00492095947265625, 0.013805389404296875, 0.0226898193359375, 0.031574249267578125, 0.04045867919921875, 0.049343109130859375, 0.0582275390625, 0.06711196899414062, 0.07599639892578125, 0.08488082885742188, 0.0937652587890625, 0.10264968872070312, 0.11153411865234375, 0.12041854858398438, 0.129302978515625, 0.13818740844726562, 0.14707183837890625, 0.15595626831054688, 0.1648406982421875, 0.17372512817382812, 0.18260955810546875, 0.19149398803710938, 0.20037841796875, 0.20926284790039062, 0.21814727783203125, 0.22703170776367188, 0.2359161376953125, 0.24480056762695312, 0.25368499755859375, 0.2625694274902344, 0.271453857421875, 0.2803382873535156, 0.28922271728515625, 0.2981071472167969, 0.3069915771484375, 0.3158760070800781, 0.32476043701171875, 0.3336448669433594, 0.342529296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 9.0, 14.0, 19.0, 40.0, 56.0, 158.0, 368.0, 2099.0, 872.0, 242.0, 100.0, 44.0, 19.0, 9.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07873249053955078, -0.07659339904785156, -0.07445430755615234, -0.07231521606445312, -0.0701761245727539, -0.06803703308105469, -0.06589794158935547, -0.06375885009765625, -0.06161975860595703, -0.05948066711425781, -0.057341575622558594, -0.055202484130859375, -0.053063392639160156, -0.05092430114746094, -0.04878520965576172, -0.0466461181640625, -0.04450702667236328, -0.04236793518066406, -0.040228843688964844, -0.038089752197265625, -0.035950660705566406, -0.03381156921386719, -0.03167247772216797, -0.02953338623046875, -0.02739429473876953, -0.025255203247070312, -0.023116111755371094, -0.020977020263671875, -0.018837928771972656, -0.016698837280273438, -0.014559745788574219, -0.012420654296875, -0.010281562805175781, -0.008142471313476562, -0.006003379821777344, -0.003864288330078125, -0.0017251968383789062, 0.0004138946533203125, 0.0025529861450195312, 0.00469207763671875, 0.006831169128417969, 0.008970260620117188, 0.011109352111816406, 0.013248443603515625, 0.015387535095214844, 0.017526626586914062, 0.01966571807861328, 0.0218048095703125, 0.02394390106201172, 0.026082992553710938, 0.028222084045410156, 0.030361175537109375, 0.032500267028808594, 0.03463935852050781, 0.03677845001220703, 0.03891754150390625, 0.04105663299560547, 0.04319572448730469, 0.045334815979003906, 0.047473907470703125, 0.049612998962402344, 0.05175209045410156, 0.05389118194580078, 0.0560302734375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 10.0, 29.0, 200.0, 512.0, 223.0, 25.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48881155252456665, -0.47044065594673157, -0.4520697593688965, -0.433698832988739, -0.41532793641090393, -0.39695703983306885, -0.3785861134529114, -0.3602152168750763, -0.3418443202972412, -0.32347342371940613, -0.30510252714157104, -0.2867316007614136, -0.2683607041835785, -0.2499898076057434, -0.23161889612674713, -0.21324798464775085, -0.19487708806991577, -0.1765061914920807, -0.1581352800130844, -0.13976436853408813, -0.12139347195625305, -0.10302256792783737, -0.08465166389942169, -0.06628075242042542, -0.04790985584259033, -0.029538951814174652, -0.011168047785758972, 0.007202856242656708, 0.025573760271072388, 0.04394466429948807, 0.06231556832790375, 0.08068647980690002, 0.09905737638473511, 0.11742828041315079, 0.13579918444156647, 0.15417009592056274, 0.17254099249839783, 0.1909118890762329, 0.2092828005552292, 0.22765371203422546, 0.24602460861206055, 0.26439550518989563, 0.2827664017677307, 0.3011373281478882, 0.31950822472572327, 0.33787912130355835, 0.3562500476837158, 0.3746209442615509, 0.392991840839386, 0.41136273741722107, 0.42973363399505615, 0.4481045603752136, 0.4664754569530487, 0.4848463535308838, 0.5032172799110413, 0.5215882062911987, 0.5399590730667114, 0.5583299994468689, 0.5767008662223816, 0.5950717926025391, 0.6134426593780518, 0.6318135857582092, 0.6501845121383667, 0.6685553789138794, 0.6869263052940369]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 10.0, 18.0, 14.0, 19.0, 16.0, 27.0, 28.0, 37.0, 32.0, 32.0, 42.0, 41.0, 32.0, 49.0, 54.0, 46.0, 52.0, 49.0, 35.0, 42.0, 32.0, 35.0, 32.0, 40.0, 16.0, 29.0, 24.0, 13.0, 13.0, 20.0, 9.0, 13.0, 14.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.13406014442443848, -0.12983031570911407, -0.12560047209262848, -0.12137063592672348, -0.11714079976081848, -0.11291097104549408, -0.10868113487958908, -0.10445129871368408, -0.10022146254777908, -0.09599162638187408, -0.09176179021596909, -0.08753195405006409, -0.08330212533473969, -0.07907228171825409, -0.07484245300292969, -0.07061261683702469, -0.06638278067111969, -0.06215294450521469, -0.05792310833930969, -0.05369327589869499, -0.04946343973278999, -0.045233603566884995, -0.041003771126270294, -0.036773934960365295, -0.0325440987944603, -0.028314262628555298, -0.02408442832529545, -0.0198545940220356, -0.0156247578561306, -0.011394921690225601, -0.007165087386965752, -0.002935253083705902, 0.0012945830821990967, 0.005524418316781521, 0.009754253551363945, 0.01398408878594637, 0.018213924020528793, 0.022443760186433792, 0.02667359448969364, 0.03090342879295349, 0.03513326495885849, 0.03936310112476349, 0.04359293729066849, 0.04782276973128319, 0.05205260589718819, 0.056282442063093185, 0.060512274503707886, 0.06474211066961288, 0.06897194683551788, 0.07320178300142288, 0.07743161916732788, 0.08166145533323288, 0.08589129149913788, 0.09012112021446228, 0.09435095638036728, 0.09858079254627228, 0.10281062871217728, 0.10704046487808228, 0.11127030104398727, 0.11550013720989227, 0.11972996592521667, 0.12395980954170227, 0.12818963825702667, 0.13241946697235107, 0.13664931058883667]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 13.0, 15.0, 21.0, 41.0, 39.0, 68.0, 130.0, 206.0, 456.0, 996.0, 2410.0, 7187.0, 33949.0, 661382.0, 311137.0, 21532.0, 5384.0, 1955.0, 797.0, 359.0, 175.0, 93.0, 69.0, 50.0, 27.0, 19.0, 11.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.253662109375, -0.24570465087890625, -0.2377471923828125, -0.22978973388671875, -0.221832275390625, -0.21387481689453125, -0.2059173583984375, -0.19795989990234375, -0.19000244140625, -0.18204498291015625, -0.1740875244140625, -0.16613006591796875, -0.158172607421875, -0.15021514892578125, -0.1422576904296875, -0.13430023193359375, -0.1263427734375, -0.11838531494140625, -0.1104278564453125, -0.10247039794921875, -0.094512939453125, -0.08655548095703125, -0.0785980224609375, -0.07064056396484375, -0.06268310546875, -0.05472564697265625, -0.0467681884765625, -0.03881072998046875, -0.030853271484375, -0.02289581298828125, -0.0149383544921875, -0.00698089599609375, 0.0009765625, 0.00893402099609375, 0.0168914794921875, 0.02484893798828125, 0.032806396484375, 0.04076385498046875, 0.0487213134765625, 0.05667877197265625, 0.06463623046875, 0.07259368896484375, 0.0805511474609375, 0.08850860595703125, 0.096466064453125, 0.10442352294921875, 0.1123809814453125, 0.12033843994140625, 0.1282958984375, 0.13625335693359375, 0.1442108154296875, 0.15216827392578125, 0.160125732421875, 0.16808319091796875, 0.1760406494140625, 0.18399810791015625, 0.19195556640625, 0.19991302490234375, 0.2078704833984375, 0.21582794189453125, 0.223785400390625, 0.23174285888671875, 0.2397003173828125, 0.24765777587890625, 0.255615234375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 3.0, 5.0, 6.0, 8.0, 13.0, 18.0, 22.0, 65.0, 189.0, 273.0, 223.0, 85.0, 23.0, 17.0, 12.0, 9.0, 10.0, 4.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12939453125, -0.12469482421875, -0.1199951171875, -0.11529541015625, -0.110595703125, -0.10589599609375, -0.1011962890625, -0.09649658203125, -0.091796875, -0.08709716796875, -0.0823974609375, -0.07769775390625, -0.072998046875, -0.06829833984375, -0.0635986328125, -0.05889892578125, -0.05419921875, -0.04949951171875, -0.0447998046875, -0.04010009765625, -0.035400390625, -0.03070068359375, -0.0260009765625, -0.02130126953125, -0.0166015625, -0.01190185546875, -0.0072021484375, -0.00250244140625, 0.002197265625, 0.00689697265625, 0.0115966796875, 0.01629638671875, 0.02099609375, 0.02569580078125, 0.0303955078125, 0.03509521484375, 0.039794921875, 0.04449462890625, 0.0491943359375, 0.05389404296875, 0.05859375, 0.06329345703125, 0.0679931640625, 0.07269287109375, 0.077392578125, 0.08209228515625, 0.0867919921875, 0.09149169921875, 0.09619140625, 0.10089111328125, 0.1055908203125, 0.11029052734375, 0.114990234375, 0.11968994140625, 0.1243896484375, 0.12908935546875, 0.1337890625, 0.13848876953125, 0.1431884765625, 0.14788818359375, 0.152587890625, 0.15728759765625, 0.1619873046875, 0.16668701171875, 0.17138671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 14.0, 6.0, 11.0, 14.0, 22.0, 20.0, 20.0, 28.0, 32.0, 55.0, 48.0, 64.0, 81.0, 88.0, 166.0, 179.0, 339.0, 517.0, 1112.0, 3158.0, 20822.0, 591249.0, 409450.0, 15675.0, 2702.0, 997.0, 506.0, 318.0, 193.0, 112.0, 100.0, 86.0, 57.0, 63.0, 53.0, 37.0, 29.0, 25.0, 25.0, 25.0, 11.0, 10.0, 9.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.283203125, -0.27460479736328125, -0.2660064697265625, -0.25740814208984375, -0.248809814453125, -0.24021148681640625, -0.2316131591796875, -0.22301483154296875, -0.21441650390625, -0.20581817626953125, -0.1972198486328125, -0.18862152099609375, -0.180023193359375, -0.17142486572265625, -0.1628265380859375, -0.15422821044921875, -0.1456298828125, -0.13703155517578125, -0.1284332275390625, -0.11983489990234375, -0.111236572265625, -0.10263824462890625, -0.0940399169921875, -0.08544158935546875, -0.07684326171875, -0.06824493408203125, -0.0596466064453125, -0.05104827880859375, -0.042449951171875, -0.03385162353515625, -0.0252532958984375, -0.01665496826171875, -0.008056640625, 0.00054168701171875, 0.0091400146484375, 0.01773834228515625, 0.026336669921875, 0.03493499755859375, 0.0435333251953125, 0.05213165283203125, 0.06072998046875, 0.06932830810546875, 0.0779266357421875, 0.08652496337890625, 0.095123291015625, 0.10372161865234375, 0.1123199462890625, 0.12091827392578125, 0.1295166015625, 0.13811492919921875, 0.1467132568359375, 0.15531158447265625, 0.163909912109375, 0.17250823974609375, 0.1811065673828125, 0.18970489501953125, 0.19830322265625, 0.20690155029296875, 0.2154998779296875, 0.22409820556640625, 0.232696533203125, 0.24129486083984375, 0.2498931884765625, 0.25849151611328125, 0.26708984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 15.0, 17.0, 14.0, 13.0, 13.0, 21.0, 18.0, 25.0, 25.0, 33.0, 42.0, 40.0, 42.0, 40.0, 48.0, 42.0, 34.0, 51.0, 49.0, 47.0, 49.0, 39.0, 32.0, 23.0, 32.0, 30.0, 24.0, 27.0, 24.0, 14.0, 14.0, 12.0, 9.0, 10.0, 6.0, 2.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.326416015625, -0.31809425354003906, -0.3097724914550781, -0.3014507293701172, -0.29312896728515625, -0.2848072052001953, -0.2764854431152344, -0.26816368103027344, -0.2598419189453125, -0.25152015686035156, -0.24319839477539062, -0.2348766326904297, -0.22655487060546875, -0.2182331085205078, -0.20991134643554688, -0.20158958435058594, -0.193267822265625, -0.18494606018066406, -0.17662429809570312, -0.1683025360107422, -0.15998077392578125, -0.1516590118408203, -0.14333724975585938, -0.13501548767089844, -0.1266937255859375, -0.11837196350097656, -0.11005020141601562, -0.10172843933105469, -0.09340667724609375, -0.08508491516113281, -0.07676315307617188, -0.06844139099121094, -0.06011962890625, -0.05179786682128906, -0.043476104736328125, -0.03515434265136719, -0.02683258056640625, -0.018510818481445312, -0.010189056396484375, -0.0018672943115234375, 0.0064544677734375, 0.014776229858398438, 0.023097991943359375, 0.03141975402832031, 0.03974151611328125, 0.04806327819824219, 0.056385040283203125, 0.06470680236816406, 0.073028564453125, 0.08135032653808594, 0.08967208862304688, 0.09799385070800781, 0.10631561279296875, 0.11463737487792969, 0.12295913696289062, 0.13128089904785156, 0.1396026611328125, 0.14792442321777344, 0.15624618530273438, 0.1645679473876953, 0.17288970947265625, 0.1812114715576172, 0.18953323364257812, 0.19785499572753906, 0.2061767578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 4.0, 11.0, 10.0, 12.0, 17.0, 23.0, 30.0, 37.0, 67.0, 106.0, 122.0, 243.0, 551.0, 1307.0, 3582.0, 14247.0, 169160.0, 811649.0, 36368.0, 7079.0, 2132.0, 859.0, 410.0, 201.0, 121.0, 67.0, 43.0, 23.0, 18.0, 18.0, 13.0, 6.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08673095703125, -0.08386421203613281, -0.08099746704101562, -0.07813072204589844, -0.07526397705078125, -0.07239723205566406, -0.06953048706054688, -0.06666374206542969, -0.0637969970703125, -0.06093025207519531, -0.058063507080078125, -0.05519676208496094, -0.05233001708984375, -0.04946327209472656, -0.046596527099609375, -0.04372978210449219, -0.040863037109375, -0.03799629211425781, -0.035129547119140625, -0.03226280212402344, -0.02939605712890625, -0.026529312133789062, -0.023662567138671875, -0.020795822143554688, -0.0179290771484375, -0.015062332153320312, -0.012195587158203125, -0.009328842163085938, -0.00646209716796875, -0.0035953521728515625, -0.000728607177734375, 0.0021381378173828125, 0.0050048828125, 0.007871627807617188, 0.010738372802734375, 0.013605117797851562, 0.01647186279296875, 0.019338607788085938, 0.022205352783203125, 0.025072097778320312, 0.0279388427734375, 0.030805587768554688, 0.033672332763671875, 0.03653907775878906, 0.03940582275390625, 0.04227256774902344, 0.045139312744140625, 0.04800605773925781, 0.050872802734375, 0.05373954772949219, 0.056606292724609375, 0.05947303771972656, 0.06233978271484375, 0.06520652770996094, 0.06807327270507812, 0.07094001770019531, 0.0738067626953125, 0.07667350769042969, 0.07954025268554688, 0.08240699768066406, 0.08527374267578125, 0.08814048767089844, 0.09100723266601562, 0.09387397766113281, 0.09674072265625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 9.0, 5.0, 8.0, 15.0, 38.0, 76.0, 129.0, 257.0, 190.0, 136.0, 56.0, 30.0, 11.0, 9.0, 14.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6808509826660156e-05, -1.6130506992340088e-05, -1.545250415802002e-05, -1.4774501323699951e-05, -1.4096498489379883e-05, -1.3418495655059814e-05, -1.2740492820739746e-05, -1.2062489986419678e-05, -1.138448715209961e-05, -1.0706484317779541e-05, -1.0028481483459473e-05, -9.350478649139404e-06, -8.672475814819336e-06, -7.994472980499268e-06, -7.316470146179199e-06, -6.638467311859131e-06, -5.9604644775390625e-06, -5.282461643218994e-06, -4.604458808898926e-06, -3.926455974578857e-06, -3.248453140258789e-06, -2.5704503059387207e-06, -1.8924474716186523e-06, -1.214444637298584e-06, -5.364418029785156e-07, 1.4156103134155273e-07, 8.195638656616211e-07, 1.4975666999816895e-06, 2.175569534301758e-06, 2.853572368621826e-06, 3.5315752029418945e-06, 4.209578037261963e-06, 4.887580871582031e-06, 5.5655837059021e-06, 6.243586540222168e-06, 6.921589374542236e-06, 7.599592208862305e-06, 8.277595043182373e-06, 8.955597877502441e-06, 9.63360071182251e-06, 1.0311603546142578e-05, 1.0989606380462646e-05, 1.1667609214782715e-05, 1.2345612049102783e-05, 1.3023614883422852e-05, 1.370161771774292e-05, 1.4379620552062988e-05, 1.5057623386383057e-05, 1.5735626220703125e-05, 1.6413629055023193e-05, 1.7091631889343262e-05, 1.776963472366333e-05, 1.84476375579834e-05, 1.9125640392303467e-05, 1.9803643226623535e-05, 2.0481646060943604e-05, 2.1159648895263672e-05, 2.183765172958374e-05, 2.251565456390381e-05, 2.3193657398223877e-05, 2.3871660232543945e-05, 2.4549663066864014e-05, 2.5227665901184082e-05, 2.590566873550415e-05, 2.658367156982422e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 5.0, 4.0, 7.0, 11.0, 7.0, 14.0, 14.0, 13.0, 18.0, 29.0, 48.0, 64.0, 123.0, 204.0, 324.0, 632.0, 1488.0, 4218.0, 16477.0, 310267.0, 682828.0, 23062.0, 5095.0, 1861.0, 765.0, 360.0, 214.0, 125.0, 83.0, 49.0, 38.0, 22.0, 12.0, 15.0, 12.0, 14.0, 2.0, 6.0, 3.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.123291015625, -0.1196746826171875, -0.116058349609375, -0.1124420166015625, -0.10882568359375, -0.1052093505859375, -0.101593017578125, -0.0979766845703125, -0.0943603515625, -0.0907440185546875, -0.087127685546875, -0.0835113525390625, -0.07989501953125, -0.0762786865234375, -0.072662353515625, -0.0690460205078125, -0.0654296875, -0.0618133544921875, -0.058197021484375, -0.0545806884765625, -0.05096435546875, -0.0473480224609375, -0.043731689453125, -0.0401153564453125, -0.0364990234375, -0.0328826904296875, -0.029266357421875, -0.0256500244140625, -0.02203369140625, -0.0184173583984375, -0.014801025390625, -0.0111846923828125, -0.007568359375, -0.0039520263671875, -0.000335693359375, 0.0032806396484375, 0.00689697265625, 0.0105133056640625, 0.014129638671875, 0.0177459716796875, 0.0213623046875, 0.0249786376953125, 0.028594970703125, 0.0322113037109375, 0.03582763671875, 0.0394439697265625, 0.043060302734375, 0.0466766357421875, 0.05029296875, 0.0539093017578125, 0.057525634765625, 0.0611419677734375, 0.06475830078125, 0.0683746337890625, 0.071990966796875, 0.0756072998046875, 0.0792236328125, 0.0828399658203125, 0.086456298828125, 0.0900726318359375, 0.09368896484375, 0.0973052978515625, 0.100921630859375, 0.1045379638671875, 0.108154296875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 2.0, 4.0, 7.0, 9.0, 15.0, 24.0, 33.0, 52.0, 100.0, 146.0, 170.0, 138.0, 100.0, 66.0, 44.0, 24.0, 17.0, 13.0, 7.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11541748046875, -0.11208629608154297, -0.10875511169433594, -0.1054239273071289, -0.10209274291992188, -0.09876155853271484, -0.09543037414550781, -0.09209918975830078, -0.08876800537109375, -0.08543682098388672, -0.08210563659667969, -0.07877445220947266, -0.07544326782226562, -0.0721120834350586, -0.06878089904785156, -0.06544971466064453, -0.0621185302734375, -0.05878734588623047, -0.05545616149902344, -0.052124977111816406, -0.048793792724609375, -0.045462608337402344, -0.04213142395019531, -0.03880023956298828, -0.03546905517578125, -0.03213787078857422, -0.028806686401367188, -0.025475502014160156, -0.022144317626953125, -0.018813133239746094, -0.015481948852539062, -0.012150764465332031, -0.008819580078125, -0.005488395690917969, -0.0021572113037109375, 0.0011739730834960938, 0.004505157470703125, 0.007836341857910156, 0.011167526245117188, 0.014498710632324219, 0.01782989501953125, 0.02116107940673828, 0.024492263793945312, 0.027823448181152344, 0.031154632568359375, 0.034485816955566406, 0.03781700134277344, 0.04114818572998047, 0.0444793701171875, 0.04781055450439453, 0.05114173889160156, 0.054472923278808594, 0.057804107666015625, 0.061135292053222656, 0.06446647644042969, 0.06779766082763672, 0.07112884521484375, 0.07446002960205078, 0.07779121398925781, 0.08112239837646484, 0.08445358276367188, 0.0877847671508789, 0.09111595153808594, 0.09444713592529297, 0.0977783203125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 5.0, 24.0, 674.0, 285.0, 17.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9732828736305237, -0.8057948350906372, -0.6383068561553955, -0.47081881761550903, -0.30333077907562256, -0.13584274053573608, 0.031645238399505615, 0.19913333654403687, 0.36662131547927856, 0.534109354019165, 0.7015973329544067, 0.8690853714942932, 1.0365734100341797, 1.204061508178711, 1.371549367904663, 1.5390374660491943, 1.7065255641937256, 1.8740135431289673, 2.041501522064209, 2.2089896202087402, 2.3764777183532715, 2.5439658164978027, 2.711453676223755, 2.878941774368286, 3.0464296340942383, 3.2139177322387695, 3.3814055919647217, 3.548893690109253, 3.716381788253784, 3.8838696479797363, 4.051357746124268, 4.218845844268799, 4.38633394241333, 4.553822040557861, 4.721310138702393, 4.888797760009766, 5.056285858154297, 5.223773956298828, 5.391262054443359, 5.558750152587891, 5.726238250732422, 5.893726348876953, 6.061214447021484, 6.228702545166016, 6.396190166473389, 6.56367826461792, 6.731166362762451, 6.898654460906982, 7.0661420822143555, 7.233630180358887, 7.401118278503418, 7.568606376647949, 7.736093997955322, 7.9035820960998535, 8.071069717407227, 8.238557815551758, 8.406046867370605, 8.573534965515137, 8.741023063659668, 8.9085111618042, 9.07599925994873, 9.243487358093262, 9.410974502563477, 9.578462600708008, 9.745950698852539]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 8.0, 7.0, 8.0, 11.0, 14.0, 15.0, 20.0, 22.0, 18.0, 15.0, 37.0, 34.0, 29.0, 42.0, 33.0, 50.0, 45.0, 45.0, 49.0, 35.0, 45.0, 43.0, 42.0, 43.0, 33.0, 35.0, 34.0, 26.0, 23.0, 20.0, 19.0, 19.0, 19.0, 12.0, 8.0, 9.0, 6.0, 3.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.5177534818649292, -1.4698368310928345, -1.4219202995300293, -1.3740036487579346, -1.3260871171951294, -1.2781704664230347, -1.2302539348602295, -1.1823372840881348, -1.1344207525253296, -1.0865041017532349, -1.0385875701904297, -0.9906709790229797, -0.9427543878555298, -0.8948377966880798, -0.8469212055206299, -0.7990045547485352, -0.7510879635810852, -0.7031713724136353, -0.6552547812461853, -0.6073381900787354, -0.5594215989112854, -0.5115050077438354, -0.4635883867740631, -0.41567179560661316, -0.3677552044391632, -0.31983861327171326, -0.2719220221042633, -0.22400541603565216, -0.1760888248682022, -0.12817223370075226, -0.08025562763214111, -0.03233903646469116, 0.015577554702758789, 0.06349414587020874, 0.11141074448823929, 0.15932734310626984, 0.2072439342737198, 0.25516051054000854, 0.3030771315097809, 0.35099372267723083, 0.3989103138446808, 0.44682690501213074, 0.4947434961795807, 0.542660117149353, 0.590576708316803, 0.6384932994842529, 0.6864098906517029, 0.7343264818191528, 0.7822430729866028, 0.8301596641540527, 0.8780762553215027, 0.9259928464889526, 0.9739094376564026, 1.0218260288238525, 1.0697426795959473, 1.1176592111587524, 1.1655758619308472, 1.213492512702942, 1.261409044265747, 1.3093256950378418, 1.357242226600647, 1.4051588773727417, 1.4530754089355469, 1.5009920597076416, 1.5489085912704468]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 4.0, 2.0, 10.0, 11.0, 6.0, 27.0, 34.0, 41.0, 76.0, 136.0, 299.0, 753.0, 3385.0, 122140.0, 4049103.0, 15699.0, 1534.0, 522.0, 242.0, 114.0, 54.0, 29.0, 18.0, 13.0, 10.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.320068359375, -0.30913543701171875, -0.2982025146484375, -0.28726959228515625, -0.276336669921875, -0.26540374755859375, -0.2544708251953125, -0.24353790283203125, -0.23260498046875, -0.22167205810546875, -0.2107391357421875, -0.19980621337890625, -0.188873291015625, -0.17794036865234375, -0.1670074462890625, -0.15607452392578125, -0.1451416015625, -0.13420867919921875, -0.1232757568359375, -0.11234283447265625, -0.101409912109375, -0.09047698974609375, -0.0795440673828125, -0.06861114501953125, -0.05767822265625, -0.04674530029296875, -0.0358123779296875, -0.02487945556640625, -0.013946533203125, -0.00301361083984375, 0.0079193115234375, 0.01885223388671875, 0.02978515625, 0.04071807861328125, 0.0516510009765625, 0.06258392333984375, 0.073516845703125, 0.08444976806640625, 0.0953826904296875, 0.10631561279296875, 0.11724853515625, 0.12818145751953125, 0.1391143798828125, 0.15004730224609375, 0.160980224609375, 0.17191314697265625, 0.1828460693359375, 0.19377899169921875, 0.2047119140625, 0.21564483642578125, 0.2265777587890625, 0.23751068115234375, 0.248443603515625, 0.25937652587890625, 0.2703094482421875, 0.28124237060546875, 0.29217529296875, 0.30310821533203125, 0.3140411376953125, 0.32497406005859375, 0.335906982421875, 0.34683990478515625, 0.3577728271484375, 0.36870574951171875, 0.379638671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 6.0, 20.0, 20.0, 49.0, 153.0, 248.0, 249.0, 118.0, 45.0, 22.0, 12.0, 11.0, 7.0, 9.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.1258087158203125, -0.121124267578125, -0.1164398193359375, -0.11175537109375, -0.1070709228515625, -0.102386474609375, -0.0977020263671875, -0.093017578125, -0.0883331298828125, -0.083648681640625, -0.0789642333984375, -0.07427978515625, -0.0695953369140625, -0.064910888671875, -0.0602264404296875, -0.0555419921875, -0.0508575439453125, -0.046173095703125, -0.0414886474609375, -0.03680419921875, -0.0321197509765625, -0.027435302734375, -0.0227508544921875, -0.01806640625, -0.0133819580078125, -0.008697509765625, -0.0040130615234375, 0.00067138671875, 0.0053558349609375, 0.010040283203125, 0.0147247314453125, 0.0194091796875, 0.0240936279296875, 0.028778076171875, 0.0334625244140625, 0.03814697265625, 0.0428314208984375, 0.047515869140625, 0.0522003173828125, 0.056884765625, 0.0615692138671875, 0.066253662109375, 0.0709381103515625, 0.07562255859375, 0.0803070068359375, 0.084991455078125, 0.0896759033203125, 0.0943603515625, 0.0990447998046875, 0.103729248046875, 0.1084136962890625, 0.11309814453125, 0.1177825927734375, 0.122467041015625, 0.1271514892578125, 0.1318359375, 0.1365203857421875, 0.141204833984375, 0.1458892822265625, 0.15057373046875, 0.1552581787109375, 0.159942626953125, 0.1646270751953125, 0.1693115234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 10.0, 11.0, 21.0, 69.0, 158.0, 838.0, 12915.0, 4163371.0, 15687.0, 904.0, 163.0, 69.0, 29.0, 12.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50341796875, -0.4857635498046875, -0.468109130859375, -0.4504547119140625, -0.43280029296875, -0.4151458740234375, -0.397491455078125, -0.3798370361328125, -0.3621826171875, -0.3445281982421875, -0.326873779296875, -0.3092193603515625, -0.29156494140625, -0.2739105224609375, -0.256256103515625, -0.2386016845703125, -0.220947265625, -0.2032928466796875, -0.185638427734375, -0.1679840087890625, -0.15032958984375, -0.1326751708984375, -0.115020751953125, -0.0973663330078125, -0.0797119140625, -0.0620574951171875, -0.044403076171875, -0.0267486572265625, -0.00909423828125, 0.0085601806640625, 0.026214599609375, 0.0438690185546875, 0.0615234375, 0.0791778564453125, 0.096832275390625, 0.1144866943359375, 0.13214111328125, 0.1497955322265625, 0.167449951171875, 0.1851043701171875, 0.2027587890625, 0.2204132080078125, 0.238067626953125, 0.2557220458984375, 0.27337646484375, 0.2910308837890625, 0.308685302734375, 0.3263397216796875, 0.343994140625, 0.3616485595703125, 0.379302978515625, 0.3969573974609375, 0.41461181640625, 0.4322662353515625, 0.449920654296875, 0.4675750732421875, 0.4852294921875, 0.5028839111328125, 0.520538330078125, 0.5381927490234375, 0.55584716796875, 0.5735015869140625, 0.591156005859375, 0.6088104248046875, 0.62646484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 11.0, 23.0, 55.0, 314.0, 1911.0, 1375.0, 271.0, 66.0, 21.0, 14.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2156982421875, -0.2101573944091797, -0.20461654663085938, -0.19907569885253906, -0.19353485107421875, -0.18799400329589844, -0.18245315551757812, -0.1769123077392578, -0.1713714599609375, -0.1658306121826172, -0.16028976440429688, -0.15474891662597656, -0.14920806884765625, -0.14366722106933594, -0.13812637329101562, -0.1325855255126953, -0.127044677734375, -0.12150382995605469, -0.11596298217773438, -0.11042213439941406, -0.10488128662109375, -0.09934043884277344, -0.09379959106445312, -0.08825874328613281, -0.0827178955078125, -0.07717704772949219, -0.07163619995117188, -0.06609535217285156, -0.06055450439453125, -0.05501365661621094, -0.049472808837890625, -0.04393196105957031, -0.03839111328125, -0.03285026550292969, -0.027309417724609375, -0.021768569946289062, -0.01622772216796875, -0.010686874389648438, -0.005146026611328125, 0.0003948211669921875, 0.0059356689453125, 0.011476516723632812, 0.017017364501953125, 0.022558212280273438, 0.02809906005859375, 0.03363990783691406, 0.039180755615234375, 0.04472160339355469, 0.050262451171875, 0.05580329895019531, 0.061344146728515625, 0.06688499450683594, 0.07242584228515625, 0.07796669006347656, 0.08350753784179688, 0.08904838562011719, 0.0945892333984375, 0.10013008117675781, 0.10567092895507812, 0.11121177673339844, 0.11675262451171875, 0.12229347229003906, 0.12783432006835938, 0.1333751678466797, 0.138916015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 87.0, 535.0, 344.0, 30.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.327150583267212, -1.2938041687011719, -1.2604578733444214, -1.2271114587783813, -1.1937651634216309, -1.1604187488555908, -1.1270723342895508, -1.0937260389328003, -1.0603796243667603, -1.0270332098007202, -0.9936869144439697, -0.9603404998779297, -0.9269941449165344, -0.8936477899551392, -0.8603013753890991, -0.8269550204277039, -0.7936086654663086, -0.7602623105049133, -0.7269159555435181, -0.693569540977478, -0.6602231860160828, -0.6268768310546875, -0.5935304164886475, -0.5601840615272522, -0.5268377065658569, -0.49349135160446167, -0.460144966840744, -0.42679858207702637, -0.3934522271156311, -0.36010587215423584, -0.3267594873905182, -0.29341310262680054, -0.2600668668746948, -0.22672049701213837, -0.1933741271495819, -0.16002775728702545, -0.126681387424469, -0.09333501756191254, -0.05998864769935608, -0.02664227783679962, 0.006704092025756836, 0.04005046188831329, 0.07339683175086975, 0.10674320161342621, 0.14008957147598267, 0.17343594133853912, 0.20678231120109558, 0.24012868106365204, 0.2734750509262085, 0.30682140588760376, 0.3401677906513214, 0.37351417541503906, 0.4068605303764343, 0.4402068853378296, 0.47355327010154724, 0.5068996548652649, 0.5402460098266602, 0.5735923647880554, 0.6069387197494507, 0.6402851343154907, 0.673631489276886, 0.7069778442382812, 0.7403242588043213, 0.7736706137657166, 0.8070169687271118]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 16.0, 19.0, 23.0, 27.0, 40.0, 44.0, 57.0, 65.0, 85.0, 86.0, 87.0, 81.0, 70.0, 70.0, 54.0, 50.0, 37.0, 35.0, 16.0, 23.0, 9.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3746042847633362, -0.3614467680454254, -0.34828925132751465, -0.3351317346096039, -0.3219742178916931, -0.30881667137145996, -0.2956591844558716, -0.2825016379356384, -0.26934412121772766, -0.2561866044998169, -0.24302908778190613, -0.22987157106399536, -0.2167140394449234, -0.20355652272701263, -0.19039900600910187, -0.1772414743900299, -0.16408397257328033, -0.15092645585536957, -0.1377689391374588, -0.12461141496896744, -0.11145389080047607, -0.09829637408256531, -0.08513885736465454, -0.07198133319616318, -0.05882381647825241, -0.045666296035051346, -0.03250877559185028, -0.019351258873939514, -0.006193738430738449, 0.006963782012462616, 0.020121298730373383, 0.033278822898864746, 0.04643633961677551, 0.05959386005997658, 0.07275138050317764, 0.08590889722108841, 0.09906642138957977, 0.11222393810749054, 0.1253814548254013, 0.13853898644447327, 0.15169650316238403, 0.1648540198802948, 0.17801153659820557, 0.19116905331611633, 0.2043265849351883, 0.21748410165309906, 0.23064161837100983, 0.2437991499900818, 0.25695663690567017, 0.27011415362358093, 0.2832716703414917, 0.29642918705940247, 0.30958670377731323, 0.3227442502975464, 0.33590173721313477, 0.3490592837333679, 0.3622168004512787, 0.37537431716918945, 0.3885318338871002, 0.401689350605011, 0.41484686732292175, 0.4280043840408325, 0.4411619305610657, 0.45431944727897644, 0.4674769639968872]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 14.0, 16.0, 12.0, 20.0, 28.0, 33.0, 49.0, 50.0, 95.0, 124.0, 203.0, 346.0, 533.0, 963.0, 1852.0, 3677.0, 8785.0, 29467.0, 200742.0, 675228.0, 95510.0, 17939.0, 6506.0, 2758.0, 1416.0, 786.0, 476.0, 282.0, 183.0, 129.0, 90.0, 64.0, 43.0, 37.0, 22.0, 13.0, 9.0, 11.0, 7.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.16259765625, -0.15771865844726562, -0.15283966064453125, -0.14796066284179688, -0.1430816650390625, -0.13820266723632812, -0.13332366943359375, -0.12844467163085938, -0.123565673828125, -0.11868667602539062, -0.11380767822265625, -0.10892868041992188, -0.1040496826171875, -0.09917068481445312, -0.09429168701171875, -0.08941268920898438, -0.08453369140625, -0.07965469360351562, -0.07477569580078125, -0.06989669799804688, -0.0650177001953125, -0.060138702392578125, -0.05525970458984375, -0.050380706787109375, -0.045501708984375, -0.040622711181640625, -0.03574371337890625, -0.030864715576171875, -0.0259857177734375, -0.021106719970703125, -0.01622772216796875, -0.011348724365234375, -0.0064697265625, -0.001590728759765625, 0.00328826904296875, 0.008167266845703125, 0.0130462646484375, 0.017925262451171875, 0.02280426025390625, 0.027683258056640625, 0.032562255859375, 0.037441253662109375, 0.04232025146484375, 0.047199249267578125, 0.0520782470703125, 0.056957244873046875, 0.06183624267578125, 0.06671524047851562, 0.07159423828125, 0.07647323608398438, 0.08135223388671875, 0.08623123168945312, 0.0911102294921875, 0.09598922729492188, 0.10086822509765625, 0.10574722290039062, 0.110626220703125, 0.11550521850585938, 0.12038421630859375, 0.12526321411132812, 0.1301422119140625, 0.13502120971679688, 0.13990020751953125, 0.14477920532226562, 0.149658203125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 3.0, 9.0, 9.0, 6.0, 18.0, 21.0, 63.0, 160.0, 252.0, 236.0, 114.0, 38.0, 20.0, 14.0, 7.0, 6.0, 10.0, 8.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12143516540527344, -0.11689376831054688, -0.11235237121582031, -0.10781097412109375, -0.10326957702636719, -0.09872817993164062, -0.09418678283691406, -0.0896453857421875, -0.08510398864746094, -0.08056259155273438, -0.07602119445800781, -0.07147979736328125, -0.06693840026855469, -0.062397003173828125, -0.05785560607910156, -0.053314208984375, -0.04877281188964844, -0.044231414794921875, -0.03969001770019531, -0.03514862060546875, -0.030607223510742188, -0.026065826416015625, -0.021524429321289062, -0.0169830322265625, -0.012441635131835938, -0.007900238037109375, -0.0033588409423828125, 0.00118255615234375, 0.0057239532470703125, 0.010265350341796875, 0.014806747436523438, 0.01934814453125, 0.023889541625976562, 0.028430938720703125, 0.03297233581542969, 0.03751373291015625, 0.04205513000488281, 0.046596527099609375, 0.05113792419433594, 0.0556793212890625, 0.06022071838378906, 0.06476211547851562, 0.06930351257324219, 0.07384490966796875, 0.07838630676269531, 0.08292770385742188, 0.08746910095214844, 0.092010498046875, 0.09655189514160156, 0.10109329223632812, 0.10563468933105469, 0.11017608642578125, 0.11471748352050781, 0.11925888061523438, 0.12380027770996094, 0.1283416748046875, 0.13288307189941406, 0.13742446899414062, 0.1419658660888672, 0.14650726318359375, 0.1510486602783203, 0.15559005737304688, 0.16013145446777344, 0.1646728515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 4.0, 7.0, 5.0, 8.0, 10.0, 16.0, 14.0, 18.0, 37.0, 25.0, 35.0, 47.0, 54.0, 76.0, 90.0, 114.0, 173.0, 236.0, 384.0, 802.0, 2247.0, 17118.0, 546279.0, 462386.0, 14203.0, 2022.0, 792.0, 397.0, 235.0, 170.0, 122.0, 87.0, 62.0, 57.0, 44.0, 42.0, 24.0, 18.0, 31.0, 15.0, 11.0, 15.0, 10.0, 5.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.25927734375, -0.25141334533691406, -0.24354934692382812, -0.2356853485107422, -0.22782135009765625, -0.2199573516845703, -0.21209335327148438, -0.20422935485839844, -0.1963653564453125, -0.18850135803222656, -0.18063735961914062, -0.1727733612060547, -0.16490936279296875, -0.1570453643798828, -0.14918136596679688, -0.14131736755371094, -0.133453369140625, -0.12558937072753906, -0.11772537231445312, -0.10986137390136719, -0.10199737548828125, -0.09413337707519531, -0.08626937866210938, -0.07840538024902344, -0.0705413818359375, -0.06267738342285156, -0.054813385009765625, -0.04694938659667969, -0.03908538818359375, -0.031221389770507812, -0.023357391357421875, -0.015493392944335938, -0.00762939453125, 0.0002346038818359375, 0.008098602294921875, 0.015962600708007812, 0.02382659912109375, 0.03169059753417969, 0.039554595947265625, 0.04741859436035156, 0.0552825927734375, 0.06314659118652344, 0.07101058959960938, 0.07887458801269531, 0.08673858642578125, 0.09460258483886719, 0.10246658325195312, 0.11033058166503906, 0.118194580078125, 0.12605857849121094, 0.13392257690429688, 0.1417865753173828, 0.14965057373046875, 0.1575145721435547, 0.16537857055664062, 0.17324256896972656, 0.1811065673828125, 0.18897056579589844, 0.19683456420898438, 0.2046985626220703, 0.21256256103515625, 0.2204265594482422, 0.22829055786132812, 0.23615455627441406, 0.2440185546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 4.0, 9.0, 8.0, 4.0, 9.0, 13.0, 12.0, 20.0, 29.0, 25.0, 15.0, 43.0, 33.0, 32.0, 28.0, 40.0, 40.0, 35.0, 54.0, 46.0, 40.0, 36.0, 29.0, 36.0, 37.0, 30.0, 37.0, 25.0, 35.0, 21.0, 23.0, 19.0, 23.0, 18.0, 10.0, 10.0, 10.0, 11.0, 9.0, 12.0, 3.0, 6.0, 2.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.232421875, -0.22567176818847656, -0.21892166137695312, -0.2121715545654297, -0.20542144775390625, -0.1986713409423828, -0.19192123413085938, -0.18517112731933594, -0.1784210205078125, -0.17167091369628906, -0.16492080688476562, -0.1581707000732422, -0.15142059326171875, -0.1446704864501953, -0.13792037963867188, -0.13117027282714844, -0.124420166015625, -0.11767005920410156, -0.11091995239257812, -0.10416984558105469, -0.09741973876953125, -0.09066963195800781, -0.08391952514648438, -0.07716941833496094, -0.0704193115234375, -0.06366920471191406, -0.056919097900390625, -0.05016899108886719, -0.04341888427734375, -0.03666877746582031, -0.029918670654296875, -0.023168563842773438, -0.01641845703125, -0.009668350219726562, -0.002918243408203125, 0.0038318634033203125, 0.01058197021484375, 0.017332077026367188, 0.024082183837890625, 0.030832290649414062, 0.0375823974609375, 0.04433250427246094, 0.051082611083984375, 0.05783271789550781, 0.06458282470703125, 0.07133293151855469, 0.07808303833007812, 0.08483314514160156, 0.091583251953125, 0.09833335876464844, 0.10508346557617188, 0.11183357238769531, 0.11858367919921875, 0.1253337860107422, 0.13208389282226562, 0.13883399963378906, 0.1455841064453125, 0.15233421325683594, 0.15908432006835938, 0.1658344268798828, 0.17258453369140625, 0.1793346405029297, 0.18608474731445312, 0.19283485412597656, 0.1995849609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 5.0, 3.0, 9.0, 14.0, 16.0, 36.0, 42.0, 72.0, 158.0, 273.0, 570.0, 1483.0, 5102.0, 26812.0, 298745.0, 661540.0, 43229.0, 7081.0, 1912.0, 712.0, 312.0, 181.0, 96.0, 46.0, 33.0, 24.0, 21.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0753173828125, -0.0730428695678711, -0.07076835632324219, -0.06849384307861328, -0.06621932983398438, -0.06394481658935547, -0.06167030334472656, -0.059395790100097656, -0.05712127685546875, -0.054846763610839844, -0.05257225036621094, -0.05029773712158203, -0.048023223876953125, -0.04574871063232422, -0.04347419738769531, -0.041199684143066406, -0.0389251708984375, -0.036650657653808594, -0.03437614440917969, -0.03210163116455078, -0.029827117919921875, -0.02755260467529297, -0.025278091430664062, -0.023003578186035156, -0.02072906494140625, -0.018454551696777344, -0.016180038452148438, -0.013905525207519531, -0.011631011962890625, -0.009356498718261719, -0.0070819854736328125, -0.004807472229003906, -0.002532958984375, -0.00025844573974609375, 0.0020160675048828125, 0.004290580749511719, 0.006565093994140625, 0.008839607238769531, 0.011114120483398438, 0.013388633728027344, 0.01566314697265625, 0.017937660217285156, 0.020212173461914062, 0.02248668670654297, 0.024761199951171875, 0.02703571319580078, 0.029310226440429688, 0.031584739685058594, 0.0338592529296875, 0.036133766174316406, 0.03840827941894531, 0.04068279266357422, 0.042957305908203125, 0.04523181915283203, 0.04750633239746094, 0.049780845642089844, 0.05205535888671875, 0.054329872131347656, 0.05660438537597656, 0.05887889862060547, 0.061153411865234375, 0.06342792510986328, 0.06570243835449219, 0.0679769515991211, 0.07025146484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 7.0, 18.0, 12.0, 24.0, 23.0, 33.0, 50.0, 59.0, 91.0, 127.0, 121.0, 110.0, 96.0, 47.0, 51.0, 20.0, 18.0, 18.0, 9.0, 13.0, 7.0, 12.0, 5.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.52346420288086e-06, -8.184462785720825e-06, -7.845461368560791e-06, -7.506459951400757e-06, -7.167458534240723e-06, -6.8284571170806885e-06, -6.489455699920654e-06, -6.15045428276062e-06, -5.811452865600586e-06, -5.472451448440552e-06, -5.133450031280518e-06, -4.794448614120483e-06, -4.455447196960449e-06, -4.116445779800415e-06, -3.777444362640381e-06, -3.4384429454803467e-06, -3.0994415283203125e-06, -2.7604401111602783e-06, -2.421438694000244e-06, -2.08243727684021e-06, -1.7434358596801758e-06, -1.4044344425201416e-06, -1.0654330253601074e-06, -7.264316082000732e-07, -3.8743019104003906e-07, -4.842877388000488e-08, 2.905726432800293e-07, 6.295740604400635e-07, 9.685754776000977e-07, 1.3075768947601318e-06, 1.646578311920166e-06, 1.9855797290802e-06, 2.3245811462402344e-06, 2.6635825634002686e-06, 3.0025839805603027e-06, 3.341585397720337e-06, 3.680586814880371e-06, 4.019588232040405e-06, 4.3585896492004395e-06, 4.697591066360474e-06, 5.036592483520508e-06, 5.375593900680542e-06, 5.714595317840576e-06, 6.05359673500061e-06, 6.3925981521606445e-06, 6.731599569320679e-06, 7.070600986480713e-06, 7.409602403640747e-06, 7.748603820800781e-06, 8.087605237960815e-06, 8.42660665512085e-06, 8.765608072280884e-06, 9.104609489440918e-06, 9.443610906600952e-06, 9.782612323760986e-06, 1.012161374092102e-05, 1.0460615158081055e-05, 1.0799616575241089e-05, 1.1138617992401123e-05, 1.1477619409561157e-05, 1.1816620826721191e-05, 1.2155622243881226e-05, 1.249462366104126e-05, 1.2833625078201294e-05, 1.3172626495361328e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 5.0, 6.0, 4.0, 10.0, 14.0, 24.0, 25.0, 31.0, 42.0, 85.0, 130.0, 201.0, 378.0, 741.0, 1581.0, 4577.0, 18520.0, 137943.0, 783431.0, 81452.0, 12993.0, 3561.0, 1303.0, 635.0, 305.0, 192.0, 111.0, 77.0, 44.0, 26.0, 24.0, 19.0, 15.0, 9.0, 5.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.0765380859375, -0.07431221008300781, -0.07208633422851562, -0.06986045837402344, -0.06763458251953125, -0.06540870666503906, -0.06318283081054688, -0.06095695495605469, -0.0587310791015625, -0.05650520324707031, -0.054279327392578125, -0.05205345153808594, -0.04982757568359375, -0.04760169982910156, -0.045375823974609375, -0.04314994812011719, -0.040924072265625, -0.03869819641113281, -0.036472320556640625, -0.03424644470214844, -0.03202056884765625, -0.029794692993164062, -0.027568817138671875, -0.025342941284179688, -0.0231170654296875, -0.020891189575195312, -0.018665313720703125, -0.016439437866210938, -0.01421356201171875, -0.011987686157226562, -0.009761810302734375, -0.0075359344482421875, -0.00531005859375, -0.0030841827392578125, -0.000858306884765625, 0.0013675689697265625, 0.00359344482421875, 0.0058193206787109375, 0.008045196533203125, 0.010271072387695312, 0.0124969482421875, 0.014722824096679688, 0.016948699951171875, 0.019174575805664062, 0.02140045166015625, 0.023626327514648438, 0.025852203369140625, 0.028078079223632812, 0.030303955078125, 0.03252983093261719, 0.034755706787109375, 0.03698158264160156, 0.03920745849609375, 0.04143333435058594, 0.043659210205078125, 0.04588508605957031, 0.0481109619140625, 0.05033683776855469, 0.052562713623046875, 0.05478858947753906, 0.05701446533203125, 0.05924034118652344, 0.061466217041015625, 0.06369209289550781, 0.06591796875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 7.0, 8.0, 16.0, 26.0, 31.0, 27.0, 53.0, 84.0, 126.0, 180.0, 144.0, 85.0, 63.0, 49.0, 22.0, 22.0, 9.0, 9.0, 6.0, 7.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.09649658203125, -0.09412670135498047, -0.09175682067871094, -0.0893869400024414, -0.08701705932617188, -0.08464717864990234, -0.08227729797363281, -0.07990741729736328, -0.07753753662109375, -0.07516765594482422, -0.07279777526855469, -0.07042789459228516, -0.06805801391601562, -0.0656881332397461, -0.06331825256347656, -0.06094837188720703, -0.0585784912109375, -0.05620861053466797, -0.05383872985839844, -0.051468849182128906, -0.049098968505859375, -0.046729087829589844, -0.04435920715332031, -0.04198932647705078, -0.03961944580078125, -0.03724956512451172, -0.03487968444824219, -0.032509803771972656, -0.030139923095703125, -0.027770042419433594, -0.025400161743164062, -0.02303028106689453, -0.020660400390625, -0.01829051971435547, -0.015920639038085938, -0.013550758361816406, -0.011180877685546875, -0.008810997009277344, -0.0064411163330078125, -0.004071235656738281, -0.00170135498046875, 0.0006685256958007812, 0.0030384063720703125, 0.005408287048339844, 0.007778167724609375, 0.010148048400878906, 0.012517929077148438, 0.014887809753417969, 0.0172576904296875, 0.01962757110595703, 0.021997451782226562, 0.024367332458496094, 0.026737213134765625, 0.029107093811035156, 0.03147697448730469, 0.03384685516357422, 0.03621673583984375, 0.03858661651611328, 0.04095649719238281, 0.043326377868652344, 0.045696258544921875, 0.048066139221191406, 0.05043601989746094, 0.05280590057373047, 0.05517578125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 15.0, 53.0, 199.0, 403.0, 229.0, 67.0, 20.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1133036613464355, -1.0641229152679443, -1.0149421691894531, -0.9657613635063171, -0.9165806174278259, -0.8673998117446899, -0.8182190656661987, -0.7690383195877075, -0.7198575735092163, -0.6706768274307251, -0.6214960217475891, -0.5723152756690979, -0.5231345295906067, -0.4739537537097931, -0.4247729778289795, -0.3755922317504883, -0.3264114260673523, -0.2772306501865387, -0.22804990410804749, -0.1788691282272339, -0.12968836724758148, -0.08050760626792908, -0.03132683038711548, 0.017853915691375732, 0.06703469157218933, 0.11621545255184174, 0.16539621353149414, 0.21457698941230774, 0.26375776529312134, 0.31293851137161255, 0.36211928725242615, 0.41130003333091736, 0.46048080921173096, 0.5096615552902222, 0.5588423609733582, 0.6080231070518494, 0.6572038531303406, 0.7063846588134766, 0.7555654048919678, 0.804746150970459, 0.8539268970489502, 0.9031076431274414, 0.9522884488105774, 1.0014691352844238, 1.0506500005722046, 1.0998307466506958, 1.149011492729187, 1.1981922388076782, 1.247373104095459, 1.2965538501739502, 1.3457345962524414, 1.3949153423309326, 1.4440962076187134, 1.4932769536972046, 1.5424576997756958, 1.591638445854187, 1.6408191919326782, 1.6899999380111694, 1.7391806840896606, 1.7883615493774414, 1.8375422954559326, 1.8867230415344238, 1.935903787612915, 1.9850845336914062, 2.0342652797698975]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 2.0, 6.0, 4.0, 7.0, 7.0, 20.0, 21.0, 20.0, 26.0, 20.0, 29.0, 34.0, 45.0, 45.0, 48.0, 42.0, 50.0, 49.0, 63.0, 61.0, 51.0, 45.0, 49.0, 35.0, 36.0, 30.0, 27.0, 23.0, 15.0, 13.0, 17.0, 12.0, 4.0, 9.0, 9.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0], "bins": [-1.693314552307129, -1.6472734212875366, -1.6012322902679443, -1.5551912784576416, -1.5091501474380493, -1.463109016418457, -1.4170678853988647, -1.3710267543792725, -1.3249857425689697, -1.2789446115493774, -1.2329034805297852, -1.1868624687194824, -1.1408213376998901, -1.0947802066802979, -1.0487390756607056, -1.0026979446411133, -0.9566568732261658, -0.9106157422065735, -0.864574670791626, -0.8185335397720337, -0.7724924683570862, -0.7264513373374939, -0.6804102659225464, -0.6343691349029541, -0.5883280038833618, -0.5422868728637695, -0.496245801448822, -0.45020467042922974, -0.4041635990142822, -0.35812246799468994, -0.31208136677742004, -0.26604026556015015, -0.21999919414520264, -0.17395809292793274, -0.12791699171066284, -0.08187587559223175, -0.03583477437496185, 0.010206326842308044, 0.056247442960739136, 0.10228854417800903, 0.14832964539527893, 0.19437074661254883, 0.24041184782981873, 0.2864529490470886, 0.3324940800666809, 0.3785351514816284, 0.4245762825012207, 0.4706173837184906, 0.5166584849357605, 0.5626996159553528, 0.6087406873703003, 0.6547818183898926, 0.7008228898048401, 0.7468640208244324, 0.7929050922393799, 0.8389462232589722, 0.8849873542785645, 0.9310284852981567, 0.9770695567131042, 1.0231106281280518, 1.069151759147644, 1.1151928901672363, 1.1612340211868286, 1.207275152206421, 1.2533161640167236]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 8.0, 4.0, 12.0, 3.0, 7.0, 13.0, 26.0, 43.0, 34.0, 99.0, 175.0, 405.0, 1386.0, 9916.0, 3658255.0, 514460.0, 7524.0, 1116.0, 353.0, 177.0, 102.0, 63.0, 24.0, 29.0, 15.0, 15.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2286376953125, -0.22124671936035156, -0.21385574340820312, -0.2064647674560547, -0.19907379150390625, -0.1916828155517578, -0.18429183959960938, -0.17690086364746094, -0.1695098876953125, -0.16211891174316406, -0.15472793579101562, -0.1473369598388672, -0.13994598388671875, -0.1325550079345703, -0.12516403198242188, -0.11777305603027344, -0.110382080078125, -0.10299110412597656, -0.09560012817382812, -0.08820915222167969, -0.08081817626953125, -0.07342720031738281, -0.06603622436523438, -0.05864524841308594, -0.0512542724609375, -0.04386329650878906, -0.036472320556640625, -0.029081344604492188, -0.02169036865234375, -0.014299392700195312, -0.006908416748046875, 0.0004825592041015625, 0.00787353515625, 0.015264511108398438, 0.022655487060546875, 0.030046463012695312, 0.03743743896484375, 0.04482841491699219, 0.052219390869140625, 0.05961036682128906, 0.0670013427734375, 0.07439231872558594, 0.08178329467773438, 0.08917427062988281, 0.09656524658203125, 0.10395622253417969, 0.11134719848632812, 0.11873817443847656, 0.126129150390625, 0.13352012634277344, 0.14091110229492188, 0.1483020782470703, 0.15569305419921875, 0.1630840301513672, 0.17047500610351562, 0.17786598205566406, 0.1852569580078125, 0.19264793395996094, 0.20003890991210938, 0.2074298858642578, 0.21482086181640625, 0.2222118377685547, 0.22960281372070312, 0.23699378967285156, 0.244384765625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 8.0, 7.0, 9.0, 11.0, 16.0, 36.0, 107.0, 190.0, 273.0, 189.0, 61.0, 36.0, 15.0, 12.0, 6.0, 10.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128662109375, -0.12412071228027344, -0.11957931518554688, -0.11503791809082031, -0.11049652099609375, -0.10595512390136719, -0.10141372680664062, -0.09687232971191406, -0.0923309326171875, -0.08778953552246094, -0.08324813842773438, -0.07870674133300781, -0.07416534423828125, -0.06962394714355469, -0.06508255004882812, -0.06054115295410156, -0.055999755859375, -0.05145835876464844, -0.046916961669921875, -0.04237556457519531, -0.03783416748046875, -0.03329277038574219, -0.028751373291015625, -0.024209976196289062, -0.0196685791015625, -0.015127182006835938, -0.010585784912109375, -0.0060443878173828125, -0.00150299072265625, 0.0030384063720703125, 0.007579803466796875, 0.012121200561523438, 0.01666259765625, 0.021203994750976562, 0.025745391845703125, 0.030286788940429688, 0.03482818603515625, 0.03936958312988281, 0.043910980224609375, 0.04845237731933594, 0.0529937744140625, 0.05753517150878906, 0.062076568603515625, 0.06661796569824219, 0.07115936279296875, 0.07570075988769531, 0.08024215698242188, 0.08478355407714844, 0.089324951171875, 0.09386634826660156, 0.09840774536132812, 0.10294914245605469, 0.10749053955078125, 0.11203193664550781, 0.11657333374023438, 0.12111473083496094, 0.1256561279296875, 0.13019752502441406, 0.13473892211914062, 0.1392803192138672, 0.14382171630859375, 0.1483631134033203, 0.15290451049804688, 0.15744590759277344, 0.1619873046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 44.0, 70.0, 264.0, 1790.0, 32927.0, 4076474.0, 79475.0, 2649.0, 389.0, 105.0, 41.0, 14.0, 10.0, 6.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.2882881164550781, -0.28018951416015625, -0.2720909118652344, -0.2639923095703125, -0.2558937072753906, -0.24779510498046875, -0.23969650268554688, -0.231597900390625, -0.22349929809570312, -0.21540069580078125, -0.20730209350585938, -0.1992034912109375, -0.19110488891601562, -0.18300628662109375, -0.17490768432617188, -0.16680908203125, -0.15871047973632812, -0.15061187744140625, -0.14251327514648438, -0.1344146728515625, -0.12631607055664062, -0.11821746826171875, -0.11011886596679688, -0.102020263671875, -0.09392166137695312, -0.08582305908203125, -0.07772445678710938, -0.0696258544921875, -0.061527252197265625, -0.05342864990234375, -0.045330047607421875, -0.0372314453125, -0.029132843017578125, -0.02103424072265625, -0.012935638427734375, -0.0048370361328125, 0.003261566162109375, 0.01136016845703125, 0.019458770751953125, 0.027557373046875, 0.035655975341796875, 0.04375457763671875, 0.051853179931640625, 0.0599517822265625, 0.06805038452148438, 0.07614898681640625, 0.08424758911132812, 0.09234619140625, 0.10044479370117188, 0.10854339599609375, 0.11664199829101562, 0.1247406005859375, 0.13283920288085938, 0.14093780517578125, 0.14903640747070312, 0.157135009765625, 0.16523361206054688, 0.17333221435546875, 0.18143081665039062, 0.1895294189453125, 0.19762802124023438, 0.20572662353515625, 0.21382522583007812, 0.221923828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 17.0, 25.0, 44.0, 113.0, 335.0, 2317.0, 807.0, 254.0, 89.0, 37.0, 23.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0645751953125, -0.062073707580566406, -0.05957221984863281, -0.05707073211669922, -0.054569244384765625, -0.05206775665283203, -0.04956626892089844, -0.047064781188964844, -0.04456329345703125, -0.042061805725097656, -0.03956031799316406, -0.03705883026123047, -0.034557342529296875, -0.03205585479736328, -0.029554367065429688, -0.027052879333496094, -0.0245513916015625, -0.022049903869628906, -0.019548416137695312, -0.01704692840576172, -0.014545440673828125, -0.012043952941894531, -0.009542465209960938, -0.007040977478027344, -0.00453948974609375, -0.0020380020141601562, 0.0004634857177734375, 0.0029649734497070312, 0.005466461181640625, 0.007967948913574219, 0.010469436645507812, 0.012970924377441406, 0.015472412109375, 0.017973899841308594, 0.020475387573242188, 0.02297687530517578, 0.025478363037109375, 0.02797985076904297, 0.030481338500976562, 0.032982826232910156, 0.03548431396484375, 0.037985801696777344, 0.04048728942871094, 0.04298877716064453, 0.045490264892578125, 0.04799175262451172, 0.05049324035644531, 0.052994728088378906, 0.0554962158203125, 0.057997703552246094, 0.06049919128417969, 0.06300067901611328, 0.06550216674804688, 0.06800365447998047, 0.07050514221191406, 0.07300662994384766, 0.07550811767578125, 0.07800960540771484, 0.08051109313964844, 0.08301258087158203, 0.08551406860351562, 0.08801555633544922, 0.09051704406738281, 0.0930185317993164, 0.09552001953125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 27.0, 85.0, 246.0, 412.0, 172.0, 43.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3954436182975769, -0.38095805048942566, -0.3664724826812744, -0.35198691487312317, -0.3375013470649719, -0.3230157792568207, -0.30853021144866943, -0.2940446734428406, -0.27955907583236694, -0.2650735080242157, -0.25058794021606445, -0.2361023724079132, -0.22161680459976196, -0.20713123679161072, -0.19264568388462067, -0.17816011607646942, -0.16367456316947937, -0.14918899536132812, -0.13470342755317688, -0.12021786719560623, -0.10573229938745499, -0.09124673157930374, -0.0767611712217331, -0.06227560341358185, -0.0477900356054306, -0.03330446779727936, -0.01881890371441841, -0.004333339631557465, 0.01015222817659378, 0.024637795984745026, 0.039123356342315674, 0.05360892415046692, 0.06809449195861816, 0.08258005976676941, 0.09706562757492065, 0.1115511879324913, 0.12603676319122314, 0.1405223309993744, 0.15500788390636444, 0.16949345171451569, 0.18397901952266693, 0.19846458733081818, 0.21295015513896942, 0.22743570804595947, 0.24192127585411072, 0.25640684366226196, 0.2708924114704132, 0.28537797927856445, 0.2998635470867157, 0.31434911489486694, 0.3288346827030182, 0.34332025051116943, 0.3578058183193207, 0.3722913861274719, 0.3867769241333008, 0.4012625217437744, 0.41574805974960327, 0.4302336275577545, 0.44471919536590576, 0.459204763174057, 0.47369033098220825, 0.4881758987903595, 0.5026614665985107, 0.5171470046043396, 0.5316326022148132]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 9.0, 11.0, 15.0, 18.0, 27.0, 30.0, 42.0, 49.0, 52.0, 52.0, 68.0, 58.0, 65.0, 73.0, 65.0, 65.0, 56.0, 39.0, 37.0, 33.0, 34.0, 21.0, 22.0, 17.0, 14.0, 7.0, 9.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1941661238670349, -0.18874065577983856, -0.1833151876926422, -0.17788971960544586, -0.1724642515182495, -0.16703878343105316, -0.1616133153438568, -0.15618786215782166, -0.1507623791694641, -0.14533691108226776, -0.1399114429950714, -0.13448597490787506, -0.1290605068206787, -0.12363503873348236, -0.11820957809686661, -0.11278411000967026, -0.1073586493730545, -0.10193318128585815, -0.0965077131986618, -0.09108224511146545, -0.0856567770242691, -0.08023130893707275, -0.074805848300457, -0.06938038021326065, -0.0639549121260643, -0.05852944403886795, -0.0531039759516716, -0.04767851158976555, -0.0422530435025692, -0.03682757541537285, -0.0314021110534668, -0.025976642966270447, -0.020551174879074097, -0.015125707723200321, -0.009700240567326546, -0.004274774342775345, 0.0011506937444210052, 0.006576161831617355, 0.012001626193523407, 0.017427094280719757, 0.022852562367916107, 0.028278030455112457, 0.03370349854230881, 0.03912896290421486, 0.04455443099141121, 0.04997989907860756, 0.05540536344051361, 0.06083083152770996, 0.06625629961490631, 0.07168176770210266, 0.07710723578929901, 0.08253270387649536, 0.08795817196369171, 0.09338364005088806, 0.09880910068750381, 0.10423456877470016, 0.10966003686189651, 0.11508550494909286, 0.12051097303628922, 0.12593643367290497, 0.13136190176010132, 0.13678736984729767, 0.14221283793449402, 0.14763830602169037, 0.15306377410888672]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 8.0, 18.0, 18.0, 26.0, 39.0, 51.0, 58.0, 102.0, 124.0, 222.0, 319.0, 492.0, 866.0, 1784.0, 3880.0, 10240.0, 36888.0, 224650.0, 637680.0, 98311.0, 19938.0, 6523.0, 2866.0, 1402.0, 751.0, 404.0, 244.0, 201.0, 130.0, 90.0, 50.0, 45.0, 34.0, 27.0, 8.0, 15.0, 12.0, 10.0, 3.0, 2.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.1422119140625, -0.13829326629638672, -0.13437461853027344, -0.13045597076416016, -0.12653732299804688, -0.1226186752319336, -0.11870002746582031, -0.11478137969970703, -0.11086273193359375, -0.10694408416748047, -0.10302543640136719, -0.0991067886352539, -0.09518814086914062, -0.09126949310302734, -0.08735084533691406, -0.08343219757080078, -0.0795135498046875, -0.07559490203857422, -0.07167625427246094, -0.06775760650634766, -0.06383895874023438, -0.059920310974121094, -0.05600166320800781, -0.05208301544189453, -0.04816436767578125, -0.04424571990966797, -0.04032707214355469, -0.036408424377441406, -0.032489776611328125, -0.028571128845214844, -0.024652481079101562, -0.02073383331298828, -0.016815185546875, -0.012896537780761719, -0.008977890014648438, -0.005059242248535156, -0.001140594482421875, 0.0027780532836914062, 0.0066967010498046875, 0.010615348815917969, 0.01453399658203125, 0.01845264434814453, 0.022371292114257812, 0.026289939880371094, 0.030208587646484375, 0.034127235412597656, 0.03804588317871094, 0.04196453094482422, 0.0458831787109375, 0.04980182647705078, 0.05372047424316406, 0.057639122009277344, 0.061557769775390625, 0.0654764175415039, 0.06939506530761719, 0.07331371307373047, 0.07723236083984375, 0.08115100860595703, 0.08506965637207031, 0.0889883041381836, 0.09290695190429688, 0.09682559967041016, 0.10074424743652344, 0.10466289520263672, 0.10858154296875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 7.0, 10.0, 6.0, 11.0, 17.0, 27.0, 109.0, 182.0, 269.0, 189.0, 82.0, 33.0, 15.0, 11.0, 5.0, 12.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1287841796875, -0.12425041198730469, -0.11971664428710938, -0.11518287658691406, -0.11064910888671875, -0.10611534118652344, -0.10158157348632812, -0.09704780578613281, -0.0925140380859375, -0.08798027038574219, -0.08344650268554688, -0.07891273498535156, -0.07437896728515625, -0.06984519958496094, -0.06531143188476562, -0.06077766418457031, -0.056243896484375, -0.05171012878417969, -0.047176361083984375, -0.04264259338378906, -0.03810882568359375, -0.03357505798339844, -0.029041290283203125, -0.024507522583007812, -0.0199737548828125, -0.015439987182617188, -0.010906219482421875, -0.0063724517822265625, -0.00183868408203125, 0.0026950836181640625, 0.007228851318359375, 0.011762619018554688, 0.01629638671875, 0.020830154418945312, 0.025363922119140625, 0.029897689819335938, 0.03443145751953125, 0.03896522521972656, 0.043498992919921875, 0.04803276062011719, 0.0525665283203125, 0.05710029602050781, 0.061634063720703125, 0.06616783142089844, 0.07070159912109375, 0.07523536682128906, 0.07976913452148438, 0.08430290222167969, 0.088836669921875, 0.09337043762207031, 0.09790420532226562, 0.10243797302246094, 0.10697174072265625, 0.11150550842285156, 0.11603927612304688, 0.12057304382324219, 0.1251068115234375, 0.1296405792236328, 0.13417434692382812, 0.13870811462402344, 0.14324188232421875, 0.14777565002441406, 0.15230941772460938, 0.1568431854248047, 0.161376953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 5.0, 14.0, 10.0, 23.0, 20.0, 18.0, 32.0, 36.0, 44.0, 53.0, 71.0, 79.0, 89.0, 140.0, 192.0, 322.0, 566.0, 1243.0, 4248.0, 71258.0, 908901.0, 54485.0, 3846.0, 1163.0, 530.0, 298.0, 189.0, 122.0, 95.0, 95.0, 71.0, 53.0, 54.0, 30.0, 27.0, 31.0, 18.0, 16.0, 12.0, 12.0, 9.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.2607421875, -0.25295066833496094, -0.24515914916992188, -0.2373676300048828, -0.22957611083984375, -0.2217845916748047, -0.21399307250976562, -0.20620155334472656, -0.1984100341796875, -0.19061851501464844, -0.18282699584960938, -0.1750354766845703, -0.16724395751953125, -0.1594524383544922, -0.15166091918945312, -0.14386940002441406, -0.136077880859375, -0.12828636169433594, -0.12049484252929688, -0.11270332336425781, -0.10491180419921875, -0.09712028503417969, -0.08932876586914062, -0.08153724670410156, -0.0737457275390625, -0.06595420837402344, -0.058162689208984375, -0.05037117004394531, -0.04257965087890625, -0.03478813171386719, -0.026996612548828125, -0.019205093383789062, -0.01141357421875, -0.0036220550537109375, 0.004169464111328125, 0.011960983276367188, 0.01975250244140625, 0.027544021606445312, 0.035335540771484375, 0.04312705993652344, 0.0509185791015625, 0.05871009826660156, 0.06650161743164062, 0.07429313659667969, 0.08208465576171875, 0.08987617492675781, 0.09766769409179688, 0.10545921325683594, 0.113250732421875, 0.12104225158691406, 0.12883377075195312, 0.1366252899169922, 0.14441680908203125, 0.1522083282470703, 0.15999984741210938, 0.16779136657714844, 0.1755828857421875, 0.18337440490722656, 0.19116592407226562, 0.1989574432373047, 0.20674896240234375, 0.2145404815673828, 0.22233200073242188, 0.23012351989746094, 0.2379150390625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 7.0, 7.0, 8.0, 8.0, 18.0, 15.0, 18.0, 11.0, 30.0, 22.0, 24.0, 28.0, 31.0, 37.0, 44.0, 35.0, 42.0, 39.0, 34.0, 44.0, 35.0, 45.0, 32.0, 36.0, 39.0, 38.0, 42.0, 24.0, 19.0, 24.0, 22.0, 29.0, 18.0, 15.0, 12.0, 11.0, 10.0, 9.0, 13.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.217529296875, -0.2109394073486328, -0.20434951782226562, -0.19775962829589844, -0.19116973876953125, -0.18457984924316406, -0.17798995971679688, -0.1714000701904297, -0.1648101806640625, -0.1582202911376953, -0.15163040161132812, -0.14504051208496094, -0.13845062255859375, -0.13186073303222656, -0.12527084350585938, -0.11868095397949219, -0.112091064453125, -0.10550117492675781, -0.09891128540039062, -0.09232139587402344, -0.08573150634765625, -0.07914161682128906, -0.07255172729492188, -0.06596183776855469, -0.0593719482421875, -0.05278205871582031, -0.046192169189453125, -0.03960227966308594, -0.03301239013671875, -0.026422500610351562, -0.019832611083984375, -0.013242721557617188, -0.00665283203125, -6.29425048828125e-05, 0.006526947021484375, 0.013116836547851562, 0.01970672607421875, 0.026296615600585938, 0.032886505126953125, 0.03947639465332031, 0.0460662841796875, 0.05265617370605469, 0.059246063232421875, 0.06583595275878906, 0.07242584228515625, 0.07901573181152344, 0.08560562133789062, 0.09219551086425781, 0.098785400390625, 0.10537528991699219, 0.11196517944335938, 0.11855506896972656, 0.12514495849609375, 0.13173484802246094, 0.13832473754882812, 0.1449146270751953, 0.1515045166015625, 0.1580944061279297, 0.16468429565429688, 0.17127418518066406, 0.17786407470703125, 0.18445396423339844, 0.19104385375976562, 0.1976337432861328, 0.2042236328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 18.0, 14.0, 17.0, 27.0, 59.0, 81.0, 115.0, 177.0, 327.0, 626.0, 1409.0, 3867.0, 12870.0, 64822.0, 675488.0, 246966.0, 29757.0, 7298.0, 2461.0, 998.0, 468.0, 257.0, 141.0, 91.0, 55.0, 31.0, 34.0, 19.0, 9.0, 7.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.05230712890625, -0.050711631774902344, -0.04911613464355469, -0.04752063751220703, -0.045925140380859375, -0.04432964324951172, -0.04273414611816406, -0.041138648986816406, -0.03954315185546875, -0.037947654724121094, -0.03635215759277344, -0.03475666046142578, -0.033161163330078125, -0.03156566619873047, -0.029970169067382812, -0.028374671936035156, -0.0267791748046875, -0.025183677673339844, -0.023588180541992188, -0.02199268341064453, -0.020397186279296875, -0.01880168914794922, -0.017206192016601562, -0.015610694885253906, -0.01401519775390625, -0.012419700622558594, -0.010824203491210938, -0.009228706359863281, -0.007633209228515625, -0.006037712097167969, -0.0044422149658203125, -0.0028467178344726562, -0.001251220703125, 0.00034427642822265625, 0.0019397735595703125, 0.0035352706909179688, 0.005130767822265625, 0.006726264953613281, 0.008321762084960938, 0.009917259216308594, 0.01151275634765625, 0.013108253479003906, 0.014703750610351562, 0.01629924774169922, 0.017894744873046875, 0.01949024200439453, 0.021085739135742188, 0.022681236267089844, 0.0242767333984375, 0.025872230529785156, 0.027467727661132812, 0.02906322479248047, 0.030658721923828125, 0.03225421905517578, 0.03384971618652344, 0.035445213317871094, 0.03704071044921875, 0.038636207580566406, 0.04023170471191406, 0.04182720184326172, 0.043422698974609375, 0.04501819610595703, 0.04661369323730469, 0.048209190368652344, 0.0498046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 9.0, 9.0, 18.0, 22.0, 38.0, 92.0, 141.0, 214.0, 195.0, 113.0, 56.0, 31.0, 14.0, 17.0, 11.0, 3.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8835067749023438e-05, -1.8259510397911072e-05, -1.7683953046798706e-05, -1.710839569568634e-05, -1.6532838344573975e-05, -1.595728099346161e-05, -1.5381723642349243e-05, -1.4806166291236877e-05, -1.4230608940124512e-05, -1.3655051589012146e-05, -1.307949423789978e-05, -1.2503936886787415e-05, -1.1928379535675049e-05, -1.1352822184562683e-05, -1.0777264833450317e-05, -1.0201707482337952e-05, -9.626150131225586e-06, -9.05059278011322e-06, -8.475035429000854e-06, -7.899478077888489e-06, -7.323920726776123e-06, -6.748363375663757e-06, -6.172806024551392e-06, -5.597248673439026e-06, -5.02169132232666e-06, -4.4461339712142944e-06, -3.870576620101929e-06, -3.295019268989563e-06, -2.7194619178771973e-06, -2.1439045667648315e-06, -1.5683472156524658e-06, -9.927898645401e-07, -4.172325134277344e-07, 1.5832483768463135e-07, 7.338821887969971e-07, 1.3094395399093628e-06, 1.8849968910217285e-06, 2.4605542421340942e-06, 3.03611159324646e-06, 3.6116689443588257e-06, 4.187226295471191e-06, 4.762783646583557e-06, 5.338340997695923e-06, 5.9138983488082886e-06, 6.489455699920654e-06, 7.06501305103302e-06, 7.640570402145386e-06, 8.216127753257751e-06, 8.791685104370117e-06, 9.367242455482483e-06, 9.942799806594849e-06, 1.0518357157707214e-05, 1.109391450881958e-05, 1.1669471859931946e-05, 1.2245029211044312e-05, 1.2820586562156677e-05, 1.3396143913269043e-05, 1.3971701264381409e-05, 1.4547258615493774e-05, 1.512281596660614e-05, 1.5698373317718506e-05, 1.627393066883087e-05, 1.6849488019943237e-05, 1.7425045371055603e-05, 1.800060272216797e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 4.0, 4.0, 8.0, 17.0, 26.0, 43.0, 61.0, 95.0, 201.0, 398.0, 1064.0, 3545.0, 21744.0, 551554.0, 444494.0, 19856.0, 3569.0, 1001.0, 412.0, 187.0, 101.0, 63.0, 31.0, 30.0, 15.0, 10.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0921630859375, -0.08945083618164062, -0.08673858642578125, -0.08402633666992188, -0.0813140869140625, -0.07860183715820312, -0.07588958740234375, -0.07317733764648438, -0.070465087890625, -0.06775283813476562, -0.06504058837890625, -0.062328338623046875, -0.0596160888671875, -0.056903839111328125, -0.05419158935546875, -0.051479339599609375, -0.04876708984375, -0.046054840087890625, -0.04334259033203125, -0.040630340576171875, -0.0379180908203125, -0.035205841064453125, -0.03249359130859375, -0.029781341552734375, -0.027069091796875, -0.024356842041015625, -0.02164459228515625, -0.018932342529296875, -0.0162200927734375, -0.013507843017578125, -0.01079559326171875, -0.008083343505859375, -0.00537109375, -0.002658843994140625, 5.340576171875e-05, 0.002765655517578125, 0.0054779052734375, 0.008190155029296875, 0.01090240478515625, 0.013614654541015625, 0.016326904296875, 0.019039154052734375, 0.02175140380859375, 0.024463653564453125, 0.0271759033203125, 0.029888153076171875, 0.03260040283203125, 0.035312652587890625, 0.03802490234375, 0.040737152099609375, 0.04344940185546875, 0.046161651611328125, 0.0488739013671875, 0.051586151123046875, 0.05429840087890625, 0.057010650634765625, 0.059722900390625, 0.062435150146484375, 0.06514739990234375, 0.06785964965820312, 0.0705718994140625, 0.07328414916992188, 0.07599639892578125, 0.07870864868164062, 0.0814208984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 10.0, 20.0, 21.0, 30.0, 49.0, 61.0, 92.0, 92.0, 95.0, 111.0, 97.0, 80.0, 58.0, 38.0, 28.0, 34.0, 17.0, 13.0, 8.0, 8.0, 9.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041748046875, -0.04001331329345703, -0.03827857971191406, -0.036543846130371094, -0.034809112548828125, -0.033074378967285156, -0.03133964538574219, -0.02960491180419922, -0.02787017822265625, -0.02613544464111328, -0.024400711059570312, -0.022665977478027344, -0.020931243896484375, -0.019196510314941406, -0.017461776733398438, -0.01572704315185547, -0.0139923095703125, -0.012257575988769531, -0.010522842407226562, -0.008788108825683594, -0.007053375244140625, -0.005318641662597656, -0.0035839080810546875, -0.0018491744995117188, -0.00011444091796875, 0.0016202926635742188, 0.0033550262451171875, 0.005089759826660156, 0.006824493408203125, 0.008559226989746094, 0.010293960571289062, 0.012028694152832031, 0.013763427734375, 0.015498161315917969, 0.017232894897460938, 0.018967628479003906, 0.020702362060546875, 0.022437095642089844, 0.024171829223632812, 0.02590656280517578, 0.02764129638671875, 0.02937602996826172, 0.031110763549804688, 0.032845497131347656, 0.034580230712890625, 0.036314964294433594, 0.03804969787597656, 0.03978443145751953, 0.0415191650390625, 0.04325389862060547, 0.04498863220214844, 0.046723365783691406, 0.048458099365234375, 0.050192832946777344, 0.05192756652832031, 0.05366230010986328, 0.05539703369140625, 0.05713176727294922, 0.05886650085449219, 0.060601234436035156, 0.062335968017578125, 0.0640707015991211, 0.06580543518066406, 0.06754016876220703, 0.06927490234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 9.0, 32.0, 60.0, 141.0, 259.0, 264.0, 124.0, 57.0, 20.0, 10.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8826207518577576, -0.8521865606307983, -0.8217523694038391, -0.7913181781768799, -0.7608839273452759, -0.7304497361183167, -0.7000155448913574, -0.6695813536643982, -0.639147162437439, -0.6087129712104797, -0.5782787799835205, -0.5478445291519165, -0.5174103379249573, -0.48697614669799805, -0.4565419554710388, -0.4261077642440796, -0.3956735134124756, -0.36523932218551636, -0.33480510115623474, -0.3043709099292755, -0.2739366888999939, -0.24350249767303467, -0.21306830644607544, -0.18263410031795502, -0.1521998941898346, -0.12176568806171417, -0.09133148938417435, -0.06089729070663452, -0.0304630845785141, -2.8878450393676758e-05, 0.030405312776565552, 0.060839518904685974, 0.09127366542816162, 0.12170787155628204, 0.15214207768440247, 0.1825762689113617, 0.21301047503948212, 0.24344468116760254, 0.27387887239456177, 0.304313063621521, 0.3347472846508026, 0.36518147587776184, 0.39561569690704346, 0.4260498881340027, 0.4564840793609619, 0.48691830039024353, 0.5173524618148804, 0.5477867126464844, 0.5782209038734436, 0.6086550951004028, 0.6390892863273621, 0.6695234775543213, 0.6999577283859253, 0.7303919196128845, 0.7608261108398438, 0.791260302066803, 0.8216944932937622, 0.8521286845207214, 0.8825628757476807, 0.9129971265792847, 0.9434313178062439, 0.9738655090332031, 1.0042996406555176, 1.0347338914871216, 1.0651681423187256]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 8.0, 3.0, 8.0, 9.0, 13.0, 13.0, 7.0, 17.0, 16.0, 19.0, 18.0, 25.0, 20.0, 27.0, 32.0, 38.0, 31.0, 60.0, 45.0, 42.0, 47.0, 40.0, 36.0, 40.0, 36.0, 36.0, 39.0, 27.0, 36.0, 23.0, 27.0, 26.0, 25.0, 23.0, 19.0, 13.0, 10.0, 9.0, 10.0, 7.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.2642877101898193, -1.2248338460922241, -1.185379981994629, -1.1459261178970337, -1.1064722537994385, -1.0670185089111328, -1.0275646448135376, -0.9881107807159424, -0.9486569166183472, -0.909203052520752, -0.8697491884231567, -0.8302953839302063, -0.7908415198326111, -0.7513876557350159, -0.7119338512420654, -0.6724799871444702, -0.633026123046875, -0.5935722589492798, -0.5541183948516846, -0.5146645903587341, -0.4752107262611389, -0.4357568621635437, -0.3963030278682709, -0.35684919357299805, -0.31739532947540283, -0.2779414653778076, -0.2384876310825348, -0.19903378188610077, -0.15957993268966675, -0.12012608349323273, -0.0806722342967987, -0.04121840000152588, -0.0017644166946411133, 0.03768943250179291, 0.07714328169822693, 0.11659713089466095, 0.15605098009109497, 0.195504829287529, 0.234958678483963, 0.27441251277923584, 0.31386637687683105, 0.35332024097442627, 0.3927740752696991, 0.4322279095649719, 0.47168177366256714, 0.5111356377601624, 0.5505894422531128, 0.590043306350708, 0.6294971704483032, 0.6689510345458984, 0.7084048986434937, 0.7478587031364441, 0.7873125672340393, 0.8267664313316345, 0.866220235824585, 0.9056740999221802, 0.9451279640197754, 0.9845818281173706, 1.0240356922149658, 1.063489556312561, 1.1029434204101562, 1.142397165298462, 1.1818510293960571, 1.2213048934936523, 1.2607587575912476]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 1.0, 10.0, 11.0, 14.0, 6.0, 18.0, 32.0, 41.0, 105.0, 341.0, 4208.0, 4148399.0, 39851.0, 877.0, 174.0, 64.0, 37.0, 23.0, 21.0, 13.0, 8.0, 8.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.431884765625, -0.41782379150390625, -0.4037628173828125, -0.38970184326171875, -0.375640869140625, -0.36157989501953125, -0.3475189208984375, -0.33345794677734375, -0.31939697265625, -0.30533599853515625, -0.2912750244140625, -0.27721405029296875, -0.263153076171875, -0.24909210205078125, -0.2350311279296875, -0.22097015380859375, -0.2069091796875, -0.19284820556640625, -0.1787872314453125, -0.16472625732421875, -0.150665283203125, -0.13660430908203125, -0.1225433349609375, -0.10848236083984375, -0.09442138671875, -0.08036041259765625, -0.0662994384765625, -0.05223846435546875, -0.038177490234375, -0.02411651611328125, -0.0100555419921875, 0.00400543212890625, 0.01806640625, 0.03212738037109375, 0.0461883544921875, 0.06024932861328125, 0.074310302734375, 0.08837127685546875, 0.1024322509765625, 0.11649322509765625, 0.13055419921875, 0.14461517333984375, 0.1586761474609375, 0.17273712158203125, 0.186798095703125, 0.20085906982421875, 0.2149200439453125, 0.22898101806640625, 0.2430419921875, 0.25710296630859375, 0.2711639404296875, 0.28522491455078125, 0.299285888671875, 0.31334686279296875, 0.3274078369140625, 0.34146881103515625, 0.35552978515625, 0.36959075927734375, 0.3836517333984375, 0.39771270751953125, 0.411773681640625, 0.42583465576171875, 0.4398956298828125, 0.45395660400390625, 0.468017578125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 1.0, 1.0, 4.0, 5.0, 15.0, 11.0, 13.0, 30.0, 96.0, 187.0, 260.0, 201.0, 84.0, 30.0, 23.0, 11.0, 8.0, 10.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1290283203125, -0.12449836730957031, -0.11996841430664062, -0.11543846130371094, -0.11090850830078125, -0.10637855529785156, -0.10184860229492188, -0.09731864929199219, -0.0927886962890625, -0.08825874328613281, -0.08372879028320312, -0.07919883728027344, -0.07466888427734375, -0.07013893127441406, -0.06560897827148438, -0.06107902526855469, -0.056549072265625, -0.05201911926269531, -0.047489166259765625, -0.04295921325683594, -0.03842926025390625, -0.03389930725097656, -0.029369354248046875, -0.024839401245117188, -0.0203094482421875, -0.015779495239257812, -0.011249542236328125, -0.0067195892333984375, -0.00218963623046875, 0.0023403167724609375, 0.006870269775390625, 0.011400222778320312, 0.01593017578125, 0.020460128784179688, 0.024990081787109375, 0.029520034790039062, 0.03404998779296875, 0.03857994079589844, 0.043109893798828125, 0.04763984680175781, 0.0521697998046875, 0.05669975280761719, 0.061229705810546875, 0.06575965881347656, 0.07028961181640625, 0.07481956481933594, 0.07934951782226562, 0.08387947082519531, 0.088409423828125, 0.09293937683105469, 0.09746932983398438, 0.10199928283691406, 0.10652923583984375, 0.11105918884277344, 0.11558914184570312, 0.12011909484863281, 0.1246490478515625, 0.1291790008544922, 0.13370895385742188, 0.13823890686035156, 0.14276885986328125, 0.14729881286621094, 0.15182876586914062, 0.1563587188720703, 0.160888671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 10.0, 10.0, 18.0, 41.0, 63.0, 89.0, 203.0, 404.0, 895.0, 1931.0, 5915.0, 25661.0, 194190.0, 3628444.0, 291037.0, 33834.0, 7209.0, 2417.0, 947.0, 456.0, 221.0, 109.0, 57.0, 32.0, 24.0, 14.0, 10.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.10223388671875, -0.09943866729736328, -0.09664344787597656, -0.09384822845458984, -0.09105300903320312, -0.0882577896118164, -0.08546257019042969, -0.08266735076904297, -0.07987213134765625, -0.07707691192626953, -0.07428169250488281, -0.0714864730834961, -0.06869125366210938, -0.06589603424072266, -0.06310081481933594, -0.06030559539794922, -0.0575103759765625, -0.05471515655517578, -0.05191993713378906, -0.049124717712402344, -0.046329498291015625, -0.043534278869628906, -0.04073905944824219, -0.03794384002685547, -0.03514862060546875, -0.03235340118408203, -0.029558181762695312, -0.026762962341308594, -0.023967742919921875, -0.021172523498535156, -0.018377304077148438, -0.015582084655761719, -0.012786865234375, -0.009991645812988281, -0.0071964263916015625, -0.004401206970214844, -0.001605987548828125, 0.0011892318725585938, 0.0039844512939453125, 0.006779670715332031, 0.00957489013671875, 0.012370109558105469, 0.015165328979492188, 0.017960548400878906, 0.020755767822265625, 0.023550987243652344, 0.026346206665039062, 0.02914142608642578, 0.0319366455078125, 0.03473186492919922, 0.03752708435058594, 0.040322303771972656, 0.043117523193359375, 0.045912742614746094, 0.04870796203613281, 0.05150318145751953, 0.05429840087890625, 0.05709362030029297, 0.05988883972167969, 0.0626840591430664, 0.06547927856445312, 0.06827449798583984, 0.07106971740722656, 0.07386493682861328, 0.07666015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 11.0, 9.0, 12.0, 20.0, 45.0, 66.0, 97.0, 121.0, 207.0, 362.0, 1589.0, 664.0, 309.0, 188.0, 119.0, 68.0, 58.0, 30.0, 30.0, 17.0, 15.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.036468505859375, -0.035282135009765625, -0.03409576416015625, -0.032909393310546875, -0.0317230224609375, -0.030536651611328125, -0.02935028076171875, -0.028163909912109375, -0.0269775390625, -0.025791168212890625, -0.02460479736328125, -0.023418426513671875, -0.0222320556640625, -0.021045684814453125, -0.01985931396484375, -0.018672943115234375, -0.017486572265625, -0.016300201416015625, -0.01511383056640625, -0.013927459716796875, -0.0127410888671875, -0.011554718017578125, -0.01036834716796875, -0.009181976318359375, -0.00799560546875, -0.006809234619140625, -0.00562286376953125, -0.004436492919921875, -0.0032501220703125, -0.002063751220703125, -0.00087738037109375, 0.000308990478515625, 0.001495361328125, 0.002681732177734375, 0.00386810302734375, 0.005054473876953125, 0.0062408447265625, 0.007427215576171875, 0.00861358642578125, 0.009799957275390625, 0.010986328125, 0.012172698974609375, 0.01335906982421875, 0.014545440673828125, 0.0157318115234375, 0.016918182373046875, 0.01810455322265625, 0.019290924072265625, 0.020477294921875, 0.021663665771484375, 0.02285003662109375, 0.024036407470703125, 0.0252227783203125, 0.026409149169921875, 0.02759552001953125, 0.028781890869140625, 0.02996826171875, 0.031154632568359375, 0.03234100341796875, 0.033527374267578125, 0.0347137451171875, 0.035900115966796875, 0.03708648681640625, 0.038272857666015625, 0.039459228515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 8.0, 76.0, 548.0, 339.0, 27.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16194187104701996, -0.133729487657547, -0.10551711916923523, -0.07730473577976227, -0.049092359840869904, -0.02087998390197754, 0.007332399487495422, 0.03554476797580719, 0.06375715136528015, 0.09196952730417252, 0.12018190324306488, 0.14839428663253784, 0.1766066551208496, 0.20481903851032257, 0.23303142189979553, 0.2612437903881073, 0.28945618867874146, 0.3176685571670532, 0.3458809554576874, 0.37409332394599915, 0.4023056924343109, 0.43051809072494507, 0.45873045921325684, 0.4869428277015686, 0.5151551961898804, 0.5433675646781921, 0.5715799331665039, 0.5997923612594604, 0.6280047297477722, 0.656217098236084, 0.6844294667243958, 0.7126418352127075, 0.7408542037010193, 0.769066572189331, 0.7972789406776428, 0.8254913091659546, 0.8537037372589111, 0.8819161057472229, 0.9101284742355347, 0.9383408427238464, 0.9665532112121582, 0.99476557970047, 1.0229779481887817, 1.0511903762817383, 1.0794026851654053, 1.1076151132583618, 1.1358275413513184, 1.1640398502349854, 1.192252278327942, 1.2204647064208984, 1.2486770153045654, 1.276889443397522, 1.305101752281189, 1.3333141803741455, 1.3615264892578125, 1.389738917350769, 1.417951226234436, 1.4461636543273926, 1.4743759632110596, 1.5025883913040161, 1.530800700187683, 1.5590131282806396, 1.5872254371643066, 1.6154378652572632, 1.6436502933502197]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 7.0, 8.0, 6.0, 14.0, 18.0, 18.0, 19.0, 23.0, 31.0, 29.0, 38.0, 23.0, 36.0, 42.0, 40.0, 46.0, 41.0, 46.0, 42.0, 40.0, 47.0, 29.0, 36.0, 34.0, 36.0, 37.0, 20.0, 30.0, 28.0, 18.0, 22.0, 19.0, 19.0, 7.0, 16.0, 9.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.11557602882385254, -0.11183465272188187, -0.1080932691693306, -0.10435189306735992, -0.10061050951480865, -0.09686913341283798, -0.09312775731086731, -0.08938637375831604, -0.08564499765634537, -0.0819036215543747, -0.07816223800182343, -0.07442086189985275, -0.07067948579788208, -0.06693810224533081, -0.06319672614336014, -0.05945534631609917, -0.055713966488838196, -0.051972586661577225, -0.048231206834316254, -0.04448983073234558, -0.04074845090508461, -0.03700707107782364, -0.033265694975852966, -0.029524315148591995, -0.025782935321331024, -0.022041555494070053, -0.01830017752945423, -0.014558798633515835, -0.010817419737577438, -0.007076039910316467, -0.0033346619457006454, 0.0004067160189151764, 0.0041480958461761475, 0.007889474742114544, 0.01163085363805294, 0.015372232533991337, 0.019113611429929733, 0.022854991257190704, 0.026596369221806526, 0.030337747186422348, 0.03407912701368332, 0.03782050684094429, 0.04156188666820526, 0.045303262770175934, 0.049044642597436905, 0.052786022424697876, 0.05652739852666855, 0.06026877835392952, 0.06401015818119049, 0.06775153428316116, 0.07149291783571243, 0.0752342939376831, 0.07897567749023438, 0.08271705359220505, 0.08645842969417572, 0.09019981324672699, 0.09394118934869766, 0.09768256545066833, 0.1014239490032196, 0.10516532510519028, 0.10890670120716095, 0.11264808475971222, 0.11638946086168289, 0.12013083696365356, 0.12387222051620483]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 4.0, 12.0, 16.0, 20.0, 30.0, 65.0, 103.0, 172.0, 308.0, 669.0, 1691.0, 5921.0, 44961.0, 880958.0, 100018.0, 9577.0, 2312.0, 885.0, 378.0, 169.0, 109.0, 54.0, 39.0, 25.0, 21.0, 11.0, 3.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1927490234375, -0.1855144500732422, -0.17827987670898438, -0.17104530334472656, -0.16381072998046875, -0.15657615661621094, -0.14934158325195312, -0.1421070098876953, -0.1348724365234375, -0.1276378631591797, -0.12040328979492188, -0.11316871643066406, -0.10593414306640625, -0.09869956970214844, -0.09146499633789062, -0.08423042297363281, -0.076995849609375, -0.06976127624511719, -0.06252670288085938, -0.05529212951660156, -0.04805755615234375, -0.04082298278808594, -0.033588409423828125, -0.026353836059570312, -0.0191192626953125, -0.011884689331054688, -0.004650115966796875, 0.0025844573974609375, 0.00981903076171875, 0.017053604125976562, 0.024288177490234375, 0.03152275085449219, 0.03875732421875, 0.04599189758300781, 0.053226470947265625, 0.06046104431152344, 0.06769561767578125, 0.07493019104003906, 0.08216476440429688, 0.08939933776855469, 0.0966339111328125, 0.10386848449707031, 0.11110305786132812, 0.11833763122558594, 0.12557220458984375, 0.13280677795410156, 0.14004135131835938, 0.1472759246826172, 0.154510498046875, 0.1617450714111328, 0.16897964477539062, 0.17621421813964844, 0.18344879150390625, 0.19068336486816406, 0.19791793823242188, 0.2051525115966797, 0.2123870849609375, 0.2196216583251953, 0.22685623168945312, 0.23409080505371094, 0.24132537841796875, 0.24855995178222656, 0.2557945251464844, 0.2630290985107422, 0.270263671875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 1.0, 2.0, 4.0, 4.0, 15.0, 9.0, 18.0, 29.0, 80.0, 194.0, 256.0, 201.0, 96.0, 27.0, 24.0, 12.0, 7.0, 8.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12841796875, -0.12391471862792969, -0.11941146850585938, -0.11490821838378906, -0.11040496826171875, -0.10590171813964844, -0.10139846801757812, -0.09689521789550781, -0.0923919677734375, -0.08788871765136719, -0.08338546752929688, -0.07888221740722656, -0.07437896728515625, -0.06987571716308594, -0.06537246704101562, -0.06086921691894531, -0.056365966796875, -0.05186271667480469, -0.047359466552734375, -0.04285621643066406, -0.03835296630859375, -0.03384971618652344, -0.029346466064453125, -0.024843215942382812, -0.0203399658203125, -0.015836715698242188, -0.011333465576171875, -0.0068302154541015625, -0.00232696533203125, 0.0021762847900390625, 0.006679534912109375, 0.011182785034179688, 0.01568603515625, 0.020189285278320312, 0.024692535400390625, 0.029195785522460938, 0.03369903564453125, 0.03820228576660156, 0.042705535888671875, 0.04720878601074219, 0.0517120361328125, 0.05621528625488281, 0.060718536376953125, 0.06522178649902344, 0.06972503662109375, 0.07422828674316406, 0.07873153686523438, 0.08323478698730469, 0.087738037109375, 0.09224128723144531, 0.09674453735351562, 0.10124778747558594, 0.10575103759765625, 0.11025428771972656, 0.11475753784179688, 0.11926078796386719, 0.1237640380859375, 0.1282672882080078, 0.13277053833007812, 0.13727378845214844, 0.14177703857421875, 0.14628028869628906, 0.15078353881835938, 0.1552867889404297, 0.1597900390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 9.0, 9.0, 3.0, 13.0, 24.0, 18.0, 28.0, 43.0, 39.0, 55.0, 92.0, 118.0, 176.0, 248.0, 380.0, 747.0, 1865.0, 8625.0, 120433.0, 827099.0, 78377.0, 6646.0, 1617.0, 693.0, 350.0, 227.0, 151.0, 120.0, 88.0, 65.0, 50.0, 31.0, 32.0, 21.0, 13.0, 14.0, 10.0, 14.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12237548828125, -0.11774539947509766, -0.11311531066894531, -0.10848522186279297, -0.10385513305664062, -0.09922504425048828, -0.09459495544433594, -0.0899648666381836, -0.08533477783203125, -0.0807046890258789, -0.07607460021972656, -0.07144451141357422, -0.06681442260742188, -0.06218433380126953, -0.05755424499511719, -0.052924156188964844, -0.0482940673828125, -0.043663978576660156, -0.03903388977050781, -0.03440380096435547, -0.029773712158203125, -0.02514362335205078, -0.020513534545898438, -0.015883445739746094, -0.01125335693359375, -0.006623268127441406, -0.0019931793212890625, 0.0026369094848632812, 0.007266998291015625, 0.011897087097167969, 0.016527175903320312, 0.021157264709472656, 0.025787353515625, 0.030417442321777344, 0.03504753112792969, 0.03967761993408203, 0.044307708740234375, 0.04893779754638672, 0.05356788635253906, 0.058197975158691406, 0.06282806396484375, 0.0674581527709961, 0.07208824157714844, 0.07671833038330078, 0.08134841918945312, 0.08597850799560547, 0.09060859680175781, 0.09523868560791016, 0.0998687744140625, 0.10449886322021484, 0.10912895202636719, 0.11375904083251953, 0.11838912963867188, 0.12301921844482422, 0.12764930725097656, 0.1322793960571289, 0.13690948486328125, 0.1415395736694336, 0.14616966247558594, 0.15079975128173828, 0.15542984008789062, 0.16005992889404297, 0.1646900177001953, 0.16932010650634766, 0.1739501953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 10.0, 4.0, 5.0, 11.0, 12.0, 12.0, 16.0, 17.0, 24.0, 19.0, 19.0, 31.0, 16.0, 28.0, 27.0, 32.0, 38.0, 41.0, 32.0, 34.0, 46.0, 33.0, 37.0, 32.0, 42.0, 38.0, 29.0, 41.0, 32.0, 33.0, 17.0, 27.0, 36.0, 16.0, 16.0, 12.0, 15.0, 8.0, 12.0, 13.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.2015380859375, -0.19568634033203125, -0.1898345947265625, -0.18398284912109375, -0.178131103515625, -0.17227935791015625, -0.1664276123046875, -0.16057586669921875, -0.15472412109375, -0.14887237548828125, -0.1430206298828125, -0.13716888427734375, -0.131317138671875, -0.12546539306640625, -0.1196136474609375, -0.11376190185546875, -0.10791015625, -0.10205841064453125, -0.0962066650390625, -0.09035491943359375, -0.084503173828125, -0.07865142822265625, -0.0727996826171875, -0.06694793701171875, -0.06109619140625, -0.05524444580078125, -0.0493927001953125, -0.04354095458984375, -0.037689208984375, -0.03183746337890625, -0.0259857177734375, -0.02013397216796875, -0.0142822265625, -0.00843048095703125, -0.0025787353515625, 0.00327301025390625, 0.009124755859375, 0.01497650146484375, 0.0208282470703125, 0.02667999267578125, 0.03253173828125, 0.03838348388671875, 0.0442352294921875, 0.05008697509765625, 0.055938720703125, 0.06179046630859375, 0.0676422119140625, 0.07349395751953125, 0.079345703125, 0.08519744873046875, 0.0910491943359375, 0.09690093994140625, 0.102752685546875, 0.10860443115234375, 0.1144561767578125, 0.12030792236328125, 0.12615966796875, 0.13201141357421875, 0.1378631591796875, 0.14371490478515625, 0.149566650390625, 0.15541839599609375, 0.1612701416015625, 0.16712188720703125, 0.1729736328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 12.0, 11.0, 14.0, 22.0, 39.0, 62.0, 82.0, 150.0, 239.0, 417.0, 853.0, 2209.0, 6639.0, 27953.0, 178850.0, 769373.0, 46235.0, 10108.0, 2925.0, 1067.0, 550.0, 292.0, 164.0, 85.0, 58.0, 38.0, 31.0, 21.0, 18.0, 13.0, 3.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05987548828125, -0.05817222595214844, -0.056468963623046875, -0.05476570129394531, -0.05306243896484375, -0.05135917663574219, -0.049655914306640625, -0.04795265197753906, -0.0462493896484375, -0.04454612731933594, -0.042842864990234375, -0.04113960266113281, -0.03943634033203125, -0.03773307800292969, -0.036029815673828125, -0.03432655334472656, -0.032623291015625, -0.030920028686523438, -0.029216766357421875, -0.027513504028320312, -0.02581024169921875, -0.024106979370117188, -0.022403717041015625, -0.020700454711914062, -0.0189971923828125, -0.017293930053710938, -0.015590667724609375, -0.013887405395507812, -0.01218414306640625, -0.010480880737304688, -0.008777618408203125, -0.0070743560791015625, -0.00537109375, -0.0036678314208984375, -0.001964569091796875, -0.0002613067626953125, 0.00144195556640625, 0.0031452178955078125, 0.004848480224609375, 0.0065517425537109375, 0.0082550048828125, 0.009958267211914062, 0.011661529541015625, 0.013364791870117188, 0.01506805419921875, 0.016771316528320312, 0.018474578857421875, 0.020177841186523438, 0.021881103515625, 0.023584365844726562, 0.025287628173828125, 0.026990890502929688, 0.02869415283203125, 0.030397415161132812, 0.032100677490234375, 0.03380393981933594, 0.0355072021484375, 0.03721046447753906, 0.038913726806640625, 0.04061698913574219, 0.04232025146484375, 0.04402351379394531, 0.045726776123046875, 0.04743003845214844, 0.04913330078125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 9.0, 4.0, 13.0, 5.0, 10.0, 22.0, 30.0, 57.0, 111.0, 152.0, 186.0, 140.0, 88.0, 55.0, 44.0, 11.0, 8.0, 12.0, 8.0, 11.0, 7.0, 4.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5974044799804688e-05, -1.556985080242157e-05, -1.5165656805038452e-05, -1.4761462807655334e-05, -1.4357268810272217e-05, -1.3953074812889099e-05, -1.3548880815505981e-05, -1.3144686818122864e-05, -1.2740492820739746e-05, -1.2336298823356628e-05, -1.193210482597351e-05, -1.1527910828590393e-05, -1.1123716831207275e-05, -1.0719522833824158e-05, -1.031532883644104e-05, -9.911134839057922e-06, -9.506940841674805e-06, -9.102746844291687e-06, -8.69855284690857e-06, -8.294358849525452e-06, -7.890164852142334e-06, -7.485970854759216e-06, -7.081776857376099e-06, -6.677582859992981e-06, -6.273388862609863e-06, -5.869194865226746e-06, -5.465000867843628e-06, -5.06080687046051e-06, -4.656612873077393e-06, -4.252418875694275e-06, -3.848224878311157e-06, -3.4440308809280396e-06, -3.039836883544922e-06, -2.635642886161804e-06, -2.2314488887786865e-06, -1.8272548913955688e-06, -1.4230608940124512e-06, -1.0188668966293335e-06, -6.146728992462158e-07, -2.1047890186309814e-07, 1.9371509552001953e-07, 5.979090929031372e-07, 1.0021030902862549e-06, 1.4062970876693726e-06, 1.8104910850524902e-06, 2.214685082435608e-06, 2.6188790798187256e-06, 3.0230730772018433e-06, 3.427267074584961e-06, 3.831461071968079e-06, 4.235655069351196e-06, 4.639849066734314e-06, 5.044043064117432e-06, 5.448237061500549e-06, 5.852431058883667e-06, 6.256625056266785e-06, 6.660819053649902e-06, 7.06501305103302e-06, 7.469207048416138e-06, 7.873401045799255e-06, 8.277595043182373e-06, 8.68178904056549e-06, 9.085983037948608e-06, 9.490177035331726e-06, 9.894371032714844e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 10.0, 16.0, 23.0, 33.0, 54.0, 69.0, 90.0, 177.0, 313.0, 489.0, 1054.0, 2917.0, 10110.0, 52153.0, 836752.0, 117651.0, 18779.0, 4678.0, 1567.0, 705.0, 309.0, 209.0, 116.0, 74.0, 61.0, 46.0, 36.0, 19.0, 17.0, 7.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0665283203125, -0.064361572265625, -0.06219482421875, -0.060028076171875, -0.057861328125, -0.055694580078125, -0.05352783203125, -0.051361083984375, -0.0491943359375, -0.047027587890625, -0.04486083984375, -0.042694091796875, -0.04052734375, -0.038360595703125, -0.03619384765625, -0.034027099609375, -0.0318603515625, -0.029693603515625, -0.02752685546875, -0.025360107421875, -0.023193359375, -0.021026611328125, -0.01885986328125, -0.016693115234375, -0.0145263671875, -0.012359619140625, -0.01019287109375, -0.008026123046875, -0.005859375, -0.003692626953125, -0.00152587890625, 0.000640869140625, 0.0028076171875, 0.004974365234375, 0.00714111328125, 0.009307861328125, 0.011474609375, 0.013641357421875, 0.01580810546875, 0.017974853515625, 0.0201416015625, 0.022308349609375, 0.02447509765625, 0.026641845703125, 0.02880859375, 0.030975341796875, 0.03314208984375, 0.035308837890625, 0.0374755859375, 0.039642333984375, 0.04180908203125, 0.043975830078125, 0.046142578125, 0.048309326171875, 0.05047607421875, 0.052642822265625, 0.0548095703125, 0.056976318359375, 0.05914306640625, 0.061309814453125, 0.0634765625, 0.065643310546875, 0.06781005859375, 0.069976806640625, 0.0721435546875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 10.0, 11.0, 7.0, 8.0, 9.0, 15.0, 13.0, 28.0, 21.0, 29.0, 67.0, 155.0, 234.0, 150.0, 52.0, 30.0, 24.0, 15.0, 16.0, 17.0, 5.0, 14.0, 6.0, 11.0, 3.0, 10.0, 9.0, 5.0, 2.0, 6.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.055450439453125, -0.05356645584106445, -0.051682472229003906, -0.04979848861694336, -0.04791450500488281, -0.046030521392822266, -0.04414653778076172, -0.04226255416870117, -0.040378570556640625, -0.03849458694458008, -0.03661060333251953, -0.034726619720458984, -0.03284263610839844, -0.03095865249633789, -0.029074668884277344, -0.027190685272216797, -0.02530670166015625, -0.023422718048095703, -0.021538734436035156, -0.01965475082397461, -0.017770767211914062, -0.015886783599853516, -0.014002799987792969, -0.012118816375732422, -0.010234832763671875, -0.008350849151611328, -0.006466865539550781, -0.004582881927490234, -0.0026988983154296875, -0.0008149147033691406, 0.0010690689086914062, 0.002953052520751953, 0.0048370361328125, 0.006721019744873047, 0.008605003356933594, 0.01048898696899414, 0.012372970581054688, 0.014256954193115234, 0.01614093780517578, 0.018024921417236328, 0.019908905029296875, 0.021792888641357422, 0.02367687225341797, 0.025560855865478516, 0.027444839477539062, 0.02932882308959961, 0.031212806701660156, 0.0330967903137207, 0.03498077392578125, 0.0368647575378418, 0.038748741149902344, 0.04063272476196289, 0.04251670837402344, 0.044400691986083984, 0.04628467559814453, 0.04816865921020508, 0.050052642822265625, 0.05193662643432617, 0.05382061004638672, 0.055704593658447266, 0.05758857727050781, 0.05947256088256836, 0.061356544494628906, 0.06324052810668945, 0.06512451171875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 12.0, 139.0, 778.0, 68.0, 11.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5541019439697266, -2.4397695064544678, -2.325437068939209, -2.21110463142395, -2.0967721939086914, -1.9824398756027222, -1.8681074380874634, -1.7537751197814941, -1.6394426822662354, -1.5251102447509766, -1.4107778072357178, -1.296445369720459, -1.1821130514144897, -1.067780613899231, -0.9534481763839722, -0.8391157984733582, -0.7247833013534546, -0.6104508638381958, -0.4961184859275818, -0.381786048412323, -0.2674536406993866, -0.1531212329864502, -0.038788795471191406, 0.07554358243942261, 0.1898760199546814, 0.3042084276676178, 0.4185408353805542, 0.532873272895813, 0.6472057104110718, 0.7615380883216858, 0.8758705258369446, 0.9902029037475586, 1.1045353412628174, 1.2188677787780762, 1.333200216293335, 1.4475326538085938, 1.561864972114563, 1.6761974096298218, 1.7905298471450806, 1.9048621654510498, 2.0191946029663086, 2.1335270404815674, 2.247859477996826, 2.362191915512085, 2.4765243530273438, 2.5908565521240234, 2.7051892280578613, 2.819521427154541, 2.933854103088379, 3.0481865406036377, 3.1625189781188965, 3.2768514156341553, 3.391183853149414, 3.5055160522460938, 3.6198487281799316, 3.7341809272766113, 3.84851336479187, 3.962845802307129, 4.077178001403809, 4.1915106773376465, 4.305842876434326, 4.420175552368164, 4.534507751464844, 4.648840427398682, 4.763172626495361]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 5.0, 3.0, 6.0, 5.0, 5.0, 17.0, 11.0, 19.0, 20.0, 15.0, 25.0, 20.0, 26.0, 30.0, 29.0, 44.0, 32.0, 36.0, 39.0, 40.0, 54.0, 44.0, 49.0, 38.0, 44.0, 42.0, 34.0, 36.0, 29.0, 33.0, 19.0, 24.0, 28.0, 12.0, 15.0, 12.0, 6.0, 9.0, 8.0, 7.0, 5.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0003173351287842, -0.9699167013168335, -0.9395160675048828, -0.9091154336929321, -0.8787147998809814, -0.8483141660690308, -0.8179135322570801, -0.7875128984451294, -0.7571122646331787, -0.726711630821228, -0.6963109970092773, -0.6659103631973267, -0.635509729385376, -0.6051090955734253, -0.5747084617614746, -0.5443078279495239, -0.513907253742218, -0.48350661993026733, -0.45310598611831665, -0.42270535230636597, -0.3923047184944153, -0.3619040846824646, -0.3315034806728363, -0.3011028468608856, -0.27070221304893494, -0.24030157923698425, -0.20990094542503357, -0.17950032651424408, -0.1490996927022934, -0.11869905889034271, -0.08829843997955322, -0.05789780616760254, -0.02749711275100708, 0.002903517335653305, 0.03330414742231369, 0.06370477378368378, 0.09410540759563446, 0.12450604140758514, 0.15490666031837463, 0.18530729413032532, 0.215707927942276, 0.24610856175422668, 0.27650919556617737, 0.30690979957580566, 0.33731043338775635, 0.36771106719970703, 0.3981117010116577, 0.4285123348236084, 0.4589129686355591, 0.48931360244750977, 0.5197142362594604, 0.5501148700714111, 0.5805155038833618, 0.6109161376953125, 0.6413167715072632, 0.6717174053192139, 0.7021180391311646, 0.7325186729431152, 0.7629193067550659, 0.7933199405670166, 0.8237205743789673, 0.854121208190918, 0.8845218420028687, 0.9149224758148193, 0.9453230500221252]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 1.0, 6.0, 1.0, 3.0, 9.0, 10.0, 15.0, 16.0, 41.0, 192.0, 5710.0, 4187191.0, 897.0, 107.0, 30.0, 12.0, 10.0, 10.0, 8.0, 7.0, 6.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89306640625, -0.8626022338867188, -0.8321380615234375, -0.8016738891601562, -0.771209716796875, -0.7407455444335938, -0.7102813720703125, -0.6798171997070312, -0.64935302734375, -0.6188888549804688, -0.5884246826171875, -0.5579605102539062, -0.527496337890625, -0.49703216552734375, -0.4665679931640625, -0.43610382080078125, -0.4056396484375, -0.37517547607421875, -0.3447113037109375, -0.31424713134765625, -0.283782958984375, -0.25331878662109375, -0.2228546142578125, -0.19239044189453125, -0.16192626953125, -0.13146209716796875, -0.1009979248046875, -0.07053375244140625, -0.040069580078125, -0.00960540771484375, 0.0208587646484375, 0.05132293701171875, 0.081787109375, 0.11225128173828125, 0.1427154541015625, 0.17317962646484375, 0.203643798828125, 0.23410797119140625, 0.2645721435546875, 0.29503631591796875, 0.32550048828125, 0.35596466064453125, 0.3864288330078125, 0.41689300537109375, 0.447357177734375, 0.47782135009765625, 0.5082855224609375, 0.5387496948242188, 0.5692138671875, 0.5996780395507812, 0.6301422119140625, 0.6606063842773438, 0.691070556640625, 0.7215347290039062, 0.7519989013671875, 0.7824630737304688, 0.81292724609375, 0.8433914184570312, 0.8738555908203125, 0.9043197631835938, 0.934783935546875, 0.9652481079101562, 0.9957122802734375, 1.0261764526367188, 1.056640625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 2.0, 2.0, 5.0, 12.0, 10.0, 16.0, 29.0, 73.0, 168.0, 240.0, 224.0, 117.0, 37.0, 22.0, 12.0, 9.0, 6.0, 11.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.12441062927246094, -0.11991500854492188, -0.11541938781738281, -0.11092376708984375, -0.10642814636230469, -0.10193252563476562, -0.09743690490722656, -0.0929412841796875, -0.08844566345214844, -0.08395004272460938, -0.07945442199707031, -0.07495880126953125, -0.07046318054199219, -0.06596755981445312, -0.06147193908691406, -0.056976318359375, -0.05248069763183594, -0.047985076904296875, -0.04348945617675781, -0.03899383544921875, -0.03449821472167969, -0.030002593994140625, -0.025506973266601562, -0.0210113525390625, -0.016515731811523438, -0.012020111083984375, -0.0075244903564453125, -0.00302886962890625, 0.0014667510986328125, 0.005962371826171875, 0.010457992553710938, 0.01495361328125, 0.019449234008789062, 0.023944854736328125, 0.028440475463867188, 0.03293609619140625, 0.03743171691894531, 0.041927337646484375, 0.04642295837402344, 0.0509185791015625, 0.05541419982910156, 0.059909820556640625, 0.06440544128417969, 0.06890106201171875, 0.07339668273925781, 0.07789230346679688, 0.08238792419433594, 0.086883544921875, 0.09137916564941406, 0.09587478637695312, 0.10037040710449219, 0.10486602783203125, 0.10936164855957031, 0.11385726928710938, 0.11835289001464844, 0.1228485107421875, 0.12734413146972656, 0.13183975219726562, 0.1363353729248047, 0.14083099365234375, 0.1453266143798828, 0.14982223510742188, 0.15431785583496094, 0.1588134765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 14.0, 27.0, 55.0, 121.0, 378.0, 1175.0, 5557.0, 44650.0, 3614194.0, 501758.0, 21924.0, 3243.0, 788.0, 235.0, 83.0, 48.0, 13.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12646484375, -0.12175559997558594, -0.11704635620117188, -0.11233711242675781, -0.10762786865234375, -0.10291862487792969, -0.09820938110351562, -0.09350013732910156, -0.0887908935546875, -0.08408164978027344, -0.07937240600585938, -0.07466316223144531, -0.06995391845703125, -0.06524467468261719, -0.060535430908203125, -0.05582618713378906, -0.051116943359375, -0.04640769958496094, -0.041698455810546875, -0.03698921203613281, -0.03227996826171875, -0.027570724487304688, -0.022861480712890625, -0.018152236938476562, -0.0134429931640625, -0.008733749389648438, -0.004024505615234375, 0.0006847381591796875, 0.00539398193359375, 0.010103225708007812, 0.014812469482421875, 0.019521713256835938, 0.02423095703125, 0.028940200805664062, 0.033649444580078125, 0.03835868835449219, 0.04306793212890625, 0.04777717590332031, 0.052486419677734375, 0.05719566345214844, 0.0619049072265625, 0.06661415100097656, 0.07132339477539062, 0.07603263854980469, 0.08074188232421875, 0.08545112609863281, 0.09016036987304688, 0.09486961364746094, 0.099578857421875, 0.10428810119628906, 0.10899734497070312, 0.11370658874511719, 0.11841583251953125, 0.12312507629394531, 0.12783432006835938, 0.13254356384277344, 0.1372528076171875, 0.14196205139160156, 0.14667129516601562, 0.1513805389404297, 0.15608978271484375, 0.1607990264892578, 0.16550827026367188, 0.17021751403808594, 0.1749267578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 9.0, 11.0, 9.0, 17.0, 33.0, 52.0, 83.0, 140.0, 235.0, 655.0, 2050.0, 341.0, 180.0, 86.0, 52.0, 32.0, 29.0, 18.0, 15.0, 8.0, 5.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05609130859375, -0.05469703674316406, -0.053302764892578125, -0.05190849304199219, -0.05051422119140625, -0.04911994934082031, -0.047725677490234375, -0.04633140563964844, -0.0449371337890625, -0.04354286193847656, -0.042148590087890625, -0.04075431823730469, -0.03936004638671875, -0.03796577453613281, -0.036571502685546875, -0.03517723083496094, -0.033782958984375, -0.03238868713378906, -0.030994415283203125, -0.029600143432617188, -0.02820587158203125, -0.026811599731445312, -0.025417327880859375, -0.024023056030273438, -0.0226287841796875, -0.021234512329101562, -0.019840240478515625, -0.018445968627929688, -0.01705169677734375, -0.015657424926757812, -0.014263153076171875, -0.012868881225585938, -0.011474609375, -0.010080337524414062, -0.008686065673828125, -0.0072917938232421875, -0.00589752197265625, -0.0045032501220703125, -0.003108978271484375, -0.0017147064208984375, -0.0003204345703125, 0.0010738372802734375, 0.002468109130859375, 0.0038623809814453125, 0.00525665283203125, 0.0066509246826171875, 0.008045196533203125, 0.009439468383789062, 0.010833740234375, 0.012228012084960938, 0.013622283935546875, 0.015016555786132812, 0.01641082763671875, 0.017805099487304688, 0.019199371337890625, 0.020593643188476562, 0.0219879150390625, 0.023382186889648438, 0.024776458740234375, 0.026170730590820312, 0.02756500244140625, 0.028959274291992188, 0.030353546142578125, 0.03174781799316406, 0.03314208984375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 13.0, 24.0, 74.0, 150.0, 260.0, 261.0, 126.0, 56.0, 17.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5612211227416992, -0.5504186749458313, -0.5396162867546082, -0.5288138389587402, -0.5180113911628723, -0.5072090029716492, -0.49640655517578125, -0.48560410737991333, -0.4748016893863678, -0.46399927139282227, -0.45319682359695435, -0.4423944056034088, -0.4315919876098633, -0.42078953981399536, -0.40998712182044983, -0.3991847038269043, -0.3883822560310364, -0.37757983803749084, -0.3667773902416229, -0.3559749722480774, -0.3451725244522095, -0.33437010645866394, -0.3235676884651184, -0.3127652406692505, -0.30196282267570496, -0.2911604046821594, -0.2803579568862915, -0.26955553889274597, -0.25875312089920044, -0.24795067310333252, -0.237148255109787, -0.22634582221508026, -0.21554335951805115, -0.20474092662334442, -0.1939384937286377, -0.18313607573509216, -0.17233364284038544, -0.1615312099456787, -0.15072879195213318, -0.13992635905742645, -0.12912392616271973, -0.118321493268013, -0.10751906782388687, -0.09671664237976074, -0.08591420948505402, -0.07511177659034729, -0.06430935114622116, -0.05350692570209503, -0.042704492807388306, -0.03190206363797188, -0.02109963446855545, -0.010297205299139023, 0.0005052238702774048, 0.011307653039693832, 0.02211008220911026, 0.03291250765323639, 0.043714940547943115, 0.05451736971735954, 0.06531979888677597, 0.0761222243309021, 0.08692465722560883, 0.09772709012031555, 0.10852951556444168, 0.11933194100856781, 0.13013437390327454]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 3.0, 5.0, 7.0, 6.0, 14.0, 9.0, 14.0, 20.0, 14.0, 27.0, 29.0, 21.0, 26.0, 32.0, 38.0, 42.0, 37.0, 43.0, 44.0, 43.0, 48.0, 43.0, 40.0, 48.0, 48.0, 38.0, 29.0, 37.0, 32.0, 22.0, 12.0, 22.0, 24.0, 18.0, 12.0, 15.0, 13.0, 11.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10800290107727051, -0.10456464439630508, -0.10112638771533966, -0.09768813848495483, -0.09424988180398941, -0.09081162512302399, -0.08737337589263916, -0.08393511921167374, -0.08049686253070831, -0.07705860584974289, -0.07362034916877747, -0.07018209993839264, -0.06674384325742722, -0.06330558657646179, -0.05986733362078667, -0.05642908066511154, -0.05299082398414612, -0.049552567303180695, -0.04611431434750557, -0.042676061391830444, -0.03923780471086502, -0.0357995480298996, -0.03236129507422447, -0.028923040255904198, -0.025484785437583923, -0.02204653061926365, -0.018608275800943375, -0.0151700209826231, -0.011731766164302826, -0.008293511345982552, -0.004855256527662277, -0.0014170017093420029, 0.0020212531089782715, 0.005459507927298546, 0.00889776274561882, 0.012336017563939095, 0.01577427238225937, 0.019212527200579643, 0.022650782018899918, 0.026089036837220192, 0.029527291655540466, 0.03296554833650589, 0.036403801292181015, 0.03984205424785614, 0.043280310928821564, 0.04671856760978699, 0.05015682056546211, 0.05359507352113724, 0.05703333020210266, 0.060471586883068085, 0.06390984356403351, 0.06734809279441833, 0.07078634947538376, 0.07422460615634918, 0.07766285538673401, 0.08110111206769943, 0.08453936874866486, 0.08797762542963028, 0.0914158821105957, 0.09485413134098053, 0.09829238802194595, 0.10173064470291138, 0.1051688939332962, 0.10860715061426163, 0.11204540729522705]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 6.0, 5.0, 11.0, 25.0, 20.0, 30.0, 65.0, 86.0, 124.0, 245.0, 482.0, 898.0, 2093.0, 6632.0, 30876.0, 299466.0, 645917.0, 47571.0, 8958.0, 2687.0, 1141.0, 497.0, 252.0, 188.0, 99.0, 69.0, 29.0, 29.0, 20.0, 11.0, 10.0, 6.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.147216796875, -0.1431407928466797, -0.13906478881835938, -0.13498878479003906, -0.13091278076171875, -0.12683677673339844, -0.12276077270507812, -0.11868476867675781, -0.1146087646484375, -0.11053276062011719, -0.10645675659179688, -0.10238075256347656, -0.09830474853515625, -0.09422874450683594, -0.09015274047851562, -0.08607673645019531, -0.082000732421875, -0.07792472839355469, -0.07384872436523438, -0.06977272033691406, -0.06569671630859375, -0.06162071228027344, -0.057544708251953125, -0.05346870422363281, -0.0493927001953125, -0.04531669616699219, -0.041240692138671875, -0.03716468811035156, -0.03308868408203125, -0.029012680053710938, -0.024936676025390625, -0.020860671997070312, -0.01678466796875, -0.012708663940429688, -0.008632659912109375, -0.0045566558837890625, -0.00048065185546875, 0.0035953521728515625, 0.007671356201171875, 0.011747360229492188, 0.0158233642578125, 0.019899368286132812, 0.023975372314453125, 0.028051376342773438, 0.03212738037109375, 0.03620338439941406, 0.040279388427734375, 0.04435539245605469, 0.048431396484375, 0.05250740051269531, 0.056583404541015625, 0.06065940856933594, 0.06473541259765625, 0.06881141662597656, 0.07288742065429688, 0.07696342468261719, 0.0810394287109375, 0.08511543273925781, 0.08919143676757812, 0.09326744079589844, 0.09734344482421875, 0.10141944885253906, 0.10549545288085938, 0.10957145690917969, 0.1136474609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 0.0, 5.0, 6.0, 10.0, 10.0, 19.0, 29.0, 68.0, 169.0, 246.0, 206.0, 122.0, 47.0, 20.0, 11.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1275634765625, -0.12311553955078125, -0.1186676025390625, -0.11421966552734375, -0.109771728515625, -0.10532379150390625, -0.1008758544921875, -0.09642791748046875, -0.09197998046875, -0.08753204345703125, -0.0830841064453125, -0.07863616943359375, -0.074188232421875, -0.06974029541015625, -0.0652923583984375, -0.06084442138671875, -0.056396484375, -0.05194854736328125, -0.0475006103515625, -0.04305267333984375, -0.038604736328125, -0.03415679931640625, -0.0297088623046875, -0.02526092529296875, -0.02081298828125, -0.01636505126953125, -0.0119171142578125, -0.00746917724609375, -0.003021240234375, 0.00142669677734375, 0.0058746337890625, 0.01032257080078125, 0.0147705078125, 0.01921844482421875, 0.0236663818359375, 0.02811431884765625, 0.032562255859375, 0.03701019287109375, 0.0414581298828125, 0.04590606689453125, 0.05035400390625, 0.05480194091796875, 0.0592498779296875, 0.06369781494140625, 0.068145751953125, 0.07259368896484375, 0.0770416259765625, 0.08148956298828125, 0.0859375, 0.09038543701171875, 0.0948333740234375, 0.09928131103515625, 0.103729248046875, 0.10817718505859375, 0.1126251220703125, 0.11707305908203125, 0.12152099609375, 0.12596893310546875, 0.1304168701171875, 0.13486480712890625, 0.139312744140625, 0.14376068115234375, 0.1482086181640625, 0.15265655517578125, 0.1571044921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 14.0, 6.0, 7.0, 13.0, 14.0, 27.0, 29.0, 38.0, 44.0, 64.0, 77.0, 94.0, 179.0, 245.0, 367.0, 705.0, 1749.0, 6974.0, 46168.0, 498185.0, 442503.0, 41257.0, 6280.0, 1594.0, 664.0, 404.0, 216.0, 163.0, 117.0, 73.0, 58.0, 52.0, 42.0, 29.0, 20.0, 8.0, 18.0, 16.0, 8.0, 6.0, 4.0, 6.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10888671875, -0.1052541732788086, -0.10162162780761719, -0.09798908233642578, -0.09435653686523438, -0.09072399139404297, -0.08709144592285156, -0.08345890045166016, -0.07982635498046875, -0.07619380950927734, -0.07256126403808594, -0.06892871856689453, -0.06529617309570312, -0.06166362762451172, -0.05803108215332031, -0.054398536682128906, -0.0507659912109375, -0.047133445739746094, -0.04350090026855469, -0.03986835479736328, -0.036235809326171875, -0.03260326385498047, -0.028970718383789062, -0.025338172912597656, -0.02170562744140625, -0.018073081970214844, -0.014440536499023438, -0.010807991027832031, -0.007175445556640625, -0.0035429000854492188, 8.96453857421875e-05, 0.0037221908569335938, 0.007354736328125, 0.010987281799316406, 0.014619827270507812, 0.01825237274169922, 0.021884918212890625, 0.02551746368408203, 0.029150009155273438, 0.032782554626464844, 0.03641510009765625, 0.040047645568847656, 0.04368019104003906, 0.04731273651123047, 0.050945281982421875, 0.05457782745361328, 0.05821037292480469, 0.061842918395996094, 0.0654754638671875, 0.0691080093383789, 0.07274055480957031, 0.07637310028076172, 0.08000564575195312, 0.08363819122314453, 0.08727073669433594, 0.09090328216552734, 0.09453582763671875, 0.09816837310791016, 0.10180091857910156, 0.10543346405029297, 0.10906600952148438, 0.11269855499267578, 0.11633110046386719, 0.1199636459350586, 0.12359619140625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 11.0, 4.0, 4.0, 8.0, 9.0, 12.0, 13.0, 14.0, 18.0, 12.0, 17.0, 33.0, 33.0, 38.0, 39.0, 38.0, 43.0, 47.0, 46.0, 38.0, 36.0, 39.0, 47.0, 30.0, 39.0, 32.0, 30.0, 33.0, 22.0, 34.0, 28.0, 24.0, 25.0, 21.0, 9.0, 16.0, 11.0, 8.0, 3.0, 9.0, 2.0, 4.0, 8.0, 0.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.185546875, -0.17955970764160156, -0.17357254028320312, -0.1675853729248047, -0.16159820556640625, -0.1556110382080078, -0.14962387084960938, -0.14363670349121094, -0.1376495361328125, -0.13166236877441406, -0.12567520141601562, -0.11968803405761719, -0.11370086669921875, -0.10771369934082031, -0.10172653198242188, -0.09573936462402344, -0.089752197265625, -0.08376502990722656, -0.07777786254882812, -0.07179069519042969, -0.06580352783203125, -0.05981636047363281, -0.053829193115234375, -0.04784202575683594, -0.0418548583984375, -0.03586769104003906, -0.029880523681640625, -0.023893356323242188, -0.01790618896484375, -0.011919021606445312, -0.005931854248046875, 5.53131103515625e-05, 0.00604248046875, 0.012029647827148438, 0.018016815185546875, 0.024003982543945312, 0.02999114990234375, 0.03597831726074219, 0.041965484619140625, 0.04795265197753906, 0.0539398193359375, 0.05992698669433594, 0.06591415405273438, 0.07190132141113281, 0.07788848876953125, 0.08387565612792969, 0.08986282348632812, 0.09584999084472656, 0.101837158203125, 0.10782432556152344, 0.11381149291992188, 0.11979866027832031, 0.12578582763671875, 0.1317729949951172, 0.13776016235351562, 0.14374732971191406, 0.1497344970703125, 0.15572166442871094, 0.16170883178710938, 0.1676959991455078, 0.17368316650390625, 0.1796703338623047, 0.18565750122070312, 0.19164466857910156, 0.1976318359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 7.0, 2.0, 3.0, 6.0, 10.0, 6.0, 22.0, 25.0, 24.0, 52.0, 66.0, 126.0, 207.0, 401.0, 777.0, 2015.0, 5728.0, 18295.0, 65147.0, 751391.0, 155255.0, 33347.0, 9872.0, 3253.0, 1241.0, 528.0, 268.0, 176.0, 88.0, 58.0, 44.0, 43.0, 19.0, 11.0, 12.0, 13.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035980224609375, -0.03491401672363281, -0.033847808837890625, -0.03278160095214844, -0.03171539306640625, -0.030649185180664062, -0.029582977294921875, -0.028516769409179688, -0.0274505615234375, -0.026384353637695312, -0.025318145751953125, -0.024251937866210938, -0.02318572998046875, -0.022119522094726562, -0.021053314208984375, -0.019987106323242188, -0.0189208984375, -0.017854690551757812, -0.016788482666015625, -0.015722274780273438, -0.01465606689453125, -0.013589859008789062, -0.012523651123046875, -0.011457443237304688, -0.0103912353515625, -0.009325027465820312, -0.008258819580078125, -0.0071926116943359375, -0.00612640380859375, -0.0050601959228515625, -0.003993988037109375, -0.0029277801513671875, -0.001861572265625, -0.0007953643798828125, 0.000270843505859375, 0.0013370513916015625, 0.00240325927734375, 0.0034694671630859375, 0.004535675048828125, 0.0056018829345703125, 0.0066680908203125, 0.0077342987060546875, 0.008800506591796875, 0.009866714477539062, 0.01093292236328125, 0.011999130249023438, 0.013065338134765625, 0.014131546020507812, 0.01519775390625, 0.016263961791992188, 0.017330169677734375, 0.018396377563476562, 0.01946258544921875, 0.020528793334960938, 0.021595001220703125, 0.022661209106445312, 0.0237274169921875, 0.024793624877929688, 0.025859832763671875, 0.026926040649414062, 0.02799224853515625, 0.029058456420898438, 0.030124664306640625, 0.031190872192382812, 0.032257080078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 8.0, 7.0, 8.0, 12.0, 7.0, 7.0, 22.0, 19.0, 48.0, 62.0, 108.0, 132.0, 123.0, 137.0, 92.0, 51.0, 39.0, 29.0, 24.0, 5.0, 11.0, 9.0, 6.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.357929229736328e-06, -9.085983037948608e-06, -8.814036846160889e-06, -8.542090654373169e-06, -8.27014446258545e-06, -7.99819827079773e-06, -7.72625207901001e-06, -7.45430588722229e-06, -7.18235969543457e-06, -6.910413503646851e-06, -6.638467311859131e-06, -6.366521120071411e-06, -6.094574928283691e-06, -5.822628736495972e-06, -5.550682544708252e-06, -5.278736352920532e-06, -5.0067901611328125e-06, -4.734843969345093e-06, -4.462897777557373e-06, -4.190951585769653e-06, -3.919005393981934e-06, -3.647059202194214e-06, -3.375113010406494e-06, -3.1031668186187744e-06, -2.8312206268310547e-06, -2.559274435043335e-06, -2.2873282432556152e-06, -2.0153820514678955e-06, -1.7434358596801758e-06, -1.471489667892456e-06, -1.1995434761047363e-06, -9.275972843170166e-07, -6.556510925292969e-07, -3.8370490074157715e-07, -1.1175870895385742e-07, 1.601874828338623e-07, 4.3213367462158203e-07, 7.040798664093018e-07, 9.760260581970215e-07, 1.2479722499847412e-06, 1.519918441772461e-06, 1.7918646335601807e-06, 2.0638108253479004e-06, 2.33575701713562e-06, 2.60770320892334e-06, 2.8796494007110596e-06, 3.1515955924987793e-06, 3.423541784286499e-06, 3.6954879760742188e-06, 3.9674341678619385e-06, 4.239380359649658e-06, 4.511326551437378e-06, 4.783272743225098e-06, 5.055218935012817e-06, 5.327165126800537e-06, 5.599111318588257e-06, 5.8710575103759766e-06, 6.143003702163696e-06, 6.414949893951416e-06, 6.686896085739136e-06, 6.9588422775268555e-06, 7.230788469314575e-06, 7.502734661102295e-06, 7.774680852890015e-06, 8.046627044677734e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 7.0, 7.0, 4.0, 13.0, 16.0, 14.0, 27.0, 39.0, 43.0, 55.0, 95.0, 159.0, 230.0, 403.0, 752.0, 1439.0, 3662.0, 10760.0, 39579.0, 401239.0, 530059.0, 41534.0, 11237.0, 3736.0, 1529.0, 705.0, 438.0, 253.0, 170.0, 112.0, 64.0, 45.0, 36.0, 24.0, 15.0, 15.0, 11.0, 7.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.045318603515625, -0.04402446746826172, -0.04273033142089844, -0.041436195373535156, -0.040142059326171875, -0.038847923278808594, -0.03755378723144531, -0.03625965118408203, -0.03496551513671875, -0.03367137908935547, -0.03237724304199219, -0.031083106994628906, -0.029788970947265625, -0.028494834899902344, -0.027200698852539062, -0.02590656280517578, -0.0246124267578125, -0.02331829071044922, -0.022024154663085938, -0.020730018615722656, -0.019435882568359375, -0.018141746520996094, -0.016847610473632812, -0.015553474426269531, -0.01425933837890625, -0.012965202331542969, -0.011671066284179688, -0.010376930236816406, -0.009082794189453125, -0.007788658142089844, -0.0064945220947265625, -0.005200386047363281, -0.00390625, -0.0026121139526367188, -0.0013179779052734375, -2.384185791015625e-05, 0.001270294189453125, 0.0025644302368164062, 0.0038585662841796875, 0.005152702331542969, 0.00644683837890625, 0.007740974426269531, 0.009035110473632812, 0.010329246520996094, 0.011623382568359375, 0.012917518615722656, 0.014211654663085938, 0.015505790710449219, 0.0167999267578125, 0.01809406280517578, 0.019388198852539062, 0.020682334899902344, 0.021976470947265625, 0.023270606994628906, 0.024564743041992188, 0.02585887908935547, 0.02715301513671875, 0.02844715118408203, 0.029741287231445312, 0.031035423278808594, 0.032329559326171875, 0.033623695373535156, 0.03491783142089844, 0.03621196746826172, 0.037506103515625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 9.0, 7.0, 4.0, 7.0, 9.0, 5.0, 16.0, 25.0, 22.0, 39.0, 37.0, 64.0, 105.0, 132.0, 147.0, 103.0, 77.0, 45.0, 27.0, 35.0, 16.0, 12.0, 10.0, 15.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.04986572265625, -0.0484461784362793, -0.047026634216308594, -0.04560708999633789, -0.04418754577636719, -0.042768001556396484, -0.04134845733642578, -0.03992891311645508, -0.038509368896484375, -0.03708982467651367, -0.03567028045654297, -0.034250736236572266, -0.03283119201660156, -0.03141164779663086, -0.029992103576660156, -0.028572559356689453, -0.02715301513671875, -0.025733470916748047, -0.024313926696777344, -0.02289438247680664, -0.021474838256835938, -0.020055294036865234, -0.01863574981689453, -0.017216205596923828, -0.015796661376953125, -0.014377117156982422, -0.012957572937011719, -0.011538028717041016, -0.010118484497070312, -0.00869894027709961, -0.007279396057128906, -0.005859851837158203, -0.0044403076171875, -0.003020763397216797, -0.0016012191772460938, -0.00018167495727539062, 0.0012378692626953125, 0.0026574134826660156, 0.004076957702636719, 0.005496501922607422, 0.006916046142578125, 0.008335590362548828, 0.009755134582519531, 0.011174678802490234, 0.012594223022460938, 0.01401376724243164, 0.015433311462402344, 0.016852855682373047, 0.01827239990234375, 0.019691944122314453, 0.021111488342285156, 0.02253103256225586, 0.023950576782226562, 0.025370121002197266, 0.02678966522216797, 0.028209209442138672, 0.029628753662109375, 0.031048297882080078, 0.03246784210205078, 0.033887386322021484, 0.03530693054199219, 0.03672647476196289, 0.038146018981933594, 0.0395655632019043, 0.040985107421875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 11.0, 317.0, 683.0, 5.0, 2.0, 2.0], "bins": [-11.232830047607422, -11.04603385925293, -10.859237670898438, -10.672442436218262, -10.48564624786377, -10.298850059509277, -10.112053871154785, -9.92525863647461, -9.738462448120117, -9.551666259765625, -9.364870071411133, -9.178074836730957, -8.991278648376465, -8.804482460021973, -8.61768627166748, -8.430891036987305, -8.244094848632812, -8.05729866027832, -7.870502948760986, -7.683706760406494, -7.49691104888916, -7.310114860534668, -7.123319149017334, -6.936522960662842, -6.74972677230835, -6.562930583953857, -6.376134872436523, -6.189338684082031, -6.002542972564697, -5.815746784210205, -5.628951072692871, -5.442154884338379, -5.255359172821045, -5.068562984466553, -4.881767272949219, -4.694971084594727, -4.508175373077393, -4.3213791847229, -4.134583473205566, -3.947787284851074, -3.7609915733337402, -3.574195623397827, -3.387399673461914, -3.200603723526001, -3.013807773590088, -2.827011823654175, -2.6402158737182617, -2.4534196853637695, -2.2666237354278564, -2.0798277854919434, -1.8930318355560303, -1.7062358856201172, -1.519439935684204, -1.332643985748291, -1.1458479166030884, -0.9590519666671753, -0.7722560167312622, -0.5854600667953491, -0.39866408705711365, -0.21186810731887817, -0.025072157382965088, 0.161723792552948, 0.34851980209350586, 0.535315752029419, 0.722111701965332]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 3.0, 2.0, 13.0, 6.0, 17.0, 19.0, 18.0, 16.0, 25.0, 37.0, 28.0, 40.0, 51.0, 43.0, 41.0, 38.0, 41.0, 33.0, 50.0, 37.0, 47.0, 45.0, 40.0, 39.0, 38.0, 36.0, 29.0, 28.0, 25.0, 19.0, 13.0, 16.0, 6.0, 13.0, 12.0, 7.0, 6.0, 8.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9799671769142151, -0.9492667317390442, -0.9185662865638733, -0.8878658413887024, -0.8571653962135315, -0.8264649510383606, -0.7957645654678345, -0.7650641202926636, -0.7343636751174927, -0.7036632299423218, -0.6729627847671509, -0.64226233959198, -0.6115618944168091, -0.5808614492416382, -0.5501610040664673, -0.5194605588912964, -0.4887601137161255, -0.4580596685409546, -0.4273592233657837, -0.3966587781906128, -0.3659583330154419, -0.335257887840271, -0.3045574724674225, -0.2738570272922516, -0.2431565821170807, -0.2124561369419098, -0.1817556917667389, -0.1510552614927292, -0.12035481631755829, -0.08965437114238739, -0.058953940868377686, -0.028253495693206787, 0.002446889877319336, 0.033147331327199936, 0.06384777277708054, 0.09454821050167084, 0.12524865567684174, 0.15594910085201263, 0.18664953112602234, 0.21734997630119324, 0.24805042147636414, 0.27875086665153503, 0.30945131182670593, 0.34015172719955444, 0.37085217237472534, 0.40155261754989624, 0.43225306272506714, 0.46295350790023804, 0.49365395307540894, 0.5243543982505798, 0.5550548434257507, 0.5857552886009216, 0.6164557337760925, 0.6471561789512634, 0.6778565645217896, 0.7085570096969604, 0.7392574548721313, 0.7699579000473022, 0.8006583452224731, 0.831358790397644, 0.8620592355728149, 0.8927596807479858, 0.9234601259231567, 0.9541605710983276, 0.9848610162734985]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 7.0, 9.0, 7.0, 12.0, 13.0, 8.0, 25.0, 119.0, 24291.0, 4169471.0, 196.0, 36.0, 22.0, 15.0, 12.0, 10.0, 6.0, 5.0, 6.0, 7.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.646484375, -1.591796875, -1.537109375, -1.482421875, -1.427734375, -1.373046875, -1.318359375, -1.263671875, -1.208984375, -1.154296875, -1.099609375, -1.044921875, -0.990234375, -0.935546875, -0.880859375, -0.826171875, -0.771484375, -0.716796875, -0.662109375, -0.607421875, -0.552734375, -0.498046875, -0.443359375, -0.388671875, -0.333984375, -0.279296875, -0.224609375, -0.169921875, -0.115234375, -0.060546875, -0.005859375, 0.048828125, 0.103515625, 0.158203125, 0.212890625, 0.267578125, 0.322265625, 0.376953125, 0.431640625, 0.486328125, 0.541015625, 0.595703125, 0.650390625, 0.705078125, 0.759765625, 0.814453125, 0.869140625, 0.923828125, 0.978515625, 1.033203125, 1.087890625, 1.142578125, 1.197265625, 1.251953125, 1.306640625, 1.361328125, 1.416015625, 1.470703125, 1.525390625, 1.580078125, 1.634765625, 1.689453125, 1.744140625, 1.798828125, 1.853515625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 1.0, 6.0, 9.0, 16.0, 18.0, 28.0, 64.0, 183.0, 243.0, 198.0, 119.0, 54.0, 21.0, 7.0, 12.0, 9.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12841796875, -0.12394142150878906, -0.11946487426757812, -0.11498832702636719, -0.11051177978515625, -0.10603523254394531, -0.10155868530273438, -0.09708213806152344, -0.0926055908203125, -0.08812904357910156, -0.08365249633789062, -0.07917594909667969, -0.07469940185546875, -0.07022285461425781, -0.06574630737304688, -0.06126976013183594, -0.056793212890625, -0.05231666564941406, -0.047840118408203125, -0.04336357116699219, -0.03888702392578125, -0.03441047668457031, -0.029933929443359375, -0.025457382202148438, -0.0209808349609375, -0.016504287719726562, -0.012027740478515625, -0.0075511932373046875, -0.00307464599609375, 0.0014019012451171875, 0.005878448486328125, 0.010354995727539062, 0.01483154296875, 0.019308090209960938, 0.023784637451171875, 0.028261184692382812, 0.03273773193359375, 0.03721427917480469, 0.041690826416015625, 0.04616737365722656, 0.0506439208984375, 0.05512046813964844, 0.059597015380859375, 0.06407356262207031, 0.06855010986328125, 0.07302665710449219, 0.07750320434570312, 0.08197975158691406, 0.086456298828125, 0.09093284606933594, 0.09540939331054688, 0.09988594055175781, 0.10436248779296875, 0.10883903503417969, 0.11331558227539062, 0.11779212951660156, 0.1222686767578125, 0.12674522399902344, 0.13122177124023438, 0.1356983184814453, 0.14017486572265625, 0.1446514129638672, 0.14912796020507812, 0.15360450744628906, 0.1580810546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 19.0, 31.0, 67.0, 97.0, 162.0, 310.0, 548.0, 1115.0, 2623.0, 7604.0, 28534.0, 181671.0, 3668709.0, 253224.0, 35193.0, 8688.0, 2974.0, 1275.0, 642.0, 366.0, 185.0, 96.0, 55.0, 28.0, 17.0, 12.0, 14.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.11968994140625, -0.11641693115234375, -0.1131439208984375, -0.10987091064453125, -0.106597900390625, -0.10332489013671875, -0.1000518798828125, -0.09677886962890625, -0.093505859375, -0.09023284912109375, -0.0869598388671875, -0.08368682861328125, -0.080413818359375, -0.07714080810546875, -0.0738677978515625, -0.07059478759765625, -0.06732177734375, -0.06404876708984375, -0.0607757568359375, -0.05750274658203125, -0.054229736328125, -0.05095672607421875, -0.0476837158203125, -0.04441070556640625, -0.0411376953125, -0.03786468505859375, -0.0345916748046875, -0.03131866455078125, -0.028045654296875, -0.02477264404296875, -0.0214996337890625, -0.01822662353515625, -0.01495361328125, -0.01168060302734375, -0.0084075927734375, -0.00513458251953125, -0.001861572265625, 0.00141143798828125, 0.0046844482421875, 0.00795745849609375, 0.01123046875, 0.01450347900390625, 0.0177764892578125, 0.02104949951171875, 0.024322509765625, 0.02759552001953125, 0.0308685302734375, 0.03414154052734375, 0.03741455078125, 0.04068756103515625, 0.0439605712890625, 0.04723358154296875, 0.050506591796875, 0.05377960205078125, 0.0570526123046875, 0.06032562255859375, 0.0635986328125, 0.06687164306640625, 0.0701446533203125, 0.07341766357421875, 0.076690673828125, 0.07996368408203125, 0.0832366943359375, 0.08650970458984375, 0.08978271484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 10.0, 17.0, 27.0, 24.0, 50.0, 44.0, 77.0, 123.0, 234.0, 790.0, 1939.0, 278.0, 173.0, 99.0, 58.0, 32.0, 23.0, 18.0, 14.0, 6.0, 10.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038330078125, -0.03705739974975586, -0.03578472137451172, -0.03451204299926758, -0.03323936462402344, -0.0319666862487793, -0.030694007873535156, -0.029421329498291016, -0.028148651123046875, -0.026875972747802734, -0.025603294372558594, -0.024330615997314453, -0.023057937622070312, -0.021785259246826172, -0.02051258087158203, -0.01923990249633789, -0.01796722412109375, -0.01669454574584961, -0.015421867370605469, -0.014149188995361328, -0.012876510620117188, -0.011603832244873047, -0.010331153869628906, -0.009058475494384766, -0.007785797119140625, -0.006513118743896484, -0.005240440368652344, -0.003967761993408203, -0.0026950836181640625, -0.0014224052429199219, -0.00014972686767578125, 0.0011229515075683594, 0.0023956298828125, 0.0036683082580566406, 0.004940986633300781, 0.006213665008544922, 0.0074863433837890625, 0.008759021759033203, 0.010031700134277344, 0.011304378509521484, 0.012577056884765625, 0.013849735260009766, 0.015122413635253906, 0.016395092010498047, 0.017667770385742188, 0.018940448760986328, 0.02021312713623047, 0.02148580551147461, 0.02275848388671875, 0.02403116226196289, 0.02530384063720703, 0.026576519012451172, 0.027849197387695312, 0.029121875762939453, 0.030394554138183594, 0.031667232513427734, 0.032939910888671875, 0.034212589263916016, 0.035485267639160156, 0.0367579460144043, 0.03803062438964844, 0.03930330276489258, 0.04057598114013672, 0.04184865951538086, 0.043121337890625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 5.0, 7.0, 29.0, 174.0, 500.0, 240.0, 40.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1107993125915527, -1.0869327783584595, -1.0630662441253662, -1.0391998291015625, -1.0153332948684692, -0.991466760635376, -0.9676002264022827, -0.9437336921691895, -0.9198671579360962, -0.8960006237030029, -0.8721341490745544, -0.8482676148414612, -0.8244010806083679, -0.8005346059799194, -0.7766680717468262, -0.7528015375137329, -0.7289350628852844, -0.7050685286521912, -0.6812020540237427, -0.6573355197906494, -0.6334689855575562, -0.6096024513244629, -0.5857359766960144, -0.5618694424629211, -0.5380029678344727, -0.5141364336013794, -0.4902699291706085, -0.46640342473983765, -0.4425368905067444, -0.4186703860759735, -0.39480388164520264, -0.3709373474121094, -0.3470707833766937, -0.32320427894592285, -0.2993377447128296, -0.2754712402820587, -0.25160473585128784, -0.22773820161819458, -0.2038716971874237, -0.18000517785549164, -0.15613865852355957, -0.1322721391916275, -0.10840562731027603, -0.08453911542892456, -0.06067259609699249, -0.036806076765060425, -0.01293957233428955, 0.010926946997642517, 0.034793466329574585, 0.058659981936216354, 0.08252649754285812, 0.1063930094242096, 0.13025952875614166, 0.15412604808807373, 0.1779925525188446, 0.20185907185077667, 0.22572559118270874, 0.2495921105146408, 0.2734586298465729, 0.29732513427734375, 0.321191668510437, 0.3450581729412079, 0.36892467737197876, 0.392791211605072, 0.4166577160358429]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 10.0, 4.0, 3.0, 13.0, 14.0, 10.0, 14.0, 13.0, 12.0, 18.0, 15.0, 35.0, 20.0, 33.0, 25.0, 27.0, 37.0, 41.0, 33.0, 41.0, 39.0, 47.0, 37.0, 44.0, 32.0, 34.0, 36.0, 35.0, 21.0, 30.0, 27.0, 31.0, 22.0, 14.0, 17.0, 13.0, 16.0, 21.0, 16.0, 14.0, 10.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.10096240043640137, -0.0977456271648407, -0.09452885389328003, -0.09131207317113876, -0.0880952998995781, -0.08487852662801743, -0.08166174590587616, -0.07844497263431549, -0.07522819936275482, -0.07201142609119415, -0.06879465281963348, -0.06557787209749222, -0.06236109882593155, -0.05914432555437088, -0.05592754855751991, -0.052710771560668945, -0.049493998289108276, -0.04627722501754761, -0.04306044802069664, -0.03984367102384567, -0.036626897752285004, -0.033410124480724335, -0.030193347483873367, -0.02697657234966755, -0.02375979721546173, -0.020543022081255913, -0.017326246947050095, -0.014109471812844276, -0.010892696678638458, -0.00767592154443264, -0.004459146410226822, -0.0012423712760210037, 0.0019744038581848145, 0.005191178992390633, 0.00840795412659645, 0.011624729260802269, 0.014841504395008087, 0.018058279529213905, 0.021275054663419724, 0.02449182979762554, 0.02770860493183136, 0.030925380066037178, 0.034142155200242996, 0.037358932197093964, 0.04057570546865463, 0.0437924787402153, 0.04700925573706627, 0.050226032733917236, 0.053442806005477905, 0.056659579277038574, 0.05987635627388954, 0.06309313327074051, 0.06630990654230118, 0.06952667981386185, 0.07274346053600311, 0.07596023380756378, 0.07917700707912445, 0.08239378035068512, 0.08561055362224579, 0.08882733434438705, 0.09204410761594772, 0.09526088088750839, 0.09847766160964966, 0.10169443488121033, 0.104911208152771]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 10.0, 9.0, 17.0, 12.0, 31.0, 33.0, 45.0, 58.0, 102.0, 122.0, 187.0, 299.0, 513.0, 829.0, 1673.0, 3682.0, 9564.0, 36823.0, 224283.0, 623425.0, 112638.0, 21683.0, 6553.0, 2745.0, 1287.0, 725.0, 411.0, 261.0, 167.0, 105.0, 81.0, 53.0, 40.0, 29.0, 13.0, 13.0, 15.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1312255859375, -0.12689781188964844, -0.12257003784179688, -0.11824226379394531, -0.11391448974609375, -0.10958671569824219, -0.10525894165039062, -0.10093116760253906, -0.0966033935546875, -0.09227561950683594, -0.08794784545898438, -0.08362007141113281, -0.07929229736328125, -0.07496452331542969, -0.07063674926757812, -0.06630897521972656, -0.061981201171875, -0.05765342712402344, -0.053325653076171875, -0.04899787902832031, -0.04467010498046875, -0.04034233093261719, -0.036014556884765625, -0.03168678283691406, -0.0273590087890625, -0.023031234741210938, -0.018703460693359375, -0.014375686645507812, -0.01004791259765625, -0.0057201385498046875, -0.001392364501953125, 0.0029354095458984375, 0.00726318359375, 0.011590957641601562, 0.015918731689453125, 0.020246505737304688, 0.02457427978515625, 0.028902053833007812, 0.033229827880859375, 0.03755760192871094, 0.0418853759765625, 0.04621315002441406, 0.050540924072265625, 0.05486869812011719, 0.05919647216796875, 0.06352424621582031, 0.06785202026367188, 0.07217979431152344, 0.076507568359375, 0.08083534240722656, 0.08516311645507812, 0.08949089050292969, 0.09381866455078125, 0.09814643859863281, 0.10247421264648438, 0.10680198669433594, 0.1111297607421875, 0.11545753479003906, 0.11978530883789062, 0.12411308288574219, 0.12844085693359375, 0.1327686309814453, 0.13709640502929688, 0.14142417907714844, 0.145751953125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 1.0, 6.0, 8.0, 13.0, 19.0, 25.0, 70.0, 154.0, 229.0, 215.0, 124.0, 64.0, 29.0, 10.0, 11.0, 7.0, 8.0, 3.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12841796875, -0.12396430969238281, -0.11951065063476562, -0.11505699157714844, -0.11060333251953125, -0.10614967346191406, -0.10169601440429688, -0.09724235534667969, -0.0927886962890625, -0.08833503723144531, -0.08388137817382812, -0.07942771911621094, -0.07497406005859375, -0.07052040100097656, -0.06606674194335938, -0.06161308288574219, -0.057159423828125, -0.05270576477050781, -0.048252105712890625, -0.04379844665527344, -0.03934478759765625, -0.03489112854003906, -0.030437469482421875, -0.025983810424804688, -0.0215301513671875, -0.017076492309570312, -0.012622833251953125, -0.008169174194335938, -0.00371551513671875, 0.0007381439208984375, 0.005191802978515625, 0.009645462036132812, 0.01409912109375, 0.018552780151367188, 0.023006439208984375, 0.027460098266601562, 0.03191375732421875, 0.03636741638183594, 0.040821075439453125, 0.04527473449707031, 0.0497283935546875, 0.05418205261230469, 0.058635711669921875, 0.06308937072753906, 0.06754302978515625, 0.07199668884277344, 0.07645034790039062, 0.08090400695800781, 0.085357666015625, 0.08981132507324219, 0.09426498413085938, 0.09871864318847656, 0.10317230224609375, 0.10762596130371094, 0.11207962036132812, 0.11653327941894531, 0.1209869384765625, 0.1254405975341797, 0.12989425659179688, 0.13434791564941406, 0.13880157470703125, 0.14325523376464844, 0.14770889282226562, 0.1521625518798828, 0.1566162109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 8.0, 10.0, 16.0, 16.0, 19.0, 25.0, 45.0, 59.0, 90.0, 130.0, 223.0, 379.0, 711.0, 1893.0, 16006.0, 816541.0, 204691.0, 5098.0, 1227.0, 513.0, 270.0, 181.0, 100.0, 77.0, 67.0, 38.0, 23.0, 18.0, 19.0, 9.0, 11.0, 8.0, 6.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.314697265625, -0.3053855895996094, -0.29607391357421875, -0.2867622375488281, -0.2774505615234375, -0.2681388854980469, -0.25882720947265625, -0.24951553344726562, -0.240203857421875, -0.23089218139648438, -0.22158050537109375, -0.21226882934570312, -0.2029571533203125, -0.19364547729492188, -0.18433380126953125, -0.17502212524414062, -0.16571044921875, -0.15639877319335938, -0.14708709716796875, -0.13777542114257812, -0.1284637451171875, -0.11915206909179688, -0.10984039306640625, -0.10052871704101562, -0.091217041015625, -0.08190536499023438, -0.07259368896484375, -0.06328201293945312, -0.0539703369140625, -0.044658660888671875, -0.03534698486328125, -0.026035308837890625, -0.0167236328125, -0.007411956787109375, 0.00189971923828125, 0.011211395263671875, 0.0205230712890625, 0.029834747314453125, 0.03914642333984375, 0.048458099365234375, 0.057769775390625, 0.06708145141601562, 0.07639312744140625, 0.08570480346679688, 0.0950164794921875, 0.10432815551757812, 0.11363983154296875, 0.12295150756835938, 0.13226318359375, 0.14157485961914062, 0.15088653564453125, 0.16019821166992188, 0.1695098876953125, 0.17882156372070312, 0.18813323974609375, 0.19744491577148438, 0.206756591796875, 0.21606826782226562, 0.22537994384765625, 0.23469161987304688, 0.2440032958984375, 0.2533149719238281, 0.26262664794921875, 0.2719383239746094, 0.28125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 2.0, 5.0, 6.0, 11.0, 9.0, 17.0, 20.0, 17.0, 34.0, 24.0, 27.0, 18.0, 37.0, 35.0, 34.0, 37.0, 49.0, 41.0, 47.0, 48.0, 52.0, 38.0, 40.0, 33.0, 32.0, 40.0, 31.0, 21.0, 34.0, 20.0, 17.0, 25.0, 21.0, 11.0, 12.0, 15.0, 5.0, 6.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.2369384765625, -0.23050308227539062, -0.22406768798828125, -0.21763229370117188, -0.2111968994140625, -0.20476150512695312, -0.19832611083984375, -0.19189071655273438, -0.185455322265625, -0.17901992797851562, -0.17258453369140625, -0.16614913940429688, -0.1597137451171875, -0.15327835083007812, -0.14684295654296875, -0.14040756225585938, -0.13397216796875, -0.12753677368164062, -0.12110137939453125, -0.11466598510742188, -0.1082305908203125, -0.10179519653320312, -0.09535980224609375, -0.08892440795898438, -0.082489013671875, -0.07605361938476562, -0.06961822509765625, -0.06318283081054688, -0.0567474365234375, -0.050312042236328125, -0.04387664794921875, -0.037441253662109375, -0.031005859375, -0.024570465087890625, -0.01813507080078125, -0.011699676513671875, -0.0052642822265625, 0.001171112060546875, 0.00760650634765625, 0.014041900634765625, 0.020477294921875, 0.026912689208984375, 0.03334808349609375, 0.039783477783203125, 0.0462188720703125, 0.052654266357421875, 0.05908966064453125, 0.06552505493164062, 0.07196044921875, 0.07839584350585938, 0.08483123779296875, 0.09126663208007812, 0.0977020263671875, 0.10413742065429688, 0.11057281494140625, 0.11700820922851562, 0.123443603515625, 0.12987899780273438, 0.13631439208984375, 0.14274978637695312, 0.1491851806640625, 0.15562057495117188, 0.16205596923828125, 0.16849136352539062, 0.1749267578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 11.0, 10.0, 12.0, 21.0, 30.0, 41.0, 67.0, 102.0, 196.0, 375.0, 848.0, 2412.0, 9202.0, 54092.0, 762712.0, 192191.0, 19129.0, 4409.0, 1398.0, 573.0, 280.0, 131.0, 108.0, 68.0, 33.0, 26.0, 14.0, 15.0, 16.0, 6.0, 5.0, 6.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.06640625, -0.06409549713134766, -0.06178474426269531, -0.05947399139404297, -0.057163238525390625, -0.05485248565673828, -0.05254173278808594, -0.050230979919433594, -0.04792022705078125, -0.045609474182128906, -0.04329872131347656, -0.04098796844482422, -0.038677215576171875, -0.03636646270751953, -0.03405570983886719, -0.031744956970214844, -0.0294342041015625, -0.027123451232910156, -0.024812698364257812, -0.02250194549560547, -0.020191192626953125, -0.01788043975830078, -0.015569686889648438, -0.013258934020996094, -0.01094818115234375, -0.008637428283691406, -0.0063266754150390625, -0.004015922546386719, -0.001705169677734375, 0.0006055831909179688, 0.0029163360595703125, 0.005227088928222656, 0.007537841796875, 0.009848594665527344, 0.012159347534179688, 0.014470100402832031, 0.016780853271484375, 0.01909160614013672, 0.021402359008789062, 0.023713111877441406, 0.02602386474609375, 0.028334617614746094, 0.030645370483398438, 0.03295612335205078, 0.035266876220703125, 0.03757762908935547, 0.03988838195800781, 0.042199134826660156, 0.0445098876953125, 0.046820640563964844, 0.04913139343261719, 0.05144214630126953, 0.053752899169921875, 0.05606365203857422, 0.05837440490722656, 0.060685157775878906, 0.06299591064453125, 0.0653066635131836, 0.06761741638183594, 0.06992816925048828, 0.07223892211914062, 0.07454967498779297, 0.07686042785644531, 0.07917118072509766, 0.08148193359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 10.0, 8.0, 17.0, 21.0, 30.0, 75.0, 116.0, 173.0, 176.0, 121.0, 95.0, 41.0, 31.0, 22.0, 12.0, 7.0, 5.0, 8.0, 3.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.5556812286376953e-05, -1.5004537999629974e-05, -1.4452263712882996e-05, -1.3899989426136017e-05, -1.3347715139389038e-05, -1.279544085264206e-05, -1.224316656589508e-05, -1.1690892279148102e-05, -1.1138617992401123e-05, -1.0586343705654144e-05, -1.0034069418907166e-05, -9.481795132160187e-06, -8.929520845413208e-06, -8.37724655866623e-06, -7.82497227191925e-06, -7.272697985172272e-06, -6.720423698425293e-06, -6.168149411678314e-06, -5.6158751249313354e-06, -5.063600838184357e-06, -4.511326551437378e-06, -3.959052264690399e-06, -3.4067779779434204e-06, -2.8545036911964417e-06, -2.302229404449463e-06, -1.7499551177024841e-06, -1.1976808309555054e-06, -6.454065442085266e-07, -9.313225746154785e-08, 4.591420292854309e-07, 1.0114163160324097e-06, 1.5636906027793884e-06, 2.115964889526367e-06, 2.668239176273346e-06, 3.2205134630203247e-06, 3.7727877497673035e-06, 4.325062036514282e-06, 4.877336323261261e-06, 5.42961061000824e-06, 5.9818848967552185e-06, 6.534159183502197e-06, 7.086433470249176e-06, 7.638707756996155e-06, 8.190982043743134e-06, 8.743256330490112e-06, 9.295530617237091e-06, 9.84780490398407e-06, 1.0400079190731049e-05, 1.0952353477478027e-05, 1.1504627764225006e-05, 1.2056902050971985e-05, 1.2609176337718964e-05, 1.3161450624465942e-05, 1.3713724911212921e-05, 1.42659991979599e-05, 1.4818273484706879e-05, 1.5370547771453857e-05, 1.5922822058200836e-05, 1.6475096344947815e-05, 1.7027370631694794e-05, 1.7579644918441772e-05, 1.813191920518875e-05, 1.868419349193573e-05, 1.923646777868271e-05, 1.9788742065429688e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 7.0, 14.0, 19.0, 35.0, 64.0, 89.0, 138.0, 275.0, 512.0, 1363.0, 5115.0, 32513.0, 704583.0, 279616.0, 18677.0, 3339.0, 1120.0, 452.0, 235.0, 152.0, 82.0, 38.0, 28.0, 32.0, 23.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.107177734375, -0.10401344299316406, -0.10084915161132812, -0.09768486022949219, -0.09452056884765625, -0.09135627746582031, -0.08819198608398438, -0.08502769470214844, -0.0818634033203125, -0.07869911193847656, -0.07553482055664062, -0.07237052917480469, -0.06920623779296875, -0.06604194641113281, -0.06287765502929688, -0.05971336364746094, -0.056549072265625, -0.05338478088378906, -0.050220489501953125, -0.04705619812011719, -0.04389190673828125, -0.04072761535644531, -0.037563323974609375, -0.03439903259277344, -0.0312347412109375, -0.028070449829101562, -0.024906158447265625, -0.021741867065429688, -0.01857757568359375, -0.015413284301757812, -0.012248992919921875, -0.009084701538085938, -0.00592041015625, -0.0027561187744140625, 0.000408172607421875, 0.0035724639892578125, 0.00673675537109375, 0.009901046752929688, 0.013065338134765625, 0.016229629516601562, 0.0193939208984375, 0.022558212280273438, 0.025722503662109375, 0.028886795043945312, 0.03205108642578125, 0.03521537780761719, 0.038379669189453125, 0.04154396057128906, 0.044708251953125, 0.04787254333496094, 0.051036834716796875, 0.05420112609863281, 0.05736541748046875, 0.06052970886230469, 0.06369400024414062, 0.06685829162597656, 0.0700225830078125, 0.07318687438964844, 0.07635116577148438, 0.07951545715332031, 0.08267974853515625, 0.08584403991699219, 0.08900833129882812, 0.09217262268066406, 0.0953369140625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 6.0, 6.0, 12.0, 15.0, 19.0, 29.0, 45.0, 57.0, 63.0, 87.0, 97.0, 128.0, 118.0, 94.0, 71.0, 35.0, 30.0, 21.0, 17.0, 14.0, 3.0, 5.0, 10.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051483154296875, -0.049364566802978516, -0.04724597930908203, -0.04512739181518555, -0.04300880432128906, -0.04089021682739258, -0.038771629333496094, -0.03665304183959961, -0.034534454345703125, -0.03241586685180664, -0.030297279357910156, -0.028178691864013672, -0.026060104370117188, -0.023941516876220703, -0.02182292938232422, -0.019704341888427734, -0.01758575439453125, -0.015467166900634766, -0.013348579406738281, -0.011229991912841797, -0.009111404418945312, -0.006992816925048828, -0.004874229431152344, -0.0027556419372558594, -0.000637054443359375, 0.0014815330505371094, 0.0036001205444335938, 0.005718708038330078, 0.007837295532226562, 0.009955883026123047, 0.012074470520019531, 0.014193058013916016, 0.0163116455078125, 0.018430233001708984, 0.02054882049560547, 0.022667407989501953, 0.024785995483398438, 0.026904582977294922, 0.029023170471191406, 0.03114175796508789, 0.033260345458984375, 0.03537893295288086, 0.037497520446777344, 0.03961610794067383, 0.04173469543457031, 0.0438532829284668, 0.04597187042236328, 0.048090457916259766, 0.05020904541015625, 0.052327632904052734, 0.05444622039794922, 0.0565648078918457, 0.05868339538574219, 0.06080198287963867, 0.06292057037353516, 0.06503915786743164, 0.06715774536132812, 0.06927633285522461, 0.0713949203491211, 0.07351350784301758, 0.07563209533691406, 0.07775068283081055, 0.07986927032470703, 0.08198785781860352, 0.0841064453125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 30.0, 101.0, 285.0, 348.0, 162.0, 44.0, 8.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4760022163391113, -1.4173980951309204, -1.358794093132019, -1.3001899719238281, -1.2415859699249268, -1.1829818487167358, -1.124377727508545, -1.0657737255096436, -1.0071697235107422, -0.948565661907196, -0.8899616003036499, -0.831357479095459, -0.7727534770965576, -0.7141493558883667, -0.6555452942848206, -0.5969412326812744, -0.5383371114730835, -0.47973304986953735, -0.4211289882659912, -0.3625248968601227, -0.30392083525657654, -0.2453167736530304, -0.18671268224716187, -0.12810862064361572, -0.06950455904006958, -0.01090048998594284, 0.0477035790681839, 0.10630765557289124, 0.16491171717643738, 0.22351577877998352, 0.28211987018585205, 0.3407239317893982, 0.39932799339294434, 0.4579320549964905, 0.5165361166000366, 0.5751402378082275, 0.6337442398071289, 0.6923483610153198, 0.750952422618866, 0.8095564842224121, 0.8681605458259583, 0.9267646074295044, 0.9853686690330505, 1.0439727306365967, 1.1025768518447876, 1.161180853843689, 1.2197849750518799, 1.2783889770507812, 1.3369930982589722, 1.395597219467163, 1.4542012214660645, 1.5128053426742554, 1.5714093446731567, 1.6300134658813477, 1.688617467880249, 1.74722158908844, 1.8058257102966309, 1.8644298315048218, 1.9230338335037231, 1.981637954711914, 2.0402419567108154, 2.098845958709717, 2.1574501991271973, 2.2160542011260986, 2.274658203125]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 4.0, 5.0, 15.0, 18.0, 17.0, 22.0, 30.0, 27.0, 30.0, 27.0, 21.0, 32.0, 34.0, 47.0, 46.0, 45.0, 48.0, 62.0, 59.0, 34.0, 37.0, 41.0, 34.0, 42.0, 30.0, 31.0, 21.0, 20.0, 10.0, 20.0, 13.0, 14.0, 8.0, 5.0, 7.0, 3.0, 7.0, 6.0, 8.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.124292254447937, -1.0891640186309814, -1.0540356636047363, -1.0189074277877808, -0.9837791323661804, -0.9486508369445801, -0.9135226011276245, -0.8783943057060242, -0.8432660102844238, -0.8081377148628235, -0.7730094194412231, -0.7378811836242676, -0.7027528882026672, -0.6676245927810669, -0.6324963569641113, -0.597368061542511, -0.5622397661209106, -0.5271114706993103, -0.49198320508003235, -0.4568549394607544, -0.42172664403915405, -0.3865983486175537, -0.35147008299827576, -0.3163418173789978, -0.28121352195739746, -0.2460852414369583, -0.21095696091651917, -0.17582868039608002, -0.14070039987564087, -0.10557211935520172, -0.07044383883476257, -0.035315558314323425, -0.00018715858459472656, 0.03494112193584442, 0.07006940245628357, 0.10519768297672272, 0.14032596349716187, 0.175454244017601, 0.21058252453804016, 0.2457108050584793, 0.28083908557891846, 0.3159673810005188, 0.35109564661979675, 0.3862239122390747, 0.42135220766067505, 0.4564805030822754, 0.49160876870155334, 0.5267370343208313, 0.5618653297424316, 0.596993625164032, 0.6321219205856323, 0.6672501564025879, 0.7023784518241882, 0.7375067472457886, 0.7726349830627441, 0.8077632784843445, 0.8428915739059448, 0.8780198693275452, 0.9131481647491455, 0.9482764005661011, 0.9834046959877014, 1.0185329914093018, 1.0536612272262573, 1.0887895822525024, 1.123917818069458]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 4.0, 12.0, 13.0, 20.0, 38.0, 39.0, 79.0, 126.0, 220.0, 472.0, 1394.0, 6543.0, 79268.0, 4018983.0, 77771.0, 6876.0, 1383.0, 495.0, 220.0, 124.0, 75.0, 38.0, 29.0, 18.0, 11.0, 4.0, 11.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1640625, -0.15850067138671875, -0.1529388427734375, -0.14737701416015625, -0.141815185546875, -0.13625335693359375, -0.1306915283203125, -0.12512969970703125, -0.11956787109375, -0.11400604248046875, -0.1084442138671875, -0.10288238525390625, -0.097320556640625, -0.09175872802734375, -0.0861968994140625, -0.08063507080078125, -0.0750732421875, -0.06951141357421875, -0.0639495849609375, -0.05838775634765625, -0.052825927734375, -0.04726409912109375, -0.0417022705078125, -0.03614044189453125, -0.03057861328125, -0.02501678466796875, -0.0194549560546875, -0.01389312744140625, -0.008331298828125, -0.00276947021484375, 0.0027923583984375, 0.00835418701171875, 0.013916015625, 0.01947784423828125, 0.0250396728515625, 0.03060150146484375, 0.036163330078125, 0.04172515869140625, 0.0472869873046875, 0.05284881591796875, 0.05841064453125, 0.06397247314453125, 0.0695343017578125, 0.07509613037109375, 0.080657958984375, 0.08621978759765625, 0.0917816162109375, 0.09734344482421875, 0.1029052734375, 0.10846710205078125, 0.1140289306640625, 0.11959075927734375, 0.125152587890625, 0.13071441650390625, 0.1362762451171875, 0.14183807373046875, 0.14739990234375, 0.15296173095703125, 0.1585235595703125, 0.16408538818359375, 0.169647216796875, 0.17520904541015625, 0.1807708740234375, 0.18633270263671875, 0.19189453125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 5.0, 6.0, 9.0, 19.0, 16.0, 69.0, 116.0, 221.0, 231.0, 150.0, 78.0, 29.0, 20.0, 8.0, 8.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13037109375, -0.12589073181152344, -0.12141036987304688, -0.11693000793457031, -0.11244964599609375, -0.10796928405761719, -0.10348892211914062, -0.09900856018066406, -0.0945281982421875, -0.09004783630371094, -0.08556747436523438, -0.08108711242675781, -0.07660675048828125, -0.07212638854980469, -0.06764602661132812, -0.06316566467285156, -0.058685302734375, -0.05420494079589844, -0.049724578857421875, -0.04524421691894531, -0.04076385498046875, -0.03628349304199219, -0.031803131103515625, -0.027322769165039062, -0.0228424072265625, -0.018362045288085938, -0.013881683349609375, -0.009401321411132812, -0.00492095947265625, -0.0004405975341796875, 0.004039764404296875, 0.008520126342773438, 0.01300048828125, 0.017480850219726562, 0.021961212158203125, 0.026441574096679688, 0.03092193603515625, 0.03540229797363281, 0.039882659912109375, 0.04436302185058594, 0.0488433837890625, 0.05332374572753906, 0.057804107666015625, 0.06228446960449219, 0.06676483154296875, 0.07124519348144531, 0.07572555541992188, 0.08020591735839844, 0.084686279296875, 0.08916664123535156, 0.09364700317382812, 0.09812736511230469, 0.10260772705078125, 0.10708808898925781, 0.11156845092773438, 0.11604881286621094, 0.1205291748046875, 0.12500953674316406, 0.12948989868164062, 0.1339702606201172, 0.13845062255859375, 0.1429309844970703, 0.14741134643554688, 0.15189170837402344, 0.1563720703125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 15.0, 23.0, 50.0, 101.0, 160.0, 315.0, 621.0, 1324.0, 3002.0, 8849.0, 36460.0, 346227.0, 3658107.0, 111288.0, 18482.0, 5402.0, 2019.0, 909.0, 450.0, 215.0, 109.0, 62.0, 43.0, 13.0, 16.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135009765625, -0.13118362426757812, -0.12735748291015625, -0.12353134155273438, -0.1197052001953125, -0.11587905883789062, -0.11205291748046875, -0.10822677612304688, -0.104400634765625, -0.10057449340820312, -0.09674835205078125, -0.09292221069335938, -0.0890960693359375, -0.08526992797851562, -0.08144378662109375, -0.07761764526367188, -0.07379150390625, -0.06996536254882812, -0.06613922119140625, -0.062313079833984375, -0.0584869384765625, -0.054660797119140625, -0.05083465576171875, -0.047008514404296875, -0.043182373046875, -0.039356231689453125, -0.03553009033203125, -0.031703948974609375, -0.0278778076171875, -0.024051666259765625, -0.02022552490234375, -0.016399383544921875, -0.0125732421875, -0.008747100830078125, -0.00492095947265625, -0.001094818115234375, 0.0027313232421875, 0.006557464599609375, 0.01038360595703125, 0.014209747314453125, 0.018035888671875, 0.021862030029296875, 0.02568817138671875, 0.029514312744140625, 0.0333404541015625, 0.037166595458984375, 0.04099273681640625, 0.044818878173828125, 0.04864501953125, 0.052471160888671875, 0.05629730224609375, 0.060123443603515625, 0.0639495849609375, 0.06777572631835938, 0.07160186767578125, 0.07542800903320312, 0.079254150390625, 0.08308029174804688, 0.08690643310546875, 0.09073257446289062, 0.0945587158203125, 0.09838485717773438, 0.10221099853515625, 0.10603713989257812, 0.10986328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 3.0, 13.0, 9.0, 15.0, 27.0, 30.0, 51.0, 69.0, 110.0, 229.0, 492.0, 2127.0, 408.0, 159.0, 103.0, 55.0, 41.0, 20.0, 33.0, 20.0, 10.0, 8.0, 2.0, 7.0, 1.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04974365234375, -0.04820871353149414, -0.04667377471923828, -0.04513883590698242, -0.04360389709472656, -0.0420689582824707, -0.040534019470214844, -0.038999080657958984, -0.037464141845703125, -0.035929203033447266, -0.034394264221191406, -0.03285932540893555, -0.03132438659667969, -0.029789447784423828, -0.02825450897216797, -0.02671957015991211, -0.02518463134765625, -0.02364969253540039, -0.02211475372314453, -0.020579814910888672, -0.019044876098632812, -0.017509937286376953, -0.015974998474121094, -0.014440059661865234, -0.012905120849609375, -0.011370182037353516, -0.009835243225097656, -0.008300304412841797, -0.0067653656005859375, -0.005230426788330078, -0.0036954879760742188, -0.0021605491638183594, -0.0006256103515625, 0.0009093284606933594, 0.0024442672729492188, 0.003979206085205078, 0.0055141448974609375, 0.007049083709716797, 0.008584022521972656, 0.010118961334228516, 0.011653900146484375, 0.013188838958740234, 0.014723777770996094, 0.016258716583251953, 0.017793655395507812, 0.019328594207763672, 0.02086353302001953, 0.02239847183227539, 0.02393341064453125, 0.02546834945678711, 0.02700328826904297, 0.028538227081298828, 0.030073165893554688, 0.03160810470581055, 0.033143043518066406, 0.034677982330322266, 0.036212921142578125, 0.037747859954833984, 0.039282798767089844, 0.0408177375793457, 0.04235267639160156, 0.04388761520385742, 0.04542255401611328, 0.04695749282836914, 0.048492431640625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 9.0, 20.0, 49.0, 117.0, 284.0, 306.0, 160.0, 41.0, 10.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33423781394958496, -0.3136671781539917, -0.2930965721607208, -0.27252593636512756, -0.2519553303718567, -0.23138469457626343, -0.21081405878067017, -0.1902434378862381, -0.16967281699180603, -0.14910219609737396, -0.1285315752029419, -0.10796093940734863, -0.08739031851291656, -0.0668196976184845, -0.04624906927347183, -0.025678440928459167, -0.0051078200340271, 0.015462804585695267, 0.03603342920541763, 0.05660405382514, 0.07717467844486237, 0.09774529933929443, 0.1183159276843071, 0.13888655602931976, 0.15945717692375183, 0.1800277978181839, 0.20059841871261597, 0.22116905450820923, 0.2417396754026413, 0.26231029629707336, 0.2828809320926666, 0.3034515380859375, 0.32402217388153076, 0.344592809677124, 0.3651634156703949, 0.38573405146598816, 0.40630465745925903, 0.4268752932548523, 0.44744592905044556, 0.4680165648460388, 0.4885871708393097, 0.5091577768325806, 0.5297284126281738, 0.5502990484237671, 0.5708696842193604, 0.5914403200149536, 0.6120108962059021, 0.6325815320014954, 0.6531521677970886, 0.6737228035926819, 0.6942934393882751, 0.7148640155792236, 0.7354346513748169, 0.7560052871704102, 0.7765759229660034, 0.7971465587615967, 0.8177171945571899, 0.8382878303527832, 0.8588584661483765, 0.879429042339325, 0.8999996781349182, 0.9205703139305115, 0.9411409497261047, 0.961711585521698, 0.9822821617126465]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 5.0, 2.0, 9.0, 4.0, 11.0, 12.0, 11.0, 14.0, 15.0, 19.0, 24.0, 27.0, 25.0, 40.0, 27.0, 22.0, 39.0, 33.0, 33.0, 34.0, 36.0, 57.0, 32.0, 40.0, 42.0, 31.0, 38.0, 31.0, 33.0, 40.0, 33.0, 23.0, 27.0, 21.0, 11.0, 16.0, 15.0, 15.0, 16.0, 9.0, 6.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1309802532196045, -0.12680184841156006, -0.12262345850467682, -0.11844506114721298, -0.11426666378974915, -0.11008826643228531, -0.10590986907482147, -0.10173147171735764, -0.0975530743598938, -0.09337467700242996, -0.08919627964496613, -0.08501788228750229, -0.08083948493003845, -0.07666108757257462, -0.07248269021511078, -0.06830429285764694, -0.0641258955001831, -0.05994749814271927, -0.05576910078525543, -0.051590703427791595, -0.04741230607032776, -0.04323390871286392, -0.039055511355400085, -0.03487711399793625, -0.030698716640472412, -0.026520319283008575, -0.02234192192554474, -0.018163524568080902, -0.013985127210617065, -0.009806729853153229, -0.005628332495689392, -0.0014499351382255554, 0.0027284622192382812, 0.006906859576702118, 0.011085256934165955, 0.015263654291629791, 0.019442051649093628, 0.023620449006557465, 0.0277988463640213, 0.03197724372148514, 0.036155641078948975, 0.04033403843641281, 0.04451243579387665, 0.048690833151340485, 0.05286923050880432, 0.05704762786626816, 0.061226025223731995, 0.06540442258119583, 0.06958281993865967, 0.0737612172961235, 0.07793961465358734, 0.08211801201105118, 0.08629640936851501, 0.09047480672597885, 0.09465320408344269, 0.09883160144090652, 0.10300999879837036, 0.1071883961558342, 0.11136679351329803, 0.11554519087076187, 0.11972358822822571, 0.12390198558568954, 0.12808038294315338, 0.13225877285003662, 0.13643717765808105]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 13.0, 28.0, 54.0, 69.0, 149.0, 208.0, 448.0, 966.0, 2478.0, 9549.0, 81217.0, 813399.0, 122772.0, 12037.0, 2984.0, 1041.0, 493.0, 255.0, 149.0, 77.0, 38.0, 45.0, 19.0, 14.0, 4.0, 7.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.19921875, -0.19345664978027344, -0.18769454956054688, -0.1819324493408203, -0.17617034912109375, -0.1704082489013672, -0.16464614868164062, -0.15888404846191406, -0.1531219482421875, -0.14735984802246094, -0.14159774780273438, -0.1358356475830078, -0.13007354736328125, -0.12431144714355469, -0.11854934692382812, -0.11278724670410156, -0.107025146484375, -0.10126304626464844, -0.09550094604492188, -0.08973884582519531, -0.08397674560546875, -0.07821464538574219, -0.07245254516601562, -0.06669044494628906, -0.0609283447265625, -0.05516624450683594, -0.049404144287109375, -0.04364204406738281, -0.03787994384765625, -0.03211784362792969, -0.026355743408203125, -0.020593643188476562, -0.01483154296875, -0.009069442749023438, -0.003307342529296875, 0.0024547576904296875, 0.00821685791015625, 0.013978958129882812, 0.019741058349609375, 0.025503158569335938, 0.0312652587890625, 0.03702735900878906, 0.042789459228515625, 0.04855155944824219, 0.05431365966796875, 0.06007575988769531, 0.06583786010742188, 0.07159996032714844, 0.077362060546875, 0.08312416076660156, 0.08888626098632812, 0.09464836120605469, 0.10041046142578125, 0.10617256164550781, 0.11193466186523438, 0.11769676208496094, 0.1234588623046875, 0.12922096252441406, 0.13498306274414062, 0.1407451629638672, 0.14650726318359375, 0.1522693634033203, 0.15803146362304688, 0.16379356384277344, 0.1695556640625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 9.0, 12.0, 16.0, 20.0, 64.0, 129.0, 216.0, 217.0, 158.0, 73.0, 35.0, 12.0, 15.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1298828125, -0.12541961669921875, -0.1209564208984375, -0.11649322509765625, -0.112030029296875, -0.10756683349609375, -0.1031036376953125, -0.09864044189453125, -0.09417724609375, -0.08971405029296875, -0.0852508544921875, -0.08078765869140625, -0.076324462890625, -0.07186126708984375, -0.0673980712890625, -0.06293487548828125, -0.0584716796875, -0.05400848388671875, -0.0495452880859375, -0.04508209228515625, -0.040618896484375, -0.03615570068359375, -0.0316925048828125, -0.02722930908203125, -0.02276611328125, -0.01830291748046875, -0.0138397216796875, -0.00937652587890625, -0.004913330078125, -0.00045013427734375, 0.0040130615234375, 0.00847625732421875, 0.012939453125, 0.01740264892578125, 0.0218658447265625, 0.02632904052734375, 0.030792236328125, 0.03525543212890625, 0.0397186279296875, 0.04418182373046875, 0.04864501953125, 0.05310821533203125, 0.0575714111328125, 0.06203460693359375, 0.066497802734375, 0.07096099853515625, 0.0754241943359375, 0.07988739013671875, 0.0843505859375, 0.08881378173828125, 0.0932769775390625, 0.09774017333984375, 0.102203369140625, 0.10666656494140625, 0.1111297607421875, 0.11559295654296875, 0.12005615234375, 0.12451934814453125, 0.1289825439453125, 0.13344573974609375, 0.137908935546875, 0.14237213134765625, 0.1468353271484375, 0.15129852294921875, 0.15576171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 8.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 10.0, 10.0, 10.0, 17.0, 26.0, 23.0, 46.0, 47.0, 67.0, 112.0, 110.0, 247.0, 518.0, 1332.0, 6186.0, 120447.0, 871739.0, 42213.0, 3412.0, 903.0, 388.0, 193.0, 118.0, 74.0, 54.0, 57.0, 35.0, 30.0, 24.0, 12.0, 16.0, 12.0, 10.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.2264404296875, -0.22021102905273438, -0.21398162841796875, -0.20775222778320312, -0.2015228271484375, -0.19529342651367188, -0.18906402587890625, -0.18283462524414062, -0.176605224609375, -0.17037582397460938, -0.16414642333984375, -0.15791702270507812, -0.1516876220703125, -0.14545822143554688, -0.13922882080078125, -0.13299942016601562, -0.12677001953125, -0.12054061889648438, -0.11431121826171875, -0.10808181762695312, -0.1018524169921875, -0.09562301635742188, -0.08939361572265625, -0.08316421508789062, -0.076934814453125, -0.07070541381835938, -0.06447601318359375, -0.058246612548828125, -0.0520172119140625, -0.045787811279296875, -0.03955841064453125, -0.033329010009765625, -0.027099609375, -0.020870208740234375, -0.01464080810546875, -0.008411407470703125, -0.0021820068359375, 0.004047393798828125, 0.01027679443359375, 0.016506195068359375, 0.022735595703125, 0.028964996337890625, 0.03519439697265625, 0.041423797607421875, 0.0476531982421875, 0.053882598876953125, 0.06011199951171875, 0.06634140014648438, 0.07257080078125, 0.07880020141601562, 0.08502960205078125, 0.09125900268554688, 0.0974884033203125, 0.10371780395507812, 0.10994720458984375, 0.11617660522460938, 0.122406005859375, 0.12863540649414062, 0.13486480712890625, 0.14109420776367188, 0.1473236083984375, 0.15355300903320312, 0.15978240966796875, 0.16601181030273438, 0.1722412109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 9.0, 8.0, 16.0, 18.0, 25.0, 23.0, 22.0, 21.0, 25.0, 29.0, 33.0, 39.0, 37.0, 46.0, 38.0, 39.0, 57.0, 48.0, 37.0, 27.0, 50.0, 30.0, 41.0, 28.0, 31.0, 29.0, 26.0, 20.0, 19.0, 19.0, 17.0, 18.0, 12.0, 6.0, 7.0, 6.0, 4.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.2034912109375, -0.19748878479003906, -0.19148635864257812, -0.1854839324951172, -0.17948150634765625, -0.1734790802001953, -0.16747665405273438, -0.16147422790527344, -0.1554718017578125, -0.14946937561035156, -0.14346694946289062, -0.1374645233154297, -0.13146209716796875, -0.1254596710205078, -0.11945724487304688, -0.11345481872558594, -0.107452392578125, -0.10144996643066406, -0.09544754028320312, -0.08944511413574219, -0.08344268798828125, -0.07744026184082031, -0.07143783569335938, -0.06543540954589844, -0.0594329833984375, -0.05343055725097656, -0.047428131103515625, -0.04142570495605469, -0.03542327880859375, -0.029420852661132812, -0.023418426513671875, -0.017416000366210938, -0.01141357421875, -0.0054111480712890625, 0.000591278076171875, 0.0065937042236328125, 0.01259613037109375, 0.018598556518554688, 0.024600982666015625, 0.030603408813476562, 0.0366058349609375, 0.04260826110839844, 0.048610687255859375, 0.05461311340332031, 0.06061553955078125, 0.06661796569824219, 0.07262039184570312, 0.07862281799316406, 0.084625244140625, 0.09062767028808594, 0.09663009643554688, 0.10263252258300781, 0.10863494873046875, 0.11463737487792969, 0.12063980102539062, 0.12664222717285156, 0.1326446533203125, 0.13864707946777344, 0.14464950561523438, 0.1506519317626953, 0.15665435791015625, 0.1626567840576172, 0.16865921020507812, 0.17466163635253906, 0.1806640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 8.0, 6.0, 14.0, 24.0, 26.0, 23.0, 47.0, 56.0, 99.0, 152.0, 299.0, 570.0, 1378.0, 3474.0, 10603.0, 44366.0, 433330.0, 488107.0, 48352.0, 11048.0, 3752.0, 1377.0, 616.0, 301.0, 149.0, 109.0, 60.0, 38.0, 38.0, 31.0, 20.0, 15.0, 18.0, 9.0, 6.0, 9.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.049713134765625, -0.048207759857177734, -0.04670238494873047, -0.0451970100402832, -0.04369163513183594, -0.04218626022338867, -0.040680885314941406, -0.03917551040649414, -0.037670135498046875, -0.03616476058959961, -0.034659385681152344, -0.03315401077270508, -0.03164863586425781, -0.030143260955810547, -0.02863788604736328, -0.027132511138916016, -0.02562713623046875, -0.024121761322021484, -0.02261638641357422, -0.021111011505126953, -0.019605636596679688, -0.018100261688232422, -0.016594886779785156, -0.01508951187133789, -0.013584136962890625, -0.01207876205444336, -0.010573387145996094, -0.009068012237548828, -0.0075626373291015625, -0.006057262420654297, -0.004551887512207031, -0.0030465126037597656, -0.0015411376953125, -3.5762786865234375e-05, 0.0014696121215820312, 0.002974987030029297, 0.0044803619384765625, 0.005985736846923828, 0.007491111755371094, 0.00899648666381836, 0.010501861572265625, 0.01200723648071289, 0.013512611389160156, 0.015017986297607422, 0.016523361206054688, 0.018028736114501953, 0.01953411102294922, 0.021039485931396484, 0.02254486083984375, 0.024050235748291016, 0.02555561065673828, 0.027060985565185547, 0.028566360473632812, 0.030071735382080078, 0.031577110290527344, 0.03308248519897461, 0.034587860107421875, 0.03609323501586914, 0.037598609924316406, 0.03910398483276367, 0.04060935974121094, 0.0421147346496582, 0.04362010955810547, 0.045125484466552734, 0.046630859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 3.0, 3.0, 6.0, 9.0, 6.0, 12.0, 24.0, 20.0, 35.0, 36.0, 32.0, 80.0, 95.0, 114.0, 111.0, 94.0, 83.0, 57.0, 45.0, 34.0, 28.0, 12.0, 16.0, 8.0, 4.0, 8.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.049041748046875e-05, -1.0190531611442566e-05, -9.890645742416382e-06, -9.590759873390198e-06, -9.290874004364014e-06, -8.99098813533783e-06, -8.691102266311646e-06, -8.391216397285461e-06, -8.091330528259277e-06, -7.791444659233093e-06, -7.491558790206909e-06, -7.191672921180725e-06, -6.891787052154541e-06, -6.591901183128357e-06, -6.292015314102173e-06, -5.992129445075989e-06, -5.692243576049805e-06, -5.392357707023621e-06, -5.0924718379974365e-06, -4.7925859689712524e-06, -4.492700099945068e-06, -4.192814230918884e-06, -3.8929283618927e-06, -3.593042492866516e-06, -3.293156623840332e-06, -2.993270754814148e-06, -2.693384885787964e-06, -2.3934990167617798e-06, -2.0936131477355957e-06, -1.7937272787094116e-06, -1.4938414096832275e-06, -1.1939555406570435e-06, -8.940696716308594e-07, -5.941838026046753e-07, -2.942979335784912e-07, 5.587935447692871e-09, 3.0547380447387695e-07, 6.05359673500061e-07, 9.052455425262451e-07, 1.2051314115524292e-06, 1.5050172805786133e-06, 1.8049031496047974e-06, 2.1047890186309814e-06, 2.4046748876571655e-06, 2.7045607566833496e-06, 3.0044466257095337e-06, 3.3043324947357178e-06, 3.604218363761902e-06, 3.904104232788086e-06, 4.20399010181427e-06, 4.503875970840454e-06, 4.803761839866638e-06, 5.103647708892822e-06, 5.403533577919006e-06, 5.7034194469451904e-06, 6.0033053159713745e-06, 6.303191184997559e-06, 6.603077054023743e-06, 6.902962923049927e-06, 7.202848792076111e-06, 7.502734661102295e-06, 7.802620530128479e-06, 8.102506399154663e-06, 8.402392268180847e-06, 8.702278137207031e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 4.0, 18.0, 34.0, 44.0, 94.0, 177.0, 451.0, 1546.0, 7173.0, 83555.0, 908736.0, 40053.0, 4807.0, 1136.0, 415.0, 130.0, 62.0, 39.0, 24.0, 16.0, 11.0, 7.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12225341796875, -0.11889362335205078, -0.11553382873535156, -0.11217403411865234, -0.10881423950195312, -0.1054544448852539, -0.10209465026855469, -0.09873485565185547, -0.09537506103515625, -0.09201526641845703, -0.08865547180175781, -0.0852956771850586, -0.08193588256835938, -0.07857608795166016, -0.07521629333496094, -0.07185649871826172, -0.0684967041015625, -0.06513690948486328, -0.06177711486816406, -0.058417320251464844, -0.055057525634765625, -0.051697731018066406, -0.04833793640136719, -0.04497814178466797, -0.04161834716796875, -0.03825855255126953, -0.03489875793457031, -0.031538963317871094, -0.028179168701171875, -0.024819374084472656, -0.021459579467773438, -0.01809978485107422, -0.014739990234375, -0.011380195617675781, -0.008020401000976562, -0.004660606384277344, -0.001300811767578125, 0.0020589828491210938, 0.0054187774658203125, 0.008778572082519531, 0.01213836669921875, 0.015498161315917969, 0.018857955932617188, 0.022217750549316406, 0.025577545166015625, 0.028937339782714844, 0.03229713439941406, 0.03565692901611328, 0.0390167236328125, 0.04237651824951172, 0.04573631286621094, 0.049096107482910156, 0.052455902099609375, 0.055815696716308594, 0.05917549133300781, 0.06253528594970703, 0.06589508056640625, 0.06925487518310547, 0.07261466979980469, 0.0759744644165039, 0.07933425903320312, 0.08269405364990234, 0.08605384826660156, 0.08941364288330078, 0.0927734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 15.0, 15.0, 44.0, 57.0, 113.0, 206.0, 239.0, 139.0, 66.0, 51.0, 22.0, 19.0, 12.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12548828125, -0.12220191955566406, -0.11891555786132812, -0.11562919616699219, -0.11234283447265625, -0.10905647277832031, -0.10577011108398438, -0.10248374938964844, -0.0991973876953125, -0.09591102600097656, -0.09262466430664062, -0.08933830261230469, -0.08605194091796875, -0.08276557922363281, -0.07947921752929688, -0.07619285583496094, -0.072906494140625, -0.06962013244628906, -0.06633377075195312, -0.06304740905761719, -0.05976104736328125, -0.05647468566894531, -0.053188323974609375, -0.04990196228027344, -0.0466156005859375, -0.04332923889160156, -0.040042877197265625, -0.03675651550292969, -0.03347015380859375, -0.030183792114257812, -0.026897430419921875, -0.023611068725585938, -0.02032470703125, -0.017038345336914062, -0.013751983642578125, -0.010465621948242188, -0.00717926025390625, -0.0038928985595703125, -0.000606536865234375, 0.0026798248291015625, 0.0059661865234375, 0.009252548217773438, 0.012538909912109375, 0.015825271606445312, 0.01911163330078125, 0.022397994995117188, 0.025684356689453125, 0.028970718383789062, 0.032257080078125, 0.03554344177246094, 0.038829803466796875, 0.04211616516113281, 0.04540252685546875, 0.04868888854980469, 0.051975250244140625, 0.05526161193847656, 0.0585479736328125, 0.06183433532714844, 0.06512069702148438, 0.06840705871582031, 0.07169342041015625, 0.07497978210449219, 0.07826614379882812, 0.08155250549316406, 0.0848388671875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 129.0, 855.0, 22.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8728519678115845, -1.6714962720870972, -1.4701405763626099, -1.2687848806381226, -1.0674291849136353, -0.866073489189148, -0.6647177934646606, -0.46336209774017334, -0.26200640201568604, -0.06065070629119873, 0.14070498943328857, 0.3420606851577759, 0.5434163808822632, 0.7447720766067505, 0.9461277723312378, 1.147483468055725, 1.3488391637802124, 1.5501948595046997, 1.751550555229187, 1.9529062509536743, 2.154262065887451, 2.3556175231933594, 2.556973457336426, 2.758328914642334, 2.9596848487854004, 3.1610405445098877, 3.362396240234375, 3.5637519359588623, 3.7651076316833496, 3.966463327407837, 4.167819023132324, 4.369174957275391, 4.570529937744141, 4.771885871887207, 4.973241329193115, 5.174596786499023, 5.37595272064209, 5.577308654785156, 5.7786641120910645, 5.980019569396973, 6.181375503540039, 6.3827314376831055, 6.584086894989014, 6.785442352294922, 6.986798286437988, 7.188154220581055, 7.389509677886963, 7.590865135192871, 7.7922210693359375, 7.993577003479004, 8.19493293762207, 8.39628791809082, 8.597643852233887, 8.798999786376953, 9.000354766845703, 9.20171070098877, 9.403066635131836, 9.604422569274902, 9.805778503417969, 10.007133483886719, 10.208489418029785, 10.409845352172852, 10.611200332641602, 10.812556266784668, 11.013912200927734]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 3.0, 6.0, 4.0, 6.0, 7.0, 11.0, 13.0, 8.0, 15.0, 27.0, 19.0, 20.0, 26.0, 29.0, 27.0, 36.0, 40.0, 45.0, 40.0, 38.0, 38.0, 42.0, 46.0, 43.0, 34.0, 47.0, 33.0, 29.0, 43.0, 28.0, 38.0, 33.0, 24.0, 13.0, 20.0, 12.0, 6.0, 12.0, 4.0, 10.0, 9.0, 3.0, 4.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9678308367729187, -0.9374896287918091, -0.9071483612060547, -0.8768071532249451, -0.8464658856391907, -0.816124677658081, -0.7857834100723267, -0.755442202091217, -0.7251009941101074, -0.6947597861289978, -0.6644185185432434, -0.6340773105621338, -0.6037360429763794, -0.5733948349952698, -0.5430536270141602, -0.5127123594284058, -0.48237109184265137, -0.45202985405921936, -0.42168861627578735, -0.39134740829467773, -0.36100614070892334, -0.3306649327278137, -0.3003236949443817, -0.2699824571609497, -0.2396412193775177, -0.2092999815940857, -0.1789587438106537, -0.14861752092838287, -0.11827628314495087, -0.08793504536151886, -0.05759382247924805, -0.02725258469581604, 0.003088712692260742, 0.03342994675040245, 0.06377118080854416, 0.09411241114139557, 0.12445364892482758, 0.15479488670825958, 0.1851361095905304, 0.2154773473739624, 0.2458185851573944, 0.2761598229408264, 0.3065010607242584, 0.33684229850769043, 0.36718350648880005, 0.39752477407455444, 0.42786598205566406, 0.45820721983909607, 0.4885484576225281, 0.5188896656036377, 0.5492309331893921, 0.5795721411705017, 0.6099134087562561, 0.6402546167373657, 0.6705958843231201, 0.7009370923042297, 0.7312783002853394, 0.761619508266449, 0.7919607758522034, 0.822301983833313, 0.8526432514190674, 0.882984459400177, 0.9133256673812866, 0.943666934967041, 0.9740082025527954]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 4.0, 8.0, 4.0, 5.0, 6.0, 11.0, 15.0, 26.0, 33.0, 59.0, 129.0, 272.0, 600.0, 1441.0, 4157.0, 14717.0, 228267.0, 3919925.0, 17094.0, 4518.0, 1658.0, 634.0, 339.0, 152.0, 78.0, 51.0, 26.0, 11.0, 9.0, 7.0, 7.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.17138671875, -0.16649627685546875, -0.1616058349609375, -0.15671539306640625, -0.151824951171875, -0.14693450927734375, -0.1420440673828125, -0.13715362548828125, -0.13226318359375, -0.12737274169921875, -0.1224822998046875, -0.11759185791015625, -0.112701416015625, -0.10781097412109375, -0.1029205322265625, -0.09803009033203125, -0.0931396484375, -0.08824920654296875, -0.0833587646484375, -0.07846832275390625, -0.073577880859375, -0.06868743896484375, -0.0637969970703125, -0.05890655517578125, -0.05401611328125, -0.04912567138671875, -0.0442352294921875, -0.03934478759765625, -0.034454345703125, -0.02956390380859375, -0.0246734619140625, -0.01978302001953125, -0.014892578125, -0.01000213623046875, -0.0051116943359375, -0.00022125244140625, 0.004669189453125, 0.00955963134765625, 0.0144500732421875, 0.01934051513671875, 0.02423095703125, 0.02912139892578125, 0.0340118408203125, 0.03890228271484375, 0.043792724609375, 0.04868316650390625, 0.0535736083984375, 0.05846405029296875, 0.0633544921875, 0.06824493408203125, 0.0731353759765625, 0.07802581787109375, 0.082916259765625, 0.08780670166015625, 0.0926971435546875, 0.09758758544921875, 0.10247802734375, 0.10736846923828125, 0.1122589111328125, 0.11714935302734375, 0.122039794921875, 0.12693023681640625, 0.1318206787109375, 0.13671112060546875, 0.1416015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 10.0, 20.0, 21.0, 74.0, 144.0, 219.0, 221.0, 126.0, 79.0, 27.0, 21.0, 9.0, 7.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1298828125, -0.125396728515625, -0.12091064453125, -0.116424560546875, -0.1119384765625, -0.107452392578125, -0.10296630859375, -0.098480224609375, -0.093994140625, -0.089508056640625, -0.08502197265625, -0.080535888671875, -0.0760498046875, -0.071563720703125, -0.06707763671875, -0.062591552734375, -0.05810546875, -0.053619384765625, -0.04913330078125, -0.044647216796875, -0.0401611328125, -0.035675048828125, -0.03118896484375, -0.026702880859375, -0.022216796875, -0.017730712890625, -0.01324462890625, -0.008758544921875, -0.0042724609375, 0.000213623046875, 0.00469970703125, 0.009185791015625, 0.013671875, 0.018157958984375, 0.02264404296875, 0.027130126953125, 0.0316162109375, 0.036102294921875, 0.04058837890625, 0.045074462890625, 0.049560546875, 0.054046630859375, 0.05853271484375, 0.063018798828125, 0.0675048828125, 0.071990966796875, 0.07647705078125, 0.080963134765625, 0.08544921875, 0.089935302734375, 0.09442138671875, 0.098907470703125, 0.1033935546875, 0.107879638671875, 0.11236572265625, 0.116851806640625, 0.121337890625, 0.125823974609375, 0.13031005859375, 0.134796142578125, 0.1392822265625, 0.143768310546875, 0.14825439453125, 0.152740478515625, 0.1572265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 10.0, 7.0, 10.0, 25.0, 23.0, 44.0, 61.0, 114.0, 175.0, 296.0, 405.0, 764.0, 1402.0, 3074.0, 10813.0, 306358.0, 3851066.0, 12774.0, 3227.0, 1488.0, 872.0, 475.0, 302.0, 160.0, 113.0, 77.0, 52.0, 34.0, 19.0, 15.0, 12.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24602890014648438, -0.23693084716796875, -0.22783279418945312, -0.2187347412109375, -0.20963668823242188, -0.20053863525390625, -0.19144058227539062, -0.182342529296875, -0.17324447631835938, -0.16414642333984375, -0.15504837036132812, -0.1459503173828125, -0.13685226440429688, -0.12775421142578125, -0.11865615844726562, -0.10955810546875, -0.10046005249023438, -0.09136199951171875, -0.08226394653320312, -0.0731658935546875, -0.06406784057617188, -0.05496978759765625, -0.045871734619140625, -0.036773681640625, -0.027675628662109375, -0.01857757568359375, -0.009479522705078125, -0.0003814697265625, 0.008716583251953125, 0.01781463623046875, 0.026912689208984375, 0.0360107421875, 0.045108795166015625, 0.05420684814453125, 0.06330490112304688, 0.0724029541015625, 0.08150100708007812, 0.09059906005859375, 0.09969711303710938, 0.108795166015625, 0.11789321899414062, 0.12699127197265625, 0.13608932495117188, 0.1451873779296875, 0.15428543090820312, 0.16338348388671875, 0.17248153686523438, 0.18157958984375, 0.19067764282226562, 0.19977569580078125, 0.20887374877929688, 0.2179718017578125, 0.22706985473632812, 0.23616790771484375, 0.24526596069335938, 0.254364013671875, 0.2634620666503906, 0.27256011962890625, 0.2816581726074219, 0.2907562255859375, 0.2998542785644531, 0.30895233154296875, 0.3180503845214844, 0.3271484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 22.0, 23.0, 38.0, 96.0, 622.0, 3069.0, 88.0, 45.0, 24.0, 16.0, 8.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03662109375, -0.035314083099365234, -0.03400707244873047, -0.0327000617980957, -0.03139305114746094, -0.030086040496826172, -0.028779029846191406, -0.02747201919555664, -0.026165008544921875, -0.02485799789428711, -0.023550987243652344, -0.022243976593017578, -0.020936965942382812, -0.019629955291748047, -0.01832294464111328, -0.017015933990478516, -0.01570892333984375, -0.014401912689208984, -0.013094902038574219, -0.011787891387939453, -0.010480880737304688, -0.009173870086669922, -0.007866859436035156, -0.006559848785400391, -0.005252838134765625, -0.003945827484130859, -0.0026388168334960938, -0.0013318061828613281, -2.47955322265625e-05, 0.0012822151184082031, 0.0025892257690429688, 0.0038962364196777344, 0.0052032470703125, 0.006510257720947266, 0.007817268371582031, 0.009124279022216797, 0.010431289672851562, 0.011738300323486328, 0.013045310974121094, 0.01435232162475586, 0.015659332275390625, 0.01696634292602539, 0.018273353576660156, 0.019580364227294922, 0.020887374877929688, 0.022194385528564453, 0.02350139617919922, 0.024808406829833984, 0.02611541748046875, 0.027422428131103516, 0.02872943878173828, 0.030036449432373047, 0.03134346008300781, 0.03265047073364258, 0.033957481384277344, 0.03526449203491211, 0.036571502685546875, 0.03787851333618164, 0.039185523986816406, 0.04049253463745117, 0.04179954528808594, 0.0431065559387207, 0.04441356658935547, 0.045720577239990234, 0.047027587890625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 15.0, 18.0, 27.0, 82.0, 143.0, 212.0, 225.0, 140.0, 72.0, 34.0, 11.0, 10.0, 10.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36155495047569275, -0.35292932391166687, -0.344303697347641, -0.3356780707836151, -0.32705244421958923, -0.31842681765556335, -0.3098011910915375, -0.3011755347251892, -0.29254990816116333, -0.28392428159713745, -0.2752986550331116, -0.2666730284690857, -0.2580474019050598, -0.24942177534103394, -0.24079613387584686, -0.23217050731182098, -0.2235448956489563, -0.21491926908493042, -0.20629364252090454, -0.19766801595687866, -0.18904238939285278, -0.1804167628288269, -0.17179112136363983, -0.16316549479961395, -0.15453986823558807, -0.1459142416715622, -0.13728861510753632, -0.12866298854351044, -0.12003735452890396, -0.11141172796487808, -0.1027860939502716, -0.09416046738624573, -0.08553485572338104, -0.07690922915935516, -0.06828360259532928, -0.05965796858072281, -0.05103234201669693, -0.04240671545267105, -0.033781085163354874, -0.025155454874038696, -0.016529828310012817, -0.00790419988334179, 0.0007214285433292389, 0.009347056970000267, 0.017972685396671295, 0.026598311960697174, 0.03522394225001335, 0.04384957253932953, 0.05247519910335541, 0.06110082566738129, 0.06972645223140717, 0.07835208624601364, 0.08697771281003952, 0.0956033393740654, 0.10422897338867188, 0.11285459995269775, 0.12148022651672363, 0.1301058530807495, 0.1387314796447754, 0.14735710620880127, 0.15598273277282715, 0.16460835933685303, 0.1732340008020401, 0.18185962736606598, 0.19048525393009186]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 1.0, 7.0, 16.0, 4.0, 4.0, 9.0, 8.0, 11.0, 17.0, 17.0, 22.0, 22.0, 24.0, 28.0, 28.0, 41.0, 27.0, 43.0, 46.0, 39.0, 34.0, 30.0, 34.0, 41.0, 40.0, 41.0, 35.0, 26.0, 36.0, 33.0, 33.0, 28.0, 31.0, 21.0, 18.0, 10.0, 19.0, 19.0, 10.0, 6.0, 14.0, 4.0, 5.0, 4.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06788229942321777, -0.06577342748641968, -0.06366455554962158, -0.06155569106340408, -0.05944681912660599, -0.05733794718980789, -0.055229078978300095, -0.0531202107667923, -0.0510113388299942, -0.048902466893196106, -0.04679359868168831, -0.04468473047018051, -0.042575858533382416, -0.04046698659658432, -0.03835811838507652, -0.036249250173568726, -0.03414037823677063, -0.032031506299972534, -0.029922638088464737, -0.02781376801431179, -0.025704897940158844, -0.023596027866005898, -0.02148715779185295, -0.019378287717700005, -0.017269417643547058, -0.015160547569394112, -0.013051677495241165, -0.010942807421088219, -0.008833937346935272, -0.006725067272782326, -0.004616197198629379, -0.002507327124476433, -0.00039845705032348633, 0.0017104130238294601, 0.0038192830979824066, 0.005928153172135353, 0.0080370232462883, 0.010145893320441246, 0.012254763394594193, 0.014363633468747139, 0.016472503542900085, 0.018581373617053032, 0.02069024369120598, 0.022799113765358925, 0.02490798383951187, 0.027016853913664818, 0.029125723987817764, 0.03123459406197071, 0.03334346413612366, 0.03545233607292175, 0.03756120428442955, 0.03967007249593735, 0.04177894443273544, 0.04388781636953354, 0.045996684581041336, 0.04810555279254913, 0.05021442472934723, 0.052323296666145325, 0.05443216487765312, 0.05654103308916092, 0.058649905025959015, 0.06075877696275711, 0.06286764144897461, 0.0649765133857727, 0.0670853853225708]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 16.0, 23.0, 28.0, 59.0, 68.0, 130.0, 222.0, 476.0, 1064.0, 3149.0, 15241.0, 187999.0, 756856.0, 71324.0, 8163.0, 2060.0, 813.0, 423.0, 160.0, 89.0, 61.0, 42.0, 30.0, 16.0, 17.0, 13.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2039794921875, -0.19820594787597656, -0.19243240356445312, -0.1866588592529297, -0.18088531494140625, -0.1751117706298828, -0.16933822631835938, -0.16356468200683594, -0.1577911376953125, -0.15201759338378906, -0.14624404907226562, -0.1404705047607422, -0.13469696044921875, -0.1289234161376953, -0.12314987182617188, -0.11737632751464844, -0.111602783203125, -0.10582923889160156, -0.10005569458007812, -0.09428215026855469, -0.08850860595703125, -0.08273506164550781, -0.07696151733398438, -0.07118797302246094, -0.0654144287109375, -0.05964088439941406, -0.053867340087890625, -0.04809379577636719, -0.04232025146484375, -0.03654670715332031, -0.030773162841796875, -0.024999618530273438, -0.01922607421875, -0.013452529907226562, -0.007678985595703125, -0.0019054412841796875, 0.00386810302734375, 0.009641647338867188, 0.015415191650390625, 0.021188735961914062, 0.0269622802734375, 0.03273582458496094, 0.038509368896484375, 0.04428291320800781, 0.05005645751953125, 0.05583000183105469, 0.061603546142578125, 0.06737709045410156, 0.073150634765625, 0.07892417907714844, 0.08469772338867188, 0.09047126770019531, 0.09624481201171875, 0.10201835632324219, 0.10779190063476562, 0.11356544494628906, 0.1193389892578125, 0.12511253356933594, 0.13088607788085938, 0.1366596221923828, 0.14243316650390625, 0.1482067108154297, 0.15398025512695312, 0.15975379943847656, 0.16552734375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 7.0, 9.0, 23.0, 33.0, 78.0, 160.0, 195.0, 189.0, 135.0, 88.0, 32.0, 15.0, 14.0, 6.0, 6.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1302490234375, -0.12574386596679688, -0.12123870849609375, -0.11673355102539062, -0.1122283935546875, -0.10772323608398438, -0.10321807861328125, -0.09871292114257812, -0.094207763671875, -0.08970260620117188, -0.08519744873046875, -0.08069229125976562, -0.0761871337890625, -0.07168197631835938, -0.06717681884765625, -0.06267166137695312, -0.05816650390625, -0.053661346435546875, -0.04915618896484375, -0.044651031494140625, -0.0401458740234375, -0.035640716552734375, -0.03113555908203125, -0.026630401611328125, -0.022125244140625, -0.017620086669921875, -0.01311492919921875, -0.008609771728515625, -0.0041046142578125, 0.000400543212890625, 0.00490570068359375, 0.009410858154296875, 0.013916015625, 0.018421173095703125, 0.02292633056640625, 0.027431488037109375, 0.0319366455078125, 0.036441802978515625, 0.04094696044921875, 0.045452117919921875, 0.049957275390625, 0.054462432861328125, 0.05896759033203125, 0.06347274780273438, 0.0679779052734375, 0.07248306274414062, 0.07698822021484375, 0.08149337768554688, 0.08599853515625, 0.09050369262695312, 0.09500885009765625, 0.09951400756835938, 0.1040191650390625, 0.10852432250976562, 0.11302947998046875, 0.11753463745117188, 0.122039794921875, 0.12654495239257812, 0.13105010986328125, 0.13555526733398438, 0.1400604248046875, 0.14456558227539062, 0.14907073974609375, 0.15357589721679688, 0.1580810546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 8.0, 2.0, 4.0, 8.0, 11.0, 15.0, 7.0, 25.0, 20.0, 29.0, 39.0, 52.0, 70.0, 105.0, 136.0, 261.0, 497.0, 945.0, 3206.0, 37961.0, 802301.0, 191638.0, 8088.0, 1479.0, 632.0, 345.0, 195.0, 116.0, 94.0, 65.0, 50.0, 33.0, 31.0, 18.0, 11.0, 8.0, 6.0, 11.0, 4.0, 10.0, 13.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.202392578125, -0.19639205932617188, -0.19039154052734375, -0.18439102172851562, -0.1783905029296875, -0.17238998413085938, -0.16638946533203125, -0.16038894653320312, -0.154388427734375, -0.14838790893554688, -0.14238739013671875, -0.13638687133789062, -0.1303863525390625, -0.12438583374023438, -0.11838531494140625, -0.11238479614257812, -0.10638427734375, -0.10038375854492188, -0.09438323974609375, -0.08838272094726562, -0.0823822021484375, -0.07638168334960938, -0.07038116455078125, -0.06438064575195312, -0.058380126953125, -0.052379608154296875, -0.04637908935546875, -0.040378570556640625, -0.0343780517578125, -0.028377532958984375, -0.02237701416015625, -0.016376495361328125, -0.0103759765625, -0.004375457763671875, 0.00162506103515625, 0.007625579833984375, 0.0136260986328125, 0.019626617431640625, 0.02562713623046875, 0.031627655029296875, 0.037628173828125, 0.043628692626953125, 0.04962921142578125, 0.055629730224609375, 0.0616302490234375, 0.06763076782226562, 0.07363128662109375, 0.07963180541992188, 0.08563232421875, 0.09163284301757812, 0.09763336181640625, 0.10363388061523438, 0.1096343994140625, 0.11563491821289062, 0.12163543701171875, 0.12763595581054688, 0.133636474609375, 0.13963699340820312, 0.14563751220703125, 0.15163803100585938, 0.1576385498046875, 0.16363906860351562, 0.16963958740234375, 0.17564010620117188, 0.181640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 7.0, 8.0, 13.0, 10.0, 16.0, 19.0, 19.0, 18.0, 27.0, 40.0, 31.0, 22.0, 33.0, 44.0, 35.0, 49.0, 39.0, 44.0, 38.0, 51.0, 33.0, 53.0, 46.0, 30.0, 41.0, 26.0, 35.0, 22.0, 21.0, 21.0, 14.0, 18.0, 15.0, 7.0, 10.0, 6.0, 8.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2021484375, -0.19599151611328125, -0.1898345947265625, -0.18367767333984375, -0.177520751953125, -0.17136383056640625, -0.1652069091796875, -0.15904998779296875, -0.15289306640625, -0.14673614501953125, -0.1405792236328125, -0.13442230224609375, -0.128265380859375, -0.12210845947265625, -0.1159515380859375, -0.10979461669921875, -0.1036376953125, -0.09748077392578125, -0.0913238525390625, -0.08516693115234375, -0.079010009765625, -0.07285308837890625, -0.0666961669921875, -0.06053924560546875, -0.05438232421875, -0.04822540283203125, -0.0420684814453125, -0.03591156005859375, -0.029754638671875, -0.02359771728515625, -0.0174407958984375, -0.01128387451171875, -0.005126953125, 0.00102996826171875, 0.0071868896484375, 0.01334381103515625, 0.019500732421875, 0.02565765380859375, 0.0318145751953125, 0.03797149658203125, 0.04412841796875, 0.05028533935546875, 0.0564422607421875, 0.06259918212890625, 0.068756103515625, 0.07491302490234375, 0.0810699462890625, 0.08722686767578125, 0.0933837890625, 0.09954071044921875, 0.1056976318359375, 0.11185455322265625, 0.118011474609375, 0.12416839599609375, 0.1303253173828125, 0.13648223876953125, 0.14263916015625, 0.14879608154296875, 0.1549530029296875, 0.16110992431640625, 0.167266845703125, 0.17342376708984375, 0.1795806884765625, 0.18573760986328125, 0.19189453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 5.0, 8.0, 16.0, 18.0, 43.0, 50.0, 71.0, 132.0, 229.0, 508.0, 1094.0, 2771.0, 11426.0, 266220.0, 738220.0, 20977.0, 3999.0, 1465.0, 604.0, 295.0, 148.0, 90.0, 60.0, 25.0, 22.0, 20.0, 15.0, 5.0, 2.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06658935546875, -0.0642232894897461, -0.06185722351074219, -0.05949115753173828, -0.057125091552734375, -0.05475902557373047, -0.05239295959472656, -0.050026893615722656, -0.04766082763671875, -0.045294761657714844, -0.04292869567871094, -0.04056262969970703, -0.038196563720703125, -0.03583049774169922, -0.03346443176269531, -0.031098365783691406, -0.0287322998046875, -0.026366233825683594, -0.024000167846679688, -0.02163410186767578, -0.019268035888671875, -0.01690196990966797, -0.014535903930664062, -0.012169837951660156, -0.00980377197265625, -0.007437705993652344, -0.0050716400146484375, -0.0027055740356445312, -0.000339508056640625, 0.0020265579223632812, 0.0043926239013671875, 0.006758689880371094, 0.009124755859375, 0.011490821838378906, 0.013856887817382812, 0.01622295379638672, 0.018589019775390625, 0.02095508575439453, 0.023321151733398438, 0.025687217712402344, 0.02805328369140625, 0.030419349670410156, 0.03278541564941406, 0.03515148162841797, 0.037517547607421875, 0.03988361358642578, 0.04224967956542969, 0.044615745544433594, 0.0469818115234375, 0.049347877502441406, 0.05171394348144531, 0.05408000946044922, 0.056446075439453125, 0.05881214141845703, 0.06117820739746094, 0.06354427337646484, 0.06591033935546875, 0.06827640533447266, 0.07064247131347656, 0.07300853729248047, 0.07537460327148438, 0.07774066925048828, 0.08010673522949219, 0.0824728012084961, 0.0848388671875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 25.0, 59.0, 120.0, 283.0, 256.0, 163.0, 55.0, 21.0, 11.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1425228118896484e-05, -4.057958722114563e-05, -3.9733946323394775e-05, -3.888830542564392e-05, -3.8042664527893066e-05, -3.719702363014221e-05, -3.635138273239136e-05, -3.55057418346405e-05, -3.466010093688965e-05, -3.3814460039138794e-05, -3.296881914138794e-05, -3.2123178243637085e-05, -3.127753734588623e-05, -3.0431896448135376e-05, -2.958625555038452e-05, -2.8740614652633667e-05, -2.7894973754882812e-05, -2.7049332857131958e-05, -2.6203691959381104e-05, -2.535805106163025e-05, -2.4512410163879395e-05, -2.366676926612854e-05, -2.2821128368377686e-05, -2.197548747062683e-05, -2.1129846572875977e-05, -2.0284205675125122e-05, -1.9438564777374268e-05, -1.8592923879623413e-05, -1.774728298187256e-05, -1.6901642084121704e-05, -1.605600118637085e-05, -1.5210360288619995e-05, -1.436471939086914e-05, -1.3519078493118286e-05, -1.2673437595367432e-05, -1.1827796697616577e-05, -1.0982155799865723e-05, -1.0136514902114868e-05, -9.290874004364014e-06, -8.44523310661316e-06, -7.599592208862305e-06, -6.75395131111145e-06, -5.908310413360596e-06, -5.062669515609741e-06, -4.217028617858887e-06, -3.3713877201080322e-06, -2.5257468223571777e-06, -1.6801059246063232e-06, -8.344650268554688e-07, 1.1175870895385742e-08, 8.568167686462402e-07, 1.7024576663970947e-06, 2.5480985641479492e-06, 3.3937394618988037e-06, 4.239380359649658e-06, 5.085021257400513e-06, 5.930662155151367e-06, 6.776303052902222e-06, 7.621943950653076e-06, 8.46758484840393e-06, 9.313225746154785e-06, 1.015886664390564e-05, 1.1004507541656494e-05, 1.1850148439407349e-05, 1.2695789337158203e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 7.0, 12.0, 11.0, 17.0, 25.0, 33.0, 54.0, 86.0, 118.0, 180.0, 322.0, 611.0, 1368.0, 3516.0, 15830.0, 248643.0, 727886.0, 40039.0, 6015.0, 1851.0, 809.0, 407.0, 246.0, 150.0, 103.0, 62.0, 46.0, 28.0, 24.0, 17.0, 9.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06915283203125, -0.06713104248046875, -0.0651092529296875, -0.06308746337890625, -0.061065673828125, -0.05904388427734375, -0.0570220947265625, -0.05500030517578125, -0.052978515625, -0.05095672607421875, -0.0489349365234375, -0.04691314697265625, -0.044891357421875, -0.04286956787109375, -0.0408477783203125, -0.03882598876953125, -0.03680419921875, -0.03478240966796875, -0.0327606201171875, -0.03073883056640625, -0.028717041015625, -0.02669525146484375, -0.0246734619140625, -0.02265167236328125, -0.0206298828125, -0.01860809326171875, -0.0165863037109375, -0.01456451416015625, -0.012542724609375, -0.01052093505859375, -0.0084991455078125, -0.00647735595703125, -0.00445556640625, -0.00243377685546875, -0.0004119873046875, 0.00160980224609375, 0.003631591796875, 0.00565338134765625, 0.0076751708984375, 0.00969696044921875, 0.01171875, 0.01374053955078125, 0.0157623291015625, 0.01778411865234375, 0.019805908203125, 0.02182769775390625, 0.0238494873046875, 0.02587127685546875, 0.02789306640625, 0.02991485595703125, 0.0319366455078125, 0.03395843505859375, 0.035980224609375, 0.03800201416015625, 0.0400238037109375, 0.04204559326171875, 0.0440673828125, 0.04608917236328125, 0.0481109619140625, 0.05013275146484375, 0.052154541015625, 0.05417633056640625, 0.0561981201171875, 0.05821990966796875, 0.06024169921875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 0.0, 4.0, 5.0, 8.0, 8.0, 7.0, 9.0, 12.0, 11.0, 21.0, 29.0, 26.0, 37.0, 46.0, 60.0, 65.0, 59.0, 57.0, 75.0, 73.0, 76.0, 58.0, 49.0, 38.0, 30.0, 25.0, 21.0, 17.0, 20.0, 12.0, 11.0, 11.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.034942626953125, -0.03388500213623047, -0.03282737731933594, -0.031769752502441406, -0.030712127685546875, -0.029654502868652344, -0.028596878051757812, -0.02753925323486328, -0.02648162841796875, -0.02542400360107422, -0.024366378784179688, -0.023308753967285156, -0.022251129150390625, -0.021193504333496094, -0.020135879516601562, -0.01907825469970703, -0.0180206298828125, -0.01696300506591797, -0.015905380249023438, -0.014847755432128906, -0.013790130615234375, -0.012732505798339844, -0.011674880981445312, -0.010617256164550781, -0.00955963134765625, -0.008502006530761719, -0.0074443817138671875, -0.006386756896972656, -0.005329132080078125, -0.004271507263183594, -0.0032138824462890625, -0.0021562576293945312, -0.0010986328125, -4.100799560546875e-05, 0.0010166168212890625, 0.0020742416381835938, 0.003131866455078125, 0.004189491271972656, 0.0052471160888671875, 0.006304740905761719, 0.00736236572265625, 0.008419990539550781, 0.009477615356445312, 0.010535240173339844, 0.011592864990234375, 0.012650489807128906, 0.013708114624023438, 0.014765739440917969, 0.0158233642578125, 0.01688098907470703, 0.017938613891601562, 0.018996238708496094, 0.020053863525390625, 0.021111488342285156, 0.022169113159179688, 0.02322673797607422, 0.02428436279296875, 0.02534198760986328, 0.026399612426757812, 0.027457237243652344, 0.028514862060546875, 0.029572486877441406, 0.030630111694335938, 0.03168773651123047, 0.032745361328125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 21.0, 65.0, 207.0, 357.0, 243.0, 81.0, 22.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0293564796447754, -1.9689313173294067, -1.9085060358047485, -1.8480808734893799, -1.7876555919647217, -1.727230429649353, -1.6668052673339844, -1.6063799858093262, -1.545954704284668, -1.4855295419692993, -1.4251042604446411, -1.3646790981292725, -1.3042538166046143, -1.2438286542892456, -1.183403491973877, -1.1229782104492188, -1.06255304813385, -1.0021278858184814, -0.9417026042938232, -0.8812774419784546, -0.8208521604537964, -0.7604269981384277, -0.7000017762184143, -0.6395765542984009, -0.5791513323783875, -0.518726110458374, -0.4583008885383606, -0.39787569642066956, -0.33745047450065613, -0.2770252525806427, -0.21660006046295166, -0.15617483854293823, -0.0957496166229248, -0.035324402153491974, 0.025100812315940857, 0.08552601933479309, 0.14595124125480652, 0.20637646317481995, 0.266801655292511, 0.3272268772125244, 0.38765209913253784, 0.44807732105255127, 0.5085025429725647, 0.5689277648925781, 0.6293529272079468, 0.689778208732605, 0.7502033710479736, 0.8106285929679871, 0.8710538148880005, 0.9314790368080139, 0.9919042587280273, 1.052329421043396, 1.1127547025680542, 1.1731798648834229, 1.233605146408081, 1.2940303087234497, 1.3544554710388184, 1.414880633354187, 1.4753059148788452, 1.5357310771942139, 1.596156358718872, 1.6565815210342407, 1.7170066833496094, 1.7774319648742676, 1.8378572463989258]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 8.0, 12.0, 6.0, 7.0, 9.0, 17.0, 19.0, 9.0, 20.0, 18.0, 24.0, 27.0, 33.0, 33.0, 33.0, 46.0, 49.0, 42.0, 49.0, 45.0, 52.0, 57.0, 41.0, 44.0, 41.0, 30.0, 38.0, 36.0, 19.0, 13.0, 18.0, 17.0, 12.0, 26.0, 8.0, 4.0, 7.0, 11.0, 4.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.940723717212677, -0.9100852012634277, -0.8794466257095337, -0.8488081097602844, -0.8181695342063904, -0.7875310182571411, -0.7568924427032471, -0.7262539267539978, -0.6956154108047485, -0.6649768948554993, -0.6343383193016052, -0.603699803352356, -0.5730612277984619, -0.5424227118492126, -0.5117841958999634, -0.48114562034606934, -0.4505070447921753, -0.41986849904060364, -0.389229953289032, -0.3585914373397827, -0.32795286178588867, -0.2973143458366394, -0.26667580008506775, -0.2360372543334961, -0.20539870858192444, -0.17476016283035278, -0.14412161707878113, -0.11348308622837067, -0.08284454047679901, -0.052205994725227356, -0.021567463874816895, 0.00907108187675476, 0.03970968723297119, 0.07034823298454285, 0.1009867712855339, 0.13162530958652496, 0.16226385533809662, 0.19290240108966827, 0.22354093194007874, 0.2541794776916504, 0.28481802344322205, 0.3154565691947937, 0.34609511494636536, 0.376733660697937, 0.4073721766471863, 0.4380107522010803, 0.4686492681503296, 0.49928781390190125, 0.5299263596534729, 0.5605648756027222, 0.5912034511566162, 0.6218419671058655, 0.6524805426597595, 0.6831190586090088, 0.7137576341629028, 0.7443961501121521, 0.7750346660614014, 0.8056731820106506, 0.8363117575645447, 0.866950273513794, 0.897588849067688, 0.9282273650169373, 0.9588658809661865, 0.9895044565200806, 1.0201430320739746]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 4.0, 6.0, 6.0, 14.0, 22.0, 38.0, 66.0, 107.0, 179.0, 298.0, 609.0, 1149.0, 2335.0, 5673.0, 20931.0, 4067665.0, 76207.0, 11430.0, 3896.0, 1663.0, 862.0, 470.0, 267.0, 141.0, 79.0, 62.0, 36.0, 23.0, 13.0, 9.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.11828041076660156, -0.11467361450195312, -0.11106681823730469, -0.10746002197265625, -0.10385322570800781, -0.10024642944335938, -0.09663963317871094, -0.0930328369140625, -0.08942604064941406, -0.08581924438476562, -0.08221244812011719, -0.07860565185546875, -0.07499885559082031, -0.07139205932617188, -0.06778526306152344, -0.064178466796875, -0.06057167053222656, -0.056964874267578125, -0.05335807800292969, -0.04975128173828125, -0.04614448547363281, -0.042537689208984375, -0.03893089294433594, -0.0353240966796875, -0.03171730041503906, -0.028110504150390625, -0.024503707885742188, -0.02089691162109375, -0.017290115356445312, -0.013683319091796875, -0.010076522827148438, -0.0064697265625, -0.0028629302978515625, 0.000743865966796875, 0.0043506622314453125, 0.00795745849609375, 0.011564254760742188, 0.015171051025390625, 0.018777847290039062, 0.0223846435546875, 0.025991439819335938, 0.029598236083984375, 0.03320503234863281, 0.03681182861328125, 0.04041862487792969, 0.044025421142578125, 0.04763221740722656, 0.051239013671875, 0.05484580993652344, 0.058452606201171875, 0.06205940246582031, 0.06566619873046875, 0.06927299499511719, 0.07287979125976562, 0.07648658752441406, 0.0800933837890625, 0.08370018005371094, 0.08730697631835938, 0.09091377258300781, 0.09452056884765625, 0.09812736511230469, 0.10173416137695312, 0.10534095764160156, 0.10894775390625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 13.0, 11.0, 40.0, 78.0, 156.0, 182.0, 203.0, 145.0, 76.0, 40.0, 15.0, 14.0, 4.0, 10.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1302490234375, -0.1257476806640625, -0.121246337890625, -0.1167449951171875, -0.11224365234375, -0.1077423095703125, -0.103240966796875, -0.0987396240234375, -0.09423828125, -0.0897369384765625, -0.085235595703125, -0.0807342529296875, -0.07623291015625, -0.0717315673828125, -0.067230224609375, -0.0627288818359375, -0.0582275390625, -0.0537261962890625, -0.049224853515625, -0.0447235107421875, -0.04022216796875, -0.0357208251953125, -0.031219482421875, -0.0267181396484375, -0.022216796875, -0.0177154541015625, -0.013214111328125, -0.0087127685546875, -0.00421142578125, 0.0002899169921875, 0.004791259765625, 0.0092926025390625, 0.0137939453125, 0.0182952880859375, 0.022796630859375, 0.0272979736328125, 0.03179931640625, 0.0363006591796875, 0.040802001953125, 0.0453033447265625, 0.0498046875, 0.0543060302734375, 0.058807373046875, 0.0633087158203125, 0.06781005859375, 0.0723114013671875, 0.076812744140625, 0.0813140869140625, 0.0858154296875, 0.0903167724609375, 0.094818115234375, 0.0993194580078125, 0.10382080078125, 0.1083221435546875, 0.112823486328125, 0.1173248291015625, 0.121826171875, 0.1263275146484375, 0.130828857421875, 0.1353302001953125, 0.13983154296875, 0.1443328857421875, 0.148834228515625, 0.1533355712890625, 0.1578369140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 9.0, 10.0, 12.0, 15.0, 30.0, 28.0, 23.0, 44.0, 76.0, 108.0, 150.0, 202.0, 313.0, 519.0, 801.0, 1468.0, 2826.0, 7123.0, 31738.0, 4055663.0, 73639.0, 11125.0, 3852.0, 1765.0, 941.0, 587.0, 368.0, 239.0, 198.0, 114.0, 82.0, 48.0, 44.0, 29.0, 32.0, 19.0, 12.0, 8.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1666259765625, -0.16167831420898438, -0.15673065185546875, -0.15178298950195312, -0.1468353271484375, -0.14188766479492188, -0.13694000244140625, -0.13199234008789062, -0.127044677734375, -0.12209701538085938, -0.11714935302734375, -0.11220169067382812, -0.1072540283203125, -0.10230636596679688, -0.09735870361328125, -0.09241104125976562, -0.08746337890625, -0.08251571655273438, -0.07756805419921875, -0.07262039184570312, -0.0676727294921875, -0.06272506713867188, -0.05777740478515625, -0.052829742431640625, -0.047882080078125, -0.042934417724609375, -0.03798675537109375, -0.033039093017578125, -0.0280914306640625, -0.023143768310546875, -0.01819610595703125, -0.013248443603515625, -0.00830078125, -0.003353118896484375, 0.00159454345703125, 0.006542205810546875, 0.0114898681640625, 0.016437530517578125, 0.02138519287109375, 0.026332855224609375, 0.031280517578125, 0.036228179931640625, 0.04117584228515625, 0.046123504638671875, 0.0510711669921875, 0.056018829345703125, 0.06096649169921875, 0.06591415405273438, 0.07086181640625, 0.07580947875976562, 0.08075714111328125, 0.08570480346679688, 0.0906524658203125, 0.09560012817382812, 0.10054779052734375, 0.10549545288085938, 0.110443115234375, 0.11539077758789062, 0.12033843994140625, 0.12528610229492188, 0.1302337646484375, 0.13518142700195312, 0.14012908935546875, 0.14507675170898438, 0.1500244140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 12.0, 15.0, 21.0, 56.0, 164.0, 3641.0, 74.0, 32.0, 19.0, 11.0, 5.0, 8.0, 4.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0394287109375, -0.03807878494262695, -0.036728858947753906, -0.03537893295288086, -0.03402900695800781, -0.032679080963134766, -0.03132915496826172, -0.029979228973388672, -0.028629302978515625, -0.027279376983642578, -0.02592945098876953, -0.024579524993896484, -0.023229598999023438, -0.02187967300415039, -0.020529747009277344, -0.019179821014404297, -0.01782989501953125, -0.016479969024658203, -0.015130043029785156, -0.01378011703491211, -0.012430191040039062, -0.011080265045166016, -0.009730339050292969, -0.008380413055419922, -0.007030487060546875, -0.005680561065673828, -0.004330635070800781, -0.0029807090759277344, -0.0016307830810546875, -0.0002808570861816406, 0.0010690689086914062, 0.002418994903564453, 0.0037689208984375, 0.005118846893310547, 0.006468772888183594, 0.00781869888305664, 0.009168624877929688, 0.010518550872802734, 0.011868476867675781, 0.013218402862548828, 0.014568328857421875, 0.015918254852294922, 0.01726818084716797, 0.018618106842041016, 0.019968032836914062, 0.02131795883178711, 0.022667884826660156, 0.024017810821533203, 0.02536773681640625, 0.026717662811279297, 0.028067588806152344, 0.02941751480102539, 0.030767440795898438, 0.032117366790771484, 0.03346729278564453, 0.03481721878051758, 0.036167144775390625, 0.03751707077026367, 0.03886699676513672, 0.040216922760009766, 0.04156684875488281, 0.04291677474975586, 0.044266700744628906, 0.04561662673950195, 0.046966552734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 8.0, 15.0, 18.0, 20.0, 35.0, 57.0, 87.0, 105.0, 127.0, 117.0, 97.0, 88.0, 61.0, 49.0, 30.0, 24.0, 15.0, 14.0, 8.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08543664216995239, -0.08130544424057007, -0.07717424631118774, -0.07304304838180542, -0.0689118504524231, -0.06478065252304077, -0.060649458318948746, -0.05651826038956642, -0.0523870624601841, -0.04825586453080177, -0.04412466660141945, -0.03999347239732742, -0.0358622744679451, -0.031731076538562775, -0.02759987860918045, -0.023468680679798126, -0.019337482750415802, -0.015206284821033478, -0.011075087822973728, -0.006943890824913979, -0.0028126928955316544, 0.0013185050338506699, 0.005449701100587845, 0.009580899029970169, 0.013712096959352493, 0.017843294888734818, 0.02197449281811714, 0.026105688884854317, 0.03023688681423664, 0.034368082880973816, 0.03849928081035614, 0.042630478739738464, 0.04676167666912079, 0.05089287459850311, 0.05502407252788544, 0.05915527045726776, 0.06328646838665009, 0.06741766631603241, 0.07154886424541473, 0.07568006217479706, 0.07981126010417938, 0.0839424580335617, 0.08807365596294403, 0.09220485389232635, 0.09633605182170868, 0.100467249751091, 0.10459844768047333, 0.10872964560985565, 0.11286083608865738, 0.1169920340180397, 0.12112323194742203, 0.12525442242622375, 0.12938562035560608, 0.1335168182849884, 0.13764801621437073, 0.14177921414375305, 0.14591041207313538, 0.1500416100025177, 0.15417280793190002, 0.15830400586128235, 0.16243520379066467, 0.166566401720047, 0.17069759964942932, 0.17482879757881165, 0.17895999550819397]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 1.0, 7.0, 5.0, 4.0, 6.0, 11.0, 5.0, 7.0, 10.0, 19.0, 19.0, 17.0, 19.0, 29.0, 24.0, 27.0, 28.0, 37.0, 37.0, 34.0, 49.0, 37.0, 42.0, 32.0, 42.0, 35.0, 30.0, 37.0, 39.0, 36.0, 32.0, 23.0, 17.0, 33.0, 22.0, 31.0, 15.0, 21.0, 13.0, 24.0, 11.0, 10.0, 9.0, 6.0, 3.0, 2.0, 8.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05700498819351196, -0.05497797578573227, -0.052950967103242874, -0.05092395842075348, -0.048896946012973785, -0.04686993360519409, -0.0448429249227047, -0.0428159162402153, -0.04078890383243561, -0.038761891424655914, -0.03673488274216652, -0.034707874059677124, -0.03268086165189743, -0.030653851106762886, -0.02862684056162834, -0.026599830016493797, -0.024572819471359253, -0.02254580892622471, -0.020518798381090164, -0.01849178783595562, -0.016464777290821075, -0.014437766745686531, -0.012410756200551987, -0.010383745655417442, -0.008356735110282898, -0.006329724565148354, -0.004302714020013809, -0.002275703474879265, -0.00024869292974472046, 0.001778317615389824, 0.0038053281605243683, 0.005832338705658913, 0.007859349250793457, 0.009886359795928001, 0.011913370341062546, 0.01394038088619709, 0.015967391431331635, 0.01799440197646618, 0.020021412521600723, 0.022048423066735268, 0.024075433611869812, 0.026102444157004356, 0.0281294547021389, 0.030156465247273445, 0.03218347579240799, 0.03421048820018768, 0.03623749688267708, 0.03826450556516647, 0.04029151797294617, 0.04231853038072586, 0.044345539063215256, 0.04637254774570465, 0.048399560153484344, 0.05042657256126404, 0.05245358124375343, 0.05448058992624283, 0.05650760233402252, 0.058534614741802216, 0.06056162342429161, 0.062588632106781, 0.0646156445145607, 0.0666426569223404, 0.06866966187953949, 0.07069667428731918, 0.07272368669509888]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 1.0, 19.0, 22.0, 39.0, 61.0, 146.0, 331.0, 886.0, 3224.0, 26065.0, 848568.0, 159440.0, 7200.0, 1545.0, 529.0, 239.0, 104.0, 54.0, 24.0, 21.0, 12.0, 4.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306396484375, -0.2964286804199219, -0.28646087646484375, -0.2764930725097656, -0.2665252685546875, -0.2565574645996094, -0.24658966064453125, -0.23662185668945312, -0.226654052734375, -0.21668624877929688, -0.20671844482421875, -0.19675064086914062, -0.1867828369140625, -0.17681503295898438, -0.16684722900390625, -0.15687942504882812, -0.14691162109375, -0.13694381713867188, -0.12697601318359375, -0.11700820922851562, -0.1070404052734375, -0.09707260131835938, -0.08710479736328125, -0.07713699340820312, -0.067169189453125, -0.057201385498046875, -0.04723358154296875, -0.037265777587890625, -0.0272979736328125, -0.017330169677734375, -0.00736236572265625, 0.002605438232421875, 0.0125732421875, 0.022541046142578125, 0.03250885009765625, 0.042476654052734375, 0.0524444580078125, 0.062412261962890625, 0.07238006591796875, 0.08234786987304688, 0.092315673828125, 0.10228347778320312, 0.11225128173828125, 0.12221908569335938, 0.1321868896484375, 0.14215469360351562, 0.15212249755859375, 0.16209030151367188, 0.17205810546875, 0.18202590942382812, 0.19199371337890625, 0.20196151733398438, 0.2119293212890625, 0.22189712524414062, 0.23186492919921875, 0.24183273315429688, 0.251800537109375, 0.2617683410644531, 0.27173614501953125, 0.2817039489746094, 0.2916717529296875, 0.3016395568847656, 0.31160736083984375, 0.3215751647949219, 0.33154296875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 11.0, 18.0, 42.0, 82.0, 149.0, 162.0, 197.0, 146.0, 89.0, 46.0, 15.0, 14.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1307373046875, -0.12623023986816406, -0.12172317504882812, -0.11721611022949219, -0.11270904541015625, -0.10820198059082031, -0.10369491577148438, -0.09918785095214844, -0.0946807861328125, -0.09017372131347656, -0.08566665649414062, -0.08115959167480469, -0.07665252685546875, -0.07214546203613281, -0.06763839721679688, -0.06313133239746094, -0.058624267578125, -0.05411720275878906, -0.049610137939453125, -0.04510307312011719, -0.04059600830078125, -0.03608894348144531, -0.031581878662109375, -0.027074813842773438, -0.0225677490234375, -0.018060684204101562, -0.013553619384765625, -0.009046554565429688, -0.00453948974609375, -3.24249267578125e-05, 0.004474639892578125, 0.008981704711914062, 0.01348876953125, 0.017995834350585938, 0.022502899169921875, 0.027009963989257812, 0.03151702880859375, 0.03602409362792969, 0.040531158447265625, 0.04503822326660156, 0.0495452880859375, 0.05405235290527344, 0.058559417724609375, 0.06306648254394531, 0.06757354736328125, 0.07208061218261719, 0.07658767700195312, 0.08109474182128906, 0.085601806640625, 0.09010887145996094, 0.09461593627929688, 0.09912300109863281, 0.10363006591796875, 0.10813713073730469, 0.11264419555664062, 0.11715126037597656, 0.1216583251953125, 0.12616539001464844, 0.13067245483398438, 0.1351795196533203, 0.13968658447265625, 0.1441936492919922, 0.14870071411132812, 0.15320777893066406, 0.15771484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 6.0, 5.0, 14.0, 14.0, 18.0, 16.0, 30.0, 41.0, 43.0, 53.0, 80.0, 113.0, 146.0, 277.0, 481.0, 1006.0, 2676.0, 20019.0, 748233.0, 262887.0, 8649.0, 1848.0, 761.0, 417.0, 241.0, 134.0, 83.0, 58.0, 48.0, 36.0, 24.0, 18.0, 14.0, 17.0, 4.0, 12.0, 7.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.250244140625, -0.24306106567382812, -0.23587799072265625, -0.22869491577148438, -0.2215118408203125, -0.21432876586914062, -0.20714569091796875, -0.19996261596679688, -0.192779541015625, -0.18559646606445312, -0.17841339111328125, -0.17123031616210938, -0.1640472412109375, -0.15686416625976562, -0.14968109130859375, -0.14249801635742188, -0.13531494140625, -0.12813186645507812, -0.12094879150390625, -0.11376571655273438, -0.1065826416015625, -0.09939956665039062, -0.09221649169921875, -0.08503341674804688, -0.077850341796875, -0.07066726684570312, -0.06348419189453125, -0.056301116943359375, -0.0491180419921875, -0.041934967041015625, -0.03475189208984375, -0.027568817138671875, -0.0203857421875, -0.013202667236328125, -0.00601959228515625, 0.001163482666015625, 0.0083465576171875, 0.015529632568359375, 0.02271270751953125, 0.029895782470703125, 0.037078857421875, 0.044261932373046875, 0.05144500732421875, 0.058628082275390625, 0.0658111572265625, 0.07299423217773438, 0.08017730712890625, 0.08736038208007812, 0.09454345703125, 0.10172653198242188, 0.10890960693359375, 0.11609268188476562, 0.1232757568359375, 0.13045883178710938, 0.13764190673828125, 0.14482498168945312, 0.152008056640625, 0.15919113159179688, 0.16637420654296875, 0.17355728149414062, 0.1807403564453125, 0.18792343139648438, 0.19510650634765625, 0.20228958129882812, 0.20947265625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 8.0, 9.0, 7.0, 14.0, 12.0, 23.0, 26.0, 29.0, 23.0, 37.0, 40.0, 47.0, 36.0, 49.0, 41.0, 44.0, 42.0, 43.0, 33.0, 55.0, 36.0, 42.0, 50.0, 36.0, 27.0, 24.0, 29.0, 11.0, 11.0, 16.0, 19.0, 19.0, 8.0, 9.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1973876953125, -0.19134140014648438, -0.18529510498046875, -0.17924880981445312, -0.1732025146484375, -0.16715621948242188, -0.16110992431640625, -0.15506362915039062, -0.149017333984375, -0.14297103881835938, -0.13692474365234375, -0.13087844848632812, -0.1248321533203125, -0.11878585815429688, -0.11273956298828125, -0.10669326782226562, -0.10064697265625, -0.09460067749023438, -0.08855438232421875, -0.08250808715820312, -0.0764617919921875, -0.07041549682617188, -0.06436920166015625, -0.058322906494140625, -0.052276611328125, -0.046230316162109375, -0.04018402099609375, -0.034137725830078125, -0.0280914306640625, -0.022045135498046875, -0.01599884033203125, -0.009952545166015625, -0.00390625, 0.002140045166015625, 0.00818634033203125, 0.014232635498046875, 0.0202789306640625, 0.026325225830078125, 0.03237152099609375, 0.038417816162109375, 0.044464111328125, 0.050510406494140625, 0.05655670166015625, 0.06260299682617188, 0.0686492919921875, 0.07469558715820312, 0.08074188232421875, 0.08678817749023438, 0.09283447265625, 0.09888076782226562, 0.10492706298828125, 0.11097335815429688, 0.1170196533203125, 0.12306594848632812, 0.12911224365234375, 0.13515853881835938, 0.141204833984375, 0.14725112915039062, 0.15329742431640625, 0.15934371948242188, 0.1653900146484375, 0.17143630981445312, 0.17748260498046875, 0.18352890014648438, 0.1895751953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 9.0, 13.0, 12.0, 19.0, 40.0, 58.0, 86.0, 162.0, 354.0, 817.0, 4050.0, 99543.0, 921743.0, 18671.0, 1844.0, 532.0, 211.0, 131.0, 85.0, 62.0, 21.0, 23.0, 19.0, 8.0, 7.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1134033203125, -0.10953140258789062, -0.10565948486328125, -0.10178756713867188, -0.0979156494140625, -0.09404373168945312, -0.09017181396484375, -0.08629989624023438, -0.082427978515625, -0.07855606079101562, -0.07468414306640625, -0.07081222534179688, -0.0669403076171875, -0.06306838989257812, -0.05919647216796875, -0.055324554443359375, -0.05145263671875, -0.047580718994140625, -0.04370880126953125, -0.039836883544921875, -0.0359649658203125, -0.032093048095703125, -0.02822113037109375, -0.024349212646484375, -0.020477294921875, -0.016605377197265625, -0.01273345947265625, -0.008861541748046875, -0.0049896240234375, -0.001117706298828125, 0.00275421142578125, 0.006626129150390625, 0.010498046875, 0.014369964599609375, 0.01824188232421875, 0.022113800048828125, 0.0259857177734375, 0.029857635498046875, 0.03372955322265625, 0.037601470947265625, 0.041473388671875, 0.045345306396484375, 0.04921722412109375, 0.053089141845703125, 0.0569610595703125, 0.060832977294921875, 0.06470489501953125, 0.06857681274414062, 0.07244873046875, 0.07632064819335938, 0.08019256591796875, 0.08406448364257812, 0.0879364013671875, 0.09180831909179688, 0.09568023681640625, 0.09955215454101562, 0.103424072265625, 0.10729598999023438, 0.11116790771484375, 0.11503982543945312, 0.1189117431640625, 0.12278366088867188, 0.12665557861328125, 0.13052749633789062, 0.1343994140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 2.0, 8.0, 8.0, 11.0, 11.0, 16.0, 21.0, 32.0, 38.0, 45.0, 48.0, 62.0, 81.0, 87.0, 80.0, 80.0, 59.0, 48.0, 59.0, 42.0, 33.0, 33.0, 20.0, 12.0, 11.0, 16.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.059906005859375e-06, -8.804723620414734e-06, -8.549541234970093e-06, -8.294358849525452e-06, -8.03917646408081e-06, -7.78399407863617e-06, -7.528811693191528e-06, -7.273629307746887e-06, -7.018446922302246e-06, -6.763264536857605e-06, -6.508082151412964e-06, -6.252899765968323e-06, -5.997717380523682e-06, -5.7425349950790405e-06, -5.487352609634399e-06, -5.232170224189758e-06, -4.976987838745117e-06, -4.721805453300476e-06, -4.466623067855835e-06, -4.211440682411194e-06, -3.956258296966553e-06, -3.7010759115219116e-06, -3.4458935260772705e-06, -3.1907111406326294e-06, -2.9355287551879883e-06, -2.680346369743347e-06, -2.425163984298706e-06, -2.169981598854065e-06, -1.914799213409424e-06, -1.6596168279647827e-06, -1.4044344425201416e-06, -1.1492520570755005e-06, -8.940696716308594e-07, -6.388872861862183e-07, -3.8370490074157715e-07, -1.2852251529693604e-07, 1.2665987014770508e-07, 3.818422555923462e-07, 6.370246410369873e-07, 8.922070264816284e-07, 1.1473894119262695e-06, 1.4025717973709106e-06, 1.6577541828155518e-06, 1.912936568260193e-06, 2.168118953704834e-06, 2.423301339149475e-06, 2.678483724594116e-06, 2.9336661100387573e-06, 3.1888484954833984e-06, 3.4440308809280396e-06, 3.6992132663726807e-06, 3.954395651817322e-06, 4.209578037261963e-06, 4.464760422706604e-06, 4.719942808151245e-06, 4.975125193595886e-06, 5.230307579040527e-06, 5.4854899644851685e-06, 5.7406723499298096e-06, 5.995854735374451e-06, 6.251037120819092e-06, 6.506219506263733e-06, 6.761401891708374e-06, 7.016584277153015e-06, 7.271766662597656e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 12.0, 26.0, 20.0, 46.0, 104.0, 259.0, 591.0, 2122.0, 18897.0, 943204.0, 77915.0, 3799.0, 882.0, 350.0, 144.0, 73.0, 44.0, 21.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1494140625, -0.1446971893310547, -0.13998031616210938, -0.13526344299316406, -0.13054656982421875, -0.12582969665527344, -0.12111282348632812, -0.11639595031738281, -0.1116790771484375, -0.10696220397949219, -0.10224533081054688, -0.09752845764160156, -0.09281158447265625, -0.08809471130371094, -0.08337783813476562, -0.07866096496582031, -0.073944091796875, -0.06922721862792969, -0.06451034545898438, -0.05979347229003906, -0.05507659912109375, -0.05035972595214844, -0.045642852783203125, -0.04092597961425781, -0.0362091064453125, -0.03149223327636719, -0.026775360107421875, -0.022058486938476562, -0.01734161376953125, -0.012624740600585938, -0.007907867431640625, -0.0031909942626953125, 0.00152587890625, 0.0062427520751953125, 0.010959625244140625, 0.015676498413085938, 0.02039337158203125, 0.025110244750976562, 0.029827117919921875, 0.03454399108886719, 0.0392608642578125, 0.04397773742675781, 0.048694610595703125, 0.05341148376464844, 0.05812835693359375, 0.06284523010253906, 0.06756210327148438, 0.07227897644042969, 0.076995849609375, 0.08171272277832031, 0.08642959594726562, 0.09114646911621094, 0.09586334228515625, 0.10058021545410156, 0.10529708862304688, 0.11001396179199219, 0.1147308349609375, 0.11944770812988281, 0.12416458129882812, 0.12888145446777344, 0.13359832763671875, 0.13831520080566406, 0.14303207397460938, 0.1477489471435547, 0.1524658203125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 6.0, 9.0, 18.0, 19.0, 47.0, 109.0, 221.0, 262.0, 173.0, 69.0, 28.0, 16.0, 10.0, 2.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.24169921875, -0.23678970336914062, -0.23188018798828125, -0.22697067260742188, -0.2220611572265625, -0.21715164184570312, -0.21224212646484375, -0.20733261108398438, -0.202423095703125, -0.19751358032226562, -0.19260406494140625, -0.18769454956054688, -0.1827850341796875, -0.17787551879882812, -0.17296600341796875, -0.16805648803710938, -0.16314697265625, -0.15823745727539062, -0.15332794189453125, -0.14841842651367188, -0.1435089111328125, -0.13859939575195312, -0.13368988037109375, -0.12878036499023438, -0.123870849609375, -0.11896133422851562, -0.11405181884765625, -0.10914230346679688, -0.1042327880859375, -0.09932327270507812, -0.09441375732421875, -0.08950424194335938, -0.0845947265625, -0.07968521118164062, -0.07477569580078125, -0.06986618041992188, -0.0649566650390625, -0.060047149658203125, -0.05513763427734375, -0.050228118896484375, -0.045318603515625, -0.040409088134765625, -0.03549957275390625, -0.030590057373046875, -0.0256805419921875, -0.020771026611328125, -0.01586151123046875, -0.010951995849609375, -0.00604248046875, -0.001132965087890625, 0.00377655029296875, 0.008686065673828125, 0.0135955810546875, 0.018505096435546875, 0.02341461181640625, 0.028324127197265625, 0.033233642578125, 0.038143157958984375, 0.04305267333984375, 0.047962188720703125, 0.0528717041015625, 0.057781219482421875, 0.06269073486328125, 0.06760025024414062, 0.072509765625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 25.0, 151.0, 347.0, 337.0, 100.0, 27.0, 11.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2232409715652466, -1.1460566520690918, -1.0688724517822266, -0.9916881918907166, -0.9145039319992065, -0.8373196721076965, -0.7601354122161865, -0.6829511523246765, -0.6057668924331665, -0.5285826325416565, -0.4513983726501465, -0.3742141127586365, -0.29702985286712646, -0.21984559297561646, -0.14266133308410645, -0.06547707319259644, 0.011707186698913574, 0.08889144659042358, 0.1660757064819336, 0.2432599663734436, 0.3204442262649536, 0.3976284861564636, 0.47481274604797363, 0.5519970059394836, 0.6291812658309937, 0.7063655257225037, 0.7835497856140137, 0.8607340455055237, 0.9379183053970337, 1.0151026248931885, 1.0922868251800537, 1.169471025466919, 1.2466554641723633, 1.3238396644592285, 1.4010239839553833, 1.478208303451538, 1.5553925037384033, 1.6325767040252686, 1.7097610235214233, 1.7869453430175781, 1.8641295433044434, 1.9413137435913086, 2.018497943878174, 2.095682382583618, 2.1728665828704834, 2.2500507831573486, 2.327235221862793, 2.404419422149658, 2.4816036224365234, 2.5587878227233887, 2.635972023010254, 2.7131564617156982, 2.7903406620025635, 2.8675248622894287, 2.944709300994873, 3.0218935012817383, 3.0990777015686035, 3.1762619018554688, 3.253446102142334, 3.3306305408477783, 3.4078147411346436, 3.484998941421509, 3.562183380126953, 3.6393675804138184, 3.7165517807006836]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 2.0, 6.0, 5.0, 5.0, 18.0, 18.0, 15.0, 17.0, 16.0, 23.0, 33.0, 27.0, 33.0, 36.0, 38.0, 48.0, 60.0, 49.0, 35.0, 55.0, 51.0, 40.0, 48.0, 43.0, 34.0, 39.0, 26.0, 32.0, 20.0, 20.0, 23.0, 13.0, 9.0, 7.0, 9.0, 8.0, 12.0, 4.0, 8.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8718730807304382, -0.8419447541236877, -0.8120164275169373, -0.782088041305542, -0.7521597146987915, -0.722231388092041, -0.6923030614852905, -0.66237473487854, -0.6324464082717896, -0.6025180816650391, -0.5725897550582886, -0.5426614284515381, -0.5127330422401428, -0.48280471563339233, -0.45287638902664185, -0.42294806241989136, -0.3930196762084961, -0.3630913496017456, -0.33316299319267273, -0.30323466658592224, -0.27330631017684937, -0.24337798357009888, -0.2134496569633484, -0.1835213154554367, -0.15359297394752502, -0.12366463243961334, -0.09373629838228226, -0.06380796432495117, -0.03387962281703949, -0.003951281309127808, 0.02597704529762268, 0.05590538680553436, 0.08583378791809082, 0.1157621294260025, 0.14569047093391418, 0.17561879754066467, 0.20554713904857635, 0.23547548055648804, 0.2654038071632385, 0.295332133769989, 0.3252604901790619, 0.3551888167858124, 0.38511717319488525, 0.41504549980163574, 0.44497382640838623, 0.4749021828174591, 0.5048304796218872, 0.5347588658332825, 0.564687192440033, 0.5946155190467834, 0.6245438456535339, 0.6544722318649292, 0.6844005584716797, 0.7143288850784302, 0.7442572116851807, 0.7741855382919312, 0.8041138648986816, 0.8340421915054321, 0.8639705181121826, 0.8938988447189331, 0.9238272309303284, 0.9537555575370789, 0.9836838841438293, 1.0136122703552246, 1.043540596961975]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 14.0, 21.0, 28.0, 30.0, 72.0, 118.0, 182.0, 281.0, 583.0, 1205.0, 2943.0, 8987.0, 43848.0, 4101456.0, 23843.0, 6382.0, 2209.0, 975.0, 435.0, 258.0, 138.0, 111.0, 52.0, 36.0, 17.0, 18.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.141845703125, -0.13771533966064453, -0.13358497619628906, -0.1294546127319336, -0.12532424926757812, -0.12119388580322266, -0.11706352233886719, -0.11293315887451172, -0.10880279541015625, -0.10467243194580078, -0.10054206848144531, -0.09641170501708984, -0.09228134155273438, -0.0881509780883789, -0.08402061462402344, -0.07989025115966797, -0.0757598876953125, -0.07162952423095703, -0.06749916076660156, -0.0633687973022461, -0.059238433837890625, -0.055108070373535156, -0.05097770690917969, -0.04684734344482422, -0.04271697998046875, -0.03858661651611328, -0.03445625305175781, -0.030325889587402344, -0.026195526123046875, -0.022065162658691406, -0.017934799194335938, -0.013804435729980469, -0.009674072265625, -0.005543708801269531, -0.0014133453369140625, 0.0027170181274414062, 0.006847381591796875, 0.010977745056152344, 0.015108108520507812, 0.01923847198486328, 0.02336883544921875, 0.02749919891357422, 0.03162956237792969, 0.035759925842285156, 0.039890289306640625, 0.044020652770996094, 0.04815101623535156, 0.05228137969970703, 0.0564117431640625, 0.06054210662841797, 0.06467247009277344, 0.0688028335571289, 0.07293319702148438, 0.07706356048583984, 0.08119392395019531, 0.08532428741455078, 0.08945465087890625, 0.09358501434326172, 0.09771537780761719, 0.10184574127197266, 0.10597610473632812, 0.1101064682006836, 0.11423683166503906, 0.11836719512939453, 0.12249755859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 12.0, 24.0, 41.0, 84.0, 151.0, 153.0, 206.0, 127.0, 95.0, 52.0, 14.0, 12.0, 10.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.131103515625, -0.12658309936523438, -0.12206268310546875, -0.11754226684570312, -0.1130218505859375, -0.10850143432617188, -0.10398101806640625, -0.09946060180664062, -0.094940185546875, -0.09041976928710938, -0.08589935302734375, -0.08137893676757812, -0.0768585205078125, -0.07233810424804688, -0.06781768798828125, -0.06329727172851562, -0.05877685546875, -0.054256439208984375, -0.04973602294921875, -0.045215606689453125, -0.0406951904296875, -0.036174774169921875, -0.03165435791015625, -0.027133941650390625, -0.022613525390625, -0.018093109130859375, -0.01357269287109375, -0.009052276611328125, -0.0045318603515625, -1.1444091796875e-05, 0.00450897216796875, 0.009029388427734375, 0.0135498046875, 0.018070220947265625, 0.02259063720703125, 0.027111053466796875, 0.0316314697265625, 0.036151885986328125, 0.04067230224609375, 0.045192718505859375, 0.049713134765625, 0.054233551025390625, 0.05875396728515625, 0.06327438354492188, 0.0677947998046875, 0.07231521606445312, 0.07683563232421875, 0.08135604858398438, 0.08587646484375, 0.09039688110351562, 0.09491729736328125, 0.09943771362304688, 0.1039581298828125, 0.10847854614257812, 0.11299896240234375, 0.11751937866210938, 0.122039794921875, 0.12656021118164062, 0.13108062744140625, 0.13560104370117188, 0.1401214599609375, 0.14464187622070312, 0.14916229248046875, 0.15368270874023438, 0.158203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 12.0, 9.0, 20.0, 30.0, 36.0, 69.0, 77.0, 137.0, 162.0, 230.0, 306.0, 499.0, 885.0, 1346.0, 2388.0, 4807.0, 11203.0, 39259.0, 4060094.0, 48513.0, 12389.0, 5164.0, 2588.0, 1474.0, 888.0, 551.0, 325.0, 219.0, 168.0, 101.0, 79.0, 63.0, 64.0, 44.0, 18.0, 14.0, 11.0, 8.0, 9.0, 5.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.14599609375, -0.1415119171142578, -0.13702774047851562, -0.13254356384277344, -0.12805938720703125, -0.12357521057128906, -0.11909103393554688, -0.11460685729980469, -0.1101226806640625, -0.10563850402832031, -0.10115432739257812, -0.09667015075683594, -0.09218597412109375, -0.08770179748535156, -0.08321762084960938, -0.07873344421386719, -0.074249267578125, -0.06976509094238281, -0.06528091430664062, -0.06079673767089844, -0.05631256103515625, -0.05182838439941406, -0.047344207763671875, -0.04286003112792969, -0.0383758544921875, -0.03389167785644531, -0.029407501220703125, -0.024923324584960938, -0.02043914794921875, -0.015954971313476562, -0.011470794677734375, -0.0069866180419921875, -0.00250244140625, 0.0019817352294921875, 0.006465911865234375, 0.010950088500976562, 0.01543426513671875, 0.019918441772460938, 0.024402618408203125, 0.028886795043945312, 0.0333709716796875, 0.03785514831542969, 0.042339324951171875, 0.04682350158691406, 0.05130767822265625, 0.05579185485839844, 0.060276031494140625, 0.06476020812988281, 0.069244384765625, 0.07372856140136719, 0.07821273803710938, 0.08269691467285156, 0.08718109130859375, 0.09166526794433594, 0.09614944458007812, 0.10063362121582031, 0.1051177978515625, 0.10960197448730469, 0.11408615112304688, 0.11857032775878906, 0.12305450439453125, 0.12753868103027344, 0.13202285766601562, 0.1365070343017578, 0.1409912109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 5.0, 10.0, 5.0, 7.0, 10.0, 14.0, 22.0, 38.0, 92.0, 3733.0, 61.0, 23.0, 14.0, 10.0, 7.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027984619140625, -0.02688455581665039, -0.02578449249267578, -0.024684429168701172, -0.023584365844726562, -0.022484302520751953, -0.021384239196777344, -0.020284175872802734, -0.019184112548828125, -0.018084049224853516, -0.016983985900878906, -0.015883922576904297, -0.014783859252929688, -0.013683795928955078, -0.012583732604980469, -0.01148366928100586, -0.01038360595703125, -0.00928354263305664, -0.008183479309082031, -0.007083415985107422, -0.0059833526611328125, -0.004883289337158203, -0.0037832260131835938, -0.0026831626892089844, -0.001583099365234375, -0.0004830360412597656, 0.0006170272827148438, 0.0017170906066894531, 0.0028171539306640625, 0.003917217254638672, 0.005017280578613281, 0.006117343902587891, 0.0072174072265625, 0.00831747055053711, 0.009417533874511719, 0.010517597198486328, 0.011617660522460938, 0.012717723846435547, 0.013817787170410156, 0.014917850494384766, 0.016017913818359375, 0.017117977142333984, 0.018218040466308594, 0.019318103790283203, 0.020418167114257812, 0.021518230438232422, 0.02261829376220703, 0.02371835708618164, 0.02481842041015625, 0.02591848373413086, 0.02701854705810547, 0.028118610382080078, 0.029218673706054688, 0.030318737030029297, 0.031418800354003906, 0.032518863677978516, 0.033618927001953125, 0.034718990325927734, 0.035819053649902344, 0.03691911697387695, 0.03801918029785156, 0.03911924362182617, 0.04021930694580078, 0.04131937026977539, 0.04241943359375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 5.0, 4.0, 8.0, 18.0, 26.0, 68.0, 77.0, 89.0, 136.0, 153.0, 146.0, 78.0, 72.0, 46.0, 25.0, 19.0, 9.0, 7.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1490519791841507, -0.14411598443984985, -0.13917997479438782, -0.13424398005008698, -0.12930798530578613, -0.1243719831109047, -0.11943598091602325, -0.11449998617172241, -0.10956399142742157, -0.10462798923254013, -0.09969199448823929, -0.09475599229335785, -0.089819997549057, -0.08488399535417557, -0.07994799315929413, -0.07501199841499329, -0.07007599622011185, -0.06513999402523041, -0.060203999280929565, -0.055267997086048126, -0.050332002341747284, -0.045396000146865845, -0.040460001677274704, -0.03552400320768356, -0.030588004738092422, -0.025652006268501282, -0.02071600779891014, -0.01578000746667385, -0.01084400899708271, -0.0059080105274915695, -0.0009720101952552795, 0.003963988274335861, 0.008899986743927002, 0.013835985213518143, 0.018771983683109283, 0.023707984015345573, 0.028643982484936714, 0.033579982817173004, 0.038515981286764145, 0.043451979756355286, 0.048387978225946426, 0.05332397669553757, 0.05825997516512871, 0.06319597363471985, 0.06813197582960129, 0.07306797057390213, 0.07800397276878357, 0.08293996751308441, 0.08787596970796585, 0.09281197190284729, 0.09774796664714813, 0.10268396884202957, 0.10761996358633041, 0.11255596578121185, 0.1174919605255127, 0.12242796272039413, 0.12736396491527557, 0.13229995965957642, 0.13723596930503845, 0.1421719640493393, 0.14710795879364014, 0.15204395353794098, 0.15697996318340302, 0.16191595792770386, 0.1668519526720047]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 5.0, 8.0, 13.0, 12.0, 15.0, 11.0, 26.0, 26.0, 29.0, 26.0, 35.0, 35.0, 48.0, 43.0, 56.0, 37.0, 48.0, 54.0, 40.0, 48.0, 49.0, 44.0, 43.0, 33.0, 33.0, 35.0, 30.0, 17.0, 22.0, 17.0, 11.0, 11.0, 8.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07425451278686523, -0.071880042552948, -0.06950556486845016, -0.06713109463453293, -0.0647566169500351, -0.06238214671611786, -0.06000767648220062, -0.05763320252299309, -0.05525872856378555, -0.05288425460457802, -0.05050978064537048, -0.04813531041145325, -0.04576083645224571, -0.04338636249303818, -0.04101189225912094, -0.038637418299913406, -0.03626294434070587, -0.03388847038149834, -0.0315139964222908, -0.029139526188373566, -0.02676505222916603, -0.024390578269958496, -0.02201610617339611, -0.019641634076833725, -0.01726716011762619, -0.01489268708974123, -0.01251821406185627, -0.01014374103397131, -0.0077692680060863495, -0.005394794978201389, -0.003020321950316429, -0.0006458498537540436, 0.0017286241054534912, 0.004103097133338451, 0.0064775701612234116, 0.008852043189108372, 0.011226516216993332, 0.013600989244878292, 0.015975462272763252, 0.018349934369325638, 0.020724408328533173, 0.023098882287740707, 0.025473354384303093, 0.02784782648086548, 0.030222300440073013, 0.03259677439928055, 0.034971244633197784, 0.03734571859240532, 0.039720192551612854, 0.04209466651082039, 0.044469140470027924, 0.04684361070394516, 0.049218084663152695, 0.05159255862236023, 0.053967028856277466, 0.056341502815485, 0.058715976774692535, 0.06109045073390007, 0.0634649246931076, 0.06583939492702484, 0.06821386516094208, 0.07058834284543991, 0.07296281307935715, 0.07533729076385498, 0.07771176099777222]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 7.0, 8.0, 14.0, 37.0, 76.0, 213.0, 883.0, 5974.0, 542430.0, 491918.0, 5726.0, 885.0, 199.0, 78.0, 23.0, 16.0, 16.0, 14.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.470703125, -0.45685577392578125, -0.4430084228515625, -0.42916107177734375, -0.415313720703125, -0.40146636962890625, -0.3876190185546875, -0.37377166748046875, -0.35992431640625, -0.34607696533203125, -0.3322296142578125, -0.31838226318359375, -0.304534912109375, -0.29068756103515625, -0.2768402099609375, -0.26299285888671875, -0.2491455078125, -0.23529815673828125, -0.2214508056640625, -0.20760345458984375, -0.193756103515625, -0.17990875244140625, -0.1660614013671875, -0.15221405029296875, -0.13836669921875, -0.12451934814453125, -0.1106719970703125, -0.09682464599609375, -0.082977294921875, -0.06912994384765625, -0.0552825927734375, -0.04143524169921875, -0.027587890625, -0.01374053955078125, 0.0001068115234375, 0.01395416259765625, 0.027801513671875, 0.04164886474609375, 0.0554962158203125, 0.06934356689453125, 0.08319091796875, 0.09703826904296875, 0.1108856201171875, 0.12473297119140625, 0.138580322265625, 0.15242767333984375, 0.1662750244140625, 0.18012237548828125, 0.1939697265625, 0.20781707763671875, 0.2216644287109375, 0.23551177978515625, 0.249359130859375, 0.26320648193359375, 0.2770538330078125, 0.29090118408203125, 0.30474853515625, 0.31859588623046875, 0.3324432373046875, 0.34629058837890625, 0.360137939453125, 0.37398529052734375, 0.3878326416015625, 0.40167999267578125, 0.41552734375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 9.0, 32.0, 30.0, 95.0, 136.0, 160.0, 171.0, 151.0, 80.0, 65.0, 32.0, 10.0, 7.0, 5.0, 9.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.132080078125, -0.12754440307617188, -0.12300872802734375, -0.11847305297851562, -0.1139373779296875, -0.10940170288085938, -0.10486602783203125, -0.10033035278320312, -0.095794677734375, -0.09125900268554688, -0.08672332763671875, -0.08218765258789062, -0.0776519775390625, -0.07311630249023438, -0.06858062744140625, -0.06404495239257812, -0.05950927734375, -0.054973602294921875, -0.05043792724609375, -0.045902252197265625, -0.0413665771484375, -0.036830902099609375, -0.03229522705078125, -0.027759552001953125, -0.023223876953125, -0.018688201904296875, -0.01415252685546875, -0.009616851806640625, -0.0050811767578125, -0.000545501708984375, 0.00399017333984375, 0.008525848388671875, 0.0130615234375, 0.017597198486328125, 0.02213287353515625, 0.026668548583984375, 0.0312042236328125, 0.035739898681640625, 0.04027557373046875, 0.044811248779296875, 0.049346923828125, 0.053882598876953125, 0.05841827392578125, 0.06295394897460938, 0.0674896240234375, 0.07202529907226562, 0.07656097412109375, 0.08109664916992188, 0.08563232421875, 0.09016799926757812, 0.09470367431640625, 0.09923934936523438, 0.1037750244140625, 0.10831069946289062, 0.11284637451171875, 0.11738204956054688, 0.121917724609375, 0.12645339965820312, 0.13098907470703125, 0.13552474975585938, 0.1400604248046875, 0.14459609985351562, 0.14913177490234375, 0.15366744995117188, 0.158203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 2.0, 7.0, 4.0, 4.0, 3.0, 10.0, 10.0, 10.0, 12.0, 15.0, 19.0, 21.0, 39.0, 48.0, 42.0, 78.0, 139.0, 242.0, 451.0, 1039.0, 3402.0, 28652.0, 833350.0, 169347.0, 8281.0, 1733.0, 653.0, 330.0, 172.0, 123.0, 55.0, 58.0, 42.0, 30.0, 22.0, 16.0, 15.0, 10.0, 14.0, 9.0, 13.0, 8.0, 3.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1806640625, -0.174591064453125, -0.16851806640625, -0.162445068359375, -0.1563720703125, -0.150299072265625, -0.14422607421875, -0.138153076171875, -0.132080078125, -0.126007080078125, -0.11993408203125, -0.113861083984375, -0.1077880859375, -0.101715087890625, -0.09564208984375, -0.089569091796875, -0.08349609375, -0.077423095703125, -0.07135009765625, -0.065277099609375, -0.0592041015625, -0.053131103515625, -0.04705810546875, -0.040985107421875, -0.034912109375, -0.028839111328125, -0.02276611328125, -0.016693115234375, -0.0106201171875, -0.004547119140625, 0.00152587890625, 0.007598876953125, 0.013671875, 0.019744873046875, 0.02581787109375, 0.031890869140625, 0.0379638671875, 0.044036865234375, 0.05010986328125, 0.056182861328125, 0.062255859375, 0.068328857421875, 0.07440185546875, 0.080474853515625, 0.0865478515625, 0.092620849609375, 0.09869384765625, 0.104766845703125, 0.11083984375, 0.116912841796875, 0.12298583984375, 0.129058837890625, 0.1351318359375, 0.141204833984375, 0.14727783203125, 0.153350830078125, 0.159423828125, 0.165496826171875, 0.17156982421875, 0.177642822265625, 0.1837158203125, 0.189788818359375, 0.19586181640625, 0.201934814453125, 0.2080078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 11.0, 11.0, 14.0, 10.0, 26.0, 26.0, 20.0, 20.0, 39.0, 35.0, 41.0, 44.0, 55.0, 57.0, 50.0, 42.0, 61.0, 48.0, 42.0, 52.0, 46.0, 35.0, 41.0, 28.0, 31.0, 23.0, 23.0, 12.0, 12.0, 10.0, 8.0, 8.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.224853515625, -0.2179241180419922, -0.21099472045898438, -0.20406532287597656, -0.19713592529296875, -0.19020652770996094, -0.18327713012695312, -0.1763477325439453, -0.1694183349609375, -0.1624889373779297, -0.15555953979492188, -0.14863014221191406, -0.14170074462890625, -0.13477134704589844, -0.12784194946289062, -0.12091255187988281, -0.113983154296875, -0.10705375671386719, -0.10012435913085938, -0.09319496154785156, -0.08626556396484375, -0.07933616638183594, -0.07240676879882812, -0.06547737121582031, -0.0585479736328125, -0.05161857604980469, -0.044689178466796875, -0.03775978088378906, -0.03083038330078125, -0.023900985717773438, -0.016971588134765625, -0.010042190551757812, -0.00311279296875, 0.0038166046142578125, 0.010746002197265625, 0.017675399780273438, 0.02460479736328125, 0.03153419494628906, 0.038463592529296875, 0.04539299011230469, 0.0523223876953125, 0.05925178527832031, 0.06618118286132812, 0.07311058044433594, 0.08003997802734375, 0.08696937561035156, 0.09389877319335938, 0.10082817077636719, 0.107757568359375, 0.11468696594238281, 0.12161636352539062, 0.12854576110839844, 0.13547515869140625, 0.14240455627441406, 0.14933395385742188, 0.1562633514404297, 0.1631927490234375, 0.1701221466064453, 0.17705154418945312, 0.18398094177246094, 0.19091033935546875, 0.19783973693847656, 0.20476913452148438, 0.2116985321044922, 0.2186279296875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 7.0, 16.0, 11.0, 17.0, 37.0, 40.0, 66.0, 112.0, 230.0, 583.0, 2005.0, 11169.0, 599948.0, 421391.0, 10014.0, 1722.0, 623.0, 243.0, 118.0, 69.0, 35.0, 28.0, 18.0, 14.0, 8.0, 5.0, 9.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08013916015625, -0.0767965316772461, -0.07345390319824219, -0.07011127471923828, -0.06676864624023438, -0.06342601776123047, -0.06008338928222656, -0.056740760803222656, -0.05339813232421875, -0.050055503845214844, -0.04671287536621094, -0.04337024688720703, -0.040027618408203125, -0.03668498992919922, -0.03334236145019531, -0.029999732971191406, -0.0266571044921875, -0.023314476013183594, -0.019971847534179688, -0.01662921905517578, -0.013286590576171875, -0.009943962097167969, -0.0066013336181640625, -0.0032587051391601562, 8.392333984375e-05, 0.0034265518188476562, 0.0067691802978515625, 0.010111808776855469, 0.013454437255859375, 0.01679706573486328, 0.020139694213867188, 0.023482322692871094, 0.026824951171875, 0.030167579650878906, 0.03351020812988281, 0.03685283660888672, 0.040195465087890625, 0.04353809356689453, 0.04688072204589844, 0.050223350524902344, 0.05356597900390625, 0.056908607482910156, 0.06025123596191406, 0.06359386444091797, 0.06693649291992188, 0.07027912139892578, 0.07362174987792969, 0.0769643783569336, 0.0803070068359375, 0.0836496353149414, 0.08699226379394531, 0.09033489227294922, 0.09367752075195312, 0.09702014923095703, 0.10036277770996094, 0.10370540618896484, 0.10704803466796875, 0.11039066314697266, 0.11373329162597656, 0.11707592010498047, 0.12041854858398438, 0.12376117706298828, 0.1271038055419922, 0.1304464340209961, 0.1337890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 14.0, 15.0, 29.0, 82.0, 140.0, 224.0, 209.0, 126.0, 69.0, 41.0, 15.0, 15.0, 9.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1682510375976562e-05, -1.1033378541469574e-05, -1.0384246706962585e-05, -9.735114872455597e-06, -9.085983037948608e-06, -8.43685120344162e-06, -7.787719368934631e-06, -7.138587534427643e-06, -6.489455699920654e-06, -5.840323865413666e-06, -5.191192030906677e-06, -4.542060196399689e-06, -3.8929283618927e-06, -3.2437965273857117e-06, -2.594664692878723e-06, -1.9455328583717346e-06, -1.296401023864746e-06, -6.472691893577576e-07, 1.862645149230957e-09, 6.509944796562195e-07, 1.300126314163208e-06, 1.9492581486701965e-06, 2.598389983177185e-06, 3.2475218176841736e-06, 3.896653652191162e-06, 4.545785486698151e-06, 5.194917321205139e-06, 5.844049155712128e-06, 6.493180990219116e-06, 7.142312824726105e-06, 7.791444659233093e-06, 8.440576493740082e-06, 9.08970832824707e-06, 9.738840162754059e-06, 1.0387971997261047e-05, 1.1037103831768036e-05, 1.1686235666275024e-05, 1.2335367500782013e-05, 1.2984499335289001e-05, 1.363363116979599e-05, 1.4282763004302979e-05, 1.4931894838809967e-05, 1.5581026673316956e-05, 1.6230158507823944e-05, 1.6879290342330933e-05, 1.752842217683792e-05, 1.817755401134491e-05, 1.8826685845851898e-05, 1.9475817680358887e-05, 2.0124949514865875e-05, 2.0774081349372864e-05, 2.1423213183879852e-05, 2.207234501838684e-05, 2.272147685289383e-05, 2.3370608687400818e-05, 2.4019740521907806e-05, 2.4668872356414795e-05, 2.5318004190921783e-05, 2.5967136025428772e-05, 2.661626785993576e-05, 2.726539969444275e-05, 2.7914531528949738e-05, 2.8563663363456726e-05, 2.9212795197963715e-05, 2.9861927032470703e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 19.0, 24.0, 30.0, 43.0, 93.0, 149.0, 292.0, 618.0, 1708.0, 6254.0, 48960.0, 887898.0, 89849.0, 8850.0, 2184.0, 734.0, 340.0, 177.0, 101.0, 63.0, 52.0, 35.0, 18.0, 15.0, 8.0, 3.0, 2.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.11864566802978516, -0.11540412902832031, -0.11216259002685547, -0.10892105102539062, -0.10567951202392578, -0.10243797302246094, -0.0991964340209961, -0.09595489501953125, -0.0927133560180664, -0.08947181701660156, -0.08623027801513672, -0.08298873901367188, -0.07974720001220703, -0.07650566101074219, -0.07326412200927734, -0.0700225830078125, -0.06678104400634766, -0.06353950500488281, -0.06029796600341797, -0.057056427001953125, -0.05381488800048828, -0.05057334899902344, -0.047331809997558594, -0.04409027099609375, -0.040848731994628906, -0.03760719299316406, -0.03436565399169922, -0.031124114990234375, -0.02788257598876953, -0.024641036987304688, -0.021399497985839844, -0.018157958984375, -0.014916419982910156, -0.011674880981445312, -0.008433341979980469, -0.005191802978515625, -0.0019502639770507812, 0.0012912750244140625, 0.004532814025878906, 0.00777435302734375, 0.011015892028808594, 0.014257431030273438, 0.01749897003173828, 0.020740509033203125, 0.02398204803466797, 0.027223587036132812, 0.030465126037597656, 0.0337066650390625, 0.036948204040527344, 0.04018974304199219, 0.04343128204345703, 0.046672821044921875, 0.04991436004638672, 0.05315589904785156, 0.056397438049316406, 0.05963897705078125, 0.0628805160522461, 0.06612205505371094, 0.06936359405517578, 0.07260513305664062, 0.07584667205810547, 0.07908821105957031, 0.08232975006103516, 0.0855712890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 8.0, 7.0, 2.0, 6.0, 13.0, 29.0, 45.0, 63.0, 78.0, 145.0, 154.0, 109.0, 119.0, 57.0, 44.0, 28.0, 29.0, 27.0, 11.0, 5.0, 5.0, 0.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.10894775390625, -0.10612106323242188, -0.10329437255859375, -0.10046768188476562, -0.0976409912109375, -0.09481430053710938, -0.09198760986328125, -0.08916091918945312, -0.086334228515625, -0.08350753784179688, -0.08068084716796875, -0.07785415649414062, -0.0750274658203125, -0.07220077514648438, -0.06937408447265625, -0.06654739379882812, -0.063720703125, -0.060894012451171875, -0.05806732177734375, -0.055240631103515625, -0.0524139404296875, -0.049587249755859375, -0.04676055908203125, -0.043933868408203125, -0.041107177734375, -0.038280487060546875, -0.03545379638671875, -0.032627105712890625, -0.0298004150390625, -0.026973724365234375, -0.02414703369140625, -0.021320343017578125, -0.01849365234375, -0.015666961669921875, -0.01284027099609375, -0.010013580322265625, -0.0071868896484375, -0.004360198974609375, -0.00153350830078125, 0.001293182373046875, 0.004119873046875, 0.006946563720703125, 0.00977325439453125, 0.012599945068359375, 0.0154266357421875, 0.018253326416015625, 0.02108001708984375, 0.023906707763671875, 0.0267333984375, 0.029560089111328125, 0.03238677978515625, 0.035213470458984375, 0.0380401611328125, 0.040866851806640625, 0.04369354248046875, 0.046520233154296875, 0.049346923828125, 0.052173614501953125, 0.05500030517578125, 0.057826995849609375, 0.0606536865234375, 0.06348037719726562, 0.06630706787109375, 0.06913375854492188, 0.07196044921875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 8.0, 92.0, 560.0, 305.0, 32.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8584301471710205, -1.7330029010772705, -1.6075756549835205, -1.4821484088897705, -1.3567211627960205, -1.2312939167022705, -1.1058666706085205, -0.9804394245147705, -0.8550121784210205, -0.7295849323272705, -0.6041576862335205, -0.4787304401397705, -0.3533031940460205, -0.2278759479522705, -0.10244870185852051, 0.022978544235229492, 0.1484057903289795, 0.2738330364227295, 0.3992602825164795, 0.5246875286102295, 0.6501147747039795, 0.7755420207977295, 0.9009692668914795, 1.0263965129852295, 1.1518237590789795, 1.2772510051727295, 1.4026782512664795, 1.5281054973602295, 1.6535327434539795, 1.7789599895477295, 1.9043872356414795, 2.0298144817352295, 2.1552419662475586, 2.2806692123413086, 2.4060964584350586, 2.5315237045288086, 2.6569509506225586, 2.7823781967163086, 2.9078054428100586, 3.0332326889038086, 3.1586599349975586, 3.2840871810913086, 3.4095144271850586, 3.5349416732788086, 3.6603689193725586, 3.7857961654663086, 3.9112234115600586, 4.036650657653809, 4.162077903747559, 4.287505149841309, 4.412932395935059, 4.538359642028809, 4.663786888122559, 4.789214134216309, 4.914641380310059, 5.040068626403809, 5.165495872497559, 5.290923118591309, 5.416350364685059, 5.541777610778809, 5.667204856872559, 5.792632102966309, 5.918059349060059, 6.043486595153809, 6.168913841247559]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 5.0, 8.0, 5.0, 3.0, 9.0, 2.0, 4.0, 16.0, 18.0, 5.0, 18.0, 31.0, 22.0, 28.0, 28.0, 42.0, 40.0, 47.0, 47.0, 57.0, 51.0, 45.0, 61.0, 54.0, 47.0, 36.0, 33.0, 33.0, 32.0, 29.0, 20.0, 20.0, 22.0, 17.0, 12.0, 21.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.871202290058136, -0.8424568772315979, -0.8137115240097046, -0.7849661111831665, -0.7562206983566284, -0.7274753451347351, -0.698729932308197, -0.6699845790863037, -0.6412391662597656, -0.6124937534332275, -0.5837484002113342, -0.5550029873847961, -0.5262576341629028, -0.49751222133636475, -0.46876680850982666, -0.44002142548561096, -0.41127604246139526, -0.38253065943717957, -0.35378527641296387, -0.3250398635864258, -0.2962944805622101, -0.2675490975379944, -0.2388036996126175, -0.2100583016872406, -0.1813129186630249, -0.1525675356388092, -0.12382213771343231, -0.09507674723863602, -0.06633135676383972, -0.03758597373962402, -0.008840575814247131, 0.01990482211112976, 0.04865020513534546, 0.07739559561014175, 0.10614098608493805, 0.13488638401031494, 0.16363176703453064, 0.19237715005874634, 0.22112254798412323, 0.24986794590950012, 0.2786133289337158, 0.3073587119579315, 0.3361040949821472, 0.3648495078086853, 0.393594890832901, 0.4223402738571167, 0.4510856866836548, 0.4798310697078705, 0.5085764527320862, 0.5373218655586243, 0.5660672187805176, 0.5948126316070557, 0.6235580444335938, 0.6523033976554871, 0.6810488104820251, 0.7097941637039185, 0.7385395765304565, 0.7672849893569946, 0.7960303425788879, 0.824775755405426, 0.8535211086273193, 0.8822665214538574, 0.9110119342803955, 0.9397573471069336, 0.9685027003288269]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 12.0, 22.0, 22.0, 23.0, 35.0, 44.0, 84.0, 120.0, 170.0, 256.0, 442.0, 825.0, 1741.0, 3977.0, 11626.0, 48075.0, 4022822.0, 79675.0, 14914.0, 4999.0, 2061.0, 949.0, 484.0, 295.0, 169.0, 136.0, 92.0, 66.0, 43.0, 28.0, 19.0, 12.0, 11.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1363525390625, -0.132171630859375, -0.12799072265625, -0.123809814453125, -0.11962890625, -0.115447998046875, -0.11126708984375, -0.107086181640625, -0.1029052734375, -0.098724365234375, -0.09454345703125, -0.090362548828125, -0.086181640625, -0.082000732421875, -0.07781982421875, -0.073638916015625, -0.0694580078125, -0.065277099609375, -0.06109619140625, -0.056915283203125, -0.052734375, -0.048553466796875, -0.04437255859375, -0.040191650390625, -0.0360107421875, -0.031829833984375, -0.02764892578125, -0.023468017578125, -0.019287109375, -0.015106201171875, -0.01092529296875, -0.006744384765625, -0.0025634765625, 0.001617431640625, 0.00579833984375, 0.009979248046875, 0.01416015625, 0.018341064453125, 0.02252197265625, 0.026702880859375, 0.0308837890625, 0.035064697265625, 0.03924560546875, 0.043426513671875, 0.047607421875, 0.051788330078125, 0.05596923828125, 0.060150146484375, 0.0643310546875, 0.068511962890625, 0.07269287109375, 0.076873779296875, 0.0810546875, 0.085235595703125, 0.08941650390625, 0.093597412109375, 0.0977783203125, 0.101959228515625, 0.10614013671875, 0.110321044921875, 0.114501953125, 0.118682861328125, 0.12286376953125, 0.127044677734375, 0.1312255859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 12.0, 9.0, 23.0, 58.0, 91.0, 145.0, 152.0, 178.0, 137.0, 89.0, 45.0, 33.0, 11.0, 5.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.132080078125, -0.1275196075439453, -0.12295913696289062, -0.11839866638183594, -0.11383819580078125, -0.10927772521972656, -0.10471725463867188, -0.10015678405761719, -0.0955963134765625, -0.09103584289550781, -0.08647537231445312, -0.08191490173339844, -0.07735443115234375, -0.07279396057128906, -0.06823348999023438, -0.06367301940917969, -0.059112548828125, -0.05455207824707031, -0.049991607666015625, -0.04543113708496094, -0.04087066650390625, -0.03631019592285156, -0.031749725341796875, -0.027189254760742188, -0.0226287841796875, -0.018068313598632812, -0.013507843017578125, -0.008947372436523438, -0.00438690185546875, 0.0001735687255859375, 0.004734039306640625, 0.009294509887695312, 0.01385498046875, 0.018415451049804688, 0.022975921630859375, 0.027536392211914062, 0.03209686279296875, 0.03665733337402344, 0.041217803955078125, 0.04577827453613281, 0.0503387451171875, 0.05489921569824219, 0.059459686279296875, 0.06402015686035156, 0.06858062744140625, 0.07314109802246094, 0.07770156860351562, 0.08226203918457031, 0.086822509765625, 0.09138298034667969, 0.09594345092773438, 0.10050392150878906, 0.10506439208984375, 0.10962486267089844, 0.11418533325195312, 0.11874580383300781, 0.1233062744140625, 0.1278667449951172, 0.13242721557617188, 0.13698768615722656, 0.14154815673828125, 0.14610862731933594, 0.15066909790039062, 0.1552295684814453, 0.1597900390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 7.0, 10.0, 15.0, 12.0, 25.0, 30.0, 42.0, 67.0, 134.0, 158.0, 234.0, 432.0, 656.0, 1193.0, 2665.0, 6599.0, 21583.0, 139704.0, 3943316.0, 55870.0, 12838.0, 4288.0, 1898.0, 979.0, 506.0, 353.0, 217.0, 133.0, 84.0, 66.0, 44.0, 30.0, 23.0, 13.0, 11.0, 12.0, 10.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.16845703125, -0.1638164520263672, -0.15917587280273438, -0.15453529357910156, -0.14989471435546875, -0.14525413513183594, -0.14061355590820312, -0.1359729766845703, -0.1313323974609375, -0.1266918182373047, -0.12205123901367188, -0.11741065979003906, -0.11277008056640625, -0.10812950134277344, -0.10348892211914062, -0.09884834289550781, -0.094207763671875, -0.08956718444824219, -0.08492660522460938, -0.08028602600097656, -0.07564544677734375, -0.07100486755371094, -0.06636428833007812, -0.06172370910644531, -0.0570831298828125, -0.05244255065917969, -0.047801971435546875, -0.04316139221191406, -0.03852081298828125, -0.03388023376464844, -0.029239654541015625, -0.024599075317382812, -0.01995849609375, -0.015317916870117188, -0.010677337646484375, -0.0060367584228515625, -0.00139617919921875, 0.0032444000244140625, 0.007884979248046875, 0.012525558471679688, 0.0171661376953125, 0.021806716918945312, 0.026447296142578125, 0.031087875366210938, 0.03572845458984375, 0.04036903381347656, 0.045009613037109375, 0.04965019226074219, 0.054290771484375, 0.05893135070800781, 0.06357192993164062, 0.06821250915527344, 0.07285308837890625, 0.07749366760253906, 0.08213424682617188, 0.08677482604980469, 0.0914154052734375, 0.09605598449707031, 0.10069656372070312, 0.10533714294433594, 0.10997772216796875, 0.11461830139160156, 0.11925888061523438, 0.12389945983886719, 0.1285400390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 9.0, 9.0, 21.0, 15.0, 14.0, 31.0, 39.0, 91.0, 344.0, 3159.0, 144.0, 79.0, 34.0, 19.0, 18.0, 14.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0396728515625, -0.037888526916503906, -0.03610420227050781, -0.03431987762451172, -0.032535552978515625, -0.03075122833251953, -0.028966903686523438, -0.027182579040527344, -0.02539825439453125, -0.023613929748535156, -0.021829605102539062, -0.02004528045654297, -0.018260955810546875, -0.01647663116455078, -0.014692306518554688, -0.012907981872558594, -0.0111236572265625, -0.009339332580566406, -0.0075550079345703125, -0.005770683288574219, -0.003986358642578125, -0.0022020339965820312, -0.0004177093505859375, 0.0013666152954101562, 0.00315093994140625, 0.004935264587402344, 0.0067195892333984375, 0.008503913879394531, 0.010288238525390625, 0.012072563171386719, 0.013856887817382812, 0.015641212463378906, 0.017425537109375, 0.019209861755371094, 0.020994186401367188, 0.02277851104736328, 0.024562835693359375, 0.02634716033935547, 0.028131484985351562, 0.029915809631347656, 0.03170013427734375, 0.033484458923339844, 0.03526878356933594, 0.03705310821533203, 0.038837432861328125, 0.04062175750732422, 0.04240608215332031, 0.044190406799316406, 0.0459747314453125, 0.047759056091308594, 0.04954338073730469, 0.05132770538330078, 0.053112030029296875, 0.05489635467529297, 0.05668067932128906, 0.058465003967285156, 0.06024932861328125, 0.062033653259277344, 0.06381797790527344, 0.06560230255126953, 0.06738662719726562, 0.06917095184326172, 0.07095527648925781, 0.0727396011352539, 0.07452392578125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 11.0, 16.0, 39.0, 66.0, 115.0, 170.0, 215.0, 127.0, 103.0, 59.0, 31.0, 14.0, 13.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3768138885498047, -0.3651999831199646, -0.3535860478878021, -0.34197214245796204, -0.33035820722579956, -0.3187443017959595, -0.307130366563797, -0.2955164611339569, -0.28390252590179443, -0.27228862047195435, -0.26067468523979187, -0.2490607649087906, -0.2374468445777893, -0.22583292424678802, -0.21421900391578674, -0.20260509848594666, -0.19099117815494537, -0.1793772578239441, -0.1677633374929428, -0.15614941716194153, -0.14453549683094025, -0.13292157649993896, -0.12130766361951828, -0.109693743288517, -0.09807982295751572, -0.08646590262651443, -0.07485198229551315, -0.06323806941509247, -0.05162414535880089, -0.040010225027799606, -0.028396308422088623, -0.01678238809108734, -0.00516846776008606, 0.0064454516395926476, 0.018059371039271355, 0.029673289507627487, 0.04128720983862877, 0.05290113016963005, 0.06451504677534103, 0.07612896710634232, 0.0877428874373436, 0.09935680776834488, 0.11097072809934616, 0.12258464097976685, 0.13419856131076813, 0.1458124816417694, 0.1574264019727707, 0.16904032230377197, 0.18065424263477325, 0.19226816296577454, 0.20388208329677582, 0.2154960036277771, 0.22710992395877838, 0.23872384428977966, 0.25033774971961975, 0.2619516849517822, 0.2735655903816223, 0.2851794958114624, 0.2967934310436249, 0.30840733647346497, 0.32002127170562744, 0.33163517713546753, 0.34324911236763, 0.3548630177974701, 0.36647695302963257]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 8.0, 6.0, 16.0, 16.0, 21.0, 25.0, 11.0, 21.0, 35.0, 41.0, 22.0, 43.0, 35.0, 35.0, 52.0, 50.0, 50.0, 52.0, 54.0, 42.0, 53.0, 52.0, 37.0, 34.0, 29.0, 27.0, 30.0, 19.0, 19.0, 24.0, 9.0, 5.0, 12.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16601133346557617, -0.1615161895751953, -0.15702106058597565, -0.1525259166955948, -0.14803077280521393, -0.14353564381599426, -0.1390404999256134, -0.13454535603523254, -0.13005021214485168, -0.12555506825447083, -0.12105993181467056, -0.1165647953748703, -0.11206965148448944, -0.10757451504468918, -0.10307937860488892, -0.09858423471450806, -0.09408910572528839, -0.08959396928548813, -0.08509882539510727, -0.080603688955307, -0.07610854506492615, -0.07161340862512589, -0.06711827218532562, -0.06262312829494476, -0.0581279918551445, -0.05363285169005394, -0.04913771152496338, -0.044642575085163116, -0.040147434920072556, -0.035652294754981995, -0.031157156452536583, -0.02666201815009117, -0.02216687798500061, -0.01767173781991005, -0.013176599517464638, -0.008681460283696651, -0.004186321049928665, 0.00030881911516189575, 0.0048039574176073074, 0.009299095720052719, 0.01379423588514328, 0.01828937605023384, 0.022784514352679253, 0.027279652655124664, 0.031774792820215225, 0.036269932985305786, 0.04076506942510605, 0.04526020959019661, 0.04975534975528717, 0.05425048992037773, 0.05874563008546829, 0.06324076652526855, 0.06773591041564941, 0.07223104685544968, 0.07672618329524994, 0.0812213271856308, 0.08571646362543106, 0.09021160006523132, 0.09470674395561218, 0.09920188039541245, 0.10369701683521271, 0.10819216072559357, 0.11268729716539383, 0.11718243360519409, 0.12167757749557495]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 7.0, 5.0, 16.0, 21.0, 38.0, 41.0, 82.0, 179.0, 363.0, 941.0, 3189.0, 20872.0, 447316.0, 544877.0, 25216.0, 3534.0, 1004.0, 409.0, 181.0, 94.0, 56.0, 36.0, 19.0, 22.0, 10.0, 12.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.266845703125, -0.2576560974121094, -0.24846649169921875, -0.23927688598632812, -0.2300872802734375, -0.22089767456054688, -0.21170806884765625, -0.20251846313476562, -0.193328857421875, -0.18413925170898438, -0.17494964599609375, -0.16576004028320312, -0.1565704345703125, -0.14738082885742188, -0.13819122314453125, -0.12900161743164062, -0.11981201171875, -0.11062240600585938, -0.10143280029296875, -0.09224319458007812, -0.0830535888671875, -0.07386398315429688, -0.06467437744140625, -0.055484771728515625, -0.046295166015625, -0.037105560302734375, -0.02791595458984375, -0.018726348876953125, -0.0095367431640625, -0.000347137451171875, 0.00884246826171875, 0.018032073974609375, 0.0272216796875, 0.036411285400390625, 0.04560089111328125, 0.054790496826171875, 0.0639801025390625, 0.07316970825195312, 0.08235931396484375, 0.09154891967773438, 0.100738525390625, 0.10992813110351562, 0.11911773681640625, 0.12830734252929688, 0.1374969482421875, 0.14668655395507812, 0.15587615966796875, 0.16506576538085938, 0.17425537109375, 0.18344497680664062, 0.19263458251953125, 0.20182418823242188, 0.2110137939453125, 0.22020339965820312, 0.22939300537109375, 0.23858261108398438, 0.247772216796875, 0.2569618225097656, 0.26615142822265625, 0.2753410339355469, 0.2845306396484375, 0.2937202453613281, 0.30290985107421875, 0.3120994567871094, 0.3212890625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 1.0, 10.0, 13.0, 17.0, 41.0, 84.0, 132.0, 142.0, 163.0, 149.0, 101.0, 64.0, 43.0, 20.0, 6.0, 9.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.128631591796875, -0.12408447265625, -0.119537353515625, -0.114990234375, -0.110443115234375, -0.10589599609375, -0.101348876953125, -0.0968017578125, -0.092254638671875, -0.08770751953125, -0.083160400390625, -0.07861328125, -0.074066162109375, -0.06951904296875, -0.064971923828125, -0.0604248046875, -0.055877685546875, -0.05133056640625, -0.046783447265625, -0.042236328125, -0.037689208984375, -0.03314208984375, -0.028594970703125, -0.0240478515625, -0.019500732421875, -0.01495361328125, -0.010406494140625, -0.005859375, -0.001312255859375, 0.00323486328125, 0.007781982421875, 0.0123291015625, 0.016876220703125, 0.02142333984375, 0.025970458984375, 0.030517578125, 0.035064697265625, 0.03961181640625, 0.044158935546875, 0.0487060546875, 0.053253173828125, 0.05780029296875, 0.062347412109375, 0.06689453125, 0.071441650390625, 0.07598876953125, 0.080535888671875, 0.0850830078125, 0.089630126953125, 0.09417724609375, 0.098724365234375, 0.103271484375, 0.107818603515625, 0.11236572265625, 0.116912841796875, 0.1214599609375, 0.126007080078125, 0.13055419921875, 0.135101318359375, 0.1396484375, 0.144195556640625, 0.14874267578125, 0.153289794921875, 0.1578369140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 5.0, 4.0, 8.0, 6.0, 12.0, 12.0, 25.0, 21.0, 32.0, 59.0, 86.0, 122.0, 258.0, 605.0, 1651.0, 7577.0, 128499.0, 856895.0, 45967.0, 4489.0, 1146.0, 459.0, 224.0, 121.0, 90.0, 46.0, 32.0, 26.0, 24.0, 12.0, 6.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.265380859375, -0.2569160461425781, -0.24845123291015625, -0.23998641967773438, -0.2315216064453125, -0.22305679321289062, -0.21459197998046875, -0.20612716674804688, -0.197662353515625, -0.18919754028320312, -0.18073272705078125, -0.17226791381835938, -0.1638031005859375, -0.15533828735351562, -0.14687347412109375, -0.13840866088867188, -0.12994384765625, -0.12147903442382812, -0.11301422119140625, -0.10454940795898438, -0.0960845947265625, -0.08761978149414062, -0.07915496826171875, -0.07069015502929688, -0.062225341796875, -0.053760528564453125, -0.04529571533203125, -0.036830902099609375, -0.0283660888671875, -0.019901275634765625, -0.01143646240234375, -0.002971649169921875, 0.0054931640625, 0.013957977294921875, 0.02242279052734375, 0.030887603759765625, 0.0393524169921875, 0.047817230224609375, 0.05628204345703125, 0.06474685668945312, 0.073211669921875, 0.08167648315429688, 0.09014129638671875, 0.09860610961914062, 0.1070709228515625, 0.11553573608398438, 0.12400054931640625, 0.13246536254882812, 0.14093017578125, 0.14939498901367188, 0.15785980224609375, 0.16632461547851562, 0.1747894287109375, 0.18325424194335938, 0.19171905517578125, 0.20018386840820312, 0.208648681640625, 0.21711349487304688, 0.22557830810546875, 0.23404312133789062, 0.2425079345703125, 0.2509727478027344, 0.25943756103515625, 0.2679023742675781, 0.2763671875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 6.0, 5.0, 10.0, 9.0, 15.0, 23.0, 16.0, 17.0, 24.0, 23.0, 35.0, 37.0, 31.0, 28.0, 38.0, 38.0, 34.0, 47.0, 48.0, 46.0, 42.0, 43.0, 36.0, 55.0, 41.0, 32.0, 33.0, 36.0, 35.0, 25.0, 16.0, 19.0, 10.0, 9.0, 10.0, 7.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15869140625, -0.15230751037597656, -0.14592361450195312, -0.1395397186279297, -0.13315582275390625, -0.1267719268798828, -0.12038803100585938, -0.11400413513183594, -0.1076202392578125, -0.10123634338378906, -0.09485244750976562, -0.08846855163574219, -0.08208465576171875, -0.07570075988769531, -0.06931686401367188, -0.06293296813964844, -0.056549072265625, -0.05016517639160156, -0.043781280517578125, -0.03739738464355469, -0.03101348876953125, -0.024629592895507812, -0.018245697021484375, -0.011861801147460938, -0.0054779052734375, 0.0009059906005859375, 0.007289886474609375, 0.013673782348632812, 0.02005767822265625, 0.026441574096679688, 0.032825469970703125, 0.03920936584472656, 0.04559326171875, 0.05197715759277344, 0.058361053466796875, 0.06474494934082031, 0.07112884521484375, 0.07751274108886719, 0.08389663696289062, 0.09028053283691406, 0.0966644287109375, 0.10304832458496094, 0.10943222045898438, 0.11581611633300781, 0.12220001220703125, 0.1285839080810547, 0.13496780395507812, 0.14135169982910156, 0.147735595703125, 0.15411949157714844, 0.16050338745117188, 0.1668872833251953, 0.17327117919921875, 0.1796550750732422, 0.18603897094726562, 0.19242286682128906, 0.1988067626953125, 0.20519065856933594, 0.21157455444335938, 0.2179584503173828, 0.22434234619140625, 0.2307262420654297, 0.23711013793945312, 0.24349403381347656, 0.2498779296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 10.0, 17.0, 33.0, 70.0, 111.0, 326.0, 1229.0, 10972.0, 932960.0, 98471.0, 3264.0, 651.0, 219.0, 99.0, 49.0, 15.0, 12.0, 8.0, 9.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1729736328125, -0.1679973602294922, -0.16302108764648438, -0.15804481506347656, -0.15306854248046875, -0.14809226989746094, -0.14311599731445312, -0.1381397247314453, -0.1331634521484375, -0.1281871795654297, -0.12321090698242188, -0.11823463439941406, -0.11325836181640625, -0.10828208923339844, -0.10330581665039062, -0.09832954406738281, -0.093353271484375, -0.08837699890136719, -0.08340072631835938, -0.07842445373535156, -0.07344818115234375, -0.06847190856933594, -0.06349563598632812, -0.05851936340332031, -0.0535430908203125, -0.04856681823730469, -0.043590545654296875, -0.03861427307128906, -0.03363800048828125, -0.028661727905273438, -0.023685455322265625, -0.018709182739257812, -0.01373291015625, -0.008756637573242188, -0.003780364990234375, 0.0011959075927734375, 0.00617218017578125, 0.011148452758789062, 0.016124725341796875, 0.021100997924804688, 0.0260772705078125, 0.031053543090820312, 0.036029815673828125, 0.04100608825683594, 0.04598236083984375, 0.05095863342285156, 0.055934906005859375, 0.06091117858886719, 0.065887451171875, 0.07086372375488281, 0.07583999633789062, 0.08081626892089844, 0.08579254150390625, 0.09076881408691406, 0.09574508666992188, 0.10072135925292969, 0.1056976318359375, 0.11067390441894531, 0.11565017700195312, 0.12062644958496094, 0.12560272216796875, 0.13057899475097656, 0.13555526733398438, 0.1405315399169922, 0.1455078125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 9.0, 6.0, 10.0, 9.0, 16.0, 9.0, 18.0, 23.0, 47.0, 27.0, 45.0, 58.0, 84.0, 65.0, 89.0, 74.0, 74.0, 69.0, 38.0, 42.0, 32.0, 26.0, 26.0, 23.0, 11.0, 16.0, 9.0, 6.0, 5.0, 11.0, 5.0, 8.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0192394256591797e-05, -9.862706065177917e-06, -9.533017873764038e-06, -9.203329682350159e-06, -8.87364149093628e-06, -8.5439532995224e-06, -8.21426510810852e-06, -7.884576916694641e-06, -7.554888725280762e-06, -7.225200533866882e-06, -6.895512342453003e-06, -6.5658241510391235e-06, -6.236135959625244e-06, -5.906447768211365e-06, -5.576759576797485e-06, -5.247071385383606e-06, -4.9173831939697266e-06, -4.587695002555847e-06, -4.258006811141968e-06, -3.928318619728088e-06, -3.598630428314209e-06, -3.2689422369003296e-06, -2.93925404548645e-06, -2.609565854072571e-06, -2.2798776626586914e-06, -1.950189471244812e-06, -1.6205012798309326e-06, -1.2908130884170532e-06, -9.611248970031738e-07, -6.314367055892944e-07, -3.0174851417541504e-07, 2.7939677238464355e-08, 3.5762786865234375e-07, 6.873160600662231e-07, 1.0170042514801025e-06, 1.346692442893982e-06, 1.6763806343078613e-06, 2.0060688257217407e-06, 2.33575701713562e-06, 2.6654452085494995e-06, 2.995133399963379e-06, 3.3248215913772583e-06, 3.6545097827911377e-06, 3.984197974205017e-06, 4.3138861656188965e-06, 4.643574357032776e-06, 4.973262548446655e-06, 5.302950739860535e-06, 5.632638931274414e-06, 5.9623271226882935e-06, 6.292015314102173e-06, 6.621703505516052e-06, 6.951391696929932e-06, 7.281079888343811e-06, 7.6107680797576904e-06, 7.94045627117157e-06, 8.27014446258545e-06, 8.599832653999329e-06, 8.929520845413208e-06, 9.259209036827087e-06, 9.588897228240967e-06, 9.918585419654846e-06, 1.0248273611068726e-05, 1.0577961802482605e-05, 1.0907649993896484e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 8.0, 22.0, 27.0, 38.0, 73.0, 114.0, 242.0, 522.0, 1486.0, 5509.0, 52258.0, 912633.0, 66574.0, 6220.0, 1592.0, 618.0, 270.0, 129.0, 67.0, 48.0, 31.0, 14.0, 9.0, 10.0, 6.0, 6.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1319580078125, -0.1280231475830078, -0.12408828735351562, -0.12015342712402344, -0.11621856689453125, -0.11228370666503906, -0.10834884643554688, -0.10441398620605469, -0.1004791259765625, -0.09654426574707031, -0.09260940551757812, -0.08867454528808594, -0.08473968505859375, -0.08080482482910156, -0.07686996459960938, -0.07293510437011719, -0.069000244140625, -0.06506538391113281, -0.061130523681640625, -0.05719566345214844, -0.05326080322265625, -0.04932594299316406, -0.045391082763671875, -0.04145622253417969, -0.0375213623046875, -0.03358650207519531, -0.029651641845703125, -0.025716781616210938, -0.02178192138671875, -0.017847061157226562, -0.013912200927734375, -0.009977340698242188, -0.00604248046875, -0.0021076202392578125, 0.001827239990234375, 0.0057621002197265625, 0.00969696044921875, 0.013631820678710938, 0.017566680908203125, 0.021501541137695312, 0.0254364013671875, 0.029371261596679688, 0.033306121826171875, 0.03724098205566406, 0.04117584228515625, 0.04511070251464844, 0.049045562744140625, 0.05298042297363281, 0.056915283203125, 0.06085014343261719, 0.06478500366210938, 0.06871986389160156, 0.07265472412109375, 0.07658958435058594, 0.08052444458007812, 0.08445930480957031, 0.0883941650390625, 0.09232902526855469, 0.09626388549804688, 0.10019874572753906, 0.10413360595703125, 0.10806846618652344, 0.11200332641601562, 0.11593818664550781, 0.119873046875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 3.0, 15.0, 13.0, 11.0, 14.0, 32.0, 37.0, 52.0, 82.0, 117.0, 145.0, 143.0, 104.0, 70.0, 45.0, 40.0, 20.0, 13.0, 12.0, 8.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10260009765625, -0.09938812255859375, -0.0961761474609375, -0.09296417236328125, -0.089752197265625, -0.08654022216796875, -0.0833282470703125, -0.08011627197265625, -0.076904296875, -0.07369232177734375, -0.0704803466796875, -0.06726837158203125, -0.064056396484375, -0.06084442138671875, -0.0576324462890625, -0.05442047119140625, -0.05120849609375, -0.04799652099609375, -0.0447845458984375, -0.04157257080078125, -0.038360595703125, -0.03514862060546875, -0.0319366455078125, -0.02872467041015625, -0.0255126953125, -0.02230072021484375, -0.0190887451171875, -0.01587677001953125, -0.012664794921875, -0.00945281982421875, -0.0062408447265625, -0.00302886962890625, 0.00018310546875, 0.00339508056640625, 0.0066070556640625, 0.00981903076171875, 0.013031005859375, 0.01624298095703125, 0.0194549560546875, 0.02266693115234375, 0.02587890625, 0.02909088134765625, 0.0323028564453125, 0.03551483154296875, 0.038726806640625, 0.04193878173828125, 0.0451507568359375, 0.04836273193359375, 0.05157470703125, 0.05478668212890625, 0.0579986572265625, 0.06121063232421875, 0.064422607421875, 0.06763458251953125, 0.0708465576171875, 0.07405853271484375, 0.0772705078125, 0.08048248291015625, 0.0836944580078125, 0.08690643310546875, 0.090118408203125, 0.09333038330078125, 0.0965423583984375, 0.09975433349609375, 0.10296630859375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 19.0, 59.0, 181.0, 322.0, 265.0, 99.0, 34.0, 10.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3284640312194824, -3.2503602504730225, -3.1722564697265625, -3.0941529273986816, -3.0160491466522217, -2.9379453659057617, -2.8598415851593018, -2.781737804412842, -2.703634262084961, -2.625530481338501, -2.547426700592041, -2.46932315826416, -2.3912193775177, -2.3131155967712402, -2.2350118160247803, -2.1569080352783203, -2.0788044929504395, -2.0007007122039795, -1.922597050666809, -1.8444932699203491, -1.7663896083831787, -1.6882858276367188, -1.6101820468902588, -1.5320783853530884, -1.4539744853973389, -1.375870704650879, -1.2977670431137085, -1.2196632623672485, -1.1415596008300781, -1.0634558200836182, -0.985352098941803, -0.9072483777999878, -0.8291447162628174, -0.7510409951210022, -0.672937273979187, -0.594833493232727, -0.5167298316955566, -0.43862608075141907, -0.3605223298072815, -0.2824186086654663, -0.20431488752365112, -0.12621116638183594, -0.04810743033885956, 0.02999630570411682, 0.108100026845932, 0.1862037479877472, 0.26430749893188477, 0.34241122007369995, 0.42051494121551514, 0.4986186623573303, 0.5767223834991455, 0.6548261642456055, 0.7329298257827759, 0.8110336065292358, 0.889137327671051, 0.9672410488128662, 1.0453448295593262, 1.1234486103057861, 1.2015522718429565, 1.2796560525894165, 1.357759714126587, 1.4358634948730469, 1.5139672756195068, 1.5920709371566772, 1.6701745986938477]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 6.0, 5.0, 9.0, 11.0, 10.0, 14.0, 22.0, 14.0, 14.0, 20.0, 18.0, 29.0, 23.0, 25.0, 25.0, 31.0, 34.0, 39.0, 33.0, 29.0, 31.0, 40.0, 42.0, 45.0, 42.0, 30.0, 43.0, 33.0, 39.0, 29.0, 28.0, 28.0, 16.0, 22.0, 20.0, 20.0, 14.0, 16.0, 6.0, 7.0, 6.0, 3.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.7534415125846863, -0.7289000153541565, -0.7043585181236267, -0.6798170208930969, -0.6552755832672119, -0.6307340860366821, -0.6061925888061523, -0.5816510915756226, -0.5571095943450928, -0.532568097114563, -0.5080265998840332, -0.4834851324558258, -0.458943635225296, -0.43440213799476624, -0.40986067056655884, -0.38531917333602905, -0.36077767610549927, -0.3362361788749695, -0.3116946816444397, -0.2871532142162323, -0.2626117169857025, -0.23807021975517273, -0.21352873742580414, -0.18898725509643555, -0.16444575786590576, -0.13990426063537598, -0.11536277830600739, -0.0908212885260582, -0.06627979874610901, -0.04173830896615982, -0.017196819186210632, 0.007344663143157959, 0.03188621997833252, 0.05642770975828171, 0.0809691995382309, 0.10551068931818008, 0.13005217909812927, 0.15459367632865906, 0.17913515865802765, 0.20367664098739624, 0.22821813821792603, 0.2527596354484558, 0.2773011326789856, 0.301842600107193, 0.3263840973377228, 0.35092559456825256, 0.37546706199645996, 0.40000855922698975, 0.42455005645751953, 0.4490915536880493, 0.4736330509185791, 0.4981745183467865, 0.5227160453796387, 0.5472574830055237, 0.5717989802360535, 0.5963404774665833, 0.620881974697113, 0.6454234719276428, 0.6699649691581726, 0.6945064663887024, 0.7190479040145874, 0.7435894012451172, 0.768130898475647, 0.7926723957061768, 0.8172138929367065]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 15.0, 27.0, 37.0, 38.0, 66.0, 98.0, 184.0, 392.0, 2536.0, 4177105.0, 12604.0, 589.0, 228.0, 117.0, 72.0, 47.0, 32.0, 26.0, 12.0, 12.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99609375, -0.9636077880859375, -0.931121826171875, -0.8986358642578125, -0.86614990234375, -0.8336639404296875, -0.801177978515625, -0.7686920166015625, -0.7362060546875, -0.7037200927734375, -0.671234130859375, -0.6387481689453125, -0.60626220703125, -0.5737762451171875, -0.541290283203125, -0.5088043212890625, -0.476318359375, -0.4438323974609375, -0.411346435546875, -0.3788604736328125, -0.34637451171875, -0.3138885498046875, -0.281402587890625, -0.2489166259765625, -0.2164306640625, -0.1839447021484375, -0.151458740234375, -0.1189727783203125, -0.08648681640625, -0.0540008544921875, -0.021514892578125, 0.0109710693359375, 0.04345703125, 0.0759429931640625, 0.108428955078125, 0.1409149169921875, 0.17340087890625, 0.2058868408203125, 0.238372802734375, 0.2708587646484375, 0.3033447265625, 0.3358306884765625, 0.368316650390625, 0.4008026123046875, 0.43328857421875, 0.4657745361328125, 0.498260498046875, 0.5307464599609375, 0.563232421875, 0.5957183837890625, 0.628204345703125, 0.6606903076171875, 0.69317626953125, 0.7256622314453125, 0.758148193359375, 0.7906341552734375, 0.8231201171875, 0.8556060791015625, 0.888092041015625, 0.9205780029296875, 0.95306396484375, 0.9855499267578125, 1.018035888671875, 1.0505218505859375, 1.0830078125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 11.0, 24.0, 36.0, 74.0, 112.0, 151.0, 155.0, 155.0, 132.0, 61.0, 33.0, 29.0, 12.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.1286602020263672, -0.12414169311523438, -0.11962318420410156, -0.11510467529296875, -0.11058616638183594, -0.10606765747070312, -0.10154914855957031, -0.0970306396484375, -0.09251213073730469, -0.08799362182617188, -0.08347511291503906, -0.07895660400390625, -0.07443809509277344, -0.06991958618164062, -0.06540107727050781, -0.060882568359375, -0.05636405944824219, -0.051845550537109375, -0.04732704162597656, -0.04280853271484375, -0.03829002380371094, -0.033771514892578125, -0.029253005981445312, -0.0247344970703125, -0.020215988159179688, -0.015697479248046875, -0.011178970336914062, -0.00666046142578125, -0.0021419525146484375, 0.002376556396484375, 0.0068950653076171875, 0.01141357421875, 0.015932083129882812, 0.020450592041015625, 0.024969100952148438, 0.02948760986328125, 0.03400611877441406, 0.038524627685546875, 0.04304313659667969, 0.0475616455078125, 0.05208015441894531, 0.056598663330078125, 0.06111717224121094, 0.06563568115234375, 0.07015419006347656, 0.07467269897460938, 0.07919120788574219, 0.083709716796875, 0.08822822570800781, 0.09274673461914062, 0.09726524353027344, 0.10178375244140625, 0.10630226135253906, 0.11082077026367188, 0.11533927917480469, 0.1198577880859375, 0.12437629699707031, 0.12889480590820312, 0.13341331481933594, 0.13793182373046875, 0.14245033264160156, 0.14696884155273438, 0.1514873504638672, 0.156005859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 2.0, 5.0, 6.0, 7.0, 3.0, 14.0, 12.0, 12.0, 16.0, 26.0, 29.0, 50.0, 86.0, 151.0, 420.0, 1328.0, 6164.0, 65434.0, 3748386.0, 352143.0, 16113.0, 2555.0, 663.0, 283.0, 128.0, 67.0, 43.0, 30.0, 23.0, 19.0, 19.0, 7.0, 7.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2318115234375, -0.2247295379638672, -0.21764755249023438, -0.21056556701660156, -0.20348358154296875, -0.19640159606933594, -0.18931961059570312, -0.1822376251220703, -0.1751556396484375, -0.1680736541748047, -0.16099166870117188, -0.15390968322753906, -0.14682769775390625, -0.13974571228027344, -0.13266372680664062, -0.1255817413330078, -0.118499755859375, -0.11141777038574219, -0.10433578491210938, -0.09725379943847656, -0.09017181396484375, -0.08308982849121094, -0.07600784301757812, -0.06892585754394531, -0.0618438720703125, -0.05476188659667969, -0.047679901123046875, -0.04059791564941406, -0.03351593017578125, -0.026433944702148438, -0.019351959228515625, -0.012269973754882812, -0.00518798828125, 0.0018939971923828125, 0.008975982666015625, 0.016057968139648438, 0.02313995361328125, 0.030221939086914062, 0.037303924560546875, 0.04438591003417969, 0.0514678955078125, 0.05854988098144531, 0.06563186645507812, 0.07271385192871094, 0.07979583740234375, 0.08687782287597656, 0.09395980834960938, 0.10104179382324219, 0.108123779296875, 0.11520576477050781, 0.12228775024414062, 0.12936973571777344, 0.13645172119140625, 0.14353370666503906, 0.15061569213867188, 0.1576976776123047, 0.1647796630859375, 0.1718616485595703, 0.17894363403320312, 0.18602561950683594, 0.19310760498046875, 0.20018959045410156, 0.20727157592773438, 0.2143535614013672, 0.221435546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 10.0, 3.0, 11.0, 9.0, 13.0, 20.0, 28.0, 36.0, 50.0, 55.0, 89.0, 166.0, 276.0, 510.0, 876.0, 793.0, 471.0, 232.0, 145.0, 75.0, 59.0, 32.0, 30.0, 13.0, 19.0, 7.0, 11.0, 11.0, 3.0, 5.0, 7.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.120849609375, -0.11694145202636719, -0.11303329467773438, -0.10912513732910156, -0.10521697998046875, -0.10130882263183594, -0.09740066528320312, -0.09349250793457031, -0.0895843505859375, -0.08567619323730469, -0.08176803588867188, -0.07785987854003906, -0.07395172119140625, -0.07004356384277344, -0.06613540649414062, -0.06222724914550781, -0.058319091796875, -0.05441093444824219, -0.050502777099609375, -0.04659461975097656, -0.04268646240234375, -0.03877830505371094, -0.034870147705078125, -0.030961990356445312, -0.0270538330078125, -0.023145675659179688, -0.019237518310546875, -0.015329360961914062, -0.01142120361328125, -0.0075130462646484375, -0.003604888916015625, 0.0003032684326171875, 0.00421142578125, 0.008119583129882812, 0.012027740478515625, 0.015935897827148438, 0.01984405517578125, 0.023752212524414062, 0.027660369873046875, 0.03156852722167969, 0.0354766845703125, 0.03938484191894531, 0.043292999267578125, 0.04720115661621094, 0.05110931396484375, 0.05501747131347656, 0.058925628662109375, 0.06283378601074219, 0.066741943359375, 0.07065010070800781, 0.07455825805664062, 0.07846641540527344, 0.08237457275390625, 0.08628273010253906, 0.09019088745117188, 0.09409904479980469, 0.0980072021484375, 0.10191535949707031, 0.10582351684570312, 0.10973167419433594, 0.11363983154296875, 0.11754798889160156, 0.12145614624023438, 0.1253643035888672, 0.1292724609375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 1.0, 7.0, 6.0, 10.0, 34.0, 70.0, 162.0, 212.0, 245.0, 142.0, 59.0, 26.0, 8.0, 5.0, 0.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1750646829605103, -1.1261309385299683, -1.0771971940994263, -1.0282633304595947, -0.9793295860290527, -0.9303958415985107, -0.8814620971679688, -0.8325283527374268, -0.78359454870224, -0.734660804271698, -0.6857270002365112, -0.6367932558059692, -0.5878595113754272, -0.5389257073402405, -0.4899919629096985, -0.4410581886768341, -0.3921244144439697, -0.34319064021110535, -0.29425686597824097, -0.24532312154769897, -0.1963893473148346, -0.14745557308197021, -0.09852182865142822, -0.04958805441856384, -0.0006542801856994629, 0.04827948659658432, 0.0972132533788681, 0.1461470127105713, 0.19508078694343567, 0.24401456117630005, 0.29294830560684204, 0.3418820798397064, 0.39081573486328125, 0.43974950909614563, 0.48868328332901, 0.537617027759552, 0.5865508317947388, 0.6354845762252808, 0.6844183206558228, 0.7333520650863647, 0.7822858691215515, 0.8312196135520935, 0.8801534175872803, 0.9290871620178223, 0.9780209064483643, 1.0269546508789062, 1.0758883953094482, 1.1248222589492798, 1.1737560033798218, 1.2226897478103638, 1.2716234922409058, 1.3205573558807373, 1.3694911003112793, 1.4184248447418213, 1.4673585891723633, 1.5162923336029053, 1.5652260780334473, 1.6141598224639893, 1.6630935668945312, 1.7120273113250732, 1.7609611749649048, 1.8098949193954468, 1.8588286638259888, 1.9077624082565308, 1.9566962718963623]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 8.0, 10.0, 8.0, 15.0, 20.0, 20.0, 17.0, 25.0, 25.0, 29.0, 30.0, 25.0, 38.0, 38.0, 44.0, 40.0, 41.0, 55.0, 49.0, 48.0, 53.0, 51.0, 29.0, 42.0, 34.0, 30.0, 20.0, 34.0, 20.0, 14.0, 17.0, 12.0, 12.0, 8.0, 11.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47909897565841675, -0.46196699142456055, -0.44483500719070435, -0.42770302295684814, -0.41057103872299194, -0.39343905448913574, -0.37630707025527954, -0.35917508602142334, -0.34204310178756714, -0.32491111755371094, -0.30777913331985474, -0.29064714908599854, -0.27351516485214233, -0.25638318061828613, -0.23925121128559113, -0.22211922705173492, -0.20498725771903992, -0.18785527348518372, -0.17072328925132751, -0.1535913050174713, -0.1364593207836151, -0.11932734400033951, -0.1021953672170639, -0.0850633829832077, -0.0679313987493515, -0.0507994145154953, -0.0336674340069294, -0.016535453498363495, 0.0005965307354927063, 0.017728514969348907, 0.03486049175262451, 0.05199247598648071, 0.06912446022033691, 0.08625644445419312, 0.10338842868804932, 0.12052040547132492, 0.13765239715576172, 0.15478438138961792, 0.17191635072231293, 0.18904833495616913, 0.20618031919002533, 0.22331230342388153, 0.24044428765773773, 0.25757625699043274, 0.27470824122428894, 0.29184022545814514, 0.30897220969200134, 0.32610419392585754, 0.34323617815971375, 0.36036816239356995, 0.37750014662742615, 0.39463213086128235, 0.41176411509513855, 0.42889609932899475, 0.44602805376052856, 0.46316003799438477, 0.48029202222824097, 0.49742400646209717, 0.5145559906959534, 0.5316879749298096, 0.5488199591636658, 0.565951943397522, 0.5830839276313782, 0.6002159118652344, 0.6173478960990906]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 11.0, 12.0, 25.0, 16.0, 36.0, 39.0, 54.0, 91.0, 124.0, 196.0, 271.0, 520.0, 939.0, 1761.0, 3949.0, 15030.0, 225632.0, 748315.0, 39538.0, 6572.0, 2459.0, 1221.0, 668.0, 387.0, 219.0, 129.0, 102.0, 54.0, 41.0, 26.0, 27.0, 16.0, 11.0, 13.0, 10.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.410400390625, -0.3976631164550781, -0.38492584228515625, -0.3721885681152344, -0.3594512939453125, -0.3467140197753906, -0.33397674560546875, -0.3212394714355469, -0.308502197265625, -0.2957649230957031, -0.28302764892578125, -0.2702903747558594, -0.2575531005859375, -0.24481582641601562, -0.23207855224609375, -0.21934127807617188, -0.20660400390625, -0.19386672973632812, -0.18112945556640625, -0.16839218139648438, -0.1556549072265625, -0.14291763305664062, -0.13018035888671875, -0.11744308471679688, -0.104705810546875, -0.09196853637695312, -0.07923126220703125, -0.06649398803710938, -0.0537567138671875, -0.041019439697265625, -0.02828216552734375, -0.015544891357421875, -0.0028076171875, 0.009929656982421875, 0.02266693115234375, 0.035404205322265625, 0.0481414794921875, 0.060878753662109375, 0.07361602783203125, 0.08635330200195312, 0.099090576171875, 0.11182785034179688, 0.12456512451171875, 0.13730239868164062, 0.1500396728515625, 0.16277694702148438, 0.17551422119140625, 0.18825149536132812, 0.20098876953125, 0.21372604370117188, 0.22646331787109375, 0.23920059204101562, 0.2519378662109375, 0.2646751403808594, 0.27741241455078125, 0.2901496887207031, 0.302886962890625, 0.3156242370605469, 0.32836151123046875, 0.3410987854003906, 0.3538360595703125, 0.3665733337402344, 0.37931060791015625, 0.3920478820800781, 0.40478515625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 14.0, 17.0, 45.0, 73.0, 96.0, 150.0, 169.0, 163.0, 102.0, 70.0, 44.0, 25.0, 9.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134765625, -0.13019943237304688, -0.12563323974609375, -0.12106704711914062, -0.1165008544921875, -0.11193466186523438, -0.10736846923828125, -0.10280227661132812, -0.098236083984375, -0.09366989135742188, -0.08910369873046875, -0.08453750610351562, -0.0799713134765625, -0.07540512084960938, -0.07083892822265625, -0.06627273559570312, -0.06170654296875, -0.057140350341796875, -0.05257415771484375, -0.048007965087890625, -0.0434417724609375, -0.038875579833984375, -0.03430938720703125, -0.029743194580078125, -0.025177001953125, -0.020610809326171875, -0.01604461669921875, -0.011478424072265625, -0.0069122314453125, -0.002346038818359375, 0.00222015380859375, 0.006786346435546875, 0.0113525390625, 0.015918731689453125, 0.02048492431640625, 0.025051116943359375, 0.0296173095703125, 0.034183502197265625, 0.03874969482421875, 0.043315887451171875, 0.047882080078125, 0.052448272705078125, 0.05701446533203125, 0.061580657958984375, 0.0661468505859375, 0.07071304321289062, 0.07527923583984375, 0.07984542846679688, 0.08441162109375, 0.08897781372070312, 0.09354400634765625, 0.09811019897460938, 0.1026763916015625, 0.10724258422851562, 0.11180877685546875, 0.11637496948242188, 0.120941162109375, 0.12550735473632812, 0.13007354736328125, 0.13463973999023438, 0.1392059326171875, 0.14377212524414062, 0.14833831787109375, 0.15290451049804688, 0.157470703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 11.0, 6.0, 16.0, 22.0, 30.0, 34.0, 48.0, 58.0, 91.0, 103.0, 177.0, 267.0, 481.0, 990.0, 2312.0, 9298.0, 117508.0, 855384.0, 51731.0, 6180.0, 1824.0, 800.0, 391.0, 224.0, 170.0, 88.0, 74.0, 57.0, 43.0, 29.0, 15.0, 17.0, 21.0, 7.0, 6.0, 6.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.325927734375, -0.316162109375, -0.306396484375, -0.296630859375, -0.286865234375, -0.277099609375, -0.267333984375, -0.257568359375, -0.247802734375, -0.238037109375, -0.228271484375, -0.218505859375, -0.208740234375, -0.198974609375, -0.189208984375, -0.179443359375, -0.169677734375, -0.159912109375, -0.150146484375, -0.140380859375, -0.130615234375, -0.120849609375, -0.111083984375, -0.101318359375, -0.091552734375, -0.081787109375, -0.072021484375, -0.062255859375, -0.052490234375, -0.042724609375, -0.032958984375, -0.023193359375, -0.013427734375, -0.003662109375, 0.006103515625, 0.015869140625, 0.025634765625, 0.035400390625, 0.045166015625, 0.054931640625, 0.064697265625, 0.074462890625, 0.084228515625, 0.093994140625, 0.103759765625, 0.113525390625, 0.123291015625, 0.133056640625, 0.142822265625, 0.152587890625, 0.162353515625, 0.172119140625, 0.181884765625, 0.191650390625, 0.201416015625, 0.211181640625, 0.220947265625, 0.230712890625, 0.240478515625, 0.250244140625, 0.260009765625, 0.269775390625, 0.279541015625, 0.289306640625, 0.299072265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 2.0, 4.0, 6.0, 6.0, 11.0, 16.0, 13.0, 14.0, 19.0, 21.0, 32.0, 42.0, 47.0, 50.0, 49.0, 65.0, 60.0, 53.0, 60.0, 55.0, 51.0, 49.0, 41.0, 37.0, 39.0, 37.0, 26.0, 16.0, 16.0, 19.0, 9.0, 8.0, 3.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.313720703125, -0.30498313903808594, -0.2962455749511719, -0.2875080108642578, -0.27877044677734375, -0.2700328826904297, -0.2612953186035156, -0.25255775451660156, -0.2438201904296875, -0.23508262634277344, -0.22634506225585938, -0.2176074981689453, -0.20886993408203125, -0.2001323699951172, -0.19139480590820312, -0.18265724182128906, -0.173919677734375, -0.16518211364746094, -0.15644454956054688, -0.1477069854736328, -0.13896942138671875, -0.1302318572998047, -0.12149429321289062, -0.11275672912597656, -0.1040191650390625, -0.09528160095214844, -0.08654403686523438, -0.07780647277832031, -0.06906890869140625, -0.06033134460449219, -0.051593780517578125, -0.04285621643066406, -0.03411865234375, -0.025381088256835938, -0.016643524169921875, -0.007905960083007812, 0.00083160400390625, 0.009569168090820312, 0.018306732177734375, 0.027044296264648438, 0.0357818603515625, 0.04451942443847656, 0.053256988525390625, 0.06199455261230469, 0.07073211669921875, 0.07946968078613281, 0.08820724487304688, 0.09694480895996094, 0.105682373046875, 0.11441993713378906, 0.12315750122070312, 0.1318950653076172, 0.14063262939453125, 0.1493701934814453, 0.15810775756835938, 0.16684532165527344, 0.1755828857421875, 0.18432044982910156, 0.19305801391601562, 0.2017955780029297, 0.21053314208984375, 0.2192707061767578, 0.22800827026367188, 0.23674583435058594, 0.2454833984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 9.0, 13.0, 15.0, 28.0, 46.0, 76.0, 131.0, 238.0, 443.0, 1008.0, 3023.0, 13599.0, 221874.0, 774423.0, 26238.0, 4696.0, 1431.0, 613.0, 246.0, 150.0, 81.0, 48.0, 30.0, 14.0, 17.0, 19.0, 7.0, 9.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14434242248535156, -0.13939285278320312, -0.1344432830810547, -0.12949371337890625, -0.12454414367675781, -0.11959457397460938, -0.11464500427246094, -0.1096954345703125, -0.10474586486816406, -0.09979629516601562, -0.09484672546386719, -0.08989715576171875, -0.08494758605957031, -0.07999801635742188, -0.07504844665527344, -0.070098876953125, -0.06514930725097656, -0.060199737548828125, -0.05525016784667969, -0.05030059814453125, -0.04535102844238281, -0.040401458740234375, -0.03545188903808594, -0.0305023193359375, -0.025552749633789062, -0.020603179931640625, -0.015653610229492188, -0.01070404052734375, -0.0057544708251953125, -0.000804901123046875, 0.0041446685791015625, 0.00909423828125, 0.014043807983398438, 0.018993377685546875, 0.023942947387695312, 0.02889251708984375, 0.03384208679199219, 0.038791656494140625, 0.04374122619628906, 0.0486907958984375, 0.05364036560058594, 0.058589935302734375, 0.06353950500488281, 0.06848907470703125, 0.07343864440917969, 0.07838821411132812, 0.08333778381347656, 0.088287353515625, 0.09323692321777344, 0.09818649291992188, 0.10313606262207031, 0.10808563232421875, 0.11303520202636719, 0.11798477172851562, 0.12293434143066406, 0.1278839111328125, 0.13283348083496094, 0.13778305053710938, 0.1427326202392578, 0.14768218994140625, 0.1526317596435547, 0.15758132934570312, 0.16253089904785156, 0.16748046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 3.0, 11.0, 13.0, 16.0, 23.0, 38.0, 57.0, 95.0, 133.0, 167.0, 151.0, 92.0, 69.0, 47.0, 23.0, 16.0, 13.0, 9.0, 13.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.045797348022461e-05, -2.9462389647960663e-05, -2.8466805815696716e-05, -2.747122198343277e-05, -2.6475638151168823e-05, -2.5480054318904877e-05, -2.448447048664093e-05, -2.3488886654376984e-05, -2.2493302822113037e-05, -2.149771898984909e-05, -2.0502135157585144e-05, -1.9506551325321198e-05, -1.851096749305725e-05, -1.7515383660793304e-05, -1.6519799828529358e-05, -1.552421599626541e-05, -1.4528632164001465e-05, -1.3533048331737518e-05, -1.2537464499473572e-05, -1.1541880667209625e-05, -1.0546296834945679e-05, -9.550713002681732e-06, -8.555129170417786e-06, -7.559545338153839e-06, -6.563961505889893e-06, -5.568377673625946e-06, -4.5727938413619995e-06, -3.577210009098053e-06, -2.5816261768341064e-06, -1.58604234457016e-06, -5.904585123062134e-07, 4.0512531995773315e-07, 1.4007091522216797e-06, 2.3962929844856262e-06, 3.3918768167495728e-06, 4.387460649013519e-06, 5.383044481277466e-06, 6.378628313541412e-06, 7.374212145805359e-06, 8.369795978069305e-06, 9.365379810333252e-06, 1.0360963642597198e-05, 1.1356547474861145e-05, 1.2352131307125092e-05, 1.3347715139389038e-05, 1.4343298971652985e-05, 1.533888280391693e-05, 1.6334466636180878e-05, 1.7330050468444824e-05, 1.832563430070877e-05, 1.9321218132972717e-05, 2.0316801965236664e-05, 2.131238579750061e-05, 2.2307969629764557e-05, 2.3303553462028503e-05, 2.429913729429245e-05, 2.5294721126556396e-05, 2.6290304958820343e-05, 2.728588879108429e-05, 2.8281472623348236e-05, 2.9277056455612183e-05, 3.027264028787613e-05, 3.1268224120140076e-05, 3.226380795240402e-05, 3.325939178466797e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 6.0, 4.0, 10.0, 18.0, 21.0, 26.0, 48.0, 42.0, 72.0, 106.0, 127.0, 203.0, 363.0, 634.0, 1221.0, 2667.0, 7172.0, 29960.0, 350455.0, 600321.0, 40098.0, 8664.0, 3111.0, 1319.0, 724.0, 385.0, 239.0, 164.0, 98.0, 71.0, 58.0, 39.0, 27.0, 13.0, 15.0, 14.0, 14.0, 2.0, 6.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.140625, -0.13637351989746094, -0.13212203979492188, -0.1278705596923828, -0.12361907958984375, -0.11936759948730469, -0.11511611938476562, -0.11086463928222656, -0.1066131591796875, -0.10236167907714844, -0.09811019897460938, -0.09385871887207031, -0.08960723876953125, -0.08535575866699219, -0.08110427856445312, -0.07685279846191406, -0.072601318359375, -0.06834983825683594, -0.06409835815429688, -0.05984687805175781, -0.05559539794921875, -0.05134391784667969, -0.047092437744140625, -0.04284095764160156, -0.0385894775390625, -0.03433799743652344, -0.030086517333984375, -0.025835037231445312, -0.02158355712890625, -0.017332077026367188, -0.013080596923828125, -0.008829116821289062, -0.00457763671875, -0.0003261566162109375, 0.003925323486328125, 0.008176803588867188, 0.01242828369140625, 0.016679763793945312, 0.020931243896484375, 0.025182723999023438, 0.0294342041015625, 0.03368568420410156, 0.037937164306640625, 0.04218864440917969, 0.04644012451171875, 0.05069160461425781, 0.054943084716796875, 0.05919456481933594, 0.063446044921875, 0.06769752502441406, 0.07194900512695312, 0.07620048522949219, 0.08045196533203125, 0.08470344543457031, 0.08895492553710938, 0.09320640563964844, 0.0974578857421875, 0.10170936584472656, 0.10596084594726562, 0.11021232604980469, 0.11446380615234375, 0.11871528625488281, 0.12296676635742188, 0.12721824645996094, 0.1314697265625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 8.0, 11.0, 18.0, 13.0, 34.0, 37.0, 42.0, 54.0, 88.0, 85.0, 99.0, 95.0, 89.0, 71.0, 51.0, 48.0, 27.0, 29.0, 18.0, 12.0, 15.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11285400390625, -0.10929679870605469, -0.10573959350585938, -0.10218238830566406, -0.09862518310546875, -0.09506797790527344, -0.09151077270507812, -0.08795356750488281, -0.0843963623046875, -0.08083915710449219, -0.07728195190429688, -0.07372474670410156, -0.07016754150390625, -0.06661033630371094, -0.06305313110351562, -0.05949592590332031, -0.055938720703125, -0.05238151550292969, -0.048824310302734375, -0.04526710510253906, -0.04170989990234375, -0.03815269470214844, -0.034595489501953125, -0.031038284301757812, -0.0274810791015625, -0.023923873901367188, -0.020366668701171875, -0.016809463500976562, -0.01325225830078125, -0.009695053100585938, -0.006137847900390625, -0.0025806427001953125, 0.0009765625, 0.0045337677001953125, 0.008090972900390625, 0.011648178100585938, 0.01520538330078125, 0.018762588500976562, 0.022319793701171875, 0.025876998901367188, 0.0294342041015625, 0.03299140930175781, 0.036548614501953125, 0.04010581970214844, 0.04366302490234375, 0.04722023010253906, 0.050777435302734375, 0.05433464050292969, 0.057891845703125, 0.06144905090332031, 0.06500625610351562, 0.06856346130371094, 0.07212066650390625, 0.07567787170410156, 0.07923507690429688, 0.08279228210449219, 0.0863494873046875, 0.08990669250488281, 0.09346389770507812, 0.09702110290527344, 0.10057830810546875, 0.10413551330566406, 0.10769271850585938, 0.11124992370605469, 0.11480712890625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 17.0, 47.0, 126.0, 250.0, 284.0, 154.0, 71.0, 21.0, 5.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9098281860351562, -1.8276026248931885, -1.7453771829605103, -1.6631516218185425, -1.5809261798858643, -1.4987006187438965, -1.4164750576019287, -1.334249496459961, -1.2520240545272827, -1.169798493385315, -1.0875730514526367, -1.005347490310669, -0.923121988773346, -0.840896487236023, -0.7586709260940552, -0.6764454245567322, -0.5942199230194092, -0.5119944214820862, -0.4297688901424408, -0.3475433588027954, -0.2653178572654724, -0.18309235572814941, -0.10086682438850403, -0.018641293048858643, 0.06358420848846436, 0.14580972492694855, 0.22803524136543274, 0.3102607727050781, 0.3924862742424011, 0.4747117757797241, 0.5569373369216919, 0.6391628384590149, 0.7213883399963379, 0.8036138415336609, 0.8858393430709839, 0.9680649042129517, 1.0502903461456299, 1.1325159072875977, 1.2147414684295654, 1.2969670295715332, 1.3791924715042114, 1.4614180326461792, 1.5436434745788574, 1.6258690357208252, 1.708094596862793, 1.7903200387954712, 1.872545599937439, 1.9547710418701172, 2.036996603012085, 2.1192221641540527, 2.2014477252960205, 2.283673048019409, 2.365898609161377, 2.4481241703033447, 2.5303497314453125, 2.6125752925872803, 2.694800853729248, 2.777026414871216, 2.8592519760131836, 2.9414772987365723, 3.02370285987854, 3.105928421020508, 3.1881539821624756, 3.2703795433044434, 3.352604866027832]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 9.0, 13.0, 6.0, 14.0, 6.0, 13.0, 15.0, 12.0, 21.0, 21.0, 26.0, 24.0, 36.0, 36.0, 42.0, 55.0, 52.0, 52.0, 50.0, 48.0, 58.0, 51.0, 47.0, 44.0, 26.0, 31.0, 31.0, 26.0, 24.0, 16.0, 17.0, 10.0, 13.0, 16.0, 10.0, 8.0, 4.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-1.1702250242233276, -1.1381992101669312, -1.1061733961105347, -1.0741477012634277, -1.0421218872070312, -1.0100960731506348, -0.9780702590942383, -0.9460444450378418, -0.9140186905860901, -0.8819928765296936, -0.8499671220779419, -0.8179413080215454, -0.7859154939651489, -0.7538897395133972, -0.7218639254570007, -0.689838171005249, -0.6578123569488525, -0.625786542892456, -0.5937607884407043, -0.5617349743843079, -0.5297092199325562, -0.49768340587615967, -0.4656575918197632, -0.4336318075656891, -0.401606023311615, -0.3695802390575409, -0.3375544548034668, -0.3055286407470703, -0.2735028564929962, -0.24147707223892212, -0.20945127308368683, -0.17742547392845154, -0.14539974927902222, -0.11337395757436752, -0.08134816586971283, -0.049322374165058136, -0.017296582460403442, 0.014729201793670654, 0.046755000948905945, 0.07878080010414124, 0.11080658435821533, 0.14283236861228943, 0.17485816776752472, 0.20688396692276, 0.2389097511768341, 0.2709355354309082, 0.3029613494873047, 0.3349871337413788, 0.3670129179954529, 0.399038702249527, 0.4310644865036011, 0.46309030055999756, 0.49511608481407166, 0.5271418690681458, 0.5591676831245422, 0.591193437576294, 0.6232192516326904, 0.6552450656890869, 0.6872708201408386, 0.7192966341972351, 0.7513223886489868, 0.7833482027053833, 0.8153740167617798, 0.8473998308181763, 0.879425585269928]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 3.0, 11.0, 13.0, 12.0, 14.0, 29.0, 26.0, 49.0, 77.0, 293.0, 4191965.0, 1395.0, 172.0, 64.0, 47.0, 31.0, 23.0, 14.0, 12.0, 8.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.6875, -20.015380859375, -19.34326171875, -18.671142578125, -17.9990234375, -17.326904296875, -16.65478515625, -15.982666015625, -15.310546875, -14.638427734375, -13.96630859375, -13.294189453125, -12.6220703125, -11.949951171875, -11.27783203125, -10.605712890625, -9.93359375, -9.261474609375, -8.58935546875, -7.917236328125, -7.2451171875, -6.572998046875, -5.90087890625, -5.228759765625, -4.556640625, -3.884521484375, -3.21240234375, -2.540283203125, -1.8681640625, -1.196044921875, -0.52392578125, 0.148193359375, 0.8203125, 1.492431640625, 2.16455078125, 2.836669921875, 3.5087890625, 4.180908203125, 4.85302734375, 5.525146484375, 6.197265625, 6.869384765625, 7.54150390625, 8.213623046875, 8.8857421875, 9.557861328125, 10.22998046875, 10.902099609375, 11.57421875, 12.246337890625, 12.91845703125, 13.590576171875, 14.2626953125, 14.934814453125, 15.60693359375, 16.279052734375, 16.951171875, 17.623291015625, 18.29541015625, 18.967529296875, 19.6396484375, 20.311767578125, 20.98388671875, 21.656005859375, 22.328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 22.0, 33.0, 57.0, 93.0, 130.0, 170.0, 149.0, 115.0, 91.0, 61.0, 26.0, 13.0, 14.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135009765625, -0.13048362731933594, -0.12595748901367188, -0.12143135070800781, -0.11690521240234375, -0.11237907409667969, -0.10785293579101562, -0.10332679748535156, -0.0988006591796875, -0.09427452087402344, -0.08974838256835938, -0.08522224426269531, -0.08069610595703125, -0.07616996765136719, -0.07164382934570312, -0.06711769104003906, -0.062591552734375, -0.05806541442871094, -0.053539276123046875, -0.04901313781738281, -0.04448699951171875, -0.03996086120605469, -0.035434722900390625, -0.030908584594726562, -0.0263824462890625, -0.021856307983398438, -0.017330169677734375, -0.012804031372070312, -0.00827789306640625, -0.0037517547607421875, 0.000774383544921875, 0.0053005218505859375, 0.00982666015625, 0.014352798461914062, 0.018878936767578125, 0.023405075073242188, 0.02793121337890625, 0.03245735168457031, 0.036983489990234375, 0.04150962829589844, 0.0460357666015625, 0.05056190490722656, 0.055088043212890625, 0.05961418151855469, 0.06414031982421875, 0.06866645812988281, 0.07319259643554688, 0.07771873474121094, 0.082244873046875, 0.08677101135253906, 0.09129714965820312, 0.09582328796386719, 0.10034942626953125, 0.10487556457519531, 0.10940170288085938, 0.11392784118652344, 0.1184539794921875, 0.12298011779785156, 0.12750625610351562, 0.1320323944091797, 0.13655853271484375, 0.1410846710205078, 0.14561080932617188, 0.15013694763183594, 0.1546630859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 6.0, 7.0, 14.0, 22.0, 27.0, 44.0, 95.0, 178.0, 384.0, 1193.0, 6044.0, 95798.0, 4018222.0, 64836.0, 5482.0, 1183.0, 359.0, 172.0, 78.0, 54.0, 25.0, 15.0, 7.0, 4.0, 11.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.46875, -0.4565582275390625, -0.444366455078125, -0.4321746826171875, -0.41998291015625, -0.4077911376953125, -0.395599365234375, -0.3834075927734375, -0.3712158203125, -0.3590240478515625, -0.346832275390625, -0.3346405029296875, -0.32244873046875, -0.3102569580078125, -0.298065185546875, -0.2858734130859375, -0.273681640625, -0.2614898681640625, -0.249298095703125, -0.2371063232421875, -0.22491455078125, -0.2127227783203125, -0.200531005859375, -0.1883392333984375, -0.1761474609375, -0.1639556884765625, -0.151763916015625, -0.1395721435546875, -0.12738037109375, -0.1151885986328125, -0.102996826171875, -0.0908050537109375, -0.07861328125, -0.0664215087890625, -0.054229736328125, -0.0420379638671875, -0.02984619140625, -0.0176544189453125, -0.005462646484375, 0.0067291259765625, 0.0189208984375, 0.0311126708984375, 0.043304443359375, 0.0554962158203125, 0.06768798828125, 0.0798797607421875, 0.092071533203125, 0.1042633056640625, 0.116455078125, 0.1286468505859375, 0.140838623046875, 0.1530303955078125, 0.16522216796875, 0.1774139404296875, 0.189605712890625, 0.2017974853515625, 0.2139892578125, 0.2261810302734375, 0.238372802734375, 0.2505645751953125, 0.26275634765625, 0.2749481201171875, 0.287139892578125, 0.2993316650390625, 0.3115234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 8.0, 7.0, 12.0, 14.0, 19.0, 29.0, 31.0, 56.0, 94.0, 151.0, 240.0, 495.0, 1039.0, 884.0, 387.0, 218.0, 125.0, 68.0, 48.0, 41.0, 21.0, 22.0, 14.0, 10.0, 6.0, 2.0, 6.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1234130859375, -0.11942100524902344, -0.11542892456054688, -0.11143684387207031, -0.10744476318359375, -0.10345268249511719, -0.09946060180664062, -0.09546852111816406, -0.0914764404296875, -0.08748435974121094, -0.08349227905273438, -0.07950019836425781, -0.07550811767578125, -0.07151603698730469, -0.06752395629882812, -0.06353187561035156, -0.059539794921875, -0.05554771423339844, -0.051555633544921875, -0.04756355285644531, -0.04357147216796875, -0.03957939147949219, -0.035587310791015625, -0.03159523010253906, -0.0276031494140625, -0.023611068725585938, -0.019618988037109375, -0.015626907348632812, -0.01163482666015625, -0.0076427459716796875, -0.003650665283203125, 0.0003414154052734375, 0.00433349609375, 0.008325576782226562, 0.012317657470703125, 0.016309738159179688, 0.02030181884765625, 0.024293899536132812, 0.028285980224609375, 0.03227806091308594, 0.0362701416015625, 0.04026222229003906, 0.044254302978515625, 0.04824638366699219, 0.05223846435546875, 0.05623054504394531, 0.060222625732421875, 0.06421470642089844, 0.068206787109375, 0.07219886779785156, 0.07619094848632812, 0.08018302917480469, 0.08417510986328125, 0.08816719055175781, 0.09215927124023438, 0.09615135192871094, 0.1001434326171875, 0.10413551330566406, 0.10812759399414062, 0.11211967468261719, 0.11611175537109375, 0.12010383605957031, 0.12409591674804688, 0.12808799743652344, 0.132080078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 18.0, 66.0, 481.0, 264.0, 88.0, 37.0, 22.0, 12.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2628905773162842, -1.1309131383895874, -0.9989356994628906, -0.8669582605361938, -0.7349808216094971, -0.6030033826828003, -0.4710259437561035, -0.33904850482940674, -0.20707106590270996, -0.07509362697601318, 0.056883811950683594, 0.18886125087738037, 0.32083868980407715, 0.4528161287307739, 0.5847935676574707, 0.7167710065841675, 0.8487484455108643, 0.980725884437561, 1.1127033233642578, 1.2446807622909546, 1.3766582012176514, 1.5086356401443481, 1.640613079071045, 1.7725905179977417, 1.9045679569244385, 2.0365452766418457, 2.168522834777832, 2.3005003929138184, 2.4324777126312256, 2.564455032348633, 2.696432590484619, 2.8284101486206055, 2.9603872299194336, 3.09236478805542, 3.224342107772827, 3.3563194274902344, 3.4882969856262207, 3.620274543762207, 3.7522518634796143, 3.8842291831970215, 4.016206741333008, 4.148184299468994, 4.2801618576049805, 4.412138938903809, 4.544116497039795, 4.676094055175781, 4.808071136474609, 4.940048694610596, 5.072026252746582, 5.204003810882568, 5.335981369018555, 5.467958450317383, 5.599936008453369, 5.7319135665893555, 5.863890647888184, 5.99586820602417, 6.127845764160156, 6.259823322296143, 6.391800880432129, 6.523777961730957, 6.655755519866943, 6.78773307800293, 6.919710159301758, 7.051687717437744, 7.1836652755737305]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 3.0, 13.0, 10.0, 16.0, 17.0, 27.0, 34.0, 26.0, 39.0, 49.0, 43.0, 63.0, 52.0, 76.0, 61.0, 62.0, 69.0, 62.0, 46.0, 42.0, 39.0, 34.0, 20.0, 24.0, 19.0, 8.0, 11.0, 8.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9663889408111572, -0.9363610148429871, -0.9063330888748169, -0.8763052225112915, -0.8462772965431213, -0.8162493705749512, -0.786221444606781, -0.7561935186386108, -0.7261656522750854, -0.6961377263069153, -0.6661098003387451, -0.6360819339752197, -0.6060540080070496, -0.5760260820388794, -0.5459981560707092, -0.5159702301025391, -0.4859423041343689, -0.45591437816619873, -0.42588648200035095, -0.3958585560321808, -0.365830659866333, -0.33580273389816284, -0.3057748079299927, -0.2757468819618225, -0.24571898579597473, -0.21569107472896576, -0.1856631636619568, -0.15563523769378662, -0.12560732662677765, -0.09557941555976868, -0.06555148959159851, -0.03552357852458954, -0.005495667457580566, 0.024532247334718704, 0.054560162127017975, 0.08458808064460754, 0.11461599171161652, 0.1446439027786255, 0.17467182874679565, 0.20469973981380463, 0.2347276508808136, 0.26475557684898376, 0.29478347301483154, 0.3248113989830017, 0.3548393249511719, 0.38486722111701965, 0.4148951470851898, 0.4449230432510376, 0.47495096921920776, 0.5049788951873779, 0.5350068211555481, 0.5650347471237183, 0.5950626134872437, 0.6250905394554138, 0.655118465423584, 0.6851463913917542, 0.7151743173599243, 0.7452022433280945, 0.7752301692962646, 0.80525803565979, 0.8352859616279602, 0.8653138875961304, 0.8953418135643005, 0.9253697395324707, 0.9553976058959961]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 4.0, 7.0, 10.0, 19.0, 44.0, 103.0, 224.0, 776.0, 4722.0, 118943.0, 902001.0, 18985.0, 1974.0, 474.0, 116.0, 64.0, 31.0, 18.0, 15.0, 11.0, 4.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.736328125, -0.7127838134765625, -0.689239501953125, -0.6656951904296875, -0.64215087890625, -0.6186065673828125, -0.595062255859375, -0.5715179443359375, -0.5479736328125, -0.5244293212890625, -0.500885009765625, -0.4773406982421875, -0.45379638671875, -0.4302520751953125, -0.406707763671875, -0.3831634521484375, -0.359619140625, -0.3360748291015625, -0.312530517578125, -0.2889862060546875, -0.26544189453125, -0.2418975830078125, -0.218353271484375, -0.1948089599609375, -0.1712646484375, -0.1477203369140625, -0.124176025390625, -0.1006317138671875, -0.07708740234375, -0.0535430908203125, -0.029998779296875, -0.0064544677734375, 0.01708984375, 0.0406341552734375, 0.064178466796875, 0.0877227783203125, 0.11126708984375, 0.1348114013671875, 0.158355712890625, 0.1819000244140625, 0.2054443359375, 0.2289886474609375, 0.252532958984375, 0.2760772705078125, 0.29962158203125, 0.3231658935546875, 0.346710205078125, 0.3702545166015625, 0.393798828125, 0.4173431396484375, 0.440887451171875, 0.4644317626953125, 0.48797607421875, 0.5115203857421875, 0.535064697265625, 0.5586090087890625, 0.5821533203125, 0.6056976318359375, 0.629241943359375, 0.6527862548828125, 0.67633056640625, 0.6998748779296875, 0.723419189453125, 0.7469635009765625, 0.7705078125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 14.0, 23.0, 42.0, 52.0, 111.0, 127.0, 133.0, 159.0, 124.0, 87.0, 55.0, 24.0, 21.0, 9.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1397705078125, -0.13522720336914062, -0.13068389892578125, -0.12614059448242188, -0.1215972900390625, -0.11705398559570312, -0.11251068115234375, -0.10796737670898438, -0.103424072265625, -0.09888076782226562, -0.09433746337890625, -0.08979415893554688, -0.0852508544921875, -0.08070755004882812, -0.07616424560546875, -0.07162094116210938, -0.06707763671875, -0.06253433227539062, -0.05799102783203125, -0.053447723388671875, -0.0489044189453125, -0.044361114501953125, -0.03981781005859375, -0.035274505615234375, -0.030731201171875, -0.026187896728515625, -0.02164459228515625, -0.017101287841796875, -0.0125579833984375, -0.008014678955078125, -0.00347137451171875, 0.001071929931640625, 0.005615234375, 0.010158538818359375, 0.01470184326171875, 0.019245147705078125, 0.0237884521484375, 0.028331756591796875, 0.03287506103515625, 0.037418365478515625, 0.041961669921875, 0.046504974365234375, 0.05104827880859375, 0.055591583251953125, 0.0601348876953125, 0.06467819213867188, 0.06922149658203125, 0.07376480102539062, 0.07830810546875, 0.08285140991210938, 0.08739471435546875, 0.09193801879882812, 0.0964813232421875, 0.10102462768554688, 0.10556793212890625, 0.11011123657226562, 0.114654541015625, 0.11919784545898438, 0.12374114990234375, 0.12828445434570312, 0.1328277587890625, 0.13737106323242188, 0.14191436767578125, 0.14645767211914062, 0.1510009765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 5.0, 11.0, 12.0, 14.0, 13.0, 19.0, 27.0, 43.0, 52.0, 72.0, 93.0, 198.0, 285.0, 476.0, 819.0, 1532.0, 3243.0, 7933.0, 22174.0, 74432.0, 297214.0, 480535.0, 109742.0, 30838.0, 10336.0, 4065.0, 1894.0, 962.0, 551.0, 325.0, 184.0, 141.0, 85.0, 64.0, 39.0, 31.0, 19.0, 20.0, 8.0, 7.0, 6.0, 11.0, 2.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1536865234375, -0.1482257843017578, -0.14276504516601562, -0.13730430603027344, -0.13184356689453125, -0.12638282775878906, -0.12092208862304688, -0.11546134948730469, -0.1100006103515625, -0.10453987121582031, -0.09907913208007812, -0.09361839294433594, -0.08815765380859375, -0.08269691467285156, -0.07723617553710938, -0.07177543640136719, -0.066314697265625, -0.06085395812988281, -0.055393218994140625, -0.04993247985839844, -0.04447174072265625, -0.03901100158691406, -0.033550262451171875, -0.028089523315429688, -0.0226287841796875, -0.017168045043945312, -0.011707305908203125, -0.0062465667724609375, -0.00078582763671875, 0.0046749114990234375, 0.010135650634765625, 0.015596389770507812, 0.02105712890625, 0.026517868041992188, 0.031978607177734375, 0.03743934631347656, 0.04290008544921875, 0.04836082458496094, 0.053821563720703125, 0.05928230285644531, 0.0647430419921875, 0.07020378112792969, 0.07566452026367188, 0.08112525939941406, 0.08658599853515625, 0.09204673767089844, 0.09750747680664062, 0.10296821594238281, 0.108428955078125, 0.11388969421386719, 0.11935043334960938, 0.12481117248535156, 0.13027191162109375, 0.13573265075683594, 0.14119338989257812, 0.1466541290283203, 0.1521148681640625, 0.1575756072998047, 0.16303634643554688, 0.16849708557128906, 0.17395782470703125, 0.17941856384277344, 0.18487930297851562, 0.1903400421142578, 0.19580078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 1.0, 5.0, 4.0, 4.0, 9.0, 12.0, 17.0, 7.0, 22.0, 16.0, 17.0, 31.0, 28.0, 42.0, 41.0, 28.0, 42.0, 54.0, 41.0, 45.0, 42.0, 50.0, 57.0, 42.0, 42.0, 41.0, 37.0, 34.0, 30.0, 28.0, 15.0, 18.0, 17.0, 10.0, 15.0, 9.0, 15.0, 3.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.2392578125, -0.2323169708251953, -0.22537612915039062, -0.21843528747558594, -0.21149444580078125, -0.20455360412597656, -0.19761276245117188, -0.1906719207763672, -0.1837310791015625, -0.1767902374267578, -0.16984939575195312, -0.16290855407714844, -0.15596771240234375, -0.14902687072753906, -0.14208602905273438, -0.1351451873779297, -0.128204345703125, -0.12126350402832031, -0.11432266235351562, -0.10738182067871094, -0.10044097900390625, -0.09350013732910156, -0.08655929565429688, -0.07961845397949219, -0.0726776123046875, -0.06573677062988281, -0.058795928955078125, -0.05185508728027344, -0.04491424560546875, -0.03797340393066406, -0.031032562255859375, -0.024091720581054688, -0.01715087890625, -0.010210037231445312, -0.003269195556640625, 0.0036716461181640625, 0.01061248779296875, 0.017553329467773438, 0.024494171142578125, 0.03143501281738281, 0.0383758544921875, 0.04531669616699219, 0.052257537841796875, 0.05919837951660156, 0.06613922119140625, 0.07308006286621094, 0.08002090454101562, 0.08696174621582031, 0.093902587890625, 0.10084342956542969, 0.10778427124023438, 0.11472511291503906, 0.12166595458984375, 0.12860679626464844, 0.13554763793945312, 0.1424884796142578, 0.1494293212890625, 0.1563701629638672, 0.16331100463867188, 0.17025184631347656, 0.17719268798828125, 0.18413352966308594, 0.19107437133789062, 0.1980152130126953, 0.2049560546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 1.0, 9.0, 6.0, 10.0, 11.0, 28.0, 31.0, 36.0, 85.0, 90.0, 154.0, 239.0, 462.0, 879.0, 1877.0, 4664.0, 15705.0, 296334.0, 696523.0, 21362.0, 5476.0, 2230.0, 1032.0, 505.0, 307.0, 150.0, 107.0, 66.0, 42.0, 36.0, 23.0, 12.0, 11.0, 9.0, 6.0, 1.0, 6.0, 3.0, 2.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.310791015625, -0.3004608154296875, -0.290130615234375, -0.2798004150390625, -0.26947021484375, -0.2591400146484375, -0.248809814453125, -0.2384796142578125, -0.2281494140625, -0.2178192138671875, -0.207489013671875, -0.1971588134765625, -0.18682861328125, -0.1764984130859375, -0.166168212890625, -0.1558380126953125, -0.1455078125, -0.1351776123046875, -0.124847412109375, -0.1145172119140625, -0.10418701171875, -0.0938568115234375, -0.083526611328125, -0.0731964111328125, -0.0628662109375, -0.0525360107421875, -0.042205810546875, -0.0318756103515625, -0.02154541015625, -0.0112152099609375, -0.000885009765625, 0.0094451904296875, 0.019775390625, 0.0301055908203125, 0.040435791015625, 0.0507659912109375, 0.06109619140625, 0.0714263916015625, 0.081756591796875, 0.0920867919921875, 0.1024169921875, 0.1127471923828125, 0.123077392578125, 0.1334075927734375, 0.14373779296875, 0.1540679931640625, 0.164398193359375, 0.1747283935546875, 0.18505859375, 0.1953887939453125, 0.205718994140625, 0.2160491943359375, 0.22637939453125, 0.2367095947265625, 0.247039794921875, 0.2573699951171875, 0.2677001953125, 0.2780303955078125, 0.288360595703125, 0.2986907958984375, 0.30902099609375, 0.3193511962890625, 0.329681396484375, 0.3400115966796875, 0.350341796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 7.0, 3.0, 5.0, 8.0, 22.0, 38.0, 90.0, 176.0, 304.0, 190.0, 83.0, 31.0, 20.0, 9.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00010162591934204102, -9.923335164785385e-05, -9.684078395366669e-05, -9.444821625947952e-05, -9.205564856529236e-05, -8.96630808711052e-05, -8.727051317691803e-05, -8.487794548273087e-05, -8.24853777885437e-05, -8.009281009435654e-05, -7.770024240016937e-05, -7.530767470598221e-05, -7.291510701179504e-05, -7.052253931760788e-05, -6.812997162342072e-05, -6.573740392923355e-05, -6.334483623504639e-05, -6.095226854085922e-05, -5.855970084667206e-05, -5.6167133152484894e-05, -5.377456545829773e-05, -5.1381997764110565e-05, -4.89894300699234e-05, -4.6596862375736237e-05, -4.420429468154907e-05, -4.181172698736191e-05, -3.9419159293174744e-05, -3.702659159898758e-05, -3.4634023904800415e-05, -3.224145621061325e-05, -2.9848888516426086e-05, -2.7456320822238922e-05, -2.5063753128051758e-05, -2.2671185433864594e-05, -2.027861773967743e-05, -1.7886050045490265e-05, -1.54934823513031e-05, -1.3100914657115936e-05, -1.0708346962928772e-05, -8.315779268741608e-06, -5.923211574554443e-06, -3.530643880367279e-06, -1.1380761861801147e-06, 1.2544915080070496e-06, 3.647059202194214e-06, 6.039626896381378e-06, 8.432194590568542e-06, 1.0824762284755707e-05, 1.3217329978942871e-05, 1.5609897673130035e-05, 1.80024653673172e-05, 2.0395033061504364e-05, 2.278760075569153e-05, 2.5180168449878693e-05, 2.7572736144065857e-05, 2.996530383825302e-05, 3.2357871532440186e-05, 3.475043922662735e-05, 3.7143006920814514e-05, 3.953557461500168e-05, 4.192814230918884e-05, 4.432071000337601e-05, 4.671327769756317e-05, 4.9105845391750336e-05, 5.14984130859375e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 8.0, 15.0, 16.0, 37.0, 49.0, 98.0, 234.0, 460.0, 1355.0, 4883.0, 39235.0, 960827.0, 34340.0, 4786.0, 1334.0, 449.0, 226.0, 80.0, 53.0, 22.0, 13.0, 9.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406982421875, -0.3916130065917969, -0.37624359130859375, -0.3608741760253906, -0.3455047607421875, -0.3301353454589844, -0.31476593017578125, -0.2993965148925781, -0.284027099609375, -0.2686576843261719, -0.25328826904296875, -0.23791885375976562, -0.2225494384765625, -0.20718002319335938, -0.19181060791015625, -0.17644119262695312, -0.16107177734375, -0.14570236206054688, -0.13033294677734375, -0.11496353149414062, -0.0995941162109375, -0.08422470092773438, -0.06885528564453125, -0.053485870361328125, -0.038116455078125, -0.022747039794921875, -0.00737762451171875, 0.007991790771484375, 0.0233612060546875, 0.038730621337890625, 0.05410003662109375, 0.06946945190429688, 0.0848388671875, 0.10020828247070312, 0.11557769775390625, 0.13094711303710938, 0.1463165283203125, 0.16168594360351562, 0.17705535888671875, 0.19242477416992188, 0.207794189453125, 0.22316360473632812, 0.23853302001953125, 0.2539024353027344, 0.2692718505859375, 0.2846412658691406, 0.30001068115234375, 0.3153800964355469, 0.33074951171875, 0.3461189270019531, 0.36148834228515625, 0.3768577575683594, 0.3922271728515625, 0.4075965881347656, 0.42296600341796875, 0.4383354187011719, 0.453704833984375, 0.4690742492675781, 0.48444366455078125, 0.4998130798339844, 0.5151824951171875, 0.5305519104003906, 0.5459213256835938, 0.5612907409667969, 0.57666015625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 4.0, 7.0, 9.0, 7.0, 33.0, 46.0, 71.0, 126.0, 181.0, 187.0, 128.0, 85.0, 38.0, 31.0, 12.0, 10.0, 12.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.30242347717285156, -0.2940559387207031, -0.2856884002685547, -0.27732086181640625, -0.2689533233642578, -0.2605857849121094, -0.25221824645996094, -0.2438507080078125, -0.23548316955566406, -0.22711563110351562, -0.2187480926513672, -0.21038055419921875, -0.2020130157470703, -0.19364547729492188, -0.18527793884277344, -0.176910400390625, -0.16854286193847656, -0.16017532348632812, -0.1518077850341797, -0.14344024658203125, -0.1350727081298828, -0.12670516967773438, -0.11833763122558594, -0.1099700927734375, -0.10160255432128906, -0.09323501586914062, -0.08486747741699219, -0.07649993896484375, -0.06813240051269531, -0.059764862060546875, -0.05139732360839844, -0.04302978515625, -0.03466224670410156, -0.026294708251953125, -0.017927169799804688, -0.00955963134765625, -0.0011920928955078125, 0.007175445556640625, 0.015542984008789062, 0.0239105224609375, 0.03227806091308594, 0.040645599365234375, 0.04901313781738281, 0.05738067626953125, 0.06574821472167969, 0.07411575317382812, 0.08248329162597656, 0.090850830078125, 0.09921836853027344, 0.10758590698242188, 0.11595344543457031, 0.12432098388671875, 0.1326885223388672, 0.14105606079101562, 0.14942359924316406, 0.1577911376953125, 0.16615867614746094, 0.17452621459960938, 0.1828937530517578, 0.19126129150390625, 0.1996288299560547, 0.20799636840820312, 0.21636390686035156, 0.2247314453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 7.0, 11.0, 29.0, 43.0, 109.0, 196.0, 285.0, 163.0, 91.0, 36.0, 12.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7721872329711914, -3.652040719985962, -3.5318939685821533, -3.411747455596924, -3.2916007041931152, -3.1714541912078857, -3.0513076782226562, -2.9311609268188477, -2.811014413833618, -2.6908679008483887, -2.57072114944458, -2.4505746364593506, -2.330428123474121, -2.2102813720703125, -2.090134859085083, -1.969988226890564, -1.849841594696045, -1.7296949625015259, -1.6095483303070068, -1.4894018173217773, -1.3692551851272583, -1.2491085529327393, -1.1289620399475098, -1.0088154077529907, -0.8886687755584717, -0.7685221433639526, -0.6483755707740784, -0.5282289981842041, -0.40808236598968506, -0.287935733795166, -0.16778916120529175, -0.04764258861541748, 0.07250428199768066, 0.19265088438987732, 0.312797486782074, 0.43294408917427063, 0.5530906915664673, 0.6732373237609863, 0.7933838963508606, 0.9135304689407349, 1.033677101135254, 1.153823733329773, 1.273970365524292, 1.3941168785095215, 1.5142635107040405, 1.6344101428985596, 1.754556655883789, 1.874703288078308, 1.9948499202728271, 2.1149964332580566, 2.2351431846618652, 2.3552896976470947, 2.475436210632324, 2.595582962036133, 2.7157294750213623, 2.835875988006592, 2.9560227394104004, 3.07616925239563, 3.1963160037994385, 3.316462516784668, 3.4366092681884766, 3.556755781173706, 3.6769022941589355, 3.797049045562744, 3.9171955585479736]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 6.0, 7.0, 10.0, 12.0, 10.0, 4.0, 7.0, 18.0, 15.0, 18.0, 24.0, 32.0, 35.0, 38.0, 40.0, 33.0, 43.0, 49.0, 59.0, 48.0, 53.0, 49.0, 39.0, 33.0, 43.0, 28.0, 41.0, 23.0, 31.0, 20.0, 27.0, 16.0, 18.0, 16.0, 16.0, 5.0, 10.0, 7.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.0337803363800049, -1.0030534267425537, -0.972326397895813, -0.941599428653717, -0.9108724594116211, -0.8801455497741699, -0.849418580532074, -0.818691611289978, -0.7879646420478821, -0.7572376728057861, -0.7265107035636902, -0.6957837343215942, -0.6650568246841431, -0.6343297958374023, -0.6036028861999512, -0.5728759169578552, -0.5421489477157593, -0.5114219784736633, -0.4806950092315674, -0.4499680697917938, -0.4192411005496979, -0.38851413130760193, -0.35778719186782837, -0.3270602226257324, -0.2963332533836365, -0.2656062841415405, -0.23487932980060577, -0.20415237545967102, -0.17342540621757507, -0.14269843697547913, -0.11197148263454437, -0.08124452829360962, -0.05051761865615845, -0.019790656864643097, 0.010936304926872253, 0.041663266718387604, 0.07239022850990295, 0.1031171977519989, 0.13384415209293365, 0.1645711064338684, 0.19529807567596436, 0.2260250449180603, 0.25675201416015625, 0.2874789535999298, 0.31820592284202576, 0.3489328920841217, 0.37965983152389526, 0.4103868007659912, 0.44111377000808716, 0.4718407392501831, 0.502567708492279, 0.533294677734375, 0.5640215873718262, 0.5947486162185669, 0.6254755258560181, 0.656202495098114, 0.68692946434021, 0.7176564335823059, 0.7483834028244019, 0.7791103720664978, 0.8098373413085938, 0.8405642509460449, 0.8712912201881409, 0.9020181894302368, 0.9327451586723328]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 11.0, 9.0, 7.0, 14.0, 24.0, 36.0, 101.0, 236.0, 2106.0, 4190800.0, 607.0, 183.0, 54.0, 29.0, 17.0, 12.0, 11.0, 8.0, 6.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51171875, -2.4315185546875, -2.351318359375, -2.2711181640625, -2.19091796875, -2.1107177734375, -2.030517578125, -1.9503173828125, -1.8701171875, -1.7899169921875, -1.709716796875, -1.6295166015625, -1.54931640625, -1.4691162109375, -1.388916015625, -1.3087158203125, -1.228515625, -1.1483154296875, -1.068115234375, -0.9879150390625, -0.90771484375, -0.8275146484375, -0.747314453125, -0.6671142578125, -0.5869140625, -0.5067138671875, -0.426513671875, -0.3463134765625, -0.26611328125, -0.1859130859375, -0.105712890625, -0.0255126953125, 0.0546875, 0.1348876953125, 0.215087890625, 0.2952880859375, 0.37548828125, 0.4556884765625, 0.535888671875, 0.6160888671875, 0.6962890625, 0.7764892578125, 0.856689453125, 0.9368896484375, 1.01708984375, 1.0972900390625, 1.177490234375, 1.2576904296875, 1.337890625, 1.4180908203125, 1.498291015625, 1.5784912109375, 1.65869140625, 1.7388916015625, 1.819091796875, 1.8992919921875, 1.9794921875, 2.0596923828125, 2.139892578125, 2.2200927734375, 2.30029296875, 2.3804931640625, 2.460693359375, 2.5408935546875, 2.62109375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 13.0, 18.0, 28.0, 51.0, 63.0, 119.0, 128.0, 156.0, 139.0, 102.0, 68.0, 47.0, 36.0, 16.0, 7.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1400146484375, -0.1355571746826172, -0.13109970092773438, -0.12664222717285156, -0.12218475341796875, -0.11772727966308594, -0.11326980590820312, -0.10881233215332031, -0.1043548583984375, -0.09989738464355469, -0.09543991088867188, -0.09098243713378906, -0.08652496337890625, -0.08206748962402344, -0.07761001586914062, -0.07315254211425781, -0.068695068359375, -0.06423759460449219, -0.059780120849609375, -0.05532264709472656, -0.05086517333984375, -0.04640769958496094, -0.041950225830078125, -0.03749275207519531, -0.0330352783203125, -0.028577804565429688, -0.024120330810546875, -0.019662857055664062, -0.01520538330078125, -0.010747909545898438, -0.006290435791015625, -0.0018329620361328125, 0.00262451171875, 0.0070819854736328125, 0.011539459228515625, 0.015996932983398438, 0.02045440673828125, 0.024911880493164062, 0.029369354248046875, 0.03382682800292969, 0.0382843017578125, 0.04274177551269531, 0.047199249267578125, 0.05165672302246094, 0.05611419677734375, 0.06057167053222656, 0.06502914428710938, 0.06948661804199219, 0.073944091796875, 0.07840156555175781, 0.08285903930664062, 0.08731651306152344, 0.09177398681640625, 0.09623146057128906, 0.10068893432617188, 0.10514640808105469, 0.1096038818359375, 0.11406135559082031, 0.11851882934570312, 0.12297630310058594, 0.12743377685546875, 0.13189125061035156, 0.13634872436523438, 0.1408061981201172, 0.145263671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 10.0, 10.0, 18.0, 33.0, 45.0, 55.0, 112.0, 229.0, 689.0, 4017.0, 108100.0, 4031450.0, 45539.0, 2519.0, 647.0, 257.0, 151.0, 86.0, 85.0, 29.0, 52.0, 29.0, 21.0, 15.0, 19.0, 13.0, 14.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.426025390625, -0.41201019287109375, -0.3979949951171875, -0.38397979736328125, -0.369964599609375, -0.35594940185546875, -0.3419342041015625, -0.32791900634765625, -0.31390380859375, -0.29988861083984375, -0.2858734130859375, -0.27185821533203125, -0.257843017578125, -0.24382781982421875, -0.2298126220703125, -0.21579742431640625, -0.2017822265625, -0.18776702880859375, -0.1737518310546875, -0.15973663330078125, -0.145721435546875, -0.13170623779296875, -0.1176910400390625, -0.10367584228515625, -0.08966064453125, -0.07564544677734375, -0.0616302490234375, -0.04761505126953125, -0.033599853515625, -0.01958465576171875, -0.0055694580078125, 0.00844573974609375, 0.0224609375, 0.03647613525390625, 0.0504913330078125, 0.06450653076171875, 0.078521728515625, 0.09253692626953125, 0.1065521240234375, 0.12056732177734375, 0.13458251953125, 0.14859771728515625, 0.1626129150390625, 0.17662811279296875, 0.190643310546875, 0.20465850830078125, 0.2186737060546875, 0.23268890380859375, 0.2467041015625, 0.26071929931640625, 0.2747344970703125, 0.28874969482421875, 0.302764892578125, 0.31678009033203125, 0.3307952880859375, 0.34481048583984375, 0.35882568359375, 0.37284088134765625, 0.3868560791015625, 0.40087127685546875, 0.414886474609375, 0.42890167236328125, 0.4429168701171875, 0.45693206787109375, 0.470947265625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 1.0, 3.0, 4.0, 6.0, 20.0, 26.0, 71.0, 152.0, 390.0, 1481.0, 1281.0, 362.0, 144.0, 77.0, 28.0, 15.0, 15.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1461181640625, -0.1348094940185547, -0.12350082397460938, -0.11219215393066406, -0.10088348388671875, -0.08957481384277344, -0.07826614379882812, -0.06695747375488281, -0.0556488037109375, -0.04434013366699219, -0.033031463623046875, -0.021722793579101562, -0.01041412353515625, 0.0008945465087890625, 0.012203216552734375, 0.023511886596679688, 0.034820556640625, 0.04612922668457031, 0.057437896728515625, 0.06874656677246094, 0.08005523681640625, 0.09136390686035156, 0.10267257690429688, 0.11398124694824219, 0.1252899169921875, 0.1365985870361328, 0.14790725708007812, 0.15921592712402344, 0.17052459716796875, 0.18183326721191406, 0.19314193725585938, 0.2044506072998047, 0.21575927734375, 0.2270679473876953, 0.23837661743164062, 0.24968528747558594, 0.26099395751953125, 0.27230262756347656, 0.2836112976074219, 0.2949199676513672, 0.3062286376953125, 0.3175373077392578, 0.3288459777832031, 0.34015464782714844, 0.35146331787109375, 0.36277198791503906, 0.3740806579589844, 0.3853893280029297, 0.396697998046875, 0.4080066680908203, 0.4193153381347656, 0.43062400817871094, 0.44193267822265625, 0.45324134826660156, 0.4645500183105469, 0.4758586883544922, 0.4871673583984375, 0.4984760284423828, 0.5097846984863281, 0.5210933685302734, 0.5324020385742188, 0.5437107086181641, 0.5550193786621094, 0.5663280487060547, 0.57763671875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 5.0, 15.0, 14.0, 20.0, 45.0, 59.0, 104.0, 141.0, 140.0, 127.0, 89.0, 57.0, 44.0, 33.0, 21.0, 18.0, 10.0, 13.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.461466908454895, -1.4091870784759521, -1.3569073677062988, -1.304627537727356, -1.252347707748413, -1.2000679969787598, -1.147788166999817, -1.095508337020874, -1.0432285070419312, -0.9909487366676331, -0.9386689066886902, -0.8863891363143921, -0.8341093063354492, -0.7818295359611511, -0.729549765586853, -0.6772699356079102, -0.6249901652336121, -0.572710394859314, -0.5204305648803711, -0.468150794506073, -0.4158709645271301, -0.36359119415283203, -0.31131139397621155, -0.25903159379959106, -0.20675179362297058, -0.1544719934463501, -0.10219220072031021, -0.049912407994270325, 0.0023673921823501587, 0.05464717745780945, 0.10692697763442993, 0.15920677781105042, 0.2114865779876709, 0.2637663781642914, 0.31604617834091187, 0.36832594871520996, 0.42060577869415283, 0.4728855490684509, 0.525165319442749, 0.5774451494216919, 0.6297249794006348, 0.6820047497749329, 0.7342845797538757, 0.7865643501281738, 0.8388441801071167, 0.8911239504814148, 0.9434037208557129, 0.9956835508346558, 1.0479633808135986, 1.1002432107925415, 1.1525229215621948, 1.2048027515411377, 1.2570825815200806, 1.3093624114990234, 1.3616421222686768, 1.4139219522476196, 1.466201663017273, 1.5184814929962158, 1.5707612037658691, 1.623041033744812, 1.6753208637237549, 1.7276005744934082, 1.779880404472351, 1.832160234451294, 1.8844400644302368]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 3.0, 6.0, 7.0, 3.0, 6.0, 14.0, 12.0, 13.0, 20.0, 11.0, 25.0, 28.0, 35.0, 22.0, 28.0, 34.0, 40.0, 42.0, 44.0, 50.0, 52.0, 50.0, 51.0, 35.0, 50.0, 52.0, 29.0, 26.0, 36.0, 27.0, 33.0, 21.0, 12.0, 20.0, 13.0, 4.0, 14.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2019305229187012, -1.1654633283615112, -1.1289961338043213, -1.0925289392471313, -1.0560617446899414, -1.0195945501327515, -0.9831272959709167, -0.9466601014137268, -0.9101929068565369, -0.8737257122993469, -0.837258517742157, -0.800791323184967, -0.7643240690231323, -0.7278568744659424, -0.6913896799087524, -0.6549224853515625, -0.6184552907943726, -0.5819880962371826, -0.5455209016799927, -0.5090537071228027, -0.4725864827632904, -0.43611928820610046, -0.39965206384658813, -0.3631848692893982, -0.32671767473220825, -0.2902504801750183, -0.25378328561782837, -0.21731606125831604, -0.1808488667011261, -0.14438167214393616, -0.10791446268558502, -0.07144725322723389, -0.034980177879333496, 0.0014870241284370422, 0.03795422613620758, 0.07442142814397812, 0.11088863015174866, 0.1473558247089386, 0.18382303416728973, 0.22029024362564087, 0.2567574381828308, 0.29322463274002075, 0.3296918272972107, 0.366159051656723, 0.40262624621391296, 0.4390934407711029, 0.47556066513061523, 0.5120278596878052, 0.5484950542449951, 0.5849622488021851, 0.621429443359375, 0.6578966379165649, 0.6943638324737549, 0.7308310270309448, 0.7672982811927795, 0.8037654757499695, 0.8402326703071594, 0.8766998648643494, 0.9131670594215393, 0.9496342539787292, 0.986101508140564, 1.022568702697754, 1.0590358972549438, 1.0955030918121338, 1.1319702863693237]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 9.0, 10.0, 14.0, 16.0, 28.0, 47.0, 46.0, 70.0, 87.0, 107.0, 204.0, 288.0, 513.0, 811.0, 1432.0, 2682.0, 5218.0, 11152.0, 24931.0, 60498.0, 152645.0, 319301.0, 269521.0, 114945.0, 45828.0, 19387.0, 8851.0, 4419.0, 2283.0, 1261.0, 722.0, 416.0, 257.0, 148.0, 113.0, 76.0, 55.0, 41.0, 29.0, 28.0, 12.0, 17.0, 9.0, 3.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1533203125, -0.14850616455078125, -0.1436920166015625, -0.13887786865234375, -0.134063720703125, -0.12924957275390625, -0.1244354248046875, -0.11962127685546875, -0.11480712890625, -0.10999298095703125, -0.1051788330078125, -0.10036468505859375, -0.095550537109375, -0.09073638916015625, -0.0859222412109375, -0.08110809326171875, -0.0762939453125, -0.07147979736328125, -0.0666656494140625, -0.06185150146484375, -0.057037353515625, -0.05222320556640625, -0.0474090576171875, -0.04259490966796875, -0.03778076171875, -0.03296661376953125, -0.0281524658203125, -0.02333831787109375, -0.018524169921875, -0.01371002197265625, -0.0088958740234375, -0.00408172607421875, 0.000732421875, 0.00554656982421875, 0.0103607177734375, 0.01517486572265625, 0.019989013671875, 0.02480316162109375, 0.0296173095703125, 0.03443145751953125, 0.03924560546875, 0.04405975341796875, 0.0488739013671875, 0.05368804931640625, 0.058502197265625, 0.06331634521484375, 0.0681304931640625, 0.07294464111328125, 0.0777587890625, 0.08257293701171875, 0.0873870849609375, 0.09220123291015625, 0.097015380859375, 0.10182952880859375, 0.1066436767578125, 0.11145782470703125, 0.11627197265625, 0.12108612060546875, 0.1259002685546875, 0.13071441650390625, 0.135528564453125, 0.14034271240234375, 0.1451568603515625, 0.14997100830078125, 0.15478515625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 20.0, 35.0, 45.0, 53.0, 76.0, 111.0, 140.0, 112.0, 127.0, 96.0, 56.0, 41.0, 31.0, 20.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13427734375, -0.1300678253173828, -0.12585830688476562, -0.12164878845214844, -0.11743927001953125, -0.11322975158691406, -0.10902023315429688, -0.10481071472167969, -0.1006011962890625, -0.09639167785644531, -0.09218215942382812, -0.08797264099121094, -0.08376312255859375, -0.07955360412597656, -0.07534408569335938, -0.07113456726074219, -0.066925048828125, -0.06271553039550781, -0.058506011962890625, -0.05429649353027344, -0.05008697509765625, -0.04587745666503906, -0.041667938232421875, -0.03745841979980469, -0.0332489013671875, -0.029039382934570312, -0.024829864501953125, -0.020620346069335938, -0.01641082763671875, -0.012201309204101562, -0.007991790771484375, -0.0037822723388671875, 0.00042724609375, 0.0046367645263671875, 0.008846282958984375, 0.013055801391601562, 0.01726531982421875, 0.021474838256835938, 0.025684356689453125, 0.029893875122070312, 0.0341033935546875, 0.03831291198730469, 0.042522430419921875, 0.04673194885253906, 0.05094146728515625, 0.05515098571777344, 0.059360504150390625, 0.06357002258300781, 0.067779541015625, 0.07198905944824219, 0.07619857788085938, 0.08040809631347656, 0.08461761474609375, 0.08882713317871094, 0.09303665161132812, 0.09724617004394531, 0.1014556884765625, 0.10566520690917969, 0.10987472534179688, 0.11408424377441406, 0.11829376220703125, 0.12250328063964844, 0.12671279907226562, 0.1309223175048828, 0.1351318359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 1.0, 11.0, 2.0, 6.0, 14.0, 19.0, 23.0, 36.0, 56.0, 94.0, 116.0, 178.0, 319.0, 549.0, 1052.0, 2226.0, 5176.0, 15913.0, 66829.0, 515333.0, 358760.0, 58348.0, 14285.0, 4859.0, 2034.0, 1000.0, 514.0, 283.0, 182.0, 118.0, 70.0, 42.0, 27.0, 24.0, 16.0, 16.0, 9.0, 8.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.289306640625, -0.2793159484863281, -0.26932525634765625, -0.2593345642089844, -0.2493438720703125, -0.23935317993164062, -0.22936248779296875, -0.21937179565429688, -0.209381103515625, -0.19939041137695312, -0.18939971923828125, -0.17940902709960938, -0.1694183349609375, -0.15942764282226562, -0.14943695068359375, -0.13944625854492188, -0.12945556640625, -0.11946487426757812, -0.10947418212890625, -0.09948348999023438, -0.0894927978515625, -0.07950210571289062, -0.06951141357421875, -0.059520721435546875, -0.049530029296875, -0.039539337158203125, -0.02954864501953125, -0.019557952880859375, -0.0095672607421875, 0.000423431396484375, 0.01041412353515625, 0.020404815673828125, 0.0303955078125, 0.040386199951171875, 0.05037689208984375, 0.060367584228515625, 0.0703582763671875, 0.08034896850585938, 0.09033966064453125, 0.10033035278320312, 0.110321044921875, 0.12031173706054688, 0.13030242919921875, 0.14029312133789062, 0.1502838134765625, 0.16027450561523438, 0.17026519775390625, 0.18025588989257812, 0.19024658203125, 0.20023727416992188, 0.21022796630859375, 0.22021865844726562, 0.2302093505859375, 0.24020004272460938, 0.25019073486328125, 0.2601814270019531, 0.270172119140625, 0.2801628112792969, 0.29015350341796875, 0.3001441955566406, 0.3101348876953125, 0.3201255798339844, 0.33011627197265625, 0.3401069641113281, 0.35009765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 2.0, 4.0, 4.0, 8.0, 7.0, 9.0, 17.0, 9.0, 15.0, 20.0, 25.0, 20.0, 32.0, 52.0, 43.0, 43.0, 44.0, 50.0, 70.0, 60.0, 54.0, 53.0, 55.0, 49.0, 40.0, 29.0, 39.0, 24.0, 21.0, 19.0, 20.0, 12.0, 14.0, 10.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3466796875, -0.33489227294921875, -0.3231048583984375, -0.31131744384765625, -0.299530029296875, -0.28774261474609375, -0.2759552001953125, -0.26416778564453125, -0.25238037109375, -0.24059295654296875, -0.2288055419921875, -0.21701812744140625, -0.205230712890625, -0.19344329833984375, -0.1816558837890625, -0.16986846923828125, -0.1580810546875, -0.14629364013671875, -0.1345062255859375, -0.12271881103515625, -0.110931396484375, -0.09914398193359375, -0.0873565673828125, -0.07556915283203125, -0.06378173828125, -0.05199432373046875, -0.0402069091796875, -0.02841949462890625, -0.016632080078125, -0.00484466552734375, 0.0069427490234375, 0.01873016357421875, 0.030517578125, 0.04230499267578125, 0.0540924072265625, 0.06587982177734375, 0.077667236328125, 0.08945465087890625, 0.1012420654296875, 0.11302947998046875, 0.12481689453125, 0.13660430908203125, 0.1483917236328125, 0.16017913818359375, 0.171966552734375, 0.18375396728515625, 0.1955413818359375, 0.20732879638671875, 0.2191162109375, 0.23090362548828125, 0.2426910400390625, 0.25447845458984375, 0.266265869140625, 0.27805328369140625, 0.2898406982421875, 0.30162811279296875, 0.31341552734375, 0.32520294189453125, 0.3369903564453125, 0.34877777099609375, 0.360565185546875, 0.37235260009765625, 0.3841400146484375, 0.39592742919921875, 0.40771484375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 13.0, 13.0, 19.0, 41.0, 67.0, 103.0, 157.0, 303.0, 644.0, 1207.0, 2473.0, 5985.0, 18014.0, 158104.0, 808167.0, 36990.0, 9192.0, 3596.0, 1722.0, 791.0, 398.0, 234.0, 134.0, 66.0, 34.0, 22.0, 20.0, 12.0, 9.0, 10.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.6455078125, -0.6286201477050781, -0.6117324829101562, -0.5948448181152344, -0.5779571533203125, -0.5610694885253906, -0.5441818237304688, -0.5272941589355469, -0.510406494140625, -0.4935188293457031, -0.47663116455078125, -0.4597434997558594, -0.4428558349609375, -0.4259681701660156, -0.40908050537109375, -0.3921928405761719, -0.37530517578125, -0.3584175109863281, -0.34152984619140625, -0.3246421813964844, -0.3077545166015625, -0.2908668518066406, -0.27397918701171875, -0.2570915222167969, -0.240203857421875, -0.22331619262695312, -0.20642852783203125, -0.18954086303710938, -0.1726531982421875, -0.15576553344726562, -0.13887786865234375, -0.12199020385742188, -0.1051025390625, -0.08821487426757812, -0.07132720947265625, -0.054439544677734375, -0.0375518798828125, -0.020664215087890625, -0.00377655029296875, 0.013111114501953125, 0.029998779296875, 0.046886444091796875, 0.06377410888671875, 0.08066177368164062, 0.0975494384765625, 0.11443710327148438, 0.13132476806640625, 0.14821243286132812, 0.16510009765625, 0.18198776245117188, 0.19887542724609375, 0.21576309204101562, 0.2326507568359375, 0.24953842163085938, 0.26642608642578125, 0.2833137512207031, 0.300201416015625, 0.3170890808105469, 0.33397674560546875, 0.3508644104003906, 0.3677520751953125, 0.3846397399902344, 0.40152740478515625, 0.4184150695800781, 0.435302734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 12.0, 5.0, 8.0, 15.0, 21.0, 27.0, 42.0, 96.0, 155.0, 231.0, 167.0, 76.0, 45.0, 28.0, 17.0, 10.0, 12.0, 5.0, 7.0, 4.0, 3.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0001195669174194336, -0.00011619646102190018, -0.00011282600462436676, -0.00010945554822683334, -0.00010608509182929993, -0.00010271463543176651, -9.93441790342331e-05, -9.597372263669968e-05, -9.260326623916626e-05, -8.923280984163284e-05, -8.586235344409943e-05, -8.249189704656601e-05, -7.912144064903259e-05, -7.575098425149918e-05, -7.238052785396576e-05, -6.901007145643234e-05, -6.563961505889893e-05, -6.226915866136551e-05, -5.889870226383209e-05, -5.5528245866298676e-05, -5.215778946876526e-05, -4.878733307123184e-05, -4.5416876673698425e-05, -4.204642027616501e-05, -3.867596387863159e-05, -3.5305507481098175e-05, -3.193505108356476e-05, -2.856459468603134e-05, -2.5194138288497925e-05, -2.1823681890964508e-05, -1.845322549343109e-05, -1.5082769095897675e-05, -1.1712312698364258e-05, -8.341856300830841e-06, -4.971399903297424e-06, -1.6009435057640076e-06, 1.7695128917694092e-06, 5.139969289302826e-06, 8.510425686836243e-06, 1.188088208436966e-05, 1.5251338481903076e-05, 1.8621794879436493e-05, 2.199225127696991e-05, 2.5362707674503326e-05, 2.8733164072036743e-05, 3.210362046957016e-05, 3.547407686710358e-05, 3.8844533264636993e-05, 4.221498966217041e-05, 4.558544605970383e-05, 4.8955902457237244e-05, 5.232635885477066e-05, 5.569681525230408e-05, 5.9067271649837494e-05, 6.243772804737091e-05, 6.580818444490433e-05, 6.917864084243774e-05, 7.254909723997116e-05, 7.591955363750458e-05, 7.9290010035038e-05, 8.266046643257141e-05, 8.603092283010483e-05, 8.940137922763824e-05, 9.277183562517166e-05, 9.614229202270508e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 13.0, 7.0, 11.0, 17.0, 16.0, 40.0, 45.0, 59.0, 96.0, 143.0, 190.0, 302.0, 435.0, 765.0, 1168.0, 2007.0, 3988.0, 8768.0, 25213.0, 188917.0, 739306.0, 51052.0, 13401.0, 5701.0, 2776.0, 1487.0, 901.0, 611.0, 328.0, 248.0, 155.0, 119.0, 81.0, 50.0, 40.0, 16.0, 19.0, 9.0, 12.0, 10.0, 6.0, 12.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.34619140625, -0.33510589599609375, -0.3240203857421875, -0.31293487548828125, -0.301849365234375, -0.29076385498046875, -0.2796783447265625, -0.26859283447265625, -0.25750732421875, -0.24642181396484375, -0.2353363037109375, -0.22425079345703125, -0.213165283203125, -0.20207977294921875, -0.1909942626953125, -0.17990875244140625, -0.1688232421875, -0.15773773193359375, -0.1466522216796875, -0.13556671142578125, -0.124481201171875, -0.11339569091796875, -0.1023101806640625, -0.09122467041015625, -0.08013916015625, -0.06905364990234375, -0.0579681396484375, -0.04688262939453125, -0.035797119140625, -0.02471160888671875, -0.0136260986328125, -0.00254058837890625, 0.008544921875, 0.01963043212890625, 0.0307159423828125, 0.04180145263671875, 0.052886962890625, 0.06397247314453125, 0.0750579833984375, 0.08614349365234375, 0.09722900390625, 0.10831451416015625, 0.1194000244140625, 0.13048553466796875, 0.141571044921875, 0.15265655517578125, 0.1637420654296875, 0.17482757568359375, 0.1859130859375, 0.19699859619140625, 0.2080841064453125, 0.21916961669921875, 0.230255126953125, 0.24134063720703125, 0.2524261474609375, 0.26351165771484375, 0.27459716796875, 0.28568267822265625, 0.2967681884765625, 0.30785369873046875, 0.318939208984375, 0.33002471923828125, 0.3411102294921875, 0.35219573974609375, 0.36328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 10.0, 11.0, 25.0, 69.0, 85.0, 170.0, 191.0, 182.0, 90.0, 50.0, 29.0, 11.0, 12.0, 7.0, 8.0, 8.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.478271484375, -0.4621162414550781, -0.44596099853515625, -0.4298057556152344, -0.4136505126953125, -0.3974952697753906, -0.38134002685546875, -0.3651847839355469, -0.349029541015625, -0.3328742980957031, -0.31671905517578125, -0.3005638122558594, -0.2844085693359375, -0.2682533264160156, -0.25209808349609375, -0.23594284057617188, -0.21978759765625, -0.20363235473632812, -0.18747711181640625, -0.17132186889648438, -0.1551666259765625, -0.13901138305664062, -0.12285614013671875, -0.10670089721679688, -0.090545654296875, -0.07439041137695312, -0.05823516845703125, -0.042079925537109375, -0.0259246826171875, -0.009769439697265625, 0.00638580322265625, 0.022541046142578125, 0.0386962890625, 0.054851531982421875, 0.07100677490234375, 0.08716201782226562, 0.1033172607421875, 0.11947250366210938, 0.13562774658203125, 0.15178298950195312, 0.167938232421875, 0.18409347534179688, 0.20024871826171875, 0.21640396118164062, 0.2325592041015625, 0.24871444702148438, 0.26486968994140625, 0.2810249328613281, 0.29718017578125, 0.3133354187011719, 0.32949066162109375, 0.3456459045410156, 0.3618011474609375, 0.3779563903808594, 0.39411163330078125, 0.4102668762207031, 0.426422119140625, 0.4425773620605469, 0.45873260498046875, 0.4748878479003906, 0.4910430908203125, 0.5071983337402344, 0.5233535766601562, 0.5395088195800781, 0.5556640625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 10.0, 12.0, 18.0, 29.0, 85.0, 197.0, 359.0, 159.0, 73.0, 30.0, 11.0, 3.0, 6.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.622251033782959, -3.3521265983581543, -3.0820019245147705, -2.811877489089966, -2.541752815246582, -2.2716283798217773, -2.0015039443969727, -1.7313793897628784, -1.4612548351287842, -1.19113028049469, -0.9210057854652405, -0.650881290435791, -0.3807567358016968, -0.11063218116760254, 0.15949225425720215, 0.4296168088912964, 0.6997413635253906, 0.9698659181594849, 1.239990472793579, 1.5101149082183838, 1.780239462852478, 2.0503640174865723, 2.320488452911377, 2.5906128883361816, 2.8607375621795654, 3.13086199760437, 3.400986671447754, 3.6711111068725586, 3.9412355422973633, 4.211359977722168, 4.481484413146973, 4.7516093254089355, 5.021734237670898, 5.291858673095703, 5.561983108520508, 5.8321075439453125, 6.102232456207275, 6.37235689163208, 6.642481327056885, 6.9126057624816895, 7.182730674743652, 7.452855110168457, 7.722979545593262, 7.993103981018066, 8.263228416442871, 8.533353805541992, 8.803478240966797, 9.073602676391602, 9.343727111816406, 9.613851547241211, 9.883975982666016, 10.15410041809082, 10.424224853515625, 10.69434928894043, 10.964473724365234, 11.234599113464355, 11.504722595214844, 11.774847030639648, 12.044971466064453, 12.315095901489258, 12.585220336914062, 12.855344772338867, 13.125469207763672, 13.395594596862793, 13.665719032287598]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 3.0, 4.0, 8.0, 5.0, 5.0, 9.0, 9.0, 14.0, 17.0, 17.0, 17.0, 9.0, 22.0, 25.0, 25.0, 35.0, 26.0, 45.0, 49.0, 62.0, 52.0, 57.0, 51.0, 46.0, 35.0, 38.0, 32.0, 27.0, 35.0, 34.0, 25.0, 17.0, 23.0, 23.0, 14.0, 19.0, 14.0, 10.0, 8.0, 7.0, 9.0, 6.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0789895057678223, -2.0096607208251953, -1.940332055091858, -1.8710033893585205, -1.8016746044158936, -1.7323458194732666, -1.6630171537399292, -1.5936884880065918, -1.5243597030639648, -1.455030918121338, -1.3857022523880005, -1.316373586654663, -1.2470448017120361, -1.1777160167694092, -1.1083873510360718, -1.0390586853027344, -0.9697299003601074, -0.9004011750221252, -0.8310724496841431, -0.7617437243461609, -0.6924149990081787, -0.6230862736701965, -0.5537575483322144, -0.4844288229942322, -0.41510009765625, -0.3457713723182678, -0.27644264698028564, -0.20711392164230347, -0.1377851963043213, -0.06845647096633911, 0.0008722543716430664, 0.07020097970962524, 0.13952970504760742, 0.2088584303855896, 0.2781871557235718, 0.34751588106155396, 0.41684460639953613, 0.4861733317375183, 0.5555020570755005, 0.6248307824134827, 0.6941595077514648, 0.763488233089447, 0.8328169584274292, 0.9021456837654114, 0.9714744091033936, 1.0408031940460205, 1.110131859779358, 1.1794605255126953, 1.2487893104553223, 1.3181180953979492, 1.3874467611312866, 1.456775426864624, 1.526104211807251, 1.595432996749878, 1.6647616624832153, 1.7340903282165527, 1.8034191131591797, 1.8727478981018066, 1.942076563835144, 2.0114052295684814, 2.0807340145111084, 2.1500627994537354, 2.219391345977783, 2.28872013092041, 2.358048915863037]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 8.0, 7.0, 17.0, 37.0, 55.0, 60.0, 64.0, 98.0, 144.0, 274.0, 560.0, 2193.0, 35202.0, 4103272.0, 48507.0, 2442.0, 566.0, 253.0, 143.0, 104.0, 73.0, 61.0, 40.0, 33.0, 18.0, 18.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6826171875, -0.6616363525390625, -0.640655517578125, -0.6196746826171875, -0.59869384765625, -0.5777130126953125, -0.556732177734375, -0.5357513427734375, -0.5147705078125, -0.4937896728515625, -0.472808837890625, -0.4518280029296875, -0.43084716796875, -0.4098663330078125, -0.388885498046875, -0.3679046630859375, -0.346923828125, -0.3259429931640625, -0.304962158203125, -0.2839813232421875, -0.26300048828125, -0.2420196533203125, -0.221038818359375, -0.2000579833984375, -0.1790771484375, -0.1580963134765625, -0.137115478515625, -0.1161346435546875, -0.09515380859375, -0.0741729736328125, -0.053192138671875, -0.0322113037109375, -0.01123046875, 0.0097503662109375, 0.030731201171875, 0.0517120361328125, 0.07269287109375, 0.0936737060546875, 0.114654541015625, 0.1356353759765625, 0.1566162109375, 0.1775970458984375, 0.198577880859375, 0.2195587158203125, 0.24053955078125, 0.2615203857421875, 0.282501220703125, 0.3034820556640625, 0.324462890625, 0.3454437255859375, 0.366424560546875, 0.3874053955078125, 0.40838623046875, 0.4293670654296875, 0.450347900390625, 0.4713287353515625, 0.4923095703125, 0.5132904052734375, 0.534271240234375, 0.5552520751953125, 0.57623291015625, 0.5972137451171875, 0.618194580078125, 0.6391754150390625, 0.66015625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 14.0, 29.0, 29.0, 50.0, 51.0, 78.0, 92.0, 100.0, 112.0, 90.0, 89.0, 73.0, 45.0, 52.0, 33.0, 21.0, 4.0, 8.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.13319969177246094, -0.12907028198242188, -0.12494087219238281, -0.12081146240234375, -0.11668205261230469, -0.11255264282226562, -0.10842323303222656, -0.1042938232421875, -0.10016441345214844, -0.09603500366210938, -0.09190559387207031, -0.08777618408203125, -0.08364677429199219, -0.07951736450195312, -0.07538795471191406, -0.071258544921875, -0.06712913513183594, -0.06299972534179688, -0.05887031555175781, -0.05474090576171875, -0.05061149597167969, -0.046482086181640625, -0.04235267639160156, -0.0382232666015625, -0.03409385681152344, -0.029964447021484375, -0.025835037231445312, -0.02170562744140625, -0.017576217651367188, -0.013446807861328125, -0.009317398071289062, -0.00518798828125, -0.0010585784912109375, 0.003070831298828125, 0.0072002410888671875, 0.01132965087890625, 0.015459060668945312, 0.019588470458984375, 0.023717880249023438, 0.0278472900390625, 0.03197669982910156, 0.036106109619140625, 0.04023551940917969, 0.04436492919921875, 0.04849433898925781, 0.052623748779296875, 0.05675315856933594, 0.060882568359375, 0.06501197814941406, 0.06914138793945312, 0.07327079772949219, 0.07740020751953125, 0.08152961730957031, 0.08565902709960938, 0.08978843688964844, 0.0939178466796875, 0.09804725646972656, 0.10217666625976562, 0.10630607604980469, 0.11043548583984375, 0.11456489562988281, 0.11869430541992188, 0.12282371520996094, 0.126953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 10.0, 11.0, 9.0, 21.0, 28.0, 44.0, 41.0, 67.0, 69.0, 95.0, 124.0, 205.0, 348.0, 540.0, 960.0, 2665.0, 14976.0, 491157.0, 3637708.0, 37362.0, 4519.0, 1363.0, 642.0, 409.0, 252.0, 187.0, 156.0, 118.0, 55.0, 47.0, 31.0, 23.0, 14.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48388671875, -0.4678497314453125, -0.451812744140625, -0.4357757568359375, -0.41973876953125, -0.4037017822265625, -0.387664794921875, -0.3716278076171875, -0.3555908203125, -0.3395538330078125, -0.323516845703125, -0.3074798583984375, -0.29144287109375, -0.2754058837890625, -0.259368896484375, -0.2433319091796875, -0.227294921875, -0.2112579345703125, -0.195220947265625, -0.1791839599609375, -0.16314697265625, -0.1471099853515625, -0.131072998046875, -0.1150360107421875, -0.0989990234375, -0.0829620361328125, -0.066925048828125, -0.0508880615234375, -0.03485107421875, -0.0188140869140625, -0.002777099609375, 0.0132598876953125, 0.029296875, 0.0453338623046875, 0.061370849609375, 0.0774078369140625, 0.09344482421875, 0.1094818115234375, 0.125518798828125, 0.1415557861328125, 0.1575927734375, 0.1736297607421875, 0.189666748046875, 0.2057037353515625, 0.22174072265625, 0.2377777099609375, 0.253814697265625, 0.2698516845703125, 0.285888671875, 0.3019256591796875, 0.317962646484375, 0.3339996337890625, 0.35003662109375, 0.3660736083984375, 0.382110595703125, 0.3981475830078125, 0.4141845703125, 0.4302215576171875, 0.446258544921875, 0.4622955322265625, 0.47833251953125, 0.4943695068359375, 0.510406494140625, 0.5264434814453125, 0.54248046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 19.0, 29.0, 98.0, 320.0, 1901.0, 1340.0, 227.0, 71.0, 39.0, 15.0, 10.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98193359375, -0.957916259765625, -0.93389892578125, -0.909881591796875, -0.8858642578125, -0.861846923828125, -0.83782958984375, -0.813812255859375, -0.789794921875, -0.765777587890625, -0.74176025390625, -0.717742919921875, -0.6937255859375, -0.669708251953125, -0.64569091796875, -0.621673583984375, -0.59765625, -0.573638916015625, -0.54962158203125, -0.525604248046875, -0.5015869140625, -0.477569580078125, -0.45355224609375, -0.429534912109375, -0.405517578125, -0.381500244140625, -0.35748291015625, -0.333465576171875, -0.3094482421875, -0.285430908203125, -0.26141357421875, -0.237396240234375, -0.21337890625, -0.189361572265625, -0.16534423828125, -0.141326904296875, -0.1173095703125, -0.093292236328125, -0.06927490234375, -0.045257568359375, -0.021240234375, 0.002777099609375, 0.02679443359375, 0.050811767578125, 0.0748291015625, 0.098846435546875, 0.12286376953125, 0.146881103515625, 0.1708984375, 0.194915771484375, 0.21893310546875, 0.242950439453125, 0.2669677734375, 0.290985107421875, 0.31500244140625, 0.339019775390625, 0.363037109375, 0.387054443359375, 0.41107177734375, 0.435089111328125, 0.4591064453125, 0.483123779296875, 0.50714111328125, 0.531158447265625, 0.55517578125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 3.0, 13.0, 25.0, 36.0, 75.0, 152.0, 229.0, 209.0, 121.0, 59.0, 29.0, 13.0, 16.0, 10.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.38411283493042, -5.266946315765381, -5.149779796600342, -5.032613277435303, -4.915446758270264, -4.798280239105225, -4.6811137199401855, -4.5639472007751465, -4.446780681610107, -4.329614162445068, -4.212447643280029, -4.09528112411499, -3.978114604949951, -3.860948085784912, -3.743781566619873, -3.626615047454834, -3.509448289871216, -3.3922817707061768, -3.2751152515411377, -3.1579487323760986, -3.0407822132110596, -2.9236156940460205, -2.8064489364624023, -2.6892824172973633, -2.572115898132324, -2.454949378967285, -2.337782859802246, -2.220616340637207, -2.103449821472168, -1.986283302307129, -1.8691166639328003, -1.7519501447677612, -1.6347835063934326, -1.5176169872283936, -1.4004504680633545, -1.2832839488983154, -1.1661174297332764, -1.0489509105682373, -0.9317842721939087, -0.8146177530288696, -0.6974512338638306, -0.5802847146987915, -0.46311816573143005, -0.3459516167640686, -0.22878509759902954, -0.11161857843399048, 0.005548000335693359, 0.12271451950073242, 0.23988103866577148, 0.35704755783081055, 0.474214106798172, 0.5913806557655334, 0.7085471749305725, 0.8257136940956116, 0.9428802728652954, 1.0600467920303345, 1.1772133111953735, 1.2943798303604126, 1.4115463495254517, 1.5287129878997803, 1.6458795070648193, 1.7630460262298584, 1.8802125453948975, 1.9973790645599365, 2.1145455837249756]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 7.0, 4.0, 4.0, 11.0, 15.0, 17.0, 11.0, 22.0, 25.0, 40.0, 38.0, 32.0, 41.0, 41.0, 54.0, 67.0, 46.0, 40.0, 61.0, 54.0, 56.0, 40.0, 38.0, 41.0, 38.0, 23.0, 30.0, 24.0, 15.0, 14.0, 8.0, 11.0, 5.0, 7.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3683083057403564, -1.3242965936660767, -1.2802847623825073, -1.2362730503082275, -1.1922612190246582, -1.1482495069503784, -1.1042377948760986, -1.0602259635925293, -1.0162142515182495, -0.972202479839325, -0.9281907081604004, -0.8841789960861206, -0.840167224407196, -0.7961554527282715, -0.7521436810493469, -0.7081319093704224, -0.6641201376914978, -0.6201083660125732, -0.5760965943336487, -0.5320848226547241, -0.48807311058044434, -0.4440613389015198, -0.4000495672225952, -0.35603782534599304, -0.3120260536670685, -0.2680142819881439, -0.22400254011154175, -0.1799907684326172, -0.13597901165485382, -0.09196725487709045, -0.047955483198165894, -0.003943741321563721, 0.04006803035736084, 0.0840797871351242, 0.12809154391288757, 0.17210331559181213, 0.2161150723695755, 0.26012682914733887, 0.3041386008262634, 0.3481503427028656, 0.39216211438179016, 0.4361738860607147, 0.4801856279373169, 0.5241973996162415, 0.568209171295166, 0.6122208833694458, 0.6562327146530151, 0.7002444267272949, 0.7442561984062195, 0.788267970085144, 0.8322797417640686, 0.8762915134429932, 0.920303225517273, 0.9643149971961975, 1.008326768875122, 1.0523384809494019, 1.0963503122329712, 1.140362024307251, 1.1843738555908203, 1.2283855676651, 1.2723973989486694, 1.3164091110229492, 1.3604209423065186, 1.4044326543807983, 1.4484443664550781]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 2.0, 5.0, 12.0, 23.0, 29.0, 45.0, 61.0, 71.0, 140.0, 148.0, 257.0, 347.0, 538.0, 865.0, 1417.0, 2291.0, 3890.0, 6966.0, 13288.0, 26551.0, 57655.0, 135696.0, 293776.0, 276013.0, 122665.0, 52665.0, 24582.0, 12399.0, 6576.0, 3680.0, 2112.0, 1315.0, 858.0, 515.0, 319.0, 234.0, 186.0, 110.0, 77.0, 47.0, 35.0, 23.0, 29.0, 17.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1981201171875, -0.1921062469482422, -0.18609237670898438, -0.18007850646972656, -0.17406463623046875, -0.16805076599121094, -0.16203689575195312, -0.1560230255126953, -0.1500091552734375, -0.1439952850341797, -0.13798141479492188, -0.13196754455566406, -0.12595367431640625, -0.11993980407714844, -0.11392593383789062, -0.10791206359863281, -0.101898193359375, -0.09588432312011719, -0.08987045288085938, -0.08385658264160156, -0.07784271240234375, -0.07182884216308594, -0.06581497192382812, -0.05980110168457031, -0.0537872314453125, -0.04777336120605469, -0.041759490966796875, -0.03574562072753906, -0.02973175048828125, -0.023717880249023438, -0.017704010009765625, -0.011690139770507812, -0.00567626953125, 0.0003376007080078125, 0.006351470947265625, 0.012365341186523438, 0.01837921142578125, 0.024393081665039062, 0.030406951904296875, 0.03642082214355469, 0.0424346923828125, 0.04844856262207031, 0.054462432861328125, 0.06047630310058594, 0.06649017333984375, 0.07250404357910156, 0.07851791381835938, 0.08453178405761719, 0.090545654296875, 0.09655952453613281, 0.10257339477539062, 0.10858726501464844, 0.11460113525390625, 0.12061500549316406, 0.12662887573242188, 0.1326427459716797, 0.1386566162109375, 0.1446704864501953, 0.15068435668945312, 0.15669822692871094, 0.16271209716796875, 0.16872596740722656, 0.17473983764648438, 0.1807537078857422, 0.186767578125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 11.0, 21.0, 29.0, 31.0, 39.0, 43.0, 76.0, 90.0, 92.0, 83.0, 98.0, 88.0, 68.0, 61.0, 44.0, 34.0, 30.0, 21.0, 16.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1436767578125, -0.13951587677001953, -0.13535499572753906, -0.1311941146850586, -0.12703323364257812, -0.12287235260009766, -0.11871147155761719, -0.11455059051513672, -0.11038970947265625, -0.10622882843017578, -0.10206794738769531, -0.09790706634521484, -0.09374618530273438, -0.0895853042602539, -0.08542442321777344, -0.08126354217529297, -0.0771026611328125, -0.07294178009033203, -0.06878089904785156, -0.0646200180053711, -0.060459136962890625, -0.056298255920410156, -0.05213737487792969, -0.04797649383544922, -0.04381561279296875, -0.03965473175048828, -0.03549385070800781, -0.031332969665527344, -0.027172088623046875, -0.023011207580566406, -0.018850326538085938, -0.014689445495605469, -0.010528564453125, -0.006367683410644531, -0.0022068023681640625, 0.0019540786743164062, 0.006114959716796875, 0.010275840759277344, 0.014436721801757812, 0.01859760284423828, 0.02275848388671875, 0.02691936492919922, 0.031080245971679688, 0.035241127014160156, 0.039402008056640625, 0.043562889099121094, 0.04772377014160156, 0.05188465118408203, 0.0560455322265625, 0.06020641326904297, 0.06436729431152344, 0.0685281753540039, 0.07268905639648438, 0.07684993743896484, 0.08101081848144531, 0.08517169952392578, 0.08933258056640625, 0.09349346160888672, 0.09765434265136719, 0.10181522369384766, 0.10597610473632812, 0.1101369857788086, 0.11429786682128906, 0.11845874786376953, 0.12261962890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 9.0, 6.0, 12.0, 9.0, 14.0, 28.0, 41.0, 56.0, 91.0, 133.0, 198.0, 389.0, 751.0, 1423.0, 3201.0, 8790.0, 30571.0, 152001.0, 673104.0, 135083.0, 28206.0, 8236.0, 3126.0, 1387.0, 696.0, 379.0, 206.0, 134.0, 83.0, 58.0, 37.0, 18.0, 15.0, 13.0, 13.0, 7.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.42041015625, -0.4066123962402344, -0.39281463623046875, -0.3790168762207031, -0.3652191162109375, -0.3514213562011719, -0.33762359619140625, -0.3238258361816406, -0.310028076171875, -0.2962303161621094, -0.28243255615234375, -0.2686347961425781, -0.2548370361328125, -0.24103927612304688, -0.22724151611328125, -0.21344375610351562, -0.19964599609375, -0.18584823608398438, -0.17205047607421875, -0.15825271606445312, -0.1444549560546875, -0.13065719604492188, -0.11685943603515625, -0.10306167602539062, -0.089263916015625, -0.07546615600585938, -0.06166839599609375, -0.047870635986328125, -0.0340728759765625, -0.020275115966796875, -0.00647735595703125, 0.007320404052734375, 0.0211181640625, 0.034915924072265625, 0.04871368408203125, 0.06251144409179688, 0.0763092041015625, 0.09010696411132812, 0.10390472412109375, 0.11770248413085938, 0.131500244140625, 0.14529800415039062, 0.15909576416015625, 0.17289352416992188, 0.1866912841796875, 0.20048904418945312, 0.21428680419921875, 0.22808456420898438, 0.24188232421875, 0.2556800842285156, 0.26947784423828125, 0.2832756042480469, 0.2970733642578125, 0.3108711242675781, 0.32466888427734375, 0.3384666442871094, 0.352264404296875, 0.3660621643066406, 0.37985992431640625, 0.3936576843261719, 0.4074554443359375, 0.4212532043457031, 0.43505096435546875, 0.4488487243652344, 0.462646484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 7.0, 12.0, 8.0, 12.0, 10.0, 10.0, 17.0, 18.0, 29.0, 24.0, 29.0, 25.0, 35.0, 37.0, 51.0, 57.0, 52.0, 55.0, 62.0, 41.0, 48.0, 37.0, 64.0, 36.0, 33.0, 30.0, 28.0, 28.0, 12.0, 15.0, 12.0, 18.0, 8.0, 8.0, 9.0, 5.0, 6.0, 4.0, 5.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.39404296875, -0.382476806640625, -0.37091064453125, -0.359344482421875, -0.3477783203125, -0.336212158203125, -0.32464599609375, -0.313079833984375, -0.301513671875, -0.289947509765625, -0.27838134765625, -0.266815185546875, -0.2552490234375, -0.243682861328125, -0.23211669921875, -0.220550537109375, -0.208984375, -0.197418212890625, -0.18585205078125, -0.174285888671875, -0.1627197265625, -0.151153564453125, -0.13958740234375, -0.128021240234375, -0.116455078125, -0.104888916015625, -0.09332275390625, -0.081756591796875, -0.0701904296875, -0.058624267578125, -0.04705810546875, -0.035491943359375, -0.02392578125, -0.012359619140625, -0.00079345703125, 0.010772705078125, 0.0223388671875, 0.033905029296875, 0.04547119140625, 0.057037353515625, 0.068603515625, 0.080169677734375, 0.09173583984375, 0.103302001953125, 0.1148681640625, 0.126434326171875, 0.13800048828125, 0.149566650390625, 0.1611328125, 0.172698974609375, 0.18426513671875, 0.195831298828125, 0.2073974609375, 0.218963623046875, 0.23052978515625, 0.242095947265625, 0.253662109375, 0.265228271484375, 0.27679443359375, 0.288360595703125, 0.2999267578125, 0.311492919921875, 0.32305908203125, 0.334625244140625, 0.34619140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 21.0, 23.0, 30.0, 39.0, 54.0, 82.0, 132.0, 207.0, 384.0, 654.0, 1356.0, 2937.0, 7512.0, 25578.0, 161696.0, 744984.0, 76639.0, 16384.0, 5393.0, 2107.0, 982.0, 493.0, 303.0, 190.0, 109.0, 68.0, 47.0, 44.0, 26.0, 15.0, 14.0, 8.0, 11.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.41015625, -0.3982086181640625, -0.386260986328125, -0.3743133544921875, -0.36236572265625, -0.3504180908203125, -0.338470458984375, -0.3265228271484375, -0.3145751953125, -0.3026275634765625, -0.290679931640625, -0.2787322998046875, -0.26678466796875, -0.2548370361328125, -0.242889404296875, -0.2309417724609375, -0.218994140625, -0.2070465087890625, -0.195098876953125, -0.1831512451171875, -0.17120361328125, -0.1592559814453125, -0.147308349609375, -0.1353607177734375, -0.1234130859375, -0.1114654541015625, -0.099517822265625, -0.0875701904296875, -0.07562255859375, -0.0636749267578125, -0.051727294921875, -0.0397796630859375, -0.02783203125, -0.0158843994140625, -0.003936767578125, 0.0080108642578125, 0.01995849609375, 0.0319061279296875, 0.043853759765625, 0.0558013916015625, 0.0677490234375, 0.0796966552734375, 0.091644287109375, 0.1035919189453125, 0.11553955078125, 0.1274871826171875, 0.139434814453125, 0.1513824462890625, 0.163330078125, 0.1752777099609375, 0.187225341796875, 0.1991729736328125, 0.21112060546875, 0.2230682373046875, 0.235015869140625, 0.2469635009765625, 0.2589111328125, 0.2708587646484375, 0.282806396484375, 0.2947540283203125, 0.30670166015625, 0.3186492919921875, 0.330596923828125, 0.3425445556640625, 0.3544921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 10.0, 11.0, 20.0, 27.0, 41.0, 60.0, 124.0, 180.0, 193.0, 113.0, 65.0, 39.0, 39.0, 19.0, 12.0, 12.0, 4.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010693073272705078, -0.00010295771062374115, -9.898468852043152e-05, -9.501166641712189e-05, -9.103864431381226e-05, -8.706562221050262e-05, -8.309260010719299e-05, -7.911957800388336e-05, -7.514655590057373e-05, -7.11735337972641e-05, -6.720051169395447e-05, -6.322748959064484e-05, -5.9254467487335205e-05, -5.5281445384025574e-05, -5.130842328071594e-05, -4.733540117740631e-05, -4.336237907409668e-05, -3.938935697078705e-05, -3.541633486747742e-05, -3.1443312764167786e-05, -2.7470290660858154e-05, -2.3497268557548523e-05, -1.952424645423889e-05, -1.555122435092926e-05, -1.1578202247619629e-05, -7.6051801443099976e-06, -3.632158041000366e-06, 3.4086406230926514e-07, 4.3138861656188965e-06, 8.286908268928528e-06, 1.225993037223816e-05, 1.623295247554779e-05, 2.0205974578857422e-05, 2.4178996682167053e-05, 2.8152018785476685e-05, 3.2125040888786316e-05, 3.609806299209595e-05, 4.007108509540558e-05, 4.404410719871521e-05, 4.801712930202484e-05, 5.199015140533447e-05, 5.5963173508644104e-05, 5.9936195611953735e-05, 6.390921771526337e-05, 6.7882239818573e-05, 7.185526192188263e-05, 7.582828402519226e-05, 7.980130612850189e-05, 8.377432823181152e-05, 8.774735033512115e-05, 9.172037243843079e-05, 9.569339454174042e-05, 9.966641664505005e-05, 0.00010363943874835968, 0.00010761246085166931, 0.00011158548295497894, 0.00011555850505828857, 0.0001195315271615982, 0.00012350454926490784, 0.00012747757136821747, 0.0001314505934715271, 0.00013542361557483673, 0.00013939663767814636, 0.000143369659781456, 0.00014734268188476562]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 5.0, 14.0, 18.0, 29.0, 31.0, 43.0, 64.0, 96.0, 148.0, 251.0, 429.0, 835.0, 1632.0, 4195.0, 14173.0, 101850.0, 826971.0, 78483.0, 12363.0, 3716.0, 1476.0, 727.0, 381.0, 237.0, 123.0, 71.0, 57.0, 47.0, 28.0, 17.0, 15.0, 11.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.458740234375, -0.44460296630859375, -0.4304656982421875, -0.41632843017578125, -0.402191162109375, -0.38805389404296875, -0.3739166259765625, -0.35977935791015625, -0.34564208984375, -0.33150482177734375, -0.3173675537109375, -0.30323028564453125, -0.289093017578125, -0.27495574951171875, -0.2608184814453125, -0.24668121337890625, -0.2325439453125, -0.21840667724609375, -0.2042694091796875, -0.19013214111328125, -0.175994873046875, -0.16185760498046875, -0.1477203369140625, -0.13358306884765625, -0.11944580078125, -0.10530853271484375, -0.0911712646484375, -0.07703399658203125, -0.062896728515625, -0.04875946044921875, -0.0346221923828125, -0.02048492431640625, -0.00634765625, 0.00778961181640625, 0.0219268798828125, 0.03606414794921875, 0.050201416015625, 0.06433868408203125, 0.0784759521484375, 0.09261322021484375, 0.10675048828125, 0.12088775634765625, 0.1350250244140625, 0.14916229248046875, 0.163299560546875, 0.17743682861328125, 0.1915740966796875, 0.20571136474609375, 0.2198486328125, 0.23398590087890625, 0.2481231689453125, 0.26226043701171875, 0.276397705078125, 0.29053497314453125, 0.3046722412109375, 0.31880950927734375, 0.33294677734375, 0.34708404541015625, 0.3612213134765625, 0.37535858154296875, 0.389495849609375, 0.40363311767578125, 0.4177703857421875, 0.43190765380859375, 0.446044921875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 14.0, 17.0, 17.0, 20.0, 34.0, 37.0, 49.0, 68.0, 83.0, 112.0, 118.0, 99.0, 60.0, 69.0, 53.0, 18.0, 26.0, 19.0, 11.0, 14.0, 4.0, 17.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2578125, -0.25089073181152344, -0.24396896362304688, -0.2370471954345703, -0.23012542724609375, -0.2232036590576172, -0.21628189086914062, -0.20936012268066406, -0.2024383544921875, -0.19551658630371094, -0.18859481811523438, -0.1816730499267578, -0.17475128173828125, -0.1678295135498047, -0.16090774536132812, -0.15398597717285156, -0.147064208984375, -0.14014244079589844, -0.13322067260742188, -0.1262989044189453, -0.11937713623046875, -0.11245536804199219, -0.10553359985351562, -0.09861183166503906, -0.0916900634765625, -0.08476829528808594, -0.07784652709960938, -0.07092475891113281, -0.06400299072265625, -0.05708122253417969, -0.050159454345703125, -0.04323768615722656, -0.03631591796875, -0.029394149780273438, -0.022472381591796875, -0.015550613403320312, -0.00862884521484375, -0.0017070770263671875, 0.005214691162109375, 0.012136459350585938, 0.0190582275390625, 0.025979995727539062, 0.032901763916015625, 0.03982353210449219, 0.04674530029296875, 0.05366706848144531, 0.060588836669921875, 0.06751060485839844, 0.074432373046875, 0.08135414123535156, 0.08827590942382812, 0.09519767761230469, 0.10211944580078125, 0.10904121398925781, 0.11596298217773438, 0.12288475036621094, 0.1298065185546875, 0.13672828674316406, 0.14365005493164062, 0.1505718231201172, 0.15749359130859375, 0.1644153594970703, 0.17133712768554688, 0.17825889587402344, 0.1851806640625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 15.0, 26.0, 31.0, 63.0, 125.0, 280.0, 246.0, 113.0, 48.0, 20.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.87274169921875, -9.648122787475586, -9.423504829406738, -9.198885917663574, -8.97426700592041, -8.749649047851562, -8.525030136108398, -8.300411224365234, -8.07579231262207, -7.8511738777160645, -7.6265549659729, -7.4019365310668945, -7.1773176193237305, -6.952699184417725, -6.728080749511719, -6.503461837768555, -6.278843879699707, -6.054225444793701, -5.829606533050537, -5.604988098144531, -5.380369186401367, -5.155750751495361, -4.9311323165893555, -4.706513404846191, -4.4818949699401855, -4.25727653503418, -4.032657623291016, -3.8080391883850098, -3.583420515060425, -3.35880184173584, -3.134183406829834, -2.909564733505249, -2.684946060180664, -2.460327386856079, -2.235708713531494, -2.0110902786254883, -1.7864716053009033, -1.5618529319763184, -1.337234377861023, -1.1126158237457275, -0.8879971504211426, -0.6633785367012024, -0.4387599229812622, -0.21414130926132202, 0.010477304458618164, 0.23509597778320312, 0.45971453189849854, 0.684333086013794, 0.9089517593383789, 1.1335704326629639, 1.3581889867782593, 1.5828075408935547, 1.8074262142181396, 2.0320448875427246, 2.2566633224487305, 2.4812819957733154, 2.7059006690979004, 2.9305193424224854, 3.1551380157470703, 3.379756450653076, 3.604375123977661, 3.828993797302246, 4.053612232208252, 4.278230667114258, 4.502849578857422]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 3.0, 12.0, 6.0, 15.0, 10.0, 21.0, 10.0, 14.0, 27.0, 30.0, 30.0, 35.0, 36.0, 41.0, 44.0, 61.0, 60.0, 77.0, 68.0, 55.0, 41.0, 44.0, 35.0, 32.0, 27.0, 23.0, 23.0, 13.0, 13.0, 15.0, 9.0, 14.0, 11.0, 8.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7776765823364258, -1.7192513942718506, -1.6608262062072754, -1.6024010181427002, -1.543975830078125, -1.4855506420135498, -1.4271254539489746, -1.3687002658843994, -1.3102750778198242, -1.251849889755249, -1.1934247016906738, -1.1349995136260986, -1.0765743255615234, -1.0181491374969482, -0.9597240090370178, -0.9012988209724426, -0.8428736925125122, -0.784448504447937, -0.7260233163833618, -0.6675981283187866, -0.6091729402542114, -0.5507477521896362, -0.4923226237297058, -0.4338974356651306, -0.3754722476005554, -0.3170470595359802, -0.25862187147140503, -0.20019671320915222, -0.14177152514457703, -0.08334633708000183, -0.024921178817749023, 0.03350400924682617, 0.09192931652069092, 0.1503545045852661, 0.20877967774868011, 0.2672048509120941, 0.3256300389766693, 0.3840552270412445, 0.4424803853034973, 0.5009055733680725, 0.5593307614326477, 0.6177559494972229, 0.6761811375617981, 0.7346062660217285, 0.7930314540863037, 0.8514566421508789, 0.9098818302154541, 0.9683070182800293, 1.0267322063446045, 1.0851573944091797, 1.1435825824737549, 1.20200777053833, 1.2604329586029053, 1.3188581466674805, 1.3772833347320557, 1.4357085227966309, 1.494133710861206, 1.5525588989257812, 1.6109840869903564, 1.6694092750549316, 1.7278344631195068, 1.786259651184082, 1.8446848392486572, 1.9031100273132324, 1.961535096168518]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 10.0, 20.0, 28.0, 28.0, 84.0, 119.0, 186.0, 302.0, 598.0, 1568.0, 91850.0, 4094116.0, 3713.0, 715.0, 373.0, 227.0, 116.0, 81.0, 57.0, 24.0, 16.0, 19.0, 12.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4453125, -1.398956298828125, -1.35260009765625, -1.306243896484375, -1.2598876953125, -1.213531494140625, -1.16717529296875, -1.120819091796875, -1.074462890625, -1.028106689453125, -0.98175048828125, -0.935394287109375, -0.8890380859375, -0.842681884765625, -0.79632568359375, -0.749969482421875, -0.70361328125, -0.657257080078125, -0.61090087890625, -0.564544677734375, -0.5181884765625, -0.471832275390625, -0.42547607421875, -0.379119873046875, -0.332763671875, -0.286407470703125, -0.24005126953125, -0.193695068359375, -0.1473388671875, -0.100982666015625, -0.05462646484375, -0.008270263671875, 0.0380859375, 0.084442138671875, 0.13079833984375, 0.177154541015625, 0.2235107421875, 0.269866943359375, 0.31622314453125, 0.362579345703125, 0.408935546875, 0.455291748046875, 0.50164794921875, 0.548004150390625, 0.5943603515625, 0.640716552734375, 0.68707275390625, 0.733428955078125, 0.77978515625, 0.826141357421875, 0.87249755859375, 0.918853759765625, 0.9652099609375, 1.011566162109375, 1.05792236328125, 1.104278564453125, 1.150634765625, 1.196990966796875, 1.24334716796875, 1.289703369140625, 1.3360595703125, 1.382415771484375, 1.42877197265625, 1.475128173828125, 1.521484375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 12.0, 19.0, 31.0, 32.0, 42.0, 54.0, 62.0, 86.0, 95.0, 102.0, 107.0, 77.0, 60.0, 67.0, 47.0, 29.0, 26.0, 17.0, 10.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1436767578125, -0.1394968032836914, -0.1353168487548828, -0.13113689422607422, -0.12695693969726562, -0.12277698516845703, -0.11859703063964844, -0.11441707611083984, -0.11023712158203125, -0.10605716705322266, -0.10187721252441406, -0.09769725799560547, -0.09351730346679688, -0.08933734893798828, -0.08515739440917969, -0.0809774398803711, -0.0767974853515625, -0.0726175308227539, -0.06843757629394531, -0.06425762176513672, -0.060077667236328125, -0.05589771270751953, -0.05171775817871094, -0.047537803649902344, -0.04335784912109375, -0.039177894592285156, -0.03499794006347656, -0.03081798553466797, -0.026638031005859375, -0.02245807647705078, -0.018278121948242188, -0.014098167419433594, -0.009918212890625, -0.005738258361816406, -0.0015583038330078125, 0.0026216506958007812, 0.006801605224609375, 0.010981559753417969, 0.015161514282226562, 0.019341468811035156, 0.02352142333984375, 0.027701377868652344, 0.03188133239746094, 0.03606128692626953, 0.040241241455078125, 0.04442119598388672, 0.04860115051269531, 0.052781105041503906, 0.0569610595703125, 0.061141014099121094, 0.06532096862792969, 0.06950092315673828, 0.07368087768554688, 0.07786083221435547, 0.08204078674316406, 0.08622074127197266, 0.09040069580078125, 0.09458065032958984, 0.09876060485839844, 0.10294055938720703, 0.10712051391601562, 0.11130046844482422, 0.11548042297363281, 0.1196603775024414, 0.12384033203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 9.0, 16.0, 18.0, 30.0, 41.0, 47.0, 75.0, 121.0, 182.0, 279.0, 417.0, 760.0, 2925.0, 91421.0, 4081777.0, 13243.0, 1374.0, 553.0, 334.0, 232.0, 154.0, 83.0, 66.0, 40.0, 37.0, 16.0, 7.0, 10.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21875, -1.1797943115234375, -1.140838623046875, -1.1018829345703125, -1.06292724609375, -1.0239715576171875, -0.985015869140625, -0.9460601806640625, -0.9071044921875, -0.8681488037109375, -0.829193115234375, -0.7902374267578125, -0.75128173828125, -0.7123260498046875, -0.673370361328125, -0.6344146728515625, -0.595458984375, -0.5565032958984375, -0.517547607421875, -0.4785919189453125, -0.43963623046875, -0.4006805419921875, -0.361724853515625, -0.3227691650390625, -0.2838134765625, -0.2448577880859375, -0.205902099609375, -0.1669464111328125, -0.12799072265625, -0.0890350341796875, -0.050079345703125, -0.0111236572265625, 0.02783203125, 0.0667877197265625, 0.105743408203125, 0.1446990966796875, 0.18365478515625, 0.2226104736328125, 0.261566162109375, 0.3005218505859375, 0.3394775390625, 0.3784332275390625, 0.417388916015625, 0.4563446044921875, 0.49530029296875, 0.5342559814453125, 0.573211669921875, 0.6121673583984375, 0.651123046875, 0.6900787353515625, 0.729034423828125, 0.7679901123046875, 0.80694580078125, 0.8459014892578125, 0.884857177734375, 0.9238128662109375, 0.9627685546875, 1.0017242431640625, 1.040679931640625, 1.0796356201171875, 1.11859130859375, 1.1575469970703125, 1.196502685546875, 1.2354583740234375, 1.2744140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 13.0, 12.0, 42.0, 132.0, 594.0, 2662.0, 436.0, 113.0, 41.0, 17.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1513671875, -1.1198043823242188, -1.0882415771484375, -1.0566787719726562, -1.025115966796875, -0.9935531616210938, -0.9619903564453125, -0.9304275512695312, -0.89886474609375, -0.8673019409179688, -0.8357391357421875, -0.8041763305664062, -0.772613525390625, -0.7410507202148438, -0.7094879150390625, -0.6779251098632812, -0.6463623046875, -0.6147994995117188, -0.5832366943359375, -0.5516738891601562, -0.520111083984375, -0.48854827880859375, -0.4569854736328125, -0.42542266845703125, -0.39385986328125, -0.36229705810546875, -0.3307342529296875, -0.29917144775390625, -0.267608642578125, -0.23604583740234375, -0.2044830322265625, -0.17292022705078125, -0.141357421875, -0.10979461669921875, -0.0782318115234375, -0.04666900634765625, -0.015106201171875, 0.01645660400390625, 0.0480194091796875, 0.07958221435546875, 0.11114501953125, 0.14270782470703125, 0.1742706298828125, 0.20583343505859375, 0.237396240234375, 0.26895904541015625, 0.3005218505859375, 0.33208465576171875, 0.3636474609375, 0.39521026611328125, 0.4267730712890625, 0.45833587646484375, 0.489898681640625, 0.5214614868164062, 0.5530242919921875, 0.5845870971679688, 0.61614990234375, 0.6477127075195312, 0.6792755126953125, 0.7108383178710938, 0.742401123046875, 0.7739639282226562, 0.8055267333984375, 0.8370895385742188, 0.86865234375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 11.0, 31.0, 52.0, 152.0, 289.0, 243.0, 115.0, 49.0, 19.0, 11.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.928096771240234, -6.723127365112305, -6.518158435821533, -6.3131890296936035, -6.108219623565674, -5.903250694274902, -5.698281288146973, -5.493311882019043, -5.288342475891113, -5.083373069763184, -4.878404140472412, -4.673434734344482, -4.468465328216553, -4.263496398925781, -4.058526992797852, -3.853557586669922, -3.6485884189605713, -3.4436192512512207, -3.238649845123291, -3.0336806774139404, -2.8287112712860107, -2.62374210357666, -2.4187726974487305, -2.21380352973938, -2.0088343620300293, -1.8038650751113892, -1.598895788192749, -1.3939266204833984, -1.1889572143554688, -0.9839880466461182, -0.779018759727478, -0.5740494728088379, -0.3690800666809082, -0.16411079466342926, 0.04085847735404968, 0.24582773447036743, 0.45079702138900757, 0.6557662487030029, 0.8607355356216431, 1.0657048225402832, 1.2706741094589233, 1.4756433963775635, 1.6806126832962036, 1.8855819702148438, 2.0905511379241943, 2.295520305633545, 2.5004897117614746, 2.7054591178894043, 2.910428285598755, 3.1153974533081055, 3.320366859436035, 3.5253360271453857, 3.7303054332733154, 3.935274600982666, 4.140244007110596, 4.345212936401367, 4.550182342529297, 4.755151748657227, 4.960120677947998, 5.165090084075928, 5.370059490203857, 5.575028419494629, 5.779997825622559, 5.984967231750488, 6.189936637878418]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 11.0, 10.0, 17.0, 23.0, 20.0, 36.0, 34.0, 46.0, 48.0, 64.0, 62.0, 51.0, 52.0, 56.0, 62.0, 56.0, 61.0, 55.0, 53.0, 44.0, 28.0, 26.0, 17.0, 20.0, 8.0, 9.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1856422424316406, -2.113992929458618, -2.0423436164855957, -1.9706943035125732, -1.8990449905395508, -1.8273956775665283, -1.7557463645935059, -1.6840970516204834, -1.612447738647461, -1.5407984256744385, -1.469149112701416, -1.3974997997283936, -1.325850486755371, -1.2542011737823486, -1.1825518608093262, -1.1109025478363037, -1.0392531156539917, -0.9676038026809692, -0.8959544897079468, -0.8243051767349243, -0.7526558637619019, -0.6810065507888794, -0.6093571782112122, -0.5377078652381897, -0.46605855226516724, -0.3944092392921448, -0.3227599263191223, -0.25111058354377747, -0.179461270570755, -0.10781195759773254, -0.036162614822387695, 0.035486698150634766, 0.10713601112365723, 0.1787853240966797, 0.25043463706970215, 0.322083979845047, 0.39373329281806946, 0.4653826057910919, 0.5370319485664368, 0.6086812615394592, 0.6803305745124817, 0.7519798874855042, 0.8236292004585266, 0.8952785730361938, 0.9669278860092163, 1.0385771989822388, 1.1102265119552612, 1.1818758249282837, 1.2535251379013062, 1.3251744508743286, 1.396823763847351, 1.4684730768203735, 1.540122389793396, 1.6117717027664185, 1.6834211349487305, 1.755070447921753, 1.8267197608947754, 1.8983690738677979, 1.9700183868408203, 2.0416676998138428, 2.1133170127868652, 2.1849663257598877, 2.25661563873291, 2.3282649517059326, 2.399914264678955]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 8.0, 17.0, 9.0, 29.0, 41.0, 77.0, 119.0, 221.0, 414.0, 899.0, 2137.0, 6077.0, 22434.0, 124707.0, 574875.0, 260025.0, 41104.0, 9700.0, 3216.0, 1284.0, 538.0, 250.0, 145.0, 84.0, 47.0, 34.0, 17.0, 10.0, 7.0, 9.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.46728515625, -0.454193115234375, -0.44110107421875, -0.428009033203125, -0.4149169921875, -0.401824951171875, -0.38873291015625, -0.375640869140625, -0.362548828125, -0.349456787109375, -0.33636474609375, -0.323272705078125, -0.3101806640625, -0.297088623046875, -0.28399658203125, -0.270904541015625, -0.2578125, -0.244720458984375, -0.23162841796875, -0.218536376953125, -0.2054443359375, -0.192352294921875, -0.17926025390625, -0.166168212890625, -0.153076171875, -0.139984130859375, -0.12689208984375, -0.113800048828125, -0.1007080078125, -0.087615966796875, -0.07452392578125, -0.061431884765625, -0.04833984375, -0.035247802734375, -0.02215576171875, -0.009063720703125, 0.0040283203125, 0.017120361328125, 0.03021240234375, 0.043304443359375, 0.056396484375, 0.069488525390625, 0.08258056640625, 0.095672607421875, 0.1087646484375, 0.121856689453125, 0.13494873046875, 0.148040771484375, 0.1611328125, 0.174224853515625, 0.18731689453125, 0.200408935546875, 0.2135009765625, 0.226593017578125, 0.23968505859375, 0.252777099609375, 0.265869140625, 0.278961181640625, 0.29205322265625, 0.305145263671875, 0.3182373046875, 0.331329345703125, 0.34442138671875, 0.357513427734375, 0.37060546875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 8.0, 10.0, 17.0, 18.0, 28.0, 30.0, 44.0, 59.0, 58.0, 59.0, 59.0, 76.0, 95.0, 65.0, 67.0, 57.0, 55.0, 37.0, 46.0, 25.0, 22.0, 24.0, 15.0, 12.0, 8.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1351318359375, -0.1310720443725586, -0.1270122528076172, -0.12295246124267578, -0.11889266967773438, -0.11483287811279297, -0.11077308654785156, -0.10671329498291016, -0.10265350341796875, -0.09859371185302734, -0.09453392028808594, -0.09047412872314453, -0.08641433715820312, -0.08235454559326172, -0.07829475402832031, -0.0742349624633789, -0.0701751708984375, -0.0661153793334961, -0.06205558776855469, -0.05799579620361328, -0.053936004638671875, -0.04987621307373047, -0.04581642150878906, -0.041756629943847656, -0.03769683837890625, -0.033637046813964844, -0.029577255249023438, -0.02551746368408203, -0.021457672119140625, -0.01739788055419922, -0.013338088989257812, -0.009278297424316406, -0.005218505859375, -0.0011587142944335938, 0.0029010772705078125, 0.006960868835449219, 0.011020660400390625, 0.015080451965332031, 0.019140243530273438, 0.023200035095214844, 0.02725982666015625, 0.031319618225097656, 0.03537940979003906, 0.03943920135498047, 0.043498992919921875, 0.04755878448486328, 0.05161857604980469, 0.055678367614746094, 0.0597381591796875, 0.0637979507446289, 0.06785774230957031, 0.07191753387451172, 0.07597732543945312, 0.08003711700439453, 0.08409690856933594, 0.08815670013427734, 0.09221649169921875, 0.09627628326416016, 0.10033607482910156, 0.10439586639404297, 0.10845565795898438, 0.11251544952392578, 0.11657524108886719, 0.1206350326538086, 0.12469482421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 3.0, 5.0, 1.0, 3.0, 8.0, 10.0, 11.0, 11.0, 14.0, 33.0, 49.0, 70.0, 76.0, 156.0, 284.0, 508.0, 1126.0, 2792.0, 8057.0, 30727.0, 155011.0, 644496.0, 160154.0, 31320.0, 8327.0, 2874.0, 1156.0, 529.0, 301.0, 160.0, 106.0, 56.0, 37.0, 24.0, 22.0, 13.0, 6.0, 10.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283935546875, -0.27185821533203125, -0.2597808837890625, -0.24770355224609375, -0.235626220703125, -0.22354888916015625, -0.2114715576171875, -0.19939422607421875, -0.18731689453125, -0.17523956298828125, -0.1631622314453125, -0.15108489990234375, -0.139007568359375, -0.12693023681640625, -0.1148529052734375, -0.10277557373046875, -0.0906982421875, -0.07862091064453125, -0.0665435791015625, -0.05446624755859375, -0.042388916015625, -0.03031158447265625, -0.0182342529296875, -0.00615692138671875, 0.00592041015625, 0.01799774169921875, 0.0300750732421875, 0.04215240478515625, 0.054229736328125, 0.06630706787109375, 0.0783843994140625, 0.09046173095703125, 0.1025390625, 0.11461639404296875, 0.1266937255859375, 0.13877105712890625, 0.150848388671875, 0.16292572021484375, 0.1750030517578125, 0.18708038330078125, 0.19915771484375, 0.21123504638671875, 0.2233123779296875, 0.23538970947265625, 0.247467041015625, 0.25954437255859375, 0.2716217041015625, 0.28369903564453125, 0.2957763671875, 0.30785369873046875, 0.3199310302734375, 0.33200836181640625, 0.344085693359375, 0.35616302490234375, 0.3682403564453125, 0.38031768798828125, 0.39239501953125, 0.40447235107421875, 0.4165496826171875, 0.42862701416015625, 0.440704345703125, 0.45278167724609375, 0.4648590087890625, 0.47693634033203125, 0.489013671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 6.0, 8.0, 8.0, 4.0, 10.0, 11.0, 18.0, 9.0, 20.0, 29.0, 35.0, 44.0, 41.0, 44.0, 54.0, 54.0, 60.0, 75.0, 64.0, 64.0, 64.0, 48.0, 52.0, 49.0, 29.0, 23.0, 22.0, 15.0, 8.0, 7.0, 6.0, 10.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.51513671875, -0.5008697509765625, -0.486602783203125, -0.4723358154296875, -0.45806884765625, -0.4438018798828125, -0.429534912109375, -0.4152679443359375, -0.4010009765625, -0.3867340087890625, -0.372467041015625, -0.3582000732421875, -0.34393310546875, -0.3296661376953125, -0.315399169921875, -0.3011322021484375, -0.286865234375, -0.2725982666015625, -0.258331298828125, -0.2440643310546875, -0.22979736328125, -0.2155303955078125, -0.201263427734375, -0.1869964599609375, -0.1727294921875, -0.1584625244140625, -0.144195556640625, -0.1299285888671875, -0.11566162109375, -0.1013946533203125, -0.087127685546875, -0.0728607177734375, -0.05859375, -0.0443267822265625, -0.030059814453125, -0.0157928466796875, -0.00152587890625, 0.0127410888671875, 0.027008056640625, 0.0412750244140625, 0.0555419921875, 0.0698089599609375, 0.084075927734375, 0.0983428955078125, 0.11260986328125, 0.1268768310546875, 0.141143798828125, 0.1554107666015625, 0.169677734375, 0.1839447021484375, 0.198211669921875, 0.2124786376953125, 0.22674560546875, 0.2410125732421875, 0.255279541015625, 0.2695465087890625, 0.2838134765625, 0.2980804443359375, 0.312347412109375, 0.3266143798828125, 0.34088134765625, 0.3551483154296875, 0.369415283203125, 0.3836822509765625, 0.39794921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 8.0, 5.0, 9.0, 9.0, 17.0, 32.0, 40.0, 47.0, 91.0, 172.0, 290.0, 482.0, 911.0, 1633.0, 3646.0, 9403.0, 29105.0, 125267.0, 654529.0, 167032.0, 36105.0, 11210.0, 4246.0, 1996.0, 983.0, 532.0, 312.0, 169.0, 98.0, 57.0, 41.0, 20.0, 23.0, 13.0, 15.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.19677734375, -0.1910877227783203, -0.18539810180664062, -0.17970848083496094, -0.17401885986328125, -0.16832923889160156, -0.16263961791992188, -0.1569499969482422, -0.1512603759765625, -0.1455707550048828, -0.13988113403320312, -0.13419151306152344, -0.12850189208984375, -0.12281227111816406, -0.11712265014648438, -0.11143302917480469, -0.105743408203125, -0.10005378723144531, -0.09436416625976562, -0.08867454528808594, -0.08298492431640625, -0.07729530334472656, -0.07160568237304688, -0.06591606140136719, -0.0602264404296875, -0.05453681945800781, -0.048847198486328125, -0.04315757751464844, -0.03746795654296875, -0.03177833557128906, -0.026088714599609375, -0.020399093627929688, -0.01470947265625, -0.009019851684570312, -0.003330230712890625, 0.0023593902587890625, 0.00804901123046875, 0.013738632202148438, 0.019428253173828125, 0.025117874145507812, 0.0308074951171875, 0.03649711608886719, 0.042186737060546875, 0.04787635803222656, 0.05356597900390625, 0.05925559997558594, 0.06494522094726562, 0.07063484191894531, 0.076324462890625, 0.08201408386230469, 0.08770370483398438, 0.09339332580566406, 0.09908294677734375, 0.10477256774902344, 0.11046218872070312, 0.11615180969238281, 0.1218414306640625, 0.1275310516357422, 0.13322067260742188, 0.13891029357910156, 0.14459991455078125, 0.15028953552246094, 0.15597915649414062, 0.1616687774658203, 0.1673583984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 10.0, 18.0, 17.0, 36.0, 46.0, 88.0, 121.0, 168.0, 153.0, 104.0, 83.0, 44.0, 38.0, 17.0, 13.0, 13.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.96453857421875e-05, -8.728262037038803e-05, -8.491985499858856e-05, -8.255708962678909e-05, -8.019432425498962e-05, -7.783155888319016e-05, -7.546879351139069e-05, -7.310602813959122e-05, -7.074326276779175e-05, -6.838049739599228e-05, -6.601773202419281e-05, -6.365496665239334e-05, -6.129220128059387e-05, -5.89294359087944e-05, -5.6566670536994934e-05, -5.4203905165195465e-05, -5.1841139793395996e-05, -4.947837442159653e-05, -4.711560904979706e-05, -4.475284367799759e-05, -4.239007830619812e-05, -4.002731293439865e-05, -3.766454756259918e-05, -3.530178219079971e-05, -3.2939016819000244e-05, -3.0576251447200775e-05, -2.8213486075401306e-05, -2.5850720703601837e-05, -2.3487955331802368e-05, -2.11251899600029e-05, -1.876242458820343e-05, -1.639965921640396e-05, -1.4036893844604492e-05, -1.1674128472805023e-05, -9.311363101005554e-06, -6.948597729206085e-06, -4.585832357406616e-06, -2.2230669856071472e-06, 1.3969838619232178e-07, 2.5024637579917908e-06, 4.86522912979126e-06, 7.227994501590729e-06, 9.590759873390198e-06, 1.1953525245189667e-05, 1.4316290616989136e-05, 1.6679055988788605e-05, 1.9041821360588074e-05, 2.1404586732387543e-05, 2.3767352104187012e-05, 2.613011747598648e-05, 2.849288284778595e-05, 3.085564821958542e-05, 3.321841359138489e-05, 3.558117896318436e-05, 3.7943944334983826e-05, 4.0306709706783295e-05, 4.2669475078582764e-05, 4.503224045038223e-05, 4.73950058221817e-05, 4.975777119398117e-05, 5.212053656578064e-05, 5.448330193758011e-05, 5.684606730937958e-05, 5.920883268117905e-05, 6.157159805297852e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 5.0, 13.0, 12.0, 17.0, 26.0, 58.0, 101.0, 187.0, 375.0, 725.0, 1784.0, 4947.0, 15075.0, 63252.0, 536504.0, 348523.0, 55350.0, 13788.0, 4509.0, 1789.0, 733.0, 363.0, 172.0, 92.0, 60.0, 25.0, 21.0, 15.0, 9.0, 9.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.16937637329101562, -0.16309356689453125, -0.15681076049804688, -0.1505279541015625, -0.14424514770507812, -0.13796234130859375, -0.13167953491210938, -0.125396728515625, -0.11911392211914062, -0.11283111572265625, -0.10654830932617188, -0.1002655029296875, -0.09398269653320312, -0.08769989013671875, -0.08141708374023438, -0.07513427734375, -0.06885147094726562, -0.06256866455078125, -0.056285858154296875, -0.0500030517578125, -0.043720245361328125, -0.03743743896484375, -0.031154632568359375, -0.024871826171875, -0.018589019775390625, -0.01230621337890625, -0.006023406982421875, 0.0002593994140625, 0.006542205810546875, 0.01282501220703125, 0.019107818603515625, 0.025390625, 0.031673431396484375, 0.03795623779296875, 0.044239044189453125, 0.0505218505859375, 0.056804656982421875, 0.06308746337890625, 0.06937026977539062, 0.075653076171875, 0.08193588256835938, 0.08821868896484375, 0.09450149536132812, 0.1007843017578125, 0.10706710815429688, 0.11334991455078125, 0.11963272094726562, 0.12591552734375, 0.13219833374023438, 0.13848114013671875, 0.14476394653320312, 0.1510467529296875, 0.15732955932617188, 0.16361236572265625, 0.16989517211914062, 0.176177978515625, 0.18246078491210938, 0.18874359130859375, 0.19502639770507812, 0.2013092041015625, 0.20759201049804688, 0.21387481689453125, 0.22015762329101562, 0.2264404296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 0.0, 4.0, 3.0, 9.0, 7.0, 14.0, 12.0, 19.0, 31.0, 27.0, 60.0, 58.0, 81.0, 82.0, 107.0, 110.0, 108.0, 69.0, 54.0, 37.0, 30.0, 18.0, 12.0, 10.0, 11.0, 5.0, 6.0, 8.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.203125, -0.1975860595703125, -0.192047119140625, -0.1865081787109375, -0.18096923828125, -0.1754302978515625, -0.169891357421875, -0.1643524169921875, -0.1588134765625, -0.1532745361328125, -0.147735595703125, -0.1421966552734375, -0.13665771484375, -0.1311187744140625, -0.125579833984375, -0.1200408935546875, -0.114501953125, -0.1089630126953125, -0.103424072265625, -0.0978851318359375, -0.09234619140625, -0.0868072509765625, -0.081268310546875, -0.0757293701171875, -0.0701904296875, -0.0646514892578125, -0.059112548828125, -0.0535736083984375, -0.04803466796875, -0.0424957275390625, -0.036956787109375, -0.0314178466796875, -0.02587890625, -0.0203399658203125, -0.014801025390625, -0.0092620849609375, -0.00372314453125, 0.0018157958984375, 0.007354736328125, 0.0128936767578125, 0.0184326171875, 0.0239715576171875, 0.029510498046875, 0.0350494384765625, 0.04058837890625, 0.0461273193359375, 0.051666259765625, 0.0572052001953125, 0.062744140625, 0.0682830810546875, 0.073822021484375, 0.0793609619140625, 0.08489990234375, 0.0904388427734375, 0.095977783203125, 0.1015167236328125, 0.1070556640625, 0.1125946044921875, 0.118133544921875, 0.1236724853515625, 0.12921142578125, 0.1347503662109375, 0.140289306640625, 0.1458282470703125, 0.1513671875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 4.0, 10.0, 15.0, 28.0, 49.0, 102.0, 198.0, 280.0, 137.0, 74.0, 56.0, 18.0, 10.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.534957408905029, -5.3976263999938965, -5.260295867919922, -5.122964859008789, -4.985633850097656, -4.848302841186523, -4.710972309112549, -4.573641300201416, -4.436310768127441, -4.298979759216309, -4.161649227142334, -4.024318218231201, -3.8869872093200684, -3.7496564388275146, -3.612325668334961, -3.474994659423828, -3.3376636505126953, -3.2003328800201416, -3.063001871109009, -2.925671100616455, -2.7883400917053223, -2.6510093212127686, -2.513678550720215, -2.376347541809082, -2.2390167713165283, -2.1016860008239746, -1.9643549919128418, -1.827024221420288, -1.6896933317184448, -1.5523624420166016, -1.4150316715240479, -1.2777007818222046, -1.1403703689575195, -1.0030394792556763, -0.8657086491584778, -0.7283778190612793, -0.591046929359436, -0.4537160396575928, -0.3163852095603943, -0.1790543794631958, -0.04172348976135254, 0.09560737013816833, 0.2329382300376892, 0.3702690899372101, 0.507599949836731, 0.6449308395385742, 0.7822616696357727, 0.9195924997329712, 1.0569233894348145, 1.1942542791366577, 1.331585168838501, 1.4689159393310547, 1.606246829032898, 1.7435777187347412, 1.880908489227295, 2.0182394981384277, 2.1555702686309814, 2.292901039123535, 2.430232048034668, 2.5675628185272217, 2.7048935890197754, 2.842224597930908, 2.979555368423462, 3.1168861389160156, 3.2542171478271484]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 5.0, 4.0, 7.0, 8.0, 7.0, 9.0, 12.0, 13.0, 15.0, 22.0, 19.0, 12.0, 13.0, 23.0, 19.0, 24.0, 35.0, 27.0, 27.0, 30.0, 46.0, 56.0, 47.0, 51.0, 57.0, 47.0, 42.0, 34.0, 34.0, 28.0, 29.0, 29.0, 19.0, 27.0, 20.0, 15.0, 18.0, 11.0, 6.0, 10.0, 12.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5275356769561768, -1.4823319911956787, -1.4371283054351807, -1.3919246196746826, -1.346720814704895, -1.301517128944397, -1.256313443183899, -1.2111097574234009, -1.1659060716629028, -1.1207023859024048, -1.0754987001419067, -1.0302948951721191, -0.9850912690162659, -0.939887523651123, -0.894683837890625, -0.849480152130127, -0.8042764067649841, -0.7590727210044861, -0.7138689756393433, -0.6686652898788452, -0.6234616041183472, -0.5782579183578491, -0.5330541729927063, -0.48785048723220825, -0.4426467716693878, -0.3974430561065674, -0.35223937034606934, -0.3070356547832489, -0.26183193922042847, -0.21662825345993042, -0.17142453789710999, -0.12622085213661194, -0.0810171365737915, -0.035813432186841965, 0.009390272200107574, 0.05459398031234741, 0.09979768097400665, 0.1450013816356659, 0.19020509719848633, 0.23540878295898438, 0.2806124985218048, 0.32581621408462524, 0.3710198998451233, 0.4162236154079437, 0.46142733097076416, 0.5066310167312622, 0.5518347024917603, 0.5970383882522583, 0.6422421336174011, 0.6874458193778992, 0.732649564743042, 0.77785325050354, 0.8230569362640381, 0.8682606220245361, 0.913464367389679, 0.958668053150177, 1.0038717985153198, 1.0490754842758179, 1.094279170036316, 1.1394829750061035, 1.1846866607666016, 1.2298903465270996, 1.2750940322875977, 1.3202977180480957, 1.3655014038085938]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 12.0, 17.0, 21.0, 32.0, 57.0, 84.0, 101.0, 166.0, 446.0, 2981.0, 217765.0, 3963469.0, 7893.0, 676.0, 197.0, 107.0, 62.0, 41.0, 45.0, 28.0, 23.0, 13.0, 14.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90576171875, -0.8711318969726562, -0.8365020751953125, -0.8018722534179688, -0.767242431640625, -0.7326126098632812, -0.6979827880859375, -0.6633529663085938, -0.62872314453125, -0.5940933227539062, -0.5594635009765625, -0.5248336791992188, -0.490203857421875, -0.45557403564453125, -0.4209442138671875, -0.38631439208984375, -0.3516845703125, -0.31705474853515625, -0.2824249267578125, -0.24779510498046875, -0.213165283203125, -0.17853546142578125, -0.1439056396484375, -0.10927581787109375, -0.07464599609375, -0.04001617431640625, -0.0053863525390625, 0.02924346923828125, 0.063873291015625, 0.09850311279296875, 0.1331329345703125, 0.16776275634765625, 0.202392578125, 0.23702239990234375, 0.2716522216796875, 0.30628204345703125, 0.340911865234375, 0.37554168701171875, 0.4101715087890625, 0.44480133056640625, 0.47943115234375, 0.5140609741210938, 0.5486907958984375, 0.5833206176757812, 0.617950439453125, 0.6525802612304688, 0.6872100830078125, 0.7218399047851562, 0.7564697265625, 0.7910995483398438, 0.8257293701171875, 0.8603591918945312, 0.894989013671875, 0.9296188354492188, 0.9642486572265625, 0.9988784790039062, 1.03350830078125, 1.0681381225585938, 1.1027679443359375, 1.1373977661132812, 1.172027587890625, 1.2066574096679688, 1.2412872314453125, 1.2759170532226562, 1.310546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 7.0, 8.0, 10.0, 12.0, 14.0, 27.0, 31.0, 36.0, 63.0, 70.0, 74.0, 58.0, 98.0, 68.0, 79.0, 74.0, 46.0, 53.0, 43.0, 39.0, 26.0, 25.0, 12.0, 18.0, 5.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135986328125, -0.13185882568359375, -0.1277313232421875, -0.12360382080078125, -0.119476318359375, -0.11534881591796875, -0.1112213134765625, -0.10709381103515625, -0.10296630859375, -0.09883880615234375, -0.0947113037109375, -0.09058380126953125, -0.086456298828125, -0.08232879638671875, -0.0782012939453125, -0.07407379150390625, -0.0699462890625, -0.06581878662109375, -0.0616912841796875, -0.05756378173828125, -0.053436279296875, -0.04930877685546875, -0.0451812744140625, -0.04105377197265625, -0.03692626953125, -0.03279876708984375, -0.0286712646484375, -0.02454376220703125, -0.020416259765625, -0.01628875732421875, -0.0121612548828125, -0.00803375244140625, -0.00390625, 0.00022125244140625, 0.0043487548828125, 0.00847625732421875, 0.012603759765625, 0.01673126220703125, 0.0208587646484375, 0.02498626708984375, 0.02911376953125, 0.03324127197265625, 0.0373687744140625, 0.04149627685546875, 0.045623779296875, 0.04975128173828125, 0.0538787841796875, 0.05800628662109375, 0.0621337890625, 0.06626129150390625, 0.0703887939453125, 0.07451629638671875, 0.078643798828125, 0.08277130126953125, 0.0868988037109375, 0.09102630615234375, 0.09515380859375, 0.09928131103515625, 0.1034088134765625, 0.10753631591796875, 0.111663818359375, 0.11579132080078125, 0.1199188232421875, 0.12404632568359375, 0.128173828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 10.0, 17.0, 18.0, 25.0, 44.0, 63.0, 150.0, 265.0, 653.0, 1794.0, 6242.0, 36591.0, 2873162.0, 1238624.0, 28697.0, 5267.0, 1592.0, 509.0, 226.0, 132.0, 57.0, 44.0, 18.0, 21.0, 11.0, 13.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.60302734375, -0.5847244262695312, -0.5664215087890625, -0.5481185913085938, -0.529815673828125, -0.5115127563476562, -0.4932098388671875, -0.47490692138671875, -0.45660400390625, -0.43830108642578125, -0.4199981689453125, -0.40169525146484375, -0.383392333984375, -0.36508941650390625, -0.3467864990234375, -0.32848358154296875, -0.3101806640625, -0.29187774658203125, -0.2735748291015625, -0.25527191162109375, -0.236968994140625, -0.21866607666015625, -0.2003631591796875, -0.18206024169921875, -0.16375732421875, -0.14545440673828125, -0.1271514892578125, -0.10884857177734375, -0.090545654296875, -0.07224273681640625, -0.0539398193359375, -0.03563690185546875, -0.017333984375, 0.00096893310546875, 0.0192718505859375, 0.03757476806640625, 0.055877685546875, 0.07418060302734375, 0.0924835205078125, 0.11078643798828125, 0.12908935546875, 0.14739227294921875, 0.1656951904296875, 0.18399810791015625, 0.202301025390625, 0.22060394287109375, 0.2389068603515625, 0.25720977783203125, 0.2755126953125, 0.29381561279296875, 0.3121185302734375, 0.33042144775390625, 0.348724365234375, 0.36702728271484375, 0.3853302001953125, 0.40363311767578125, 0.42193603515625, 0.44023895263671875, 0.4585418701171875, 0.47684478759765625, 0.495147705078125, 0.5134506225585938, 0.5317535400390625, 0.5500564575195312, 0.568359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 2.0, 9.0, 14.0, 14.0, 18.0, 22.0, 35.0, 68.0, 95.0, 149.0, 401.0, 1052.0, 1288.0, 430.0, 206.0, 97.0, 45.0, 40.0, 20.0, 20.0, 12.0, 4.0, 5.0, 4.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.461669921875, -0.4488868713378906, -0.43610382080078125, -0.4233207702636719, -0.4105377197265625, -0.3977546691894531, -0.38497161865234375, -0.3721885681152344, -0.359405517578125, -0.3466224670410156, -0.33383941650390625, -0.3210563659667969, -0.3082733154296875, -0.2954902648925781, -0.28270721435546875, -0.2699241638183594, -0.25714111328125, -0.24435806274414062, -0.23157501220703125, -0.21879196166992188, -0.2060089111328125, -0.19322586059570312, -0.18044281005859375, -0.16765975952148438, -0.154876708984375, -0.14209365844726562, -0.12931060791015625, -0.11652755737304688, -0.1037445068359375, -0.09096145629882812, -0.07817840576171875, -0.06539535522460938, -0.0526123046875, -0.039829254150390625, -0.02704620361328125, -0.014263153076171875, -0.0014801025390625, 0.011302947998046875, 0.02408599853515625, 0.036869049072265625, 0.049652099609375, 0.062435150146484375, 0.07521820068359375, 0.08800125122070312, 0.1007843017578125, 0.11356735229492188, 0.12635040283203125, 0.13913345336914062, 0.15191650390625, 0.16469955444335938, 0.17748260498046875, 0.19026565551757812, 0.2030487060546875, 0.21583175659179688, 0.22861480712890625, 0.24139785766601562, 0.254180908203125, 0.2669639587402344, 0.27974700927734375, 0.2925300598144531, 0.3053131103515625, 0.3180961608886719, 0.33087921142578125, 0.3436622619628906, 0.3564453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 19.0, 33.0, 64.0, 142.0, 256.0, 266.0, 123.0, 51.0, 23.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30051326751709, -6.150554656982422, -6.000596523284912, -5.850637912750244, -5.700679779052734, -5.550721168518066, -5.400762557983398, -5.250804424285889, -5.100845813751221, -4.950887203216553, -4.800929069519043, -4.650970458984375, -4.501012325286865, -4.351053714752197, -4.2010955810546875, -4.0511369705200195, -3.9011785984039307, -3.751220226287842, -3.601261854171753, -3.451303482055664, -3.301344871520996, -3.1513864994049072, -3.0014281272888184, -2.8514695167541504, -2.7015113830566406, -2.5515530109405518, -2.401594638824463, -2.251636028289795, -2.101677656173706, -1.9517192840576172, -1.8017609119415283, -1.65180242061615, -1.5018439292907715, -1.3518855571746826, -1.2019270658493042, -1.0519686937332153, -0.9020102620124817, -0.752051830291748, -0.6020934581756592, -0.45213496685028076, -0.3021765947341919, -0.15221817791461945, -0.002259761095046997, 0.14769864082336426, 0.2976570725440979, 0.44761550426483154, 0.5975738763809204, 0.7475323677062988, 0.8974907398223877, 1.0474491119384766, 1.197407603263855, 1.3473659753799438, 1.4973244667053223, 1.6472828388214111, 1.7972412109375, 1.9471997022628784, 2.0971579551696777, 2.2471163272857666, 2.3970746994018555, 2.5470333099365234, 2.6969916820526123, 2.846950054168701, 2.99690842628479, 3.146866798400879, 3.296825408935547]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 4.0, 7.0, 9.0, 9.0, 19.0, 9.0, 26.0, 20.0, 29.0, 26.0, 26.0, 46.0, 45.0, 46.0, 52.0, 45.0, 55.0, 44.0, 48.0, 46.0, 48.0, 50.0, 52.0, 40.0, 36.0, 27.0, 29.0, 21.0, 18.0, 20.0, 8.0, 12.0, 8.0, 4.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2660889625549316, -1.2179960012435913, -1.1699029207229614, -1.121809959411621, -1.0737169981002808, -1.0256239175796509, -0.9775309562683105, -0.9294379353523254, -0.8813449144363403, -0.8332518935203552, -0.7851589322090149, -0.7370659112930298, -0.6889728903770447, -0.6408798694610596, -0.5927869081497192, -0.5446938872337341, -0.4966009259223938, -0.4485079348087311, -0.40041491389274597, -0.35232192277908325, -0.30422890186309814, -0.2561359107494354, -0.2080429196357727, -0.1599498987197876, -0.11185690760612488, -0.06376390159130096, -0.015670903027057648, 0.03242209553718567, 0.08051510155200958, 0.1286081075668335, 0.17670109868049622, 0.22479411959648132, 0.27288711071014404, 0.32098010182380676, 0.36907312273979187, 0.4171661138534546, 0.4652591347694397, 0.5133521556854248, 0.5614451169967651, 0.6095381379127502, 0.6576311588287354, 0.7057241797447205, 0.7538171410560608, 0.8019101619720459, 0.850003182888031, 0.8980962038040161, 0.9461891651153564, 0.9942821860313416, 1.042375087738037, 1.0904680490493774, 1.1385611295700073, 1.1866540908813477, 1.234747052192688, 1.2828401327133179, 1.3309330940246582, 1.379026174545288, 1.4271191358566284, 1.4752120971679688, 1.5233051776885986, 1.571398138999939, 1.6194911003112793, 1.6675841808319092, 1.7156771421432495, 1.7637701034545898, 1.8118631839752197]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 24.0, 33.0, 42.0, 86.0, 155.0, 295.0, 500.0, 1122.0, 2892.0, 8076.0, 26420.0, 109310.0, 425304.0, 357406.0, 84147.0, 21561.0, 6562.0, 2477.0, 1041.0, 527.0, 233.0, 136.0, 81.0, 46.0, 24.0, 19.0, 7.0, 4.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.360595703125, -0.350555419921875, -0.34051513671875, -0.330474853515625, -0.3204345703125, -0.310394287109375, -0.30035400390625, -0.290313720703125, -0.2802734375, -0.270233154296875, -0.26019287109375, -0.250152587890625, -0.2401123046875, -0.230072021484375, -0.22003173828125, -0.209991455078125, -0.199951171875, -0.189910888671875, -0.17987060546875, -0.169830322265625, -0.1597900390625, -0.149749755859375, -0.13970947265625, -0.129669189453125, -0.11962890625, -0.109588623046875, -0.09954833984375, -0.089508056640625, -0.0794677734375, -0.069427490234375, -0.05938720703125, -0.049346923828125, -0.039306640625, -0.029266357421875, -0.01922607421875, -0.009185791015625, 0.0008544921875, 0.010894775390625, 0.02093505859375, 0.030975341796875, 0.041015625, 0.051055908203125, 0.06109619140625, 0.071136474609375, 0.0811767578125, 0.091217041015625, 0.10125732421875, 0.111297607421875, 0.121337890625, 0.131378173828125, 0.14141845703125, 0.151458740234375, 0.1614990234375, 0.171539306640625, 0.18157958984375, 0.191619873046875, 0.20166015625, 0.211700439453125, 0.22174072265625, 0.231781005859375, 0.2418212890625, 0.251861572265625, 0.26190185546875, 0.271942138671875, 0.281982421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 11.0, 23.0, 31.0, 28.0, 35.0, 47.0, 58.0, 68.0, 63.0, 62.0, 70.0, 51.0, 74.0, 73.0, 53.0, 59.0, 43.0, 33.0, 18.0, 29.0, 12.0, 16.0, 8.0, 8.0, 3.0, 4.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1427001953125, -0.13846397399902344, -0.13422775268554688, -0.1299915313720703, -0.12575531005859375, -0.12151908874511719, -0.11728286743164062, -0.11304664611816406, -0.1088104248046875, -0.10457420349121094, -0.10033798217773438, -0.09610176086425781, -0.09186553955078125, -0.08762931823730469, -0.08339309692382812, -0.07915687561035156, -0.074920654296875, -0.07068443298339844, -0.06644821166992188, -0.06221199035644531, -0.05797576904296875, -0.05373954772949219, -0.049503326416015625, -0.04526710510253906, -0.0410308837890625, -0.03679466247558594, -0.032558441162109375, -0.028322219848632812, -0.02408599853515625, -0.019849777221679688, -0.015613555908203125, -0.011377334594726562, -0.00714111328125, -0.0029048919677734375, 0.001331329345703125, 0.0055675506591796875, 0.00980377197265625, 0.014039993286132812, 0.018276214599609375, 0.022512435913085938, 0.0267486572265625, 0.030984878540039062, 0.035221099853515625, 0.03945732116699219, 0.04369354248046875, 0.04792976379394531, 0.052165985107421875, 0.05640220642089844, 0.060638427734375, 0.06487464904785156, 0.06911087036132812, 0.07334709167480469, 0.07758331298828125, 0.08181953430175781, 0.08605575561523438, 0.09029197692871094, 0.0945281982421875, 0.09876441955566406, 0.10300064086914062, 0.10723686218261719, 0.11147308349609375, 0.11570930480957031, 0.11994552612304688, 0.12418174743652344, 0.12841796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 9.0, 21.0, 11.0, 23.0, 42.0, 62.0, 77.0, 108.0, 163.0, 277.0, 454.0, 780.0, 1577.0, 3703.0, 10071.0, 34432.0, 151426.0, 651223.0, 144324.0, 32702.0, 9793.0, 3578.0, 1599.0, 799.0, 447.0, 290.0, 192.0, 117.0, 67.0, 57.0, 31.0, 24.0, 19.0, 10.0, 9.0, 8.0, 2.0, 6.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3642578125, -0.3536949157714844, -0.34313201904296875, -0.3325691223144531, -0.3220062255859375, -0.3114433288574219, -0.30088043212890625, -0.2903175354003906, -0.279754638671875, -0.2691917419433594, -0.25862884521484375, -0.24806594848632812, -0.2375030517578125, -0.22694015502929688, -0.21637725830078125, -0.20581436157226562, -0.19525146484375, -0.18468856811523438, -0.17412567138671875, -0.16356277465820312, -0.1529998779296875, -0.14243698120117188, -0.13187408447265625, -0.12131118774414062, -0.110748291015625, -0.10018539428710938, -0.08962249755859375, -0.07905960083007812, -0.0684967041015625, -0.057933807373046875, -0.04737091064453125, -0.036808013916015625, -0.0262451171875, -0.015682220458984375, -0.00511932373046875, 0.005443572998046875, 0.0160064697265625, 0.026569366455078125, 0.03713226318359375, 0.047695159912109375, 0.058258056640625, 0.06882095336914062, 0.07938385009765625, 0.08994674682617188, 0.1005096435546875, 0.11107254028320312, 0.12163543701171875, 0.13219833374023438, 0.14276123046875, 0.15332412719726562, 0.16388702392578125, 0.17444992065429688, 0.1850128173828125, 0.19557571411132812, 0.20613861083984375, 0.21670150756835938, 0.227264404296875, 0.23782730102539062, 0.24839019775390625, 0.2589530944824219, 0.2695159912109375, 0.2800788879394531, 0.29064178466796875, 0.3012046813964844, 0.311767578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 13.0, 10.0, 3.0, 16.0, 21.0, 27.0, 27.0, 35.0, 47.0, 57.0, 65.0, 62.0, 75.0, 82.0, 73.0, 72.0, 56.0, 49.0, 44.0, 40.0, 25.0, 26.0, 16.0, 15.0, 12.0, 6.0, 2.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5625, -0.5445785522460938, -0.5266571044921875, -0.5087356567382812, -0.490814208984375, -0.47289276123046875, -0.4549713134765625, -0.43704986572265625, -0.41912841796875, -0.40120697021484375, -0.3832855224609375, -0.36536407470703125, -0.347442626953125, -0.32952117919921875, -0.3115997314453125, -0.29367828369140625, -0.2757568359375, -0.25783538818359375, -0.2399139404296875, -0.22199249267578125, -0.204071044921875, -0.18614959716796875, -0.1682281494140625, -0.15030670166015625, -0.13238525390625, -0.11446380615234375, -0.0965423583984375, -0.07862091064453125, -0.060699462890625, -0.04277801513671875, -0.0248565673828125, -0.00693511962890625, 0.010986328125, 0.02890777587890625, 0.0468292236328125, 0.06475067138671875, 0.082672119140625, 0.10059356689453125, 0.1185150146484375, 0.13643646240234375, 0.15435791015625, 0.17227935791015625, 0.1902008056640625, 0.20812225341796875, 0.226043701171875, 0.24396514892578125, 0.2618865966796875, 0.27980804443359375, 0.2977294921875, 0.31565093994140625, 0.3335723876953125, 0.35149383544921875, 0.369415283203125, 0.38733673095703125, 0.4052581787109375, 0.42317962646484375, 0.44110107421875, 0.45902252197265625, 0.4769439697265625, 0.49486541748046875, 0.512786865234375, 0.5307083129882812, 0.5486297607421875, 0.5665512084960938, 0.58447265625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 10.0, 2.0, 2.0, 3.0, 10.0, 13.0, 20.0, 25.0, 47.0, 63.0, 85.0, 136.0, 216.0, 391.0, 670.0, 1350.0, 2664.0, 6204.0, 16216.0, 48742.0, 207956.0, 631815.0, 88175.0, 26234.0, 9577.0, 3962.0, 1810.0, 871.0, 477.0, 296.0, 175.0, 122.0, 63.0, 48.0, 29.0, 30.0, 18.0, 12.0, 8.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.114013671875, -0.11011314392089844, -0.10621261596679688, -0.10231208801269531, -0.09841156005859375, -0.09451103210449219, -0.09061050415039062, -0.08670997619628906, -0.0828094482421875, -0.07890892028808594, -0.07500839233398438, -0.07110786437988281, -0.06720733642578125, -0.06330680847167969, -0.059406280517578125, -0.05550575256347656, -0.051605224609375, -0.04770469665527344, -0.043804168701171875, -0.03990364074707031, -0.03600311279296875, -0.03210258483886719, -0.028202056884765625, -0.024301528930664062, -0.0204010009765625, -0.016500473022460938, -0.012599945068359375, -0.008699417114257812, -0.00479888916015625, -0.0008983612060546875, 0.003002166748046875, 0.0069026947021484375, 0.01080322265625, 0.014703750610351562, 0.018604278564453125, 0.022504806518554688, 0.02640533447265625, 0.030305862426757812, 0.034206390380859375, 0.03810691833496094, 0.0420074462890625, 0.04590797424316406, 0.049808502197265625, 0.05370903015136719, 0.05760955810546875, 0.06151008605957031, 0.06541061401367188, 0.06931114196777344, 0.073211669921875, 0.07711219787597656, 0.08101272583007812, 0.08491325378417969, 0.08881378173828125, 0.09271430969238281, 0.09661483764648438, 0.10051536560058594, 0.1044158935546875, 0.10831642150878906, 0.11221694946289062, 0.11611747741699219, 0.12001800537109375, 0.12391853332519531, 0.12781906127929688, 0.13171958923339844, 0.1356201171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 3.0, 5.0, 9.0, 8.0, 8.0, 22.0, 16.0, 30.0, 35.0, 65.0, 74.0, 84.0, 130.0, 146.0, 110.0, 61.0, 33.0, 47.0, 23.0, 20.0, 15.0, 20.0, 7.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5239925384521484e-05, -4.3684616684913635e-05, -4.2129307985305786e-05, -4.057399928569794e-05, -3.901869058609009e-05, -3.746338188648224e-05, -3.590807318687439e-05, -3.435276448726654e-05, -3.279745578765869e-05, -3.124214708805084e-05, -2.9686838388442993e-05, -2.8131529688835144e-05, -2.6576220989227295e-05, -2.5020912289619446e-05, -2.3465603590011597e-05, -2.1910294890403748e-05, -2.03549861907959e-05, -1.879967749118805e-05, -1.72443687915802e-05, -1.568906009197235e-05, -1.4133751392364502e-05, -1.2578442692756653e-05, -1.1023133993148804e-05, -9.467825293540955e-06, -7.912516593933105e-06, -6.357207894325256e-06, -4.801899194717407e-06, -3.246590495109558e-06, -1.691281795501709e-06, -1.3597309589385986e-07, 1.4193356037139893e-06, 2.9746443033218384e-06, 4.5299530029296875e-06, 6.085261702537537e-06, 7.640570402145386e-06, 9.195879101753235e-06, 1.0751187801361084e-05, 1.2306496500968933e-05, 1.3861805200576782e-05, 1.541711390018463e-05, 1.697242259979248e-05, 1.852773129940033e-05, 2.008303999900818e-05, 2.1638348698616028e-05, 2.3193657398223877e-05, 2.4748966097831726e-05, 2.6304274797439575e-05, 2.7859583497047424e-05, 2.9414892196655273e-05, 3.097020089626312e-05, 3.252550959587097e-05, 3.408081829547882e-05, 3.563612699508667e-05, 3.719143569469452e-05, 3.874674439430237e-05, 4.030205309391022e-05, 4.1857361793518066e-05, 4.3412670493125916e-05, 4.4967979192733765e-05, 4.6523287892341614e-05, 4.807859659194946e-05, 4.963390529155731e-05, 5.118921399116516e-05, 5.274452269077301e-05, 5.429983139038086e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 8.0, 10.0, 10.0, 8.0, 17.0, 17.0, 33.0, 55.0, 70.0, 107.0, 152.0, 238.0, 379.0, 629.0, 1054.0, 1975.0, 3905.0, 8366.0, 20293.0, 59538.0, 259834.0, 566791.0, 78895.0, 25862.0, 10285.0, 4619.0, 2270.0, 1278.0, 680.0, 392.0, 264.0, 154.0, 124.0, 64.0, 54.0, 35.0, 20.0, 24.0, 17.0, 7.0, 5.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.12164306640625, -0.11773395538330078, -0.11382484436035156, -0.10991573333740234, -0.10600662231445312, -0.1020975112915039, -0.09818840026855469, -0.09427928924560547, -0.09037017822265625, -0.08646106719970703, -0.08255195617675781, -0.0786428451538086, -0.07473373413085938, -0.07082462310791016, -0.06691551208496094, -0.06300640106201172, -0.0590972900390625, -0.05518817901611328, -0.05127906799316406, -0.047369956970214844, -0.043460845947265625, -0.039551734924316406, -0.03564262390136719, -0.03173351287841797, -0.02782440185546875, -0.02391529083251953, -0.020006179809570312, -0.016097068786621094, -0.012187957763671875, -0.008278846740722656, -0.0043697357177734375, -0.00046062469482421875, 0.003448486328125, 0.007357597351074219, 0.011266708374023438, 0.015175819396972656, 0.019084930419921875, 0.022994041442871094, 0.026903152465820312, 0.03081226348876953, 0.03472137451171875, 0.03863048553466797, 0.04253959655761719, 0.046448707580566406, 0.050357818603515625, 0.054266929626464844, 0.05817604064941406, 0.06208515167236328, 0.0659942626953125, 0.06990337371826172, 0.07381248474121094, 0.07772159576416016, 0.08163070678710938, 0.0855398178100586, 0.08944892883300781, 0.09335803985595703, 0.09726715087890625, 0.10117626190185547, 0.10508537292480469, 0.1089944839477539, 0.11290359497070312, 0.11681270599365234, 0.12072181701660156, 0.12463092803955078, 0.1285400390625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 8.0, 7.0, 8.0, 14.0, 8.0, 22.0, 20.0, 27.0, 46.0, 56.0, 97.0, 117.0, 190.0, 107.0, 79.0, 56.0, 29.0, 30.0, 14.0, 14.0, 12.0, 12.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.231201171875, -0.22546768188476562, -0.21973419189453125, -0.21400070190429688, -0.2082672119140625, -0.20253372192382812, -0.19680023193359375, -0.19106674194335938, -0.185333251953125, -0.17959976196289062, -0.17386627197265625, -0.16813278198242188, -0.1623992919921875, -0.15666580200195312, -0.15093231201171875, -0.14519882202148438, -0.13946533203125, -0.13373184204101562, -0.12799835205078125, -0.12226486206054688, -0.1165313720703125, -0.11079788208007812, -0.10506439208984375, -0.09933090209960938, -0.093597412109375, -0.08786392211914062, -0.08213043212890625, -0.07639694213867188, -0.0706634521484375, -0.06492996215820312, -0.05919647216796875, -0.053462982177734375, -0.0477294921875, -0.041996002197265625, -0.03626251220703125, -0.030529022216796875, -0.0247955322265625, -0.019062042236328125, -0.01332855224609375, -0.007595062255859375, -0.001861572265625, 0.003871917724609375, 0.00960540771484375, 0.015338897705078125, 0.0210723876953125, 0.026805877685546875, 0.03253936767578125, 0.038272857666015625, 0.04400634765625, 0.049739837646484375, 0.05547332763671875, 0.061206817626953125, 0.0669403076171875, 0.07267379760742188, 0.07840728759765625, 0.08414077758789062, 0.089874267578125, 0.09560775756835938, 0.10134124755859375, 0.10707473754882812, 0.1128082275390625, 0.11854171752929688, 0.12427520751953125, 0.13000869750976562, 0.1357421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 6.0, 13.0, 8.0, 29.0, 38.0, 77.0, 137.0, 218.0, 177.0, 127.0, 62.0, 38.0, 27.0, 21.0, 6.0, 3.0, 2.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8909107446670532, -1.7903063297271729, -1.6897019147872925, -1.589097499847412, -1.4884930849075317, -1.3878886699676514, -1.2872843742370605, -1.1866798400878906, -1.0860755443572998, -0.9854711294174194, -0.8848667144775391, -0.7842622995376587, -0.6836578845977783, -0.5830535292625427, -0.48244911432266235, -0.381844699382782, -0.28124022483825684, -0.18063580989837646, -0.08003140985965729, 0.02057299017906189, 0.12117740511894226, 0.22178179025650024, 0.3223862051963806, 0.422990620136261, 0.5235950350761414, 0.6241994500160217, 0.7248038649559021, 0.8254082202911377, 0.9260126352310181, 1.0266170501708984, 1.1272214651107788, 1.2278258800506592, 1.328430414199829, 1.4290348291397095, 1.5296392440795898, 1.6302436590194702, 1.7308480739593506, 1.8314523696899414, 1.9320569038391113, 2.032661199569702, 2.133265733718872, 2.233870029449463, 2.334474563598633, 2.4350788593292236, 2.5356833934783936, 2.6362876892089844, 2.7368922233581543, 2.837496519088745, 2.938100814819336, 3.0387051105499268, 3.1393096446990967, 3.2399139404296875, 3.3405184745788574, 3.4411227703094482, 3.541727304458618, 3.642331600189209, 3.742936134338379, 3.8435404300689697, 3.9441449642181396, 4.0447492599487305, 4.1453537940979, 4.24595832824707, 4.346562385559082, 4.447166919708252, 4.547771453857422]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 2.0, 7.0, 8.0, 6.0, 3.0, 6.0, 12.0, 14.0, 13.0, 20.0, 14.0, 30.0, 17.0, 31.0, 26.0, 34.0, 40.0, 40.0, 55.0, 64.0, 72.0, 71.0, 47.0, 47.0, 33.0, 23.0, 25.0, 32.0, 20.0, 19.0, 30.0, 20.0, 20.0, 14.0, 13.0, 13.0, 8.0, 9.0, 9.0, 7.0, 8.0, 7.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.7454392910003662, -1.6966986656188965, -1.6479579210281372, -1.5992172956466675, -1.5504765510559082, -1.5017359256744385, -1.4529953002929688, -1.4042545557022095, -1.3555139303207397, -1.30677330493927, -1.2580325603485107, -1.209291934967041, -1.1605511903762817, -1.111810564994812, -1.0630698204040527, -1.014329195022583, -0.9655885100364685, -0.916847825050354, -0.8681071400642395, -0.819366455078125, -0.7706258296966553, -0.7218851447105408, -0.6731444597244263, -0.6244038343429565, -0.5756630897521973, -0.5269224047660828, -0.47818174958229065, -0.42944106459617615, -0.38070040941238403, -0.33195972442626953, -0.28321903944015503, -0.23447838425636292, -0.1857377290725708, -0.1369970589876175, -0.08825638145208359, -0.03951570391654968, 0.009224966168403625, 0.057965636253356934, 0.10670632123947144, 0.15544697642326355, 0.20418766140937805, 0.25292834639549255, 0.30166900157928467, 0.35040968656539917, 0.39915037155151367, 0.4478910267353058, 0.4966317117214203, 0.5453723669052124, 0.5941130518913269, 0.6428537368774414, 0.6915944218635559, 0.7403351068496704, 0.7890757322311401, 0.8378164172172546, 0.8865571022033691, 0.9352977275848389, 0.9840384721755981, 1.0327790975570679, 1.0815198421478271, 1.1302604675292969, 1.1790012121200562, 1.2277418375015259, 1.2764825820922852, 1.3252232074737549, 1.3739638328552246]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 13.0, 13.0, 22.0, 38.0, 61.0, 108.0, 177.0, 310.0, 628.0, 1551.0, 4382.0, 16977.0, 129775.0, 3754935.0, 252899.0, 23202.0, 5719.0, 1835.0, 763.0, 363.0, 195.0, 110.0, 62.0, 46.0, 27.0, 22.0, 13.0, 10.0, 9.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.351806640625, -0.3385810852050781, -0.32535552978515625, -0.3121299743652344, -0.2989044189453125, -0.2856788635253906, -0.27245330810546875, -0.2592277526855469, -0.246002197265625, -0.23277664184570312, -0.21955108642578125, -0.20632553100585938, -0.1930999755859375, -0.17987442016601562, -0.16664886474609375, -0.15342330932617188, -0.14019775390625, -0.12697219848632812, -0.11374664306640625, -0.10052108764648438, -0.0872955322265625, -0.07406997680664062, -0.06084442138671875, -0.047618865966796875, -0.034393310546875, -0.021167755126953125, -0.00794219970703125, 0.005283355712890625, 0.0185089111328125, 0.031734466552734375, 0.04496002197265625, 0.058185577392578125, 0.0714111328125, 0.08463668823242188, 0.09786224365234375, 0.11108779907226562, 0.1243133544921875, 0.13753890991210938, 0.15076446533203125, 0.16399002075195312, 0.177215576171875, 0.19044113159179688, 0.20366668701171875, 0.21689224243164062, 0.2301177978515625, 0.24334335327148438, 0.25656890869140625, 0.2697944641113281, 0.28302001953125, 0.2962455749511719, 0.30947113037109375, 0.3226966857910156, 0.3359222412109375, 0.3491477966308594, 0.36237335205078125, 0.3755989074707031, 0.388824462890625, 0.4020500183105469, 0.41527557373046875, 0.4285011291503906, 0.4417266845703125, 0.4549522399902344, 0.46817779541015625, 0.4814033508300781, 0.49462890625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 6.0, 4.0, 2.0, 6.0, 13.0, 13.0, 22.0, 25.0, 33.0, 37.0, 51.0, 67.0, 65.0, 64.0, 68.0, 60.0, 71.0, 77.0, 61.0, 52.0, 65.0, 36.0, 31.0, 21.0, 20.0, 9.0, 7.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1429443359375, -0.1386566162109375, -0.134368896484375, -0.1300811767578125, -0.12579345703125, -0.1215057373046875, -0.117218017578125, -0.1129302978515625, -0.108642578125, -0.1043548583984375, -0.100067138671875, -0.0957794189453125, -0.09149169921875, -0.0872039794921875, -0.082916259765625, -0.0786285400390625, -0.0743408203125, -0.0700531005859375, -0.065765380859375, -0.0614776611328125, -0.05718994140625, -0.0529022216796875, -0.048614501953125, -0.0443267822265625, -0.0400390625, -0.0357513427734375, -0.031463623046875, -0.0271759033203125, -0.02288818359375, -0.0186004638671875, -0.014312744140625, -0.0100250244140625, -0.0057373046875, -0.0014495849609375, 0.002838134765625, 0.0071258544921875, 0.01141357421875, 0.0157012939453125, 0.019989013671875, 0.0242767333984375, 0.028564453125, 0.0328521728515625, 0.037139892578125, 0.0414276123046875, 0.04571533203125, 0.0500030517578125, 0.054290771484375, 0.0585784912109375, 0.0628662109375, 0.0671539306640625, 0.071441650390625, 0.0757293701171875, 0.08001708984375, 0.0843048095703125, 0.088592529296875, 0.0928802490234375, 0.09716796875, 0.1014556884765625, 0.105743408203125, 0.1100311279296875, 0.11431884765625, 0.1186065673828125, 0.122894287109375, 0.1271820068359375, 0.1314697265625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 11.0, 12.0, 11.0, 21.0, 34.0, 51.0, 79.0, 178.0, 416.0, 1043.0, 3638.0, 17990.0, 295150.0, 3799945.0, 64187.0, 8076.0, 2098.0, 719.0, 288.0, 139.0, 72.0, 42.0, 17.0, 19.0, 8.0, 8.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6181640625, -0.597747802734375, -0.57733154296875, -0.556915283203125, -0.5364990234375, -0.516082763671875, -0.49566650390625, -0.475250244140625, -0.454833984375, -0.434417724609375, -0.41400146484375, -0.393585205078125, -0.3731689453125, -0.352752685546875, -0.33233642578125, -0.311920166015625, -0.29150390625, -0.271087646484375, -0.25067138671875, -0.230255126953125, -0.2098388671875, -0.189422607421875, -0.16900634765625, -0.148590087890625, -0.128173828125, -0.107757568359375, -0.08734130859375, -0.066925048828125, -0.0465087890625, -0.026092529296875, -0.00567626953125, 0.014739990234375, 0.03515625, 0.055572509765625, 0.07598876953125, 0.096405029296875, 0.1168212890625, 0.137237548828125, 0.15765380859375, 0.178070068359375, 0.198486328125, 0.218902587890625, 0.23931884765625, 0.259735107421875, 0.2801513671875, 0.300567626953125, 0.32098388671875, 0.341400146484375, 0.36181640625, 0.382232666015625, 0.40264892578125, 0.423065185546875, 0.4434814453125, 0.463897705078125, 0.48431396484375, 0.504730224609375, 0.525146484375, 0.545562744140625, 0.56597900390625, 0.586395263671875, 0.6068115234375, 0.627227783203125, 0.64764404296875, 0.668060302734375, 0.6884765625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 6.0, 1.0, 9.0, 8.0, 17.0, 24.0, 33.0, 34.0, 73.0, 89.0, 182.0, 408.0, 1162.0, 1114.0, 432.0, 198.0, 101.0, 42.0, 37.0, 28.0, 26.0, 9.0, 8.0, 7.0, 12.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.424072265625, -0.4094505310058594, -0.39482879638671875, -0.3802070617675781, -0.3655853271484375, -0.3509635925292969, -0.33634185791015625, -0.3217201232910156, -0.307098388671875, -0.2924766540527344, -0.27785491943359375, -0.2632331848144531, -0.2486114501953125, -0.23398971557617188, -0.21936798095703125, -0.20474624633789062, -0.19012451171875, -0.17550277709960938, -0.16088104248046875, -0.14625930786132812, -0.1316375732421875, -0.11701583862304688, -0.10239410400390625, -0.08777236938476562, -0.073150634765625, -0.058528900146484375, -0.04390716552734375, -0.029285430908203125, -0.0146636962890625, -4.1961669921875e-05, 0.01457977294921875, 0.029201507568359375, 0.0438232421875, 0.058444976806640625, 0.07306671142578125, 0.08768844604492188, 0.1023101806640625, 0.11693191528320312, 0.13155364990234375, 0.14617538452148438, 0.160797119140625, 0.17541885375976562, 0.19004058837890625, 0.20466232299804688, 0.2192840576171875, 0.23390579223632812, 0.24852752685546875, 0.2631492614746094, 0.27777099609375, 0.2923927307128906, 0.30701446533203125, 0.3216361999511719, 0.3362579345703125, 0.3508796691894531, 0.36550140380859375, 0.3801231384277344, 0.394744873046875, 0.4093666076660156, 0.42398834228515625, 0.4386100769042969, 0.4532318115234375, 0.4678535461425781, 0.48247528076171875, 0.4970970153808594, 0.51171875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 7.0, 8.0, 18.0, 44.0, 73.0, 143.0, 235.0, 207.0, 130.0, 74.0, 27.0, 11.0, 7.0, 6.0, 7.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.619357585906982, -6.483953952789307, -6.348550796508789, -6.213147163391113, -6.0777435302734375, -5.94234037399292, -5.806936740875244, -5.671533107757568, -5.536129951477051, -5.400726318359375, -5.265323162078857, -5.129919528961182, -4.994515895843506, -4.859112739562988, -4.7237091064453125, -4.588305473327637, -4.452901840209961, -4.317498207092285, -4.182095050811768, -4.046691417694092, -3.911288022994995, -3.7758846282958984, -3.6404809951782227, -3.505077600479126, -3.3696742057800293, -3.2342708110809326, -3.098867177963257, -2.96346378326416, -2.8280603885650635, -2.692656993865967, -2.557253360748291, -2.4218499660491943, -2.2864463329315186, -2.151042938232422, -2.015639305114746, -1.8802359104156494, -1.7448325157165527, -1.6094290018081665, -1.4740254878997803, -1.3386220932006836, -1.2032185792922974, -1.0678150653839111, -0.9324116706848145, -0.7970081567764282, -0.6616047024726868, -0.5262012481689453, -0.3907977342605591, -0.2553942799568176, -0.11999082565307617, 0.015412643551826477, 0.15081611275672913, 0.28621959686279297, 0.4216230511665344, 0.5570265054702759, 0.6924300193786621, 0.8278334736824036, 0.963236927986145, 1.0986404418945312, 1.234043836593628, 1.3694473505020142, 1.5048508644104004, 1.640254259109497, 1.7756577730178833, 1.9110612869262695, 2.046464681625366]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 14.0, 14.0, 8.0, 11.0, 22.0, 18.0, 28.0, 21.0, 23.0, 35.0, 43.0, 42.0, 51.0, 58.0, 59.0, 48.0, 52.0, 45.0, 53.0, 43.0, 36.0, 36.0, 40.0, 27.0, 25.0, 26.0, 24.0, 14.0, 17.0, 10.0, 14.0, 11.0, 10.0, 3.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8770756721496582, -1.8248622417449951, -1.7726486921310425, -1.7204352617263794, -1.6682217121124268, -1.6160082817077637, -1.5637948513031006, -1.5115814208984375, -1.4593678712844849, -1.4071544408798218, -1.3549408912658691, -1.302727460861206, -1.250514030456543, -1.1983004808425903, -1.1460870504379272, -1.0938735008239746, -1.0416600704193115, -0.9894465804100037, -0.9372330904006958, -0.8850196599960327, -0.8328061699867249, -0.780592679977417, -0.7283792495727539, -0.676165759563446, -0.6239522695541382, -0.5717387795448303, -0.5195252895355225, -0.4673118591308594, -0.4150983691215515, -0.36288487911224365, -0.3106714189052582, -0.2584579586982727, -0.20624446868896484, -0.15403099358081818, -0.10181751847267151, -0.04960404336452484, 0.002609431743621826, 0.05482292175292969, 0.10703638195991516, 0.15924984216690063, 0.2114633321762085, 0.26367682218551636, 0.31589028239250183, 0.3681037425994873, 0.42031723260879517, 0.472530722618103, 0.5247441530227661, 0.576957643032074, 0.6291711330413818, 0.6813846230506897, 0.7335981130599976, 0.7858115434646606, 0.8380250334739685, 0.8902385234832764, 0.9424519538879395, 0.9946654438972473, 1.0468789339065552, 1.0990923643112183, 1.151305913925171, 1.203519344329834, 1.255732774734497, 1.3079463243484497, 1.3601597547531128, 1.4123733043670654, 1.4645867347717285]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 6.0, 19.0, 42.0, 34.0, 57.0, 101.0, 164.0, 279.0, 518.0, 1051.0, 2106.0, 4512.0, 10808.0, 28629.0, 86034.0, 278871.0, 408688.0, 149433.0, 47516.0, 16696.0, 6870.0, 3066.0, 1434.0, 681.0, 362.0, 238.0, 119.0, 89.0, 38.0, 34.0, 14.0, 13.0, 9.0, 7.0, 3.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.254638671875, -0.24528884887695312, -0.23593902587890625, -0.22658920288085938, -0.2172393798828125, -0.20788955688476562, -0.19853973388671875, -0.18918991088867188, -0.179840087890625, -0.17049026489257812, -0.16114044189453125, -0.15179061889648438, -0.1424407958984375, -0.13309097290039062, -0.12374114990234375, -0.11439132690429688, -0.10504150390625, -0.09569168090820312, -0.08634185791015625, -0.07699203491210938, -0.0676422119140625, -0.058292388916015625, -0.04894256591796875, -0.039592742919921875, -0.030242919921875, -0.020893096923828125, -0.01154327392578125, -0.002193450927734375, 0.0071563720703125, 0.016506195068359375, 0.02585601806640625, 0.035205841064453125, 0.0445556640625, 0.053905487060546875, 0.06325531005859375, 0.07260513305664062, 0.0819549560546875, 0.09130477905273438, 0.10065460205078125, 0.11000442504882812, 0.119354248046875, 0.12870407104492188, 0.13805389404296875, 0.14740371704101562, 0.1567535400390625, 0.16610336303710938, 0.17545318603515625, 0.18480300903320312, 0.19415283203125, 0.20350265502929688, 0.21285247802734375, 0.22220230102539062, 0.2315521240234375, 0.24090194702148438, 0.25025177001953125, 0.2596015930175781, 0.268951416015625, 0.2783012390136719, 0.28765106201171875, 0.2970008850097656, 0.3063507080078125, 0.3157005310058594, 0.32505035400390625, 0.3344001770019531, 0.34375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 7.0, 6.0, 11.0, 19.0, 22.0, 27.0, 30.0, 45.0, 48.0, 57.0, 70.0, 71.0, 65.0, 71.0, 69.0, 65.0, 49.0, 53.0, 48.0, 40.0, 34.0, 24.0, 30.0, 15.0, 9.0, 8.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1832275390625, -0.1783123016357422, -0.17339706420898438, -0.16848182678222656, -0.16356658935546875, -0.15865135192871094, -0.15373611450195312, -0.1488208770751953, -0.1439056396484375, -0.1389904022216797, -0.13407516479492188, -0.12915992736816406, -0.12424468994140625, -0.11932945251464844, -0.11441421508789062, -0.10949897766113281, -0.104583740234375, -0.09966850280761719, -0.09475326538085938, -0.08983802795410156, -0.08492279052734375, -0.08000755310058594, -0.07509231567382812, -0.07017707824707031, -0.0652618408203125, -0.06034660339355469, -0.055431365966796875, -0.05051612854003906, -0.04560089111328125, -0.04068565368652344, -0.035770416259765625, -0.030855178833007812, -0.02593994140625, -0.021024703979492188, -0.016109466552734375, -0.011194229125976562, -0.00627899169921875, -0.0013637542724609375, 0.003551483154296875, 0.008466720581054688, 0.0133819580078125, 0.018297195434570312, 0.023212432861328125, 0.028127670288085938, 0.03304290771484375, 0.03795814514160156, 0.042873382568359375, 0.04778861999511719, 0.052703857421875, 0.05761909484863281, 0.06253433227539062, 0.06744956970214844, 0.07236480712890625, 0.07728004455566406, 0.08219528198242188, 0.08711051940917969, 0.0920257568359375, 0.09694099426269531, 0.10185623168945312, 0.10677146911621094, 0.11168670654296875, 0.11660194396972656, 0.12151718139648438, 0.1264324188232422, 0.13134765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 10.0, 10.0, 14.0, 19.0, 25.0, 35.0, 37.0, 56.0, 93.0, 127.0, 218.0, 314.0, 584.0, 1048.0, 2094.0, 4697.0, 14074.0, 58791.0, 597610.0, 300985.0, 47324.0, 11991.0, 4221.0, 1788.0, 939.0, 530.0, 322.0, 203.0, 121.0, 73.0, 61.0, 40.0, 24.0, 26.0, 9.0, 9.0, 13.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.483642578125, -0.4705467224121094, -0.45745086669921875, -0.4443550109863281, -0.4312591552734375, -0.4181632995605469, -0.40506744384765625, -0.3919715881347656, -0.378875732421875, -0.3657798767089844, -0.35268402099609375, -0.3395881652832031, -0.3264923095703125, -0.3133964538574219, -0.30030059814453125, -0.2872047424316406, -0.27410888671875, -0.2610130310058594, -0.24791717529296875, -0.23482131958007812, -0.2217254638671875, -0.20862960815429688, -0.19553375244140625, -0.18243789672851562, -0.169342041015625, -0.15624618530273438, -0.14315032958984375, -0.13005447387695312, -0.1169586181640625, -0.10386276245117188, -0.09076690673828125, -0.07767105102539062, -0.0645751953125, -0.051479339599609375, -0.03838348388671875, -0.025287628173828125, -0.0121917724609375, 0.000904083251953125, 0.01399993896484375, 0.027095794677734375, 0.040191650390625, 0.053287506103515625, 0.06638336181640625, 0.07947921752929688, 0.0925750732421875, 0.10567092895507812, 0.11876678466796875, 0.13186264038085938, 0.14495849609375, 0.15805435180664062, 0.17115020751953125, 0.18424606323242188, 0.1973419189453125, 0.21043777465820312, 0.22353363037109375, 0.23662948608398438, 0.249725341796875, 0.2628211975097656, 0.27591705322265625, 0.2890129089355469, 0.3021087646484375, 0.3152046203613281, 0.32830047607421875, 0.3413963317871094, 0.3544921875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 2.0, 7.0, 14.0, 13.0, 13.0, 19.0, 23.0, 33.0, 35.0, 34.0, 55.0, 61.0, 66.0, 82.0, 85.0, 73.0, 78.0, 54.0, 54.0, 44.0, 25.0, 34.0, 23.0, 9.0, 10.0, 7.0, 4.0, 6.0, 6.0, 7.0, 4.0, 2.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.72998046875, -0.7104415893554688, -0.6909027099609375, -0.6713638305664062, -0.651824951171875, -0.6322860717773438, -0.6127471923828125, -0.5932083129882812, -0.57366943359375, -0.5541305541992188, -0.5345916748046875, -0.5150527954101562, -0.495513916015625, -0.47597503662109375, -0.4564361572265625, -0.43689727783203125, -0.4173583984375, -0.39781951904296875, -0.3782806396484375, -0.35874176025390625, -0.339202880859375, -0.31966400146484375, -0.3001251220703125, -0.28058624267578125, -0.26104736328125, -0.24150848388671875, -0.2219696044921875, -0.20243072509765625, -0.182891845703125, -0.16335296630859375, -0.1438140869140625, -0.12427520751953125, -0.104736328125, -0.08519744873046875, -0.0656585693359375, -0.04611968994140625, -0.026580810546875, -0.00704193115234375, 0.0124969482421875, 0.03203582763671875, 0.05157470703125, 0.07111358642578125, 0.0906524658203125, 0.11019134521484375, 0.129730224609375, 0.14926910400390625, 0.1688079833984375, 0.18834686279296875, 0.2078857421875, 0.22742462158203125, 0.2469635009765625, 0.26650238037109375, 0.286041259765625, 0.30558013916015625, 0.3251190185546875, 0.34465789794921875, 0.36419677734375, 0.38373565673828125, 0.4032745361328125, 0.42281341552734375, 0.442352294921875, 0.46189117431640625, 0.4814300537109375, 0.5009689331054688, 0.5205078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 3.0, 11.0, 8.0, 9.0, 15.0, 20.0, 33.0, 61.0, 75.0, 121.0, 204.0, 389.0, 955.0, 2742.0, 8920.0, 44488.0, 768922.0, 190086.0, 22854.0, 5514.0, 1692.0, 652.0, 311.0, 158.0, 86.0, 57.0, 43.0, 32.0, 34.0, 22.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.253173828125, -0.24568557739257812, -0.23819732666015625, -0.23070907592773438, -0.2232208251953125, -0.21573257446289062, -0.20824432373046875, -0.20075607299804688, -0.193267822265625, -0.18577957153320312, -0.17829132080078125, -0.17080307006835938, -0.1633148193359375, -0.15582656860351562, -0.14833831787109375, -0.14085006713867188, -0.13336181640625, -0.12587356567382812, -0.11838531494140625, -0.11089706420898438, -0.1034088134765625, -0.09592056274414062, -0.08843231201171875, -0.08094406127929688, -0.073455810546875, -0.06596755981445312, -0.05847930908203125, -0.050991058349609375, -0.0435028076171875, -0.036014556884765625, -0.02852630615234375, -0.021038055419921875, -0.0135498046875, -0.006061553955078125, 0.00142669677734375, 0.008914947509765625, 0.0164031982421875, 0.023891448974609375, 0.03137969970703125, 0.038867950439453125, 0.046356201171875, 0.053844451904296875, 0.06133270263671875, 0.06882095336914062, 0.0763092041015625, 0.08379745483398438, 0.09128570556640625, 0.09877395629882812, 0.10626220703125, 0.11375045776367188, 0.12123870849609375, 0.12872695922851562, 0.1362152099609375, 0.14370346069335938, 0.15119171142578125, 0.15867996215820312, 0.166168212890625, 0.17365646362304688, 0.18114471435546875, 0.18863296508789062, 0.1961212158203125, 0.20360946655273438, 0.21109771728515625, 0.21858596801757812, 0.22607421875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 6.0, 14.0, 11.0, 18.0, 18.0, 15.0, 43.0, 39.0, 59.0, 77.0, 124.0, 123.0, 109.0, 73.0, 64.0, 45.0, 31.0, 20.0, 20.0, 15.0, 11.0, 9.0, 8.0, 5.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8770179748535156e-05, -5.7009048759937286e-05, -5.5247917771339417e-05, -5.348678678274155e-05, -5.172565579414368e-05, -4.996452480554581e-05, -4.820339381694794e-05, -4.644226282835007e-05, -4.46811318397522e-05, -4.292000085115433e-05, -4.115886986255646e-05, -3.939773887395859e-05, -3.763660788536072e-05, -3.587547689676285e-05, -3.411434590816498e-05, -3.235321491956711e-05, -3.059208393096924e-05, -2.883095294237137e-05, -2.70698219537735e-05, -2.530869096517563e-05, -2.354755997657776e-05, -2.178642898797989e-05, -2.002529799938202e-05, -1.826416701078415e-05, -1.650303602218628e-05, -1.474190503358841e-05, -1.298077404499054e-05, -1.121964305639267e-05, -9.4585120677948e-06, -7.69738107919693e-06, -5.93625009059906e-06, -4.17511910200119e-06, -2.4139881134033203e-06, -6.528571248054504e-07, 1.1082738637924194e-06, 2.8694048523902893e-06, 4.630535840988159e-06, 6.391666829586029e-06, 8.152797818183899e-06, 9.913928806781769e-06, 1.1675059795379639e-05, 1.3436190783977509e-05, 1.5197321772575378e-05, 1.6958452761173248e-05, 1.8719583749771118e-05, 2.0480714738368988e-05, 2.2241845726966858e-05, 2.4002976715564728e-05, 2.5764107704162598e-05, 2.7525238692760468e-05, 2.9286369681358337e-05, 3.104750066995621e-05, 3.280863165855408e-05, 3.456976264715195e-05, 3.633089363574982e-05, 3.809202462434769e-05, 3.985315561294556e-05, 4.1614286601543427e-05, 4.3375417590141296e-05, 4.5136548578739166e-05, 4.6897679567337036e-05, 4.8658810555934906e-05, 5.0419941544532776e-05, 5.2181072533130646e-05, 5.3942203521728516e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 7.0, 10.0, 7.0, 21.0, 28.0, 30.0, 49.0, 71.0, 130.0, 183.0, 315.0, 507.0, 903.0, 1731.0, 3951.0, 10032.0, 33946.0, 358694.0, 582779.0, 36477.0, 10381.0, 4092.0, 1949.0, 973.0, 486.0, 293.0, 176.0, 118.0, 53.0, 50.0, 32.0, 21.0, 16.0, 13.0, 8.0, 5.0, 8.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.28271484375, -0.27486610412597656, -0.2670173645019531, -0.2591686248779297, -0.25131988525390625, -0.2434711456298828, -0.23562240600585938, -0.22777366638183594, -0.2199249267578125, -0.21207618713378906, -0.20422744750976562, -0.1963787078857422, -0.18852996826171875, -0.1806812286376953, -0.17283248901367188, -0.16498374938964844, -0.157135009765625, -0.14928627014160156, -0.14143753051757812, -0.1335887908935547, -0.12574005126953125, -0.11789131164550781, -0.11004257202148438, -0.10219383239746094, -0.0943450927734375, -0.08649635314941406, -0.07864761352539062, -0.07079887390136719, -0.06295013427734375, -0.05510139465332031, -0.047252655029296875, -0.03940391540527344, -0.03155517578125, -0.023706436157226562, -0.015857696533203125, -0.008008956909179688, -0.00016021728515625, 0.0076885223388671875, 0.015537261962890625, 0.023386001586914062, 0.0312347412109375, 0.03908348083496094, 0.046932220458984375, 0.05478096008300781, 0.06262969970703125, 0.07047843933105469, 0.07832717895507812, 0.08617591857910156, 0.094024658203125, 0.10187339782714844, 0.10972213745117188, 0.11757087707519531, 0.12541961669921875, 0.1332683563232422, 0.14111709594726562, 0.14896583557128906, 0.1568145751953125, 0.16466331481933594, 0.17251205444335938, 0.1803607940673828, 0.18820953369140625, 0.1960582733154297, 0.20390701293945312, 0.21175575256347656, 0.2196044921875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 2.0, 7.0, 7.0, 5.0, 8.0, 8.0, 12.0, 20.0, 35.0, 37.0, 40.0, 71.0, 109.0, 134.0, 124.0, 107.0, 86.0, 45.0, 48.0, 24.0, 15.0, 14.0, 13.0, 10.0, 3.0, 7.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27001953125, -0.2618598937988281, -0.25370025634765625, -0.24554061889648438, -0.2373809814453125, -0.22922134399414062, -0.22106170654296875, -0.21290206909179688, -0.204742431640625, -0.19658279418945312, -0.18842315673828125, -0.18026351928710938, -0.1721038818359375, -0.16394424438476562, -0.15578460693359375, -0.14762496948242188, -0.13946533203125, -0.13130569458007812, -0.12314605712890625, -0.11498641967773438, -0.1068267822265625, -0.09866714477539062, -0.09050750732421875, -0.08234786987304688, -0.074188232421875, -0.06602859497070312, -0.05786895751953125, -0.049709320068359375, -0.0415496826171875, -0.033390045166015625, -0.02523040771484375, -0.017070770263671875, -0.0089111328125, -0.000751495361328125, 0.00740814208984375, 0.015567779541015625, 0.0237274169921875, 0.031887054443359375, 0.04004669189453125, 0.048206329345703125, 0.056365966796875, 0.06452560424804688, 0.07268524169921875, 0.08084487915039062, 0.0890045166015625, 0.09716415405273438, 0.10532379150390625, 0.11348342895507812, 0.12164306640625, 0.12980270385742188, 0.13796234130859375, 0.14612197875976562, 0.1542816162109375, 0.16244125366210938, 0.17060089111328125, 0.17876052856445312, 0.186920166015625, 0.19507980346679688, 0.20323944091796875, 0.21139907836914062, 0.2195587158203125, 0.22771835327148438, 0.23587799072265625, 0.24403762817382812, 0.252197265625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 15.0, 31.0, 42.0, 107.0, 196.0, 309.0, 140.0, 67.0, 38.0, 21.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.654610633850098, -5.490706443786621, -5.326802730560303, -5.162898540496826, -4.998994827270508, -4.835090637207031, -4.671186447143555, -4.507282257080078, -4.34337854385376, -4.179474353790283, -4.015570640563965, -3.8516664505004883, -3.687762498855591, -3.5238585472106934, -3.359954357147217, -3.1960504055023193, -3.032146453857422, -2.8682425022125244, -2.704338550567627, -2.5404343605041504, -2.376530408859253, -2.2126264572143555, -2.048722267150879, -1.8848183155059814, -1.720914363861084, -1.5570104122161865, -1.3931063413619995, -1.2292022705078125, -1.065298318862915, -0.9013943076133728, -0.7374902963638306, -0.5735862255096436, -0.4096822738647461, -0.24577826261520386, -0.08187425136566162, 0.08202975988388062, 0.24593377113342285, 0.4098377823829651, 0.5737417936325073, 0.7376458644866943, 0.9015498161315918, 1.0654537677764893, 1.2293578386306763, 1.3932619094848633, 1.5571658611297607, 1.7210698127746582, 1.8849738836288452, 2.0488779544830322, 2.2127819061279297, 2.376685857772827, 2.5405898094177246, 2.704493999481201, 2.8683979511260986, 3.032301902770996, 3.1962060928344727, 3.36011004447937, 3.5240139961242676, 3.687917947769165, 3.8518218994140625, 4.015726089477539, 4.179630279541016, 4.343533992767334, 4.5074381828308105, 4.671341896057129, 4.8352460861206055]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 7.0, 3.0, 5.0, 5.0, 13.0, 15.0, 14.0, 23.0, 15.0, 22.0, 28.0, 31.0, 41.0, 53.0, 52.0, 57.0, 62.0, 90.0, 71.0, 85.0, 55.0, 45.0, 35.0, 23.0, 20.0, 25.0, 16.0, 19.0, 20.0, 14.0, 6.0, 6.0, 7.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7739622592926025, -1.7097135782241821, -1.6454648971557617, -1.5812163352966309, -1.5169676542282104, -1.45271897315979, -1.3884704113006592, -1.3242217302322388, -1.2599730491638184, -1.195724368095398, -1.1314756870269775, -1.0672271251678467, -1.0029784440994263, -0.9387297630310059, -0.8744811415672302, -0.8102325201034546, -0.7459838390350342, -0.6817351579666138, -0.6174865365028381, -0.5532379150390625, -0.4889892339706421, -0.42474058270454407, -0.36049193143844604, -0.296243280172348, -0.23199462890625, -0.16774597764015198, -0.10349732637405396, -0.03924867510795593, 0.02499997615814209, 0.08924862742424011, 0.15349727869033813, 0.21774592995643616, 0.2819948196411133, 0.3462434709072113, 0.4104921221733093, 0.47474077343940735, 0.5389894247055054, 0.6032381057739258, 0.6674867272377014, 0.731735348701477, 0.7959840297698975, 0.8602327108383179, 0.9244813323020935, 0.9887299537658691, 1.0529786348342896, 1.11722731590271, 1.1814758777618408, 1.2457245588302612, 1.3099732398986816, 1.374221920967102, 1.4384706020355225, 1.5027191638946533, 1.5669678449630737, 1.6312165260314941, 1.695465087890625, 1.7597137689590454, 1.8239624500274658, 1.8882111310958862, 1.9524598121643066, 2.0167083740234375, 2.0809569358825684, 2.1452057361602783, 2.209454298019409, 2.273703098297119, 2.33795166015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 2.0, 3.0, 5.0, 3.0, 12.0, 17.0, 17.0, 24.0, 39.0, 57.0, 88.0, 115.0, 179.0, 325.0, 598.0, 1152.0, 2166.0, 5073.0, 13826.0, 48317.0, 267252.0, 2733127.0, 973616.0, 108212.0, 25137.0, 8251.0, 3326.0, 1528.0, 773.0, 435.0, 212.0, 142.0, 69.0, 52.0, 42.0, 35.0, 24.0, 11.0, 7.0, 3.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3984375, -0.38458251953125, -0.3707275390625, -0.35687255859375, -0.343017578125, -0.32916259765625, -0.3153076171875, -0.30145263671875, -0.28759765625, -0.27374267578125, -0.2598876953125, -0.24603271484375, -0.232177734375, -0.21832275390625, -0.2044677734375, -0.19061279296875, -0.1767578125, -0.16290283203125, -0.1490478515625, -0.13519287109375, -0.121337890625, -0.10748291015625, -0.0936279296875, -0.07977294921875, -0.06591796875, -0.05206298828125, -0.0382080078125, -0.02435302734375, -0.010498046875, 0.00335693359375, 0.0172119140625, 0.03106689453125, 0.044921875, 0.05877685546875, 0.0726318359375, 0.08648681640625, 0.100341796875, 0.11419677734375, 0.1280517578125, 0.14190673828125, 0.15576171875, 0.16961669921875, 0.1834716796875, 0.19732666015625, 0.211181640625, 0.22503662109375, 0.2388916015625, 0.25274658203125, 0.2666015625, 0.28045654296875, 0.2943115234375, 0.30816650390625, 0.322021484375, 0.33587646484375, 0.3497314453125, 0.36358642578125, 0.37744140625, 0.39129638671875, 0.4051513671875, 0.41900634765625, 0.432861328125, 0.44671630859375, 0.4605712890625, 0.47442626953125, 0.48828125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 5.0, 20.0, 20.0, 33.0, 53.0, 57.0, 60.0, 72.0, 62.0, 81.0, 72.0, 80.0, 73.0, 69.0, 49.0, 58.0, 34.0, 25.0, 25.0, 13.0, 12.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.17835235595703125, -0.1729888916015625, -0.16762542724609375, -0.162261962890625, -0.15689849853515625, -0.1515350341796875, -0.14617156982421875, -0.14080810546875, -0.13544464111328125, -0.1300811767578125, -0.12471771240234375, -0.119354248046875, -0.11399078369140625, -0.1086273193359375, -0.10326385498046875, -0.097900390625, -0.09253692626953125, -0.0871734619140625, -0.08180999755859375, -0.076446533203125, -0.07108306884765625, -0.0657196044921875, -0.06035614013671875, -0.05499267578125, -0.04962921142578125, -0.0442657470703125, -0.03890228271484375, -0.033538818359375, -0.02817535400390625, -0.0228118896484375, -0.01744842529296875, -0.0120849609375, -0.00672149658203125, -0.0013580322265625, 0.00400543212890625, 0.009368896484375, 0.01473236083984375, 0.0200958251953125, 0.02545928955078125, 0.03082275390625, 0.03618621826171875, 0.0415496826171875, 0.04691314697265625, 0.052276611328125, 0.05764007568359375, 0.0630035400390625, 0.06836700439453125, 0.07373046875, 0.07909393310546875, 0.0844573974609375, 0.08982086181640625, 0.095184326171875, 0.10054779052734375, 0.1059112548828125, 0.11127471923828125, 0.11663818359375, 0.12200164794921875, 0.1273651123046875, 0.13272857666015625, 0.138092041015625, 0.14345550537109375, 0.1488189697265625, 0.15418243408203125, 0.1595458984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 10.0, 19.0, 26.0, 40.0, 50.0, 80.0, 110.0, 177.0, 286.0, 574.0, 1170.0, 2822.0, 9073.0, 51527.0, 2193937.0, 1872098.0, 48485.0, 8489.0, 2631.0, 1186.0, 603.0, 338.0, 189.0, 119.0, 76.0, 54.0, 30.0, 20.0, 17.0, 10.0, 9.0, 7.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.025390625, -0.9960861206054688, -0.9667816162109375, -0.9374771118164062, -0.908172607421875, -0.8788681030273438, -0.8495635986328125, -0.8202590942382812, -0.79095458984375, -0.7616500854492188, -0.7323455810546875, -0.7030410766601562, -0.673736572265625, -0.6444320678710938, -0.6151275634765625, -0.5858230590820312, -0.5565185546875, -0.5272140502929688, -0.4979095458984375, -0.46860504150390625, -0.439300537109375, -0.40999603271484375, -0.3806915283203125, -0.35138702392578125, -0.32208251953125, -0.29277801513671875, -0.2634735107421875, -0.23416900634765625, -0.204864501953125, -0.17555999755859375, -0.1462554931640625, -0.11695098876953125, -0.087646484375, -0.05834197998046875, -0.0290374755859375, 0.00026702880859375, 0.029571533203125, 0.05887603759765625, 0.0881805419921875, 0.11748504638671875, 0.14678955078125, 0.17609405517578125, 0.2053985595703125, 0.23470306396484375, 0.264007568359375, 0.29331207275390625, 0.3226165771484375, 0.35192108154296875, 0.3812255859375, 0.41053009033203125, 0.4398345947265625, 0.46913909912109375, 0.498443603515625, 0.5277481079101562, 0.5570526123046875, 0.5863571166992188, 0.61566162109375, 0.6449661254882812, 0.6742706298828125, 0.7035751342773438, 0.732879638671875, 0.7621841430664062, 0.7914886474609375, 0.8207931518554688, 0.85009765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 7.0, 10.0, 14.0, 28.0, 36.0, 49.0, 67.0, 107.0, 140.0, 225.0, 290.0, 491.0, 771.0, 618.0, 410.0, 250.0, 182.0, 111.0, 74.0, 49.0, 32.0, 32.0, 13.0, 8.0, 10.0, 8.0, 8.0, 7.0, 2.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75341796875, -0.7317657470703125, -0.710113525390625, -0.6884613037109375, -0.66680908203125, -0.6451568603515625, -0.623504638671875, -0.6018524169921875, -0.5802001953125, -0.5585479736328125, -0.536895751953125, -0.5152435302734375, -0.49359130859375, -0.4719390869140625, -0.450286865234375, -0.4286346435546875, -0.406982421875, -0.3853302001953125, -0.363677978515625, -0.3420257568359375, -0.32037353515625, -0.2987213134765625, -0.277069091796875, -0.2554168701171875, -0.2337646484375, -0.2121124267578125, -0.190460205078125, -0.1688079833984375, -0.14715576171875, -0.1255035400390625, -0.103851318359375, -0.0821990966796875, -0.060546875, -0.0388946533203125, -0.017242431640625, 0.0044097900390625, 0.02606201171875, 0.0477142333984375, 0.069366455078125, 0.0910186767578125, 0.1126708984375, 0.1343231201171875, 0.155975341796875, 0.1776275634765625, 0.19927978515625, 0.2209320068359375, 0.242584228515625, 0.2642364501953125, 0.285888671875, 0.3075408935546875, 0.329193115234375, 0.3508453369140625, 0.37249755859375, 0.3941497802734375, 0.415802001953125, 0.4374542236328125, 0.4591064453125, 0.4807586669921875, 0.502410888671875, 0.5240631103515625, 0.54571533203125, 0.5673675537109375, 0.589019775390625, 0.6106719970703125, 0.63232421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 13.0, 5.0, 15.0, 26.0, 52.0, 62.0, 143.0, 190.0, 196.0, 124.0, 70.0, 37.0, 17.0, 12.0, 4.0, 8.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.430160522460938, -8.1155366897583, -7.8009138107299805, -7.486290454864502, -7.171667098999023, -6.857043266296387, -6.542419910430908, -6.22779655456543, -5.913173198699951, -5.598549842834473, -5.283926486968994, -4.969303131103516, -4.654679298400879, -4.340056419372559, -4.025432586669922, -3.7108092308044434, -3.396185874938965, -3.0815625190734863, -2.766939163208008, -2.45231556892395, -2.1376922130584717, -1.8230688571929932, -1.508445382118225, -1.193821907043457, -0.8791985511779785, -0.5645751357078552, -0.24995172023773193, 0.06467169523239136, 0.37929511070251465, 0.6939184665679932, 1.0085419416427612, 1.3231654167175293, 1.6377887725830078, 1.9524121284484863, 2.267035484313965, 2.5816590785980225, 2.896282434463501, 3.2109057903289795, 3.525529384613037, 3.8401527404785156, 4.154776096343994, 4.469399452209473, 4.784022808074951, 5.09864616394043, 5.413269996643066, 5.727892875671387, 6.042516708374023, 6.357140064239502, 6.6717634201049805, 6.986386775970459, 7.3010101318359375, 7.615633487701416, 7.9302568435668945, 8.244880676269531, 8.559503555297852, 8.874127388000488, 9.188751220703125, 9.503375053405762, 9.817997932434082, 10.132621765136719, 10.447244644165039, 10.761868476867676, 11.076491355895996, 11.391115188598633, 11.705738067626953]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 10.0, 6.0, 12.0, 23.0, 25.0, 18.0, 27.0, 50.0, 37.0, 56.0, 53.0, 68.0, 67.0, 76.0, 83.0, 62.0, 54.0, 47.0, 42.0, 33.0, 26.0, 28.0, 20.0, 19.0, 18.0, 10.0, 16.0, 0.0, 3.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.484915733337402, -5.342550277709961, -5.200184345245361, -5.057818412780762, -4.91545295715332, -4.773087501525879, -4.630721569061279, -4.48835563659668, -4.345990180969238, -4.203624725341797, -4.061258792877197, -3.9188930988311768, -3.7765274047851562, -3.6341617107391357, -3.4917960166931152, -3.3494303226470947, -3.207064628601074, -3.0646989345550537, -2.922333240509033, -2.7799675464630127, -2.637601852416992, -2.4952361583709717, -2.352870464324951, -2.2105047702789307, -2.06813907623291, -1.9257733821868896, -1.7834076881408691, -1.6410419940948486, -1.4986763000488281, -1.3563106060028076, -1.213944911956787, -1.0715792179107666, -0.9292135238647461, -0.7868478298187256, -0.6444821357727051, -0.5021164417266846, -0.35975074768066406, -0.21738505363464355, -0.07501935958862305, 0.06734633445739746, 0.20971202850341797, 0.3520777225494385, 0.494443416595459, 0.6368091106414795, 0.7791748046875, 0.9215404987335205, 1.063906192779541, 1.2062718868255615, 1.348637580871582, 1.4910032749176025, 1.633368968963623, 1.7757346630096436, 1.918100357055664, 2.0604660511016846, 2.202831745147705, 2.3451974391937256, 2.487563133239746, 2.6299288272857666, 2.772294521331787, 2.9146602153778076, 3.057025909423828, 3.1993916034698486, 3.341757297515869, 3.4841229915618896, 3.62648868560791]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 5.0, 9.0, 15.0, 15.0, 24.0, 46.0, 65.0, 126.0, 176.0, 300.0, 573.0, 1111.0, 2337.0, 5476.0, 15703.0, 53462.0, 238637.0, 559859.0, 122011.0, 31153.0, 9942.0, 3893.0, 1719.0, 805.0, 433.0, 252.0, 143.0, 79.0, 59.0, 45.0, 23.0, 17.0, 11.0, 8.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.4501953125, -0.43843841552734375, -0.4266815185546875, -0.41492462158203125, -0.403167724609375, -0.39141082763671875, -0.3796539306640625, -0.36789703369140625, -0.35614013671875, -0.34438323974609375, -0.3326263427734375, -0.32086944580078125, -0.309112548828125, -0.29735565185546875, -0.2855987548828125, -0.27384185791015625, -0.2620849609375, -0.25032806396484375, -0.2385711669921875, -0.22681427001953125, -0.215057373046875, -0.20330047607421875, -0.1915435791015625, -0.17978668212890625, -0.16802978515625, -0.15627288818359375, -0.1445159912109375, -0.13275909423828125, -0.121002197265625, -0.10924530029296875, -0.0974884033203125, -0.08573150634765625, -0.073974609375, -0.06221771240234375, -0.0504608154296875, -0.03870391845703125, -0.026947021484375, -0.01519012451171875, -0.0034332275390625, 0.00832366943359375, 0.02008056640625, 0.03183746337890625, 0.0435943603515625, 0.05535125732421875, 0.067108154296875, 0.07886505126953125, 0.0906219482421875, 0.10237884521484375, 0.1141357421875, 0.12589263916015625, 0.1376495361328125, 0.14940643310546875, 0.161163330078125, 0.17292022705078125, 0.1846771240234375, 0.19643402099609375, 0.20819091796875, 0.21994781494140625, 0.2317047119140625, 0.24346160888671875, 0.255218505859375, 0.26697540283203125, 0.2787322998046875, 0.29048919677734375, 0.30224609375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 9.0, 7.0, 16.0, 24.0, 31.0, 35.0, 43.0, 54.0, 72.0, 81.0, 67.0, 92.0, 82.0, 79.0, 57.0, 57.0, 40.0, 42.0, 33.0, 21.0, 15.0, 19.0, 9.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26513671875, -0.256195068359375, -0.24725341796875, -0.238311767578125, -0.2293701171875, -0.220428466796875, -0.21148681640625, -0.202545166015625, -0.193603515625, -0.184661865234375, -0.17572021484375, -0.166778564453125, -0.1578369140625, -0.148895263671875, -0.13995361328125, -0.131011962890625, -0.1220703125, -0.113128662109375, -0.10418701171875, -0.095245361328125, -0.0863037109375, -0.077362060546875, -0.06842041015625, -0.059478759765625, -0.050537109375, -0.041595458984375, -0.03265380859375, -0.023712158203125, -0.0147705078125, -0.005828857421875, 0.00311279296875, 0.012054443359375, 0.02099609375, 0.029937744140625, 0.03887939453125, 0.047821044921875, 0.0567626953125, 0.065704345703125, 0.07464599609375, 0.083587646484375, 0.092529296875, 0.101470947265625, 0.11041259765625, 0.119354248046875, 0.1282958984375, 0.137237548828125, 0.14617919921875, 0.155120849609375, 0.1640625, 0.173004150390625, 0.18194580078125, 0.190887451171875, 0.1998291015625, 0.208770751953125, 0.21771240234375, 0.226654052734375, 0.235595703125, 0.244537353515625, 0.25347900390625, 0.262420654296875, 0.2713623046875, 0.280303955078125, 0.28924560546875, 0.298187255859375, 0.30712890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 9.0, 13.0, 11.0, 15.0, 57.0, 65.0, 84.0, 144.0, 213.0, 332.0, 684.0, 1521.0, 4759.0, 21110.0, 198469.0, 776765.0, 33427.0, 6738.0, 2039.0, 888.0, 437.0, 273.0, 166.0, 102.0, 59.0, 50.0, 30.0, 29.0, 17.0, 14.0, 9.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5478515625, -0.53179931640625, -0.5157470703125, -0.49969482421875, -0.483642578125, -0.46759033203125, -0.4515380859375, -0.43548583984375, -0.41943359375, -0.40338134765625, -0.3873291015625, -0.37127685546875, -0.355224609375, -0.33917236328125, -0.3231201171875, -0.30706787109375, -0.291015625, -0.27496337890625, -0.2589111328125, -0.24285888671875, -0.226806640625, -0.21075439453125, -0.1947021484375, -0.17864990234375, -0.16259765625, -0.14654541015625, -0.1304931640625, -0.11444091796875, -0.098388671875, -0.08233642578125, -0.0662841796875, -0.05023193359375, -0.0341796875, -0.01812744140625, -0.0020751953125, 0.01397705078125, 0.030029296875, 0.04608154296875, 0.0621337890625, 0.07818603515625, 0.09423828125, 0.11029052734375, 0.1263427734375, 0.14239501953125, 0.158447265625, 0.17449951171875, 0.1905517578125, 0.20660400390625, 0.22265625, 0.23870849609375, 0.2547607421875, 0.27081298828125, 0.286865234375, 0.30291748046875, 0.3189697265625, 0.33502197265625, 0.35107421875, 0.36712646484375, 0.3831787109375, 0.39923095703125, 0.415283203125, 0.43133544921875, 0.4473876953125, 0.46343994140625, 0.4794921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 3.0, 3.0, 6.0, 4.0, 6.0, 8.0, 11.0, 12.0, 7.0, 20.0, 28.0, 29.0, 43.0, 40.0, 70.0, 70.0, 91.0, 104.0, 97.0, 63.0, 50.0, 43.0, 30.0, 31.0, 20.0, 27.0, 16.0, 16.0, 7.0, 7.0, 8.0, 9.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0068359375, -0.975341796875, -0.94384765625, -0.912353515625, -0.880859375, -0.849365234375, -0.81787109375, -0.786376953125, -0.7548828125, -0.723388671875, -0.69189453125, -0.660400390625, -0.62890625, -0.597412109375, -0.56591796875, -0.534423828125, -0.5029296875, -0.471435546875, -0.43994140625, -0.408447265625, -0.376953125, -0.345458984375, -0.31396484375, -0.282470703125, -0.2509765625, -0.219482421875, -0.18798828125, -0.156494140625, -0.125, -0.093505859375, -0.06201171875, -0.030517578125, 0.0009765625, 0.032470703125, 0.06396484375, 0.095458984375, 0.126953125, 0.158447265625, 0.18994140625, 0.221435546875, 0.2529296875, 0.284423828125, 0.31591796875, 0.347412109375, 0.37890625, 0.410400390625, 0.44189453125, 0.473388671875, 0.5048828125, 0.536376953125, 0.56787109375, 0.599365234375, 0.630859375, 0.662353515625, 0.69384765625, 0.725341796875, 0.7568359375, 0.788330078125, 0.81982421875, 0.851318359375, 0.8828125, 0.914306640625, 0.94580078125, 0.977294921875, 1.0087890625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 6.0, 5.0, 9.0, 18.0, 15.0, 22.0, 20.0, 50.0, 69.0, 95.0, 174.0, 278.0, 539.0, 1117.0, 2709.0, 8319.0, 37317.0, 816774.0, 151818.0, 20165.0, 5211.0, 1924.0, 861.0, 392.0, 231.0, 146.0, 72.0, 52.0, 36.0, 25.0, 24.0, 22.0, 14.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.100341796875, -0.09685897827148438, -0.09337615966796875, -0.08989334106445312, -0.0864105224609375, -0.08292770385742188, -0.07944488525390625, -0.07596206665039062, -0.072479248046875, -0.06899642944335938, -0.06551361083984375, -0.062030792236328125, -0.0585479736328125, -0.055065155029296875, -0.05158233642578125, -0.048099517822265625, -0.04461669921875, -0.041133880615234375, -0.03765106201171875, -0.034168243408203125, -0.0306854248046875, -0.027202606201171875, -0.02371978759765625, -0.020236968994140625, -0.016754150390625, -0.013271331787109375, -0.00978851318359375, -0.006305694580078125, -0.0028228759765625, 0.000659942626953125, 0.00414276123046875, 0.007625579833984375, 0.0111083984375, 0.014591217041015625, 0.01807403564453125, 0.021556854248046875, 0.0250396728515625, 0.028522491455078125, 0.03200531005859375, 0.035488128662109375, 0.038970947265625, 0.042453765869140625, 0.04593658447265625, 0.049419403076171875, 0.0529022216796875, 0.056385040283203125, 0.05986785888671875, 0.06335067749023438, 0.06683349609375, 0.07031631469726562, 0.07379913330078125, 0.07728195190429688, 0.0807647705078125, 0.08424758911132812, 0.08773040771484375, 0.09121322631835938, 0.094696044921875, 0.09817886352539062, 0.10166168212890625, 0.10514450073242188, 0.1086273193359375, 0.11211013793945312, 0.11559295654296875, 0.11907577514648438, 0.12255859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 11.0, 10.0, 10.0, 15.0, 22.0, 27.0, 41.0, 61.0, 105.0, 127.0, 127.0, 115.0, 89.0, 66.0, 45.0, 38.0, 25.0, 13.0, 8.0, 15.0, 7.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.93986701965332e-05, -3.8144178688526154e-05, -3.6889687180519104e-05, -3.5635195672512054e-05, -3.4380704164505005e-05, -3.3126212656497955e-05, -3.1871721148490906e-05, -3.0617229640483856e-05, -2.9362738132476807e-05, -2.8108246624469757e-05, -2.6853755116462708e-05, -2.5599263608455658e-05, -2.434477210044861e-05, -2.309028059244156e-05, -2.183578908443451e-05, -2.058129757642746e-05, -1.932680606842041e-05, -1.807231456041336e-05, -1.681782305240631e-05, -1.556333154439926e-05, -1.4308840036392212e-05, -1.3054348528385162e-05, -1.1799857020378113e-05, -1.0545365512371063e-05, -9.290874004364014e-06, -8.036382496356964e-06, -6.7818909883499146e-06, -5.527399480342865e-06, -4.2729079723358154e-06, -3.018416464328766e-06, -1.7639249563217163e-06, -5.094334483146667e-07, 7.450580596923828e-07, 1.9995495676994324e-06, 3.254041075706482e-06, 4.5085325837135315e-06, 5.763024091720581e-06, 7.017515599727631e-06, 8.27200710773468e-06, 9.52649861574173e-06, 1.078099012374878e-05, 1.2035481631755829e-05, 1.3289973139762878e-05, 1.4544464647769928e-05, 1.5798956155776978e-05, 1.7053447663784027e-05, 1.8307939171791077e-05, 1.9562430679798126e-05, 2.0816922187805176e-05, 2.2071413695812225e-05, 2.3325905203819275e-05, 2.4580396711826324e-05, 2.5834888219833374e-05, 2.7089379727840424e-05, 2.8343871235847473e-05, 2.9598362743854523e-05, 3.085285425186157e-05, 3.210734575986862e-05, 3.336183726787567e-05, 3.461632877588272e-05, 3.587082028388977e-05, 3.712531179189682e-05, 3.837980329990387e-05, 3.963429480791092e-05, 4.088878631591797e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 7.0, 6.0, 6.0, 5.0, 12.0, 13.0, 20.0, 23.0, 42.0, 36.0, 54.0, 79.0, 113.0, 217.0, 256.0, 402.0, 720.0, 1253.0, 2024.0, 3918.0, 7694.0, 17140.0, 44826.0, 198080.0, 672239.0, 58899.0, 20797.0, 9144.0, 4401.0, 2407.0, 1389.0, 814.0, 500.0, 303.0, 224.0, 150.0, 94.0, 74.0, 43.0, 36.0, 26.0, 22.0, 14.0, 2.0, 6.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.061614990234375, -0.05956888198852539, -0.05752277374267578, -0.05547666549682617, -0.05343055725097656, -0.05138444900512695, -0.049338340759277344, -0.047292232513427734, -0.045246124267578125, -0.043200016021728516, -0.041153907775878906, -0.0391077995300293, -0.03706169128417969, -0.03501558303833008, -0.03296947479248047, -0.03092336654663086, -0.02887725830078125, -0.02683115005493164, -0.02478504180908203, -0.022738933563232422, -0.020692825317382812, -0.018646717071533203, -0.016600608825683594, -0.014554500579833984, -0.012508392333984375, -0.010462284088134766, -0.008416175842285156, -0.006370067596435547, -0.0043239593505859375, -0.002277851104736328, -0.00023174285888671875, 0.0018143653869628906, 0.0038604736328125, 0.005906581878662109, 0.007952690124511719, 0.009998798370361328, 0.012044906616210938, 0.014091014862060547, 0.016137123107910156, 0.018183231353759766, 0.020229339599609375, 0.022275447845458984, 0.024321556091308594, 0.026367664337158203, 0.028413772583007812, 0.030459880828857422, 0.03250598907470703, 0.03455209732055664, 0.03659820556640625, 0.03864431381225586, 0.04069042205810547, 0.04273653030395508, 0.04478263854980469, 0.0468287467956543, 0.048874855041503906, 0.050920963287353516, 0.052967071533203125, 0.055013179779052734, 0.057059288024902344, 0.05910539627075195, 0.06115150451660156, 0.06319761276245117, 0.06524372100830078, 0.06728982925415039, 0.0693359375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 4.0, 6.0, 11.0, 12.0, 11.0, 17.0, 15.0, 34.0, 23.0, 19.0, 39.0, 59.0, 70.0, 103.0, 112.0, 103.0, 92.0, 60.0, 48.0, 24.0, 21.0, 23.0, 20.0, 12.0, 13.0, 13.0, 4.0, 8.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08319091796875, -0.08018112182617188, -0.07717132568359375, -0.07416152954101562, -0.0711517333984375, -0.06814193725585938, -0.06513214111328125, -0.062122344970703125, -0.059112548828125, -0.056102752685546875, -0.05309295654296875, -0.050083160400390625, -0.0470733642578125, -0.044063568115234375, -0.04105377197265625, -0.038043975830078125, -0.0350341796875, -0.032024383544921875, -0.02901458740234375, -0.026004791259765625, -0.0229949951171875, -0.019985198974609375, -0.01697540283203125, -0.013965606689453125, -0.010955810546875, -0.007946014404296875, -0.00493621826171875, -0.001926422119140625, 0.0010833740234375, 0.004093170166015625, 0.00710296630859375, 0.010112762451171875, 0.01312255859375, 0.016132354736328125, 0.01914215087890625, 0.022151947021484375, 0.0251617431640625, 0.028171539306640625, 0.03118133544921875, 0.034191131591796875, 0.037200927734375, 0.040210723876953125, 0.04322052001953125, 0.046230316162109375, 0.0492401123046875, 0.052249908447265625, 0.05525970458984375, 0.058269500732421875, 0.061279296875, 0.06428909301757812, 0.06729888916015625, 0.07030868530273438, 0.0733184814453125, 0.07632827758789062, 0.07933807373046875, 0.08234786987304688, 0.085357666015625, 0.08836746215820312, 0.09137725830078125, 0.09438705444335938, 0.0973968505859375, 0.10040664672851562, 0.10341644287109375, 0.10642623901367188, 0.10943603515625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 7.0, 7.0, 14.0, 27.0, 28.0, 70.0, 200.0, 300.0, 182.0, 67.0, 30.0, 25.0, 16.0, 15.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4611735343933105, -3.3397510051727295, -3.2183284759521484, -3.0969057083129883, -2.9754831790924072, -2.854060649871826, -2.732638120651245, -2.611215591430664, -2.489792823791504, -2.368370294570923, -2.246947765350342, -2.1255249977111816, -2.0041024684906006, -1.8826799392700195, -1.7612574100494385, -1.6398347616195679, -1.5184122323989868, -1.3969897031784058, -1.2755670547485352, -1.154144525527954, -1.0327218770980835, -0.9112993478775024, -0.7898767590522766, -0.6684541702270508, -0.547031581401825, -0.4256089925765991, -0.3041864037513733, -0.18276384472846985, -0.06134125590324402, 0.060081303119659424, 0.18150389194488525, 0.3029264807701111, 0.4243490695953369, 0.5457716584205627, 0.6671942472457886, 0.7886167764663696, 0.9100394248962402, 1.0314619541168213, 1.1528844833374023, 1.274307131767273, 1.3957297801971436, 1.5171523094177246, 1.6385749578475952, 1.7599974870681763, 1.8814201354980469, 2.002842664718628, 2.124265193939209, 2.245687961578369, 2.367110252380371, 2.488532781600952, 2.609955310821533, 2.7313780784606934, 2.8528006076812744, 2.9742231369018555, 3.0956456661224365, 3.2170681953430176, 3.3384909629821777, 3.459913492202759, 3.58133602142334, 3.7027587890625, 3.824181318283081, 3.945603847503662, 4.067026615142822, 4.188448905944824, 4.309871673583984]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 13.0, 19.0, 18.0, 20.0, 25.0, 34.0, 57.0, 134.0, 124.0, 96.0, 129.0, 105.0, 46.0, 31.0, 29.0, 26.0, 20.0, 14.0, 11.0, 13.0, 8.0, 7.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.718404769897461, -4.604491710662842, -4.490578651428223, -4.3766655921936035, -4.262752532958984, -4.148839473724365, -4.034926414489746, -3.921013355255127, -3.807100296020508, -3.6931872367858887, -3.5792741775512695, -3.4653611183166504, -3.3514480590820312, -3.237534999847412, -3.123621940612793, -3.009708881378174, -2.8957958221435547, -2.7818827629089355, -2.6679697036743164, -2.5540566444396973, -2.440143585205078, -2.326230525970459, -2.21231746673584, -2.0984044075012207, -1.9844913482666016, -1.8705782890319824, -1.7566652297973633, -1.6427521705627441, -1.528839111328125, -1.4149260520935059, -1.3010129928588867, -1.1870999336242676, -1.0731868743896484, -0.9592738151550293, -0.8453607559204102, -0.731447696685791, -0.6175346374511719, -0.5036215782165527, -0.3897085189819336, -0.27579545974731445, -0.1618824005126953, -0.04796934127807617, 0.06594371795654297, 0.1798567771911621, 0.29376983642578125, 0.4076828956604004, 0.5215959548950195, 0.6355090141296387, 0.7494220733642578, 0.863335132598877, 0.9772481918334961, 1.0911612510681152, 1.2050743103027344, 1.3189873695373535, 1.4329004287719727, 1.5468134880065918, 1.660726547241211, 1.77463960647583, 1.8885526657104492, 2.0024657249450684, 2.1163787841796875, 2.2302918434143066, 2.344204902648926, 2.458117961883545, 2.572031021118164]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 10.0, 10.0, 7.0, 7.0, 13.0, 13.0, 6.0, 16.0, 18.0, 19.0, 19.0, 23.0, 29.0, 34.0, 48.0, 27.0, 98.0, 238.0, 72.0, 41.0, 26.0, 24.0, 23.0, 24.0, 24.0, 16.0, 12.0, 17.0, 13.0, 14.0, 7.0, 8.0, 7.0, 6.0, 8.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.173828125, -0.16828155517578125, -0.1627349853515625, -0.15718841552734375, -0.151641845703125, -0.14609527587890625, -0.1405487060546875, -0.13500213623046875, -0.12945556640625, -0.12390899658203125, -0.1183624267578125, -0.11281585693359375, -0.107269287109375, -0.10172271728515625, -0.0961761474609375, -0.09062957763671875, -0.0850830078125, -0.07953643798828125, -0.0739898681640625, -0.06844329833984375, -0.062896728515625, -0.05735015869140625, -0.0518035888671875, -0.04625701904296875, -0.04071044921875, -0.03516387939453125, -0.0296173095703125, -0.02407073974609375, -0.018524169921875, -0.01297760009765625, -0.0074310302734375, -0.00188446044921875, 0.003662109375, 0.00920867919921875, 0.0147552490234375, 0.02030181884765625, 0.025848388671875, 0.03139495849609375, 0.0369415283203125, 0.04248809814453125, 0.04803466796875, 0.05358123779296875, 0.0591278076171875, 0.06467437744140625, 0.070220947265625, 0.07576751708984375, 0.0813140869140625, 0.08686065673828125, 0.0924072265625, 0.09795379638671875, 0.1035003662109375, 0.10904693603515625, 0.114593505859375, 0.12014007568359375, 0.1256866455078125, 0.13123321533203125, 0.13677978515625, 0.14232635498046875, 0.1478729248046875, 0.15341949462890625, 0.158966064453125, 0.16451263427734375, 0.1700592041015625, 0.17560577392578125, 0.18115234375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 6.0, 7.0, 14.0, 14.0, 10.0, 26.0, 41.0, 73.0, 210.0, 751.0, 3586.0, 277741.0, 8100601.0, 4185.0, 842.0, 255.0, 113.0, 28.0, 34.0, 22.0, 10.0, 3.0, 4.0, 11.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9718711376190186, -3.855161666870117, -3.738452196121216, -3.6217427253723145, -3.505033493041992, -3.3883237838745117, -3.2716145515441895, -3.154905080795288, -3.0381956100463867, -2.9214861392974854, -2.804776668548584, -2.6880671977996826, -2.5713577270507812, -2.454648494720459, -2.3379390239715576, -2.2212295532226562, -2.104520082473755, -1.9878106117248535, -1.8711011409759521, -1.7543917894363403, -1.637682318687439, -1.5209728479385376, -1.4042634963989258, -1.2875540256500244, -1.170844554901123, -1.0541350841522217, -0.9374256730079651, -0.8207162618637085, -0.7040067911148071, -0.5872973203659058, -0.47058790922164917, -0.3538784980773926, -0.2371690273284912, -0.12045958638191223, -0.003750145435333252, 0.11295929551124573, 0.2296687364578247, 0.3463782072067261, 0.46308761835098267, 0.5797970294952393, 0.6965065002441406, 0.813215970993042, 0.9299253821372986, 1.0466347932815552, 1.1633442640304565, 1.280053734779358, 1.3967630863189697, 1.513472557067871, 1.6301820278167725, 1.7468914985656738, 1.8636009693145752, 1.980310320854187, 2.097019672393799, 2.2137293815612793, 2.3304386138916016, 2.447148084640503, 2.5638575553894043, 2.6805670261383057, 2.797276496887207, 2.9139859676361084, 3.0306954383850098, 3.147404670715332, 3.2641141414642334, 3.3808236122131348, 3.497533082962036]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 6.0, 5.0, 4.0, 10.0, 6.0, 4.0, 5.0, 6.0, 1.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-5.073133945465088, -4.937679767608643, -4.802225589752197, -4.666771411895752, -4.531317234039307, -4.395863056182861, -4.260408878326416, -4.1249542236328125, -3.9895002841949463, -3.854046106338501, -3.7185919284820557, -3.5831377506256104, -3.447683334350586, -3.3122291564941406, -3.1767749786376953, -3.04132080078125, -2.9058666229248047, -2.7704124450683594, -2.634958267211914, -2.4995040893554688, -2.3640499114990234, -2.228595733642578, -2.0931413173675537, -1.9576871395111084, -1.822232961654663, -1.6867787837982178, -1.5513246059417725, -1.4158703088760376, -1.2804161310195923, -1.144961953163147, -1.009507656097412, -0.8740534782409668, -0.7385990619659424, -0.6031448841094971, -0.467690646648407, -0.3322364389896393, -0.19678223133087158, -0.06132805347442627, 0.07412618398666382, 0.2095804214477539, 0.3450345993041992, 0.4804888069629669, 0.6159430146217346, 0.7513972520828247, 0.88685142993927, 1.0223056077957153, 1.1577599048614502, 1.2932140827178955, 1.4286682605743408, 1.5641224384307861, 1.6995766162872314, 1.8350309133529663, 1.9704850912094116, 2.1059393882751465, 2.241393566131592, 2.376847743988037, 2.5123019218444824, 2.6477560997009277, 2.783210277557373, 2.9186644554138184, 3.0541186332702637, 3.189572811126709, 3.3250272274017334, 3.4604814052581787, 3.595935583114624]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 6.0, 8.0, 13.0, 19.0, 29.0, 44.0, 64.0, 125.0, 282.0, 668.0, 1922.0, 6328.0, 26925.0, 148481.0, 264678.0, 57681.0, 11917.0, 3134.0, 1025.0, 410.0, 202.0, 112.0, 65.0, 41.0, 29.0, 18.0, 13.0, 7.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.212890625, -3.1190185546875, -3.025146484375, -2.9312744140625, -2.83740234375, -2.7435302734375, -2.649658203125, -2.5557861328125, -2.4619140625, -2.3680419921875, -2.274169921875, -2.1802978515625, -2.08642578125, -1.9925537109375, -1.898681640625, -1.8048095703125, -1.7109375, -1.6170654296875, -1.523193359375, -1.4293212890625, -1.33544921875, -1.2415771484375, -1.147705078125, -1.0538330078125, -0.9599609375, -0.8660888671875, -0.772216796875, -0.6783447265625, -0.58447265625, -0.4906005859375, -0.396728515625, -0.3028564453125, -0.208984375, -0.1151123046875, -0.021240234375, 0.0726318359375, 0.16650390625, 0.2603759765625, 0.354248046875, 0.4481201171875, 0.5419921875, 0.6358642578125, 0.729736328125, 0.8236083984375, 0.91748046875, 1.0113525390625, 1.105224609375, 1.1990966796875, 1.29296875, 1.3868408203125, 1.480712890625, 1.5745849609375, 1.66845703125, 1.7623291015625, 1.856201171875, 1.9500732421875, 2.0439453125, 2.1378173828125, 2.231689453125, 2.3255615234375, 2.41943359375, 2.5133056640625, 2.607177734375, 2.7010498046875, 2.794921875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 4.0, 6.0, 8.0, 10.0, 8.0, 10.0, 11.0, 19.0, 25.0, 33.0, 34.0, 27.0, 44.0, 42.0, 56.0, 64.0, 62.0, 72.0, 68.0, 62.0, 63.0, 46.0, 47.0, 36.0, 36.0, 22.0, 17.0, 18.0, 14.0, 8.0, 6.0, 6.0, 5.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.28515625, -0.2776813507080078, -0.2702064514160156, -0.26273155212402344, -0.25525665283203125, -0.24778175354003906, -0.24030685424804688, -0.2328319549560547, -0.2253570556640625, -0.2178821563720703, -0.21040725708007812, -0.20293235778808594, -0.19545745849609375, -0.18798255920410156, -0.18050765991210938, -0.1730327606201172, -0.165557861328125, -0.1580829620361328, -0.15060806274414062, -0.14313316345214844, -0.13565826416015625, -0.12818336486816406, -0.12070846557617188, -0.11323356628417969, -0.1057586669921875, -0.09828376770019531, -0.09080886840820312, -0.08333396911621094, -0.07585906982421875, -0.06838417053222656, -0.060909271240234375, -0.05343437194824219, -0.04595947265625, -0.03848457336425781, -0.031009674072265625, -0.023534774780273438, -0.01605987548828125, -0.008584976196289062, -0.001110076904296875, 0.0063648223876953125, 0.0138397216796875, 0.021314620971679688, 0.028789520263671875, 0.03626441955566406, 0.04373931884765625, 0.05121421813964844, 0.058689117431640625, 0.06616401672363281, 0.073638916015625, 0.08111381530761719, 0.08858871459960938, 0.09606361389160156, 0.10353851318359375, 0.11101341247558594, 0.11848831176757812, 0.1259632110595703, 0.1334381103515625, 0.1409130096435547, 0.14838790893554688, 0.15586280822753906, 0.16333770751953125, 0.17081260681152344, 0.17828750610351562, 0.1857624053955078, 0.1932373046875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 4.0, 4.0, 3.0, 12.0, 42.0, 118.0, 185.0, 77.0, 31.0, 10.0, 4.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.390362739562988, -11.176735877990723, -10.963109016418457, -10.749483108520508, -10.535856246948242, -10.322229385375977, -10.108602523803711, -9.894975662231445, -9.68134880065918, -9.467721939086914, -9.254095077514648, -9.0404691696167, -8.826842308044434, -8.613215446472168, -8.399588584899902, -8.185961723327637, -7.9723358154296875, -7.758708953857422, -7.5450825691223145, -7.331455707550049, -7.117829322814941, -6.904202461242676, -6.69057559967041, -6.4769487380981445, -6.263322353363037, -6.0496954917907715, -5.836069107055664, -5.622442245483398, -5.408815383911133, -5.195188999176025, -4.98156213760376, -4.767935752868652, -4.554309368133545, -4.340682506561279, -4.127056121826172, -3.9134292602539062, -3.6998026371002197, -3.486176013946533, -3.2725491523742676, -3.058922529220581, -2.8452959060668945, -2.631669282913208, -2.4180426597595215, -2.204415798187256, -1.9907891750335693, -1.7771625518798828, -1.5635358095169067, -1.3499090671539307, -1.1362824440002441, -0.9226557612419128, -0.7090290784835815, -0.49540239572525024, -0.28177571296691895, -0.06814908981323242, 0.14547765254974365, 0.3591043949127197, 0.5727310180664062, 0.7863577008247375, 0.9999843835830688, 1.213611125946045, 1.4272377490997314, 1.640864372253418, 1.854491114616394, 2.06811785697937, 2.2817444801330566]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 7.0, 2.0, 4.0, 4.0, 4.0, 8.0, 19.0, 36.0, 56.0, 68.0, 64.0, 70.0, 45.0, 34.0, 11.0, 10.0, 3.0, 4.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0], "bins": [-2.398483991622925, -2.340806722640991, -2.2831294536590576, -2.225451946258545, -2.1677746772766113, -2.1100974082946777, -2.052420139312744, -1.9947428703308105, -1.937065601348877, -1.8793883323669434, -1.8217109441757202, -1.7640336751937866, -1.706356406211853, -1.6486790180206299, -1.5910017490386963, -1.5333244800567627, -1.4756470918655396, -1.417969822883606, -1.3602924346923828, -1.3026151657104492, -1.2449378967285156, -1.187260627746582, -1.1295832395553589, -1.0719059705734253, -1.0142285823822021, -0.9565512537956238, -0.8988739848136902, -0.8411966562271118, -0.7835193872451782, -0.7258420586585999, -0.6681647300720215, -0.6104874610900879, -0.5528103113174438, -0.49513301253318787, -0.4374557137489319, -0.3797783851623535, -0.32210108637809753, -0.26442378759384155, -0.20674645900726318, -0.1490691602230072, -0.09139186143875122, -0.03371455520391464, 0.023962751030921936, 0.08164006471633911, 0.1393173635005951, 0.19699466228485107, 0.25467199087142944, 0.3123492896556854, 0.3700265884399414, 0.4277038872241974, 0.48538118600845337, 0.5430585145950317, 0.6007357835769653, 0.6584131121635437, 0.7160904407501221, 0.7737677097320557, 0.831445038318634, 0.8891223669052124, 0.946799635887146, 1.0044770240783691, 1.0621542930603027, 1.1198315620422363, 1.17750883102417, 1.235186219215393, 1.2928634881973267]}, "eval/loss": 5.553798675537109, "eval/wer": 2.01330821102737, "eval/runtime": 947.3214, "eval/samples_per_second": 2.789, "eval/steps_per_second": 0.349} \ No newline at end of file +{"train/loss": 4.2487, "train/learning_rate": 5.102040816326531e-06, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 6325, "_timestamp": 1646285118, "_step": 893, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 51.0, 788.0, 154.0, 11.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-157.27684020996094, -143.8236541748047, -130.37045288085938, -116.91726684570312, -103.46407318115234, -90.01087951660156, -76.55769348144531, -63.10449981689453, -49.65130615234375, -36.19811248779297, -22.744922637939453, -9.291732788085938, 4.161460876464844, 17.614654541015625, 31.067840576171875, 44.521034240722656, 57.97422790527344, 71.42742156982422, 84.880615234375, 98.33380126953125, 111.78699493408203, 125.24018859863281, 138.69337463378906, 152.14657592773438, 165.59976196289062, 179.05294799804688, 192.5061492919922, 205.95933532714844, 219.41253662109375, 232.86572265625, 246.31890869140625, 259.7720947265625, 273.22528076171875, 286.678466796875, 300.13165283203125, 313.5848388671875, 327.0380554199219, 340.4912414550781, 353.9444274902344, 367.3976135253906, 380.850830078125, 394.30401611328125, 407.7572021484375, 421.21038818359375, 434.6636047363281, 448.1167907714844, 461.5699768066406, 475.0231628417969, 488.4763488769531, 501.9295349121094, 515.3827514648438, 528.8359375, 542.2891235351562, 555.7423095703125, 569.1954956054688, 582.648681640625, 596.1018676757812, 609.5550537109375, 623.0082397460938, 636.46142578125, 649.9146118164062, 663.3677978515625, 676.821044921875, 690.2742309570312, 703.7274169921875]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 0.0, 3.0, 9.0, 7.0, 7.0, 16.0, 23.0, 39.0, 34.0, 65.0, 107.0, 155.0, 167.0, 125.0, 93.0, 52.0, 31.0, 23.0, 12.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-367.9178161621094, -358.02044677734375, -348.12310791015625, -338.2257385253906, -328.3283996582031, -318.4310302734375, -308.53369140625, -298.6363220214844, -288.73895263671875, -278.8415832519531, -268.9442443847656, -259.046875, -249.14952087402344, -239.25216674804688, -229.3548126220703, -219.45745849609375, -209.5601043701172, -199.66275024414062, -189.76539611816406, -179.8680419921875, -169.97067260742188, -160.0733184814453, -150.17596435546875, -140.27859497070312, -130.38125610351562, -120.48390197753906, -110.58654022216797, -100.6891860961914, -90.79182434082031, -80.89447021484375, -70.99711608886719, -61.099754333496094, -51.202392578125, -41.30503463745117, -31.407678604125977, -21.51032257080078, -11.612964630126953, -1.715606689453125, 8.181747436523438, 18.07910919189453, 27.976463317871094, 37.87382125854492, 47.77117919921875, 57.66853332519531, 67.56588745117188, 77.46324920654297, 87.36060333251953, 97.25796508789062, 107.15531921386719, 117.05267333984375, 126.95003509521484, 136.84738159179688, 146.7447509765625, 156.64210510253906, 166.53945922851562, 176.43682861328125, 186.33416748046875, 196.2315216064453, 206.12887573242188, 216.0262451171875, 225.92359924316406, 235.82095336914062, 245.7183074951172, 255.61566162109375, 265.5130310058594]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 4.0, 9.0, 7.0, 11.0, 17.0, 25.0, 38.0, 30.0, 72.0, 96.0, 131.0, 152.0, 130.0, 93.0, 59.0, 45.0, 28.0, 17.0, 8.0, 11.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4296875, -5.28729248046875, -5.1448974609375, -5.00250244140625, -4.860107421875, -4.71771240234375, -4.5753173828125, -4.43292236328125, -4.29052734375, -4.14813232421875, -4.0057373046875, -3.86334228515625, -3.720947265625, -3.57855224609375, -3.4361572265625, -3.29376220703125, -3.1513671875, -3.00897216796875, -2.8665771484375, -2.72418212890625, -2.581787109375, -2.43939208984375, -2.2969970703125, -2.15460205078125, -2.01220703125, -1.86981201171875, -1.7274169921875, -1.58502197265625, -1.442626953125, -1.30023193359375, -1.1578369140625, -1.01544189453125, -0.873046875, -0.73065185546875, -0.5882568359375, -0.44586181640625, -0.303466796875, -0.16107177734375, -0.0186767578125, 0.12371826171875, 0.26611328125, 0.40850830078125, 0.5509033203125, 0.69329833984375, 0.835693359375, 0.97808837890625, 1.1204833984375, 1.26287841796875, 1.4052734375, 1.54766845703125, 1.6900634765625, 1.83245849609375, 1.974853515625, 2.11724853515625, 2.2596435546875, 2.40203857421875, 2.54443359375, 2.68682861328125, 2.8292236328125, 2.97161865234375, 3.114013671875, 3.25640869140625, 3.3988037109375, 3.54119873046875, 3.68359375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 17.0, 23.0, 17.0, 19.0, 36.0, 71.0, 92.0, 125.0, 210.0, 343.0, 642.0, 1381.0, 3303.0, 14395.0, 4000953.0, 161666.0, 7076.0, 2043.0, 852.0, 372.0, 248.0, 113.0, 84.0, 59.0, 28.0, 23.0, 25.0, 13.0, 6.0, 6.0, 8.0, 8.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-46.40625, -45.1787109375, -43.951171875, -42.7236328125, -41.49609375, -40.2685546875, -39.041015625, -37.8134765625, -36.5859375, -35.3583984375, -34.130859375, -32.9033203125, -31.67578125, -30.4482421875, -29.220703125, -27.9931640625, -26.765625, -25.5380859375, -24.310546875, -23.0830078125, -21.85546875, -20.6279296875, -19.400390625, -18.1728515625, -16.9453125, -15.7177734375, -14.490234375, -13.2626953125, -12.03515625, -10.8076171875, -9.580078125, -8.3525390625, -7.125, -5.8974609375, -4.669921875, -3.4423828125, -2.21484375, -0.9873046875, 0.240234375, 1.4677734375, 2.6953125, 3.9228515625, 5.150390625, 6.3779296875, 7.60546875, 8.8330078125, 10.060546875, 11.2880859375, 12.515625, 13.7431640625, 14.970703125, 16.1982421875, 17.42578125, 18.6533203125, 19.880859375, 21.1083984375, 22.3359375, 23.5634765625, 24.791015625, 26.0185546875, 27.24609375, 28.4736328125, 29.701171875, 30.9287109375, 32.15625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 14.0, 14.0, 16.0, 29.0, 28.0, 35.0, 65.0, 97.0, 169.0, 298.0, 640.0, 1029.0, 687.0, 371.0, 194.0, 111.0, 72.0, 54.0, 38.0, 27.0, 17.0, 12.0, 14.0, 9.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.387939453125, -9.03369140625, -8.679443359375, -8.3251953125, -7.970947265625, -7.61669921875, -7.262451171875, -6.908203125, -6.553955078125, -6.19970703125, -5.845458984375, -5.4912109375, -5.136962890625, -4.78271484375, -4.428466796875, -4.07421875, -3.719970703125, -3.36572265625, -3.011474609375, -2.6572265625, -2.302978515625, -1.94873046875, -1.594482421875, -1.240234375, -0.885986328125, -0.53173828125, -0.177490234375, 0.1767578125, 0.531005859375, 0.88525390625, 1.239501953125, 1.59375, 1.947998046875, 2.30224609375, 2.656494140625, 3.0107421875, 3.364990234375, 3.71923828125, 4.073486328125, 4.427734375, 4.781982421875, 5.13623046875, 5.490478515625, 5.8447265625, 6.198974609375, 6.55322265625, 6.907470703125, 7.26171875, 7.615966796875, 7.97021484375, 8.324462890625, 8.6787109375, 9.032958984375, 9.38720703125, 9.741455078125, 10.095703125, 10.449951171875, 10.80419921875, 11.158447265625, 11.5126953125, 11.866943359375, 12.22119140625, 12.575439453125, 12.9296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 11.0, 21.0, 19.0, 25.0, 42.0, 61.0, 81.0, 121.0, 177.0, 320.0, 1004.0, 6191.0, 151149.0, 3984397.0, 45848.0, 3317.0, 701.0, 284.0, 157.0, 97.0, 57.0, 66.0, 38.0, 25.0, 20.0, 15.0, 4.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-36.53125, -35.5263671875, -34.521484375, -33.5166015625, -32.51171875, -31.5068359375, -30.501953125, -29.4970703125, -28.4921875, -27.4873046875, -26.482421875, -25.4775390625, -24.47265625, -23.4677734375, -22.462890625, -21.4580078125, -20.453125, -19.4482421875, -18.443359375, -17.4384765625, -16.43359375, -15.4287109375, -14.423828125, -13.4189453125, -12.4140625, -11.4091796875, -10.404296875, -9.3994140625, -8.39453125, -7.3896484375, -6.384765625, -5.3798828125, -4.375, -3.3701171875, -2.365234375, -1.3603515625, -0.35546875, 0.6494140625, 1.654296875, 2.6591796875, 3.6640625, 4.6689453125, 5.673828125, 6.6787109375, 7.68359375, 8.6884765625, 9.693359375, 10.6982421875, 11.703125, 12.7080078125, 13.712890625, 14.7177734375, 15.72265625, 16.7275390625, 17.732421875, 18.7373046875, 19.7421875, 20.7470703125, 21.751953125, 22.7568359375, 23.76171875, 24.7666015625, 25.771484375, 26.7763671875, 27.78125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 52.0, 218.0, 463.0, 201.0, 59.0, 8.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.93682098388672, -117.5113754272461, -115.0859375, -112.66049194335938, -110.23505401611328, -107.80960845947266, -105.38417053222656, -102.95872497558594, -100.53327941894531, -98.10783386230469, -95.6823959350586, -93.25695037841797, -90.83151245117188, -88.40606689453125, -85.98062133789062, -83.55518341064453, -81.12974548339844, -78.70429992675781, -76.27886199951172, -73.8534164428711, -71.427978515625, -69.00253295898438, -66.57708740234375, -64.15164947509766, -61.72620391845703, -59.30076217651367, -56.87532043457031, -54.44987487792969, -52.02443313598633, -49.59899139404297, -47.17354965209961, -44.74810791015625, -42.32265853881836, -39.897216796875, -37.47177505493164, -35.04633331298828, -32.620887756347656, -30.195446014404297, -27.770004272460938, -25.344560623168945, -22.919118881225586, -20.493677139282227, -18.068233489990234, -15.642791748046875, -13.2173490524292, -10.791906356811523, -8.366464614868164, -5.941020965576172, -3.5155792236328125, -1.0901367664337158, 1.3353056907653809, 3.7607479095458984, 6.186190605163574, 8.61163330078125, 11.03707504272461, 13.462518692016602, 15.887960433959961, 18.31340217590332, 20.738845825195312, 23.164287567138672, 25.58972930908203, 28.015172958374023, 30.440614700317383, 32.866058349609375, 35.291500091552734]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 12.0, 9.0, 17.0, 13.0, 19.0, 21.0, 30.0, 21.0, 32.0, 32.0, 33.0, 46.0, 40.0, 42.0, 40.0, 49.0, 42.0, 44.0, 41.0, 39.0, 47.0, 38.0, 38.0, 40.0, 26.0, 25.0, 32.0, 23.0, 16.0, 15.0, 12.0, 14.0, 8.0, 5.0, 3.0, 9.0, 9.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.84715270996094, -32.708274841308594, -31.56939697265625, -30.430519104003906, -29.291641235351562, -28.15276336669922, -27.013885498046875, -25.87500762939453, -24.736129760742188, -23.597251892089844, -22.4583740234375, -21.319496154785156, -20.180618286132812, -19.04174041748047, -17.902862548828125, -16.76398468017578, -15.625104904174805, -14.486227035522461, -13.347349166870117, -12.208471298217773, -11.06959342956543, -9.930715560913086, -8.791836738586426, -7.652958869934082, -6.514081001281738, -5.3752031326293945, -4.236325263977051, -3.097446918487549, -1.958569049835205, -0.8196911811828613, 0.3191871643066406, 1.4580650329589844, 2.596942901611328, 3.735820770263672, 4.874698638916016, 6.013576984405518, 7.152454853057861, 8.291332244873047, 9.430211067199707, 10.56908893585205, 11.707966804504395, 12.846844673156738, 13.985722541809082, 15.124601364135742, 16.263479232788086, 17.40235710144043, 18.541234970092773, 19.680112838745117, 20.81899070739746, 21.957868576049805, 23.09674644470215, 24.235624313354492, 25.374502182006836, 26.51338005065918, 27.652259826660156, 28.7911376953125, 29.930015563964844, 31.068893432617188, 32.20777130126953, 33.346649169921875, 34.48552703857422, 35.62440490722656, 36.763282775878906, 37.90216064453125, 39.041038513183594]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 8.0, 14.0, 10.0, 28.0, 29.0, 42.0, 50.0, 83.0, 106.0, 125.0, 157.0, 104.0, 76.0, 56.0, 36.0, 27.0, 13.0, 10.0, 7.0, 1.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.046875, -4.91290283203125, -4.7789306640625, -4.64495849609375, -4.510986328125, -4.37701416015625, -4.2430419921875, -4.10906982421875, -3.97509765625, -3.84112548828125, -3.7071533203125, -3.57318115234375, -3.439208984375, -3.30523681640625, -3.1712646484375, -3.03729248046875, -2.9033203125, -2.76934814453125, -2.6353759765625, -2.50140380859375, -2.367431640625, -2.23345947265625, -2.0994873046875, -1.96551513671875, -1.83154296875, -1.69757080078125, -1.5635986328125, -1.42962646484375, -1.295654296875, -1.16168212890625, -1.0277099609375, -0.89373779296875, -0.759765625, -0.62579345703125, -0.4918212890625, -0.35784912109375, -0.223876953125, -0.08990478515625, 0.0440673828125, 0.17803955078125, 0.31201171875, 0.44598388671875, 0.5799560546875, 0.71392822265625, 0.847900390625, 0.98187255859375, 1.1158447265625, 1.24981689453125, 1.3837890625, 1.51776123046875, 1.6517333984375, 1.78570556640625, 1.919677734375, 2.05364990234375, 2.1876220703125, 2.32159423828125, 2.45556640625, 2.58953857421875, 2.7235107421875, 2.85748291015625, 2.991455078125, 3.12542724609375, 3.2593994140625, 3.39337158203125, 3.52734375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 11.0, 5.0, 12.0, 10.0, 17.0, 19.0, 30.0, 37.0, 57.0, 77.0, 121.0, 180.0, 262.0, 416.0, 633.0, 993.0, 1474.0, 2513.0, 4484.0, 8982.0, 21978.0, 71196.0, 434702.0, 391400.0, 68229.0, 20756.0, 9021.0, 4418.0, 2397.0, 1447.0, 944.0, 583.0, 373.0, 238.0, 151.0, 125.0, 70.0, 58.0, 36.0, 30.0, 20.0, 11.0, 15.0, 4.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2352294921875, -0.22763633728027344, -0.22004318237304688, -0.2124500274658203, -0.20485687255859375, -0.1972637176513672, -0.18967056274414062, -0.18207740783691406, -0.1744842529296875, -0.16689109802246094, -0.15929794311523438, -0.1517047882080078, -0.14411163330078125, -0.1365184783935547, -0.12892532348632812, -0.12133216857910156, -0.113739013671875, -0.10614585876464844, -0.09855270385742188, -0.09095954895019531, -0.08336639404296875, -0.07577323913574219, -0.06818008422851562, -0.06058692932128906, -0.0529937744140625, -0.04540061950683594, -0.037807464599609375, -0.030214309692382812, -0.02262115478515625, -0.015027999877929688, -0.007434844970703125, 0.0001583099365234375, 0.00775146484375, 0.015344619750976562, 0.022937774658203125, 0.030530929565429688, 0.03812408447265625, 0.04571723937988281, 0.053310394287109375, 0.06090354919433594, 0.0684967041015625, 0.07608985900878906, 0.08368301391601562, 0.09127616882324219, 0.09886932373046875, 0.10646247863769531, 0.11405563354492188, 0.12164878845214844, 0.129241943359375, 0.13683509826660156, 0.14442825317382812, 0.1520214080810547, 0.15961456298828125, 0.1672077178955078, 0.17480087280273438, 0.18239402770996094, 0.1899871826171875, 0.19758033752441406, 0.20517349243164062, 0.2127666473388672, 0.22035980224609375, 0.2279529571533203, 0.23554611206054688, 0.24313926696777344, 0.250732421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 4.0, 8.0, 12.0, 16.0, 24.0, 24.0, 28.0, 25.0, 33.0, 33.0, 27.0, 29.0, 39.0, 50.0, 44.0, 50.0, 1064.0, 62.0, 48.0, 59.0, 36.0, 49.0, 38.0, 34.0, 24.0, 27.0, 23.0, 18.0, 25.0, 16.0, 10.0, 14.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0546875, -2.952239990234375, -2.84979248046875, -2.747344970703125, -2.6448974609375, -2.542449951171875, -2.44000244140625, -2.337554931640625, -2.235107421875, -2.132659912109375, -2.03021240234375, -1.927764892578125, -1.8253173828125, -1.722869873046875, -1.62042236328125, -1.517974853515625, -1.41552734375, -1.313079833984375, -1.21063232421875, -1.108184814453125, -1.0057373046875, -0.903289794921875, -0.80084228515625, -0.698394775390625, -0.595947265625, -0.493499755859375, -0.39105224609375, -0.288604736328125, -0.1861572265625, -0.083709716796875, 0.01873779296875, 0.121185302734375, 0.2236328125, 0.326080322265625, 0.42852783203125, 0.530975341796875, 0.6334228515625, 0.735870361328125, 0.83831787109375, 0.940765380859375, 1.043212890625, 1.145660400390625, 1.24810791015625, 1.350555419921875, 1.4530029296875, 1.555450439453125, 1.65789794921875, 1.760345458984375, 1.86279296875, 1.965240478515625, 2.06768798828125, 2.170135498046875, 2.2725830078125, 2.375030517578125, 2.47747802734375, 2.579925537109375, 2.682373046875, 2.784820556640625, 2.88726806640625, 2.989715576171875, 3.0921630859375, 3.194610595703125, 3.29705810546875, 3.399505615234375, 3.501953125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 10.0, 10.0, 12.0, 31.0, 32.0, 44.0, 77.0, 125.0, 156.0, 244.0, 444.0, 616.0, 1009.0, 1529.0, 2345.0, 3568.0, 5616.0, 8782.0, 14055.0, 22371.0, 36501.0, 61429.0, 111638.0, 1282345.0, 290438.0, 103776.0, 57655.0, 34439.0, 21122.0, 13204.0, 8499.0, 5444.0, 3410.0, 2157.0, 1433.0, 869.0, 593.0, 387.0, 269.0, 149.0, 105.0, 80.0, 39.0, 31.0, 14.0, 13.0, 7.0, 4.0, 7.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.08544921875, -0.082855224609375, -0.08026123046875, -0.077667236328125, -0.0750732421875, -0.072479248046875, -0.06988525390625, -0.067291259765625, -0.064697265625, -0.062103271484375, -0.05950927734375, -0.056915283203125, -0.0543212890625, -0.051727294921875, -0.04913330078125, -0.046539306640625, -0.0439453125, -0.041351318359375, -0.03875732421875, -0.036163330078125, -0.0335693359375, -0.030975341796875, -0.02838134765625, -0.025787353515625, -0.023193359375, -0.020599365234375, -0.01800537109375, -0.015411376953125, -0.0128173828125, -0.010223388671875, -0.00762939453125, -0.005035400390625, -0.00244140625, 0.000152587890625, 0.00274658203125, 0.005340576171875, 0.0079345703125, 0.010528564453125, 0.01312255859375, 0.015716552734375, 0.018310546875, 0.020904541015625, 0.02349853515625, 0.026092529296875, 0.0286865234375, 0.031280517578125, 0.03387451171875, 0.036468505859375, 0.0390625, 0.041656494140625, 0.04425048828125, 0.046844482421875, 0.0494384765625, 0.052032470703125, 0.05462646484375, 0.057220458984375, 0.059814453125, 0.062408447265625, 0.06500244140625, 0.067596435546875, 0.0701904296875, 0.072784423828125, 0.07537841796875, 0.077972412109375, 0.08056640625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 7.0, 4.0, 9.0, 15.0, 14.0, 12.0, 14.0, 30.0, 30.0, 29.0, 47.0, 38.0, 49.0, 65.0, 74.0, 79.0, 85.0, 49.0, 59.0, 35.0, 40.0, 32.0, 31.0, 38.0, 15.0, 25.0, 17.0, 10.0, 11.0, 8.0, 7.0, 6.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006933212280273438, -0.0006714761257171631, -0.0006496310234069824, -0.0006277859210968018, -0.0006059408187866211, -0.0005840957164764404, -0.0005622506141662598, -0.0005404055118560791, -0.0005185604095458984, -0.0004967153072357178, -0.0004748702049255371, -0.00045302510261535645, -0.0004311800003051758, -0.0004093348979949951, -0.00038748979568481445, -0.0003656446933746338, -0.0003437995910644531, -0.00032195448875427246, -0.0003001093864440918, -0.00027826428413391113, -0.00025641918182373047, -0.0002345740795135498, -0.00021272897720336914, -0.00019088387489318848, -0.0001690387725830078, -0.00014719367027282715, -0.00012534856796264648, -0.00010350346565246582, -8.165836334228516e-05, -5.981326103210449e-05, -3.796815872192383e-05, -1.6123056411743164e-05, 5.7220458984375e-06, 2.7567148208618164e-05, 4.941225051879883e-05, 7.125735282897949e-05, 9.310245513916016e-05, 0.00011494755744934082, 0.00013679265975952148, 0.00015863776206970215, 0.0001804828643798828, 0.00020232796669006348, 0.00022417306900024414, 0.0002460181713104248, 0.00026786327362060547, 0.00028970837593078613, 0.0003115534782409668, 0.00033339858055114746, 0.0003552436828613281, 0.0003770887851715088, 0.00039893388748168945, 0.0004207789897918701, 0.0004426240921020508, 0.00046446919441223145, 0.0004863142967224121, 0.0005081593990325928, 0.0005300045013427734, 0.0005518496036529541, 0.0005736947059631348, 0.0005955398082733154, 0.0006173849105834961, 0.0006392300128936768, 0.0006610751152038574, 0.0006829202175140381, 0.0007047653198242188]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 4.0, 8.0, 11.0, 11.0, 15.0, 16.0, 24.0, 34.0, 50.0, 62.0, 72.0, 88.0, 127.0, 133.0, 217.0, 227.0, 366.0, 27533.0, 1017823.0, 448.0, 309.0, 193.0, 151.0, 156.0, 98.0, 94.0, 73.0, 40.0, 37.0, 34.0, 25.0, 15.0, 12.0, 14.0, 5.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0141448974609375, -0.013705253601074219, -0.013265609741210938, -0.012825965881347656, -0.012386322021484375, -0.011946678161621094, -0.011507034301757812, -0.011067390441894531, -0.01062774658203125, -0.010188102722167969, -0.009748458862304688, -0.009308815002441406, -0.008869171142578125, -0.008429527282714844, -0.007989883422851562, -0.007550239562988281, -0.007110595703125, -0.006670951843261719, -0.0062313079833984375, -0.005791664123535156, -0.005352020263671875, -0.004912376403808594, -0.0044727325439453125, -0.004033088684082031, -0.00359344482421875, -0.0031538009643554688, -0.0027141571044921875, -0.0022745132446289062, -0.001834869384765625, -0.0013952255249023438, -0.0009555816650390625, -0.0005159378051757812, -7.62939453125e-05, 0.00036334991455078125, 0.0008029937744140625, 0.0012426376342773438, 0.001682281494140625, 0.0021219253540039062, 0.0025615692138671875, 0.0030012130737304688, 0.00344085693359375, 0.0038805007934570312, 0.0043201446533203125, 0.004759788513183594, 0.005199432373046875, 0.005639076232910156, 0.0060787200927734375, 0.006518363952636719, 0.0069580078125, 0.007397651672363281, 0.007837295532226562, 0.008276939392089844, 0.008716583251953125, 0.009156227111816406, 0.009595870971679688, 0.010035514831542969, 0.01047515869140625, 0.010914802551269531, 0.011354446411132812, 0.011794090270996094, 0.012233734130859375, 0.012673377990722656, 0.013113021850585938, 0.013552665710449219, 0.0139923095703125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1010.0, 4.0], "bins": [-0.01571698673069477, -0.015465534292161465, -0.015214082784950733, -0.014962630346417427, -0.014711177907884121, -0.014459725469350815, -0.014208273962140083, -0.013956821523606777, -0.013705369085073471, -0.013453916646540165, -0.013202465139329433, -0.012951012700796127, -0.012699560262262821, -0.012448107823729515, -0.012196656316518784, -0.011945203877985477, -0.011693752370774746, -0.01144229993224144, -0.011190848425030708, -0.010939395986497402, -0.010687943547964096, -0.010436492040753365, -0.010185039602220058, -0.009933587163686752, -0.00968213565647602, -0.009430683217942715, -0.009179231710731983, -0.008927779272198677, -0.008676326833665371, -0.008424874395132065, -0.008173422887921333, -0.007921970449388027, -0.0076705170795321465, -0.007419065106660128, -0.0071676126681268215, -0.006916160695254803, -0.006664708256721497, -0.006413256283849478, -0.006161804310977459, -0.005910351872444153, -0.005658899899572134, -0.005407447926700115, -0.005155995488166809, -0.00490454351529479, -0.0046530915424227715, -0.004401639103889465, -0.0041501871310174465, -0.003898734925314784, -0.0036472827196121216, -0.003395830513909459, -0.0031443783082067966, -0.002892926335334778, -0.0026414741296321154, -0.002390021923929453, -0.002138569951057434, -0.0018871177453547716, -0.001635665656067431, -0.0013842135667800903, -0.0011327613610774279, -0.0008813092135824263, -0.0006298570660874248, -0.0003784048603847623, -0.00012695277109742165, 0.000124499318189919, 0.0003759515529964119]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 19.0, 17.0, 21.0, 24.0, 33.0, 25.0, 36.0, 58.0, 48.0, 53.0, 68.0, 67.0, 60.0, 60.0, 61.0, 56.0, 43.0, 46.0, 44.0, 29.0, 35.0, 24.0, 14.0, 19.0, 9.0, 8.0, 5.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006846189498901367, -0.0006620734930038452, -0.0006395280361175537, -0.0006169825792312622, -0.0005944371223449707, -0.0005718916654586792, -0.0005493462085723877, -0.0005268007516860962, -0.0005042552947998047, -0.0004817098379135132, -0.0004591643810272217, -0.0004366189241409302, -0.00041407346725463867, -0.00039152801036834717, -0.00036898255348205566, -0.00034643709659576416, -0.00032389163970947266, -0.00030134618282318115, -0.00027880072593688965, -0.00025625526905059814, -0.00023370981216430664, -0.00021116435527801514, -0.00018861889839172363, -0.00016607344150543213, -0.00014352798461914062, -0.00012098252773284912, -9.843707084655762e-05, -7.589161396026611e-05, -5.334615707397461e-05, -3.0800700187683105e-05, -8.255243301391602e-06, 1.4290213584899902e-05, 3.6835670471191406e-05, 5.938112735748291e-05, 8.192658424377441e-05, 0.00010447204113006592, 0.00012701749801635742, 0.00014956295490264893, 0.00017210841178894043, 0.00019465386867523193, 0.00021719932556152344, 0.00023974478244781494, 0.00026229023933410645, 0.00028483569622039795, 0.00030738115310668945, 0.00032992660999298096, 0.00035247206687927246, 0.00037501752376556396, 0.00039756298065185547, 0.00042010843753814697, 0.0004426538944244385, 0.00046519935131073, 0.0004877448081970215, 0.000510290265083313, 0.0005328357219696045, 0.000555381178855896, 0.0005779266357421875, 0.000600472092628479, 0.0006230175495147705, 0.000645563006401062, 0.0006681084632873535, 0.000690653920173645, 0.0007131993770599365, 0.000735744833946228, 0.0007582902908325195]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 8.0, 14.0, 10.0, 28.0, 29.0, 42.0, 50.0, 83.0, 106.0, 125.0, 157.0, 104.0, 76.0, 56.0, 36.0, 27.0, 13.0, 10.0, 7.0, 1.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.046875, -4.91290283203125, -4.7789306640625, -4.64495849609375, -4.510986328125, -4.37701416015625, -4.2430419921875, -4.10906982421875, -3.97509765625, -3.84112548828125, -3.7071533203125, -3.57318115234375, -3.439208984375, -3.30523681640625, -3.1712646484375, -3.03729248046875, -2.9033203125, -2.76934814453125, -2.6353759765625, -2.50140380859375, -2.367431640625, -2.23345947265625, -2.0994873046875, -1.96551513671875, -1.83154296875, -1.69757080078125, -1.5635986328125, -1.42962646484375, -1.295654296875, -1.16168212890625, -1.0277099609375, -0.89373779296875, -0.759765625, -0.62579345703125, -0.4918212890625, -0.35784912109375, -0.223876953125, -0.08990478515625, 0.0440673828125, 0.17803955078125, 0.31201171875, 0.44598388671875, 0.5799560546875, 0.71392822265625, 0.847900390625, 0.98187255859375, 1.1158447265625, 1.24981689453125, 1.3837890625, 1.51776123046875, 1.6517333984375, 1.78570556640625, 1.919677734375, 2.05364990234375, 2.1876220703125, 2.32159423828125, 2.45556640625, 2.58953857421875, 2.7235107421875, 2.85748291015625, 2.991455078125, 3.12542724609375, 3.2593994140625, 3.39337158203125, 3.52734375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 7.0, 6.0, 11.0, 16.0, 29.0, 32.0, 56.0, 89.0, 94.0, 165.0, 250.0, 486.0, 955.0, 1974.0, 5367.0, 28971.0, 923839.0, 73186.0, 7823.0, 2549.0, 1160.0, 610.0, 312.0, 184.0, 114.0, 79.0, 51.0, 50.0, 28.0, 12.0, 11.0, 9.0, 12.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.328125, -26.515869140625, -25.70361328125, -24.891357421875, -24.0791015625, -23.266845703125, -22.45458984375, -21.642333984375, -20.830078125, -20.017822265625, -19.20556640625, -18.393310546875, -17.5810546875, -16.768798828125, -15.95654296875, -15.144287109375, -14.33203125, -13.519775390625, -12.70751953125, -11.895263671875, -11.0830078125, -10.270751953125, -9.45849609375, -8.646240234375, -7.833984375, -7.021728515625, -6.20947265625, -5.397216796875, -4.5849609375, -3.772705078125, -2.96044921875, -2.148193359375, -1.3359375, -0.523681640625, 0.28857421875, 1.100830078125, 1.9130859375, 2.725341796875, 3.53759765625, 4.349853515625, 5.162109375, 5.974365234375, 6.78662109375, 7.598876953125, 8.4111328125, 9.223388671875, 10.03564453125, 10.847900390625, 11.66015625, 12.472412109375, 13.28466796875, 14.096923828125, 14.9091796875, 15.721435546875, 16.53369140625, 17.345947265625, 18.158203125, 18.970458984375, 19.78271484375, 20.594970703125, 21.4072265625, 22.219482421875, 23.03173828125, 23.843994140625, 24.65625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 8.0, 7.0, 12.0, 11.0, 18.0, 19.0, 14.0, 28.0, 26.0, 18.0, 37.0, 33.0, 39.0, 51.0, 55.0, 59.0, 96.0, 192.0, 1520.0, 226.0, 100.0, 87.0, 63.0, 28.0, 43.0, 39.0, 24.0, 25.0, 29.0, 21.0, 18.0, 16.0, 11.0, 11.0, 12.0, 7.0, 12.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69921875, -6.47332763671875, -6.2474365234375, -6.02154541015625, -5.795654296875, -5.56976318359375, -5.3438720703125, -5.11798095703125, -4.89208984375, -4.66619873046875, -4.4403076171875, -4.21441650390625, -3.988525390625, -3.76263427734375, -3.5367431640625, -3.31085205078125, -3.0849609375, -2.85906982421875, -2.6331787109375, -2.40728759765625, -2.181396484375, -1.95550537109375, -1.7296142578125, -1.50372314453125, -1.27783203125, -1.05194091796875, -0.8260498046875, -0.60015869140625, -0.374267578125, -0.14837646484375, 0.0775146484375, 0.30340576171875, 0.529296875, 0.75518798828125, 0.9810791015625, 1.20697021484375, 1.432861328125, 1.65875244140625, 1.8846435546875, 2.11053466796875, 2.33642578125, 2.56231689453125, 2.7882080078125, 3.01409912109375, 3.239990234375, 3.46588134765625, 3.6917724609375, 3.91766357421875, 4.1435546875, 4.36944580078125, 4.5953369140625, 4.82122802734375, 5.047119140625, 5.27301025390625, 5.4989013671875, 5.72479248046875, 5.95068359375, 6.17657470703125, 6.4024658203125, 6.62835693359375, 6.854248046875, 7.08013916015625, 7.3060302734375, 7.53192138671875, 7.7578125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 10.0, 6.0, 12.0, 16.0, 11.0, 22.0, 28.0, 23.0, 32.0, 42.0, 50.0, 81.0, 166.0, 335.0, 1262.0, 24451.0, 3090122.0, 26731.0, 1307.0, 384.0, 164.0, 95.0, 59.0, 45.0, 40.0, 25.0, 27.0, 21.0, 18.0, 23.0, 16.0, 6.0, 11.0, 12.0, 5.0, 10.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.25, -29.319580078125, -28.38916015625, -27.458740234375, -26.5283203125, -25.597900390625, -24.66748046875, -23.737060546875, -22.806640625, -21.876220703125, -20.94580078125, -20.015380859375, -19.0849609375, -18.154541015625, -17.22412109375, -16.293701171875, -15.36328125, -14.432861328125, -13.50244140625, -12.572021484375, -11.6416015625, -10.711181640625, -9.78076171875, -8.850341796875, -7.919921875, -6.989501953125, -6.05908203125, -5.128662109375, -4.1982421875, -3.267822265625, -2.33740234375, -1.406982421875, -0.4765625, 0.453857421875, 1.38427734375, 2.314697265625, 3.2451171875, 4.175537109375, 5.10595703125, 6.036376953125, 6.966796875, 7.897216796875, 8.82763671875, 9.758056640625, 10.6884765625, 11.618896484375, 12.54931640625, 13.479736328125, 14.41015625, 15.340576171875, 16.27099609375, 17.201416015625, 18.1318359375, 19.062255859375, 19.99267578125, 20.923095703125, 21.853515625, 22.783935546875, 23.71435546875, 24.644775390625, 25.5751953125, 26.505615234375, 27.43603515625, 28.366455078125, 29.296875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 15.0, 219.0, 633.0, 135.0, 15.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.684745788574219, -5.3429388999938965, -3.001132011413574, -0.659325122833252, 1.6824817657470703, 4.024288177490234, 6.366095542907715, 8.707902908325195, 11.04970932006836, 13.391515731811523, 15.733323097229004, 18.075130462646484, 20.41693687438965, 22.758743286132812, 25.10055160522461, 27.442358016967773, 29.784164428710938, 32.125972747802734, 34.467777252197266, 36.80958557128906, 39.151390075683594, 41.49319839477539, 43.83500671386719, 46.17681121826172, 48.518619537353516, 50.86042785644531, 53.202232360839844, 55.54404067993164, 57.88584899902344, 60.22765350341797, 62.569461822509766, 64.91127014160156, 67.25308227539062, 69.59488677978516, 71.93669891357422, 74.27850341796875, 76.62030792236328, 78.96211242675781, 81.30392456054688, 83.6457290649414, 85.98753356933594, 88.32933807373047, 90.67115020751953, 93.01295471191406, 95.3547592163086, 97.69656372070312, 100.03837585449219, 102.38018035888672, 104.72199249267578, 107.06379699707031, 109.40560913085938, 111.7474136352539, 114.08921813964844, 116.4310302734375, 118.77283477783203, 121.11463928222656, 123.45645141601562, 125.79825592041016, 128.1400604248047, 130.48187255859375, 132.8236846923828, 135.1654815673828, 137.50729370117188, 139.84910583496094, 142.19090270996094]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 5.0, 8.0, 5.0, 14.0, 26.0, 16.0, 16.0, 21.0, 23.0, 30.0, 31.0, 37.0, 44.0, 23.0, 37.0, 48.0, 32.0, 48.0, 37.0, 48.0, 35.0, 38.0, 47.0, 42.0, 29.0, 37.0, 28.0, 28.0, 29.0, 24.0, 22.0, 9.0, 11.0, 14.0, 12.0, 5.0, 4.0, 10.0, 14.0, 6.0, 1.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0], "bins": [-27.12782096862793, -26.352937698364258, -25.578054428100586, -24.80316925048828, -24.02828598022461, -23.253402709960938, -22.478519439697266, -21.703636169433594, -20.928752899169922, -20.15386962890625, -19.378986358642578, -18.604103088378906, -17.8292179107666, -17.05433464050293, -16.279451370239258, -15.504568099975586, -14.729682922363281, -13.95479965209961, -13.179915428161621, -12.40503215789795, -11.630147933959961, -10.855264663696289, -10.080381393432617, -9.305498123168945, -8.530613899230957, -7.755730152130127, -6.980846405029297, -6.205963134765625, -5.431079387664795, -4.656195640563965, -3.881312370300293, -3.106428623199463, -2.3315467834472656, -1.556663155555725, -0.7817795276641846, -0.006896018981933594, 0.7679877281188965, 1.5428714752197266, 2.3177547454833984, 3.0926384925842285, 3.8675222396850586, 4.642405986785889, 5.417289733886719, 6.192173004150391, 6.967056751251221, 7.741940498352051, 8.516823768615723, 9.291707992553711, 10.066591262817383, 10.841474533081055, 11.616358757019043, 12.391242027282715, 13.166126251220703, 13.941009521484375, 14.715892791748047, 15.490776062011719, 16.26565933227539, 17.040542602539062, 17.815425872802734, 18.590309143066406, 19.36519432067871, 20.140077590942383, 20.914960861206055, 21.689844131469727, 22.46472930908203]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 3.0, 2.0, 8.0, 14.0, 11.0, 28.0, 36.0, 40.0, 58.0, 91.0, 113.0, 116.0, 138.0, 102.0, 79.0, 57.0, 34.0, 22.0, 18.0, 10.0, 4.0, 4.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.10546875, -4.969482421875, -4.83349609375, -4.697509765625, -4.5615234375, -4.425537109375, -4.28955078125, -4.153564453125, -4.017578125, -3.881591796875, -3.74560546875, -3.609619140625, -3.4736328125, -3.337646484375, -3.20166015625, -3.065673828125, -2.9296875, -2.793701171875, -2.65771484375, -2.521728515625, -2.3857421875, -2.249755859375, -2.11376953125, -1.977783203125, -1.841796875, -1.705810546875, -1.56982421875, -1.433837890625, -1.2978515625, -1.161865234375, -1.02587890625, -0.889892578125, -0.75390625, -0.617919921875, -0.48193359375, -0.345947265625, -0.2099609375, -0.073974609375, 0.06201171875, 0.197998046875, 0.333984375, 0.469970703125, 0.60595703125, 0.741943359375, 0.8779296875, 1.013916015625, 1.14990234375, 1.285888671875, 1.421875, 1.557861328125, 1.69384765625, 1.829833984375, 1.9658203125, 2.101806640625, 2.23779296875, 2.373779296875, 2.509765625, 2.645751953125, 2.78173828125, 2.917724609375, 3.0537109375, 3.189697265625, 3.32568359375, 3.461669921875, 3.59765625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 8.0, 11.0, 9.0, 12.0, 27.0, 28.0, 59.0, 92.0, 158.0, 212.0, 540.0, 1289.0, 4332.0, 61982.0, 4104052.0, 17378.0, 2580.0, 780.0, 328.0, 160.0, 89.0, 53.0, 37.0, 18.0, 9.0, 14.0, 7.0, 5.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.75, -41.60498046875, -40.4599609375, -39.31494140625, -38.169921875, -37.02490234375, -35.8798828125, -34.73486328125, -33.58984375, -32.44482421875, -31.2998046875, -30.15478515625, -29.009765625, -27.86474609375, -26.7197265625, -25.57470703125, -24.4296875, -23.28466796875, -22.1396484375, -20.99462890625, -19.849609375, -18.70458984375, -17.5595703125, -16.41455078125, -15.26953125, -14.12451171875, -12.9794921875, -11.83447265625, -10.689453125, -9.54443359375, -8.3994140625, -7.25439453125, -6.109375, -4.96435546875, -3.8193359375, -2.67431640625, -1.529296875, -0.38427734375, 0.7607421875, 1.90576171875, 3.05078125, 4.19580078125, 5.3408203125, 6.48583984375, 7.630859375, 8.77587890625, 9.9208984375, 11.06591796875, 12.2109375, 13.35595703125, 14.5009765625, 15.64599609375, 16.791015625, 17.93603515625, 19.0810546875, 20.22607421875, 21.37109375, 22.51611328125, 23.6611328125, 24.80615234375, 25.951171875, 27.09619140625, 28.2412109375, 29.38623046875, 30.53125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 6.0, 6.0, 13.0, 8.0, 15.0, 19.0, 25.0, 32.0, 48.0, 98.0, 107.0, 210.0, 304.0, 550.0, 799.0, 665.0, 399.0, 251.0, 162.0, 105.0, 60.0, 46.0, 30.0, 24.0, 18.0, 7.0, 12.0, 8.0, 7.0, 10.0, 3.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.890625, -7.6336669921875, -7.376708984375, -7.1197509765625, -6.86279296875, -6.6058349609375, -6.348876953125, -6.0919189453125, -5.8349609375, -5.5780029296875, -5.321044921875, -5.0640869140625, -4.80712890625, -4.5501708984375, -4.293212890625, -4.0362548828125, -3.779296875, -3.5223388671875, -3.265380859375, -3.0084228515625, -2.75146484375, -2.4945068359375, -2.237548828125, -1.9805908203125, -1.7236328125, -1.4666748046875, -1.209716796875, -0.9527587890625, -0.69580078125, -0.4388427734375, -0.181884765625, 0.0750732421875, 0.33203125, 0.5889892578125, 0.845947265625, 1.1029052734375, 1.35986328125, 1.6168212890625, 1.873779296875, 2.1307373046875, 2.3876953125, 2.6446533203125, 2.901611328125, 3.1585693359375, 3.41552734375, 3.6724853515625, 3.929443359375, 4.1864013671875, 4.443359375, 4.7003173828125, 4.957275390625, 5.2142333984375, 5.47119140625, 5.7281494140625, 5.985107421875, 6.2420654296875, 6.4990234375, 6.7559814453125, 7.012939453125, 7.2698974609375, 7.52685546875, 7.7838134765625, 8.040771484375, 8.2977294921875, 8.5546875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 6.0, 15.0, 17.0, 18.0, 56.0, 74.0, 113.0, 178.0, 335.0, 525.0, 942.0, 1678.0, 3245.0, 6484.0, 14236.0, 38563.0, 151931.0, 1371988.0, 2287519.0, 232318.0, 50384.0, 17758.0, 7684.0, 3695.0, 1892.0, 1073.0, 614.0, 354.0, 224.0, 119.0, 92.0, 42.0, 31.0, 22.0, 17.0, 16.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.5859375, -11.236083984375, -10.88623046875, -10.536376953125, -10.1865234375, -9.836669921875, -9.48681640625, -9.136962890625, -8.787109375, -8.437255859375, -8.08740234375, -7.737548828125, -7.3876953125, -7.037841796875, -6.68798828125, -6.338134765625, -5.98828125, -5.638427734375, -5.28857421875, -4.938720703125, -4.5888671875, -4.239013671875, -3.88916015625, -3.539306640625, -3.189453125, -2.839599609375, -2.48974609375, -2.139892578125, -1.7900390625, -1.440185546875, -1.09033203125, -0.740478515625, -0.390625, -0.040771484375, 0.30908203125, 0.658935546875, 1.0087890625, 1.358642578125, 1.70849609375, 2.058349609375, 2.408203125, 2.758056640625, 3.10791015625, 3.457763671875, 3.8076171875, 4.157470703125, 4.50732421875, 4.857177734375, 5.20703125, 5.556884765625, 5.90673828125, 6.256591796875, 6.6064453125, 6.956298828125, 7.30615234375, 7.656005859375, 8.005859375, 8.355712890625, 8.70556640625, 9.055419921875, 9.4052734375, 9.755126953125, 10.10498046875, 10.454833984375, 10.8046875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 22.0, 74.0, 284.0, 400.0, 175.0, 45.0, 10.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.34567642211914, -32.80447769165039, -29.263277053833008, -25.722076416015625, -22.180877685546875, -18.639678955078125, -15.098478317260742, -11.55727767944336, -8.01607894897461, -4.474879264831543, -0.9336795806884766, 2.60752010345459, 6.148719787597656, 9.689918518066406, 13.231119155883789, 16.772319793701172, 20.313518524169922, 23.854717254638672, 27.395917892456055, 30.937118530273438, 34.47831726074219, 38.01951599121094, 41.56071472167969, 45.1019172668457, 48.64311599731445, 52.1843147277832, 55.72551727294922, 59.26671600341797, 62.80791473388672, 66.34911346435547, 69.89031219482422, 73.4315185546875, 76.97271728515625, 80.513916015625, 84.05511474609375, 87.5963134765625, 91.13751220703125, 94.6787109375, 98.21991729736328, 101.76111602783203, 105.30231475830078, 108.84351348876953, 112.38471221923828, 115.92591094970703, 119.46711730957031, 123.00831604003906, 126.54951477050781, 130.09071350097656, 133.6319122314453, 137.17311096191406, 140.7143096923828, 144.25550842285156, 147.7967071533203, 151.33790588378906, 154.8791046142578, 158.42031860351562, 161.96151733398438, 165.50271606445312, 169.04391479492188, 172.58511352539062, 176.12631225585938, 179.66751098632812, 183.20870971679688, 186.74990844726562, 190.29110717773438]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 5.0, 3.0, 6.0, 3.0, 12.0, 13.0, 12.0, 14.0, 18.0, 17.0, 31.0, 26.0, 28.0, 31.0, 24.0, 28.0, 39.0, 27.0, 36.0, 43.0, 30.0, 38.0, 47.0, 35.0, 39.0, 32.0, 35.0, 36.0, 28.0, 28.0, 27.0, 22.0, 23.0, 24.0, 15.0, 22.0, 14.0, 23.0, 13.0, 8.0, 15.0, 8.0, 2.0, 6.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 4.0], "bins": [-26.044818878173828, -25.298988342285156, -24.553159713745117, -23.807329177856445, -23.061498641967773, -22.315670013427734, -21.569839477539062, -20.82400894165039, -20.07818031311035, -19.33234977722168, -18.58652114868164, -17.84069061279297, -17.094860076904297, -16.349031448364258, -15.603200912475586, -14.85737133026123, -14.111540794372559, -13.365711212158203, -12.619880676269531, -11.874051094055176, -11.12822151184082, -10.382390975952148, -9.636561393737793, -8.890731811523438, -8.144901275634766, -7.399071216583252, -6.6532416343688965, -5.907411575317383, -5.161581993103027, -4.415751934051514, -3.669921875, -2.9240922927856445, -2.178262710571289, -1.4324328899383545, -0.6866029500961304, 0.05922698974609375, 0.8050568103790283, 1.550886631011963, 2.2967166900634766, 3.042546272277832, 3.7883763313293457, 4.534206390380859, 5.280035972595215, 6.0258660316467285, 6.771696090698242, 7.517525672912598, 8.263355255126953, 9.009185791015625, 9.75501537322998, 10.500844955444336, 11.246675491333008, 11.992505073547363, 12.738334655761719, 13.48416519165039, 14.229994773864746, 14.975824356079102, 15.721654891967773, 16.467485427856445, 17.213314056396484, 17.959144592285156, 18.704975128173828, 19.450803756713867, 20.19663429260254, 20.942462921142578, 21.68829345703125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 3.0, 5.0, 8.0, 20.0, 22.0, 22.0, 39.0, 62.0, 83.0, 88.0, 123.0, 103.0, 115.0, 90.0, 57.0, 66.0, 29.0, 25.0, 12.0, 10.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8046875, -4.675201416015625, -4.54571533203125, -4.416229248046875, -4.2867431640625, -4.157257080078125, -4.02777099609375, -3.898284912109375, -3.768798828125, -3.639312744140625, -3.50982666015625, -3.380340576171875, -3.2508544921875, -3.121368408203125, -2.99188232421875, -2.862396240234375, -2.73291015625, -2.603424072265625, -2.47393798828125, -2.344451904296875, -2.2149658203125, -2.085479736328125, -1.95599365234375, -1.826507568359375, -1.697021484375, -1.567535400390625, -1.43804931640625, -1.308563232421875, -1.1790771484375, -1.049591064453125, -0.92010498046875, -0.790618896484375, -0.6611328125, -0.531646728515625, -0.40216064453125, -0.272674560546875, -0.1431884765625, -0.013702392578125, 0.11578369140625, 0.245269775390625, 0.374755859375, 0.504241943359375, 0.63372802734375, 0.763214111328125, 0.8927001953125, 1.022186279296875, 1.15167236328125, 1.281158447265625, 1.41064453125, 1.540130615234375, 1.66961669921875, 1.799102783203125, 1.9285888671875, 2.058074951171875, 2.18756103515625, 2.317047119140625, 2.446533203125, 2.576019287109375, 2.70550537109375, 2.834991455078125, 2.9644775390625, 3.093963623046875, 3.22344970703125, 3.352935791015625, 3.482421875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 6.0, 4.0, 8.0, 15.0, 9.0, 32.0, 42.0, 51.0, 52.0, 82.0, 103.0, 151.0, 267.0, 367.0, 525.0, 797.0, 1349.0, 2198.0, 3827.0, 7414.0, 16832.0, 46359.0, 181476.0, 588692.0, 131660.0, 36997.0, 13984.0, 6540.0, 3306.0, 1903.0, 1133.0, 780.0, 534.0, 324.0, 199.0, 143.0, 103.0, 68.0, 62.0, 35.0, 30.0, 24.0, 14.0, 14.0, 13.0, 9.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2049560546875, -0.1982135772705078, -0.19147109985351562, -0.18472862243652344, -0.17798614501953125, -0.17124366760253906, -0.16450119018554688, -0.1577587127685547, -0.1510162353515625, -0.1442737579345703, -0.13753128051757812, -0.13078880310058594, -0.12404632568359375, -0.11730384826660156, -0.11056137084960938, -0.10381889343261719, -0.097076416015625, -0.09033393859863281, -0.08359146118164062, -0.07684898376464844, -0.07010650634765625, -0.06336402893066406, -0.056621551513671875, -0.04987907409667969, -0.0431365966796875, -0.03639411926269531, -0.029651641845703125, -0.022909164428710938, -0.01616668701171875, -0.009424209594726562, -0.002681732177734375, 0.0040607452392578125, 0.01080322265625, 0.017545700073242188, 0.024288177490234375, 0.031030654907226562, 0.03777313232421875, 0.04451560974121094, 0.051258087158203125, 0.05800056457519531, 0.0647430419921875, 0.07148551940917969, 0.07822799682617188, 0.08497047424316406, 0.09171295166015625, 0.09845542907714844, 0.10519790649414062, 0.11194038391113281, 0.118682861328125, 0.1254253387451172, 0.13216781616210938, 0.13891029357910156, 0.14565277099609375, 0.15239524841308594, 0.15913772583007812, 0.1658802032470703, 0.1726226806640625, 0.1793651580810547, 0.18610763549804688, 0.19285011291503906, 0.19959259033203125, 0.20633506774902344, 0.21307754516601562, 0.2198200225830078, 0.2265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 13.0, 12.0, 12.0, 18.0, 20.0, 20.0, 26.0, 22.0, 20.0, 35.0, 31.0, 32.0, 37.0, 37.0, 39.0, 38.0, 32.0, 1060.0, 32.0, 32.0, 35.0, 33.0, 27.0, 38.0, 44.0, 34.0, 37.0, 20.0, 20.0, 27.0, 18.0, 22.0, 18.0, 9.0, 12.0, 9.0, 10.0, 5.0, 7.0, 3.0, 8.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.376953125, -2.306732177734375, -2.23651123046875, -2.166290283203125, -2.0960693359375, -2.025848388671875, -1.95562744140625, -1.885406494140625, -1.815185546875, -1.744964599609375, -1.67474365234375, -1.604522705078125, -1.5343017578125, -1.464080810546875, -1.39385986328125, -1.323638916015625, -1.25341796875, -1.183197021484375, -1.11297607421875, -1.042755126953125, -0.9725341796875, -0.902313232421875, -0.83209228515625, -0.761871337890625, -0.691650390625, -0.621429443359375, -0.55120849609375, -0.480987548828125, -0.4107666015625, -0.340545654296875, -0.27032470703125, -0.200103759765625, -0.1298828125, -0.059661865234375, 0.01055908203125, 0.080780029296875, 0.1510009765625, 0.221221923828125, 0.29144287109375, 0.361663818359375, 0.431884765625, 0.502105712890625, 0.57232666015625, 0.642547607421875, 0.7127685546875, 0.782989501953125, 0.85321044921875, 0.923431396484375, 0.99365234375, 1.063873291015625, 1.13409423828125, 1.204315185546875, 1.2745361328125, 1.344757080078125, 1.41497802734375, 1.485198974609375, 1.555419921875, 1.625640869140625, 1.69586181640625, 1.766082763671875, 1.8363037109375, 1.906524658203125, 1.97674560546875, 2.046966552734375, 2.1171875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 5.0, 13.0, 10.0, 10.0, 21.0, 43.0, 41.0, 62.0, 109.0, 139.0, 199.0, 345.0, 461.0, 657.0, 936.0, 1271.0, 1833.0, 2761.0, 3935.0, 5677.0, 8311.0, 12076.0, 18168.0, 27051.0, 41447.0, 65742.0, 110464.0, 1106326.0, 395159.0, 107412.0, 64158.0, 40583.0, 26325.0, 17551.0, 11885.0, 8118.0, 5376.0, 3782.0, 2649.0, 1794.0, 1311.0, 882.0, 623.0, 402.0, 307.0, 214.0, 156.0, 104.0, 80.0, 52.0, 28.0, 34.0, 20.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.057098388671875, -0.05525493621826172, -0.05341148376464844, -0.051568031311035156, -0.049724578857421875, -0.047881126403808594, -0.04603767395019531, -0.04419422149658203, -0.04235076904296875, -0.04050731658935547, -0.03866386413574219, -0.036820411682128906, -0.034976959228515625, -0.033133506774902344, -0.03129005432128906, -0.02944660186767578, -0.0276031494140625, -0.02575969696044922, -0.023916244506835938, -0.022072792053222656, -0.020229339599609375, -0.018385887145996094, -0.016542434692382812, -0.014698982238769531, -0.01285552978515625, -0.011012077331542969, -0.009168624877929688, -0.007325172424316406, -0.005481719970703125, -0.0036382675170898438, -0.0017948150634765625, 4.863739013671875e-05, 0.00189208984375, 0.0037355422973632812, 0.0055789947509765625, 0.007422447204589844, 0.009265899658203125, 0.011109352111816406, 0.012952804565429688, 0.014796257019042969, 0.01663970947265625, 0.01848316192626953, 0.020326614379882812, 0.022170066833496094, 0.024013519287109375, 0.025856971740722656, 0.027700424194335938, 0.02954387664794922, 0.0313873291015625, 0.03323078155517578, 0.03507423400878906, 0.036917686462402344, 0.038761138916015625, 0.040604591369628906, 0.04244804382324219, 0.04429149627685547, 0.04613494873046875, 0.04797840118408203, 0.04982185363769531, 0.051665306091308594, 0.053508758544921875, 0.055352210998535156, 0.05719566345214844, 0.05903911590576172, 0.060882568359375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 9.0, 4.0, 9.0, 13.0, 15.0, 6.0, 18.0, 21.0, 24.0, 28.0, 29.0, 38.0, 42.0, 56.0, 60.0, 57.0, 66.0, 51.0, 59.0, 48.0, 50.0, 53.0, 46.0, 34.0, 29.0, 25.0, 14.0, 20.0, 12.0, 12.0, 8.0, 13.0, 4.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003948211669921875, -0.0003816261887550354, -0.0003684312105178833, -0.0003552362322807312, -0.0003420412540435791, -0.000328846275806427, -0.0003156512975692749, -0.0003024563193321228, -0.0002892613410949707, -0.0002760663628578186, -0.0002628713846206665, -0.0002496764063835144, -0.0002364814281463623, -0.0002232864499092102, -0.0002100914716720581, -0.000196896493434906, -0.0001837015151977539, -0.0001705065369606018, -0.0001573115587234497, -0.0001441165804862976, -0.0001309216022491455, -0.00011772662401199341, -0.00010453164577484131, -9.133666753768921e-05, -7.814168930053711e-05, -6.494671106338501e-05, -5.175173282623291e-05, -3.855675458908081e-05, -2.536177635192871e-05, -1.2166798114776611e-05, 1.0281801223754883e-06, 1.4223158359527588e-05, 2.7418136596679688e-05, 4.061311483383179e-05, 5.380809307098389e-05, 6.700307130813599e-05, 8.019804954528809e-05, 9.339302778244019e-05, 0.00010658800601959229, 0.00011978298425674438, 0.00013297796249389648, 0.00014617294073104858, 0.00015936791896820068, 0.00017256289720535278, 0.00018575787544250488, 0.00019895285367965698, 0.00021214783191680908, 0.00022534281015396118, 0.00023853778839111328, 0.0002517327666282654, 0.0002649277448654175, 0.0002781227231025696, 0.0002913177013397217, 0.0003045126795768738, 0.0003177076578140259, 0.000330902636051178, 0.0003440976142883301, 0.0003572925925254822, 0.0003704875707626343, 0.0003836825489997864, 0.0003968775272369385, 0.0004100725054740906, 0.0004232674837112427, 0.0004364624619483948, 0.0004496574401855469]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 3.0, 3.0, 5.0, 7.0, 13.0, 14.0, 22.0, 22.0, 29.0, 37.0, 44.0, 42.0, 46.0, 80.0, 91.0, 97.0, 120.0, 149.0, 168.0, 417.0, 8932.0, 842230.0, 191900.0, 2847.0, 244.0, 193.0, 144.0, 124.0, 91.0, 82.0, 59.0, 52.0, 47.0, 37.0, 38.0, 27.0, 16.0, 27.0, 13.0, 9.0, 5.0, 6.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.006885528564453125, -0.006669342517852783, -0.006453156471252441, -0.0062369704246521, -0.006020784378051758, -0.005804598331451416, -0.005588412284851074, -0.005372226238250732, -0.005156040191650391, -0.004939854145050049, -0.004723668098449707, -0.004507482051849365, -0.0042912960052490234, -0.004075109958648682, -0.00385892391204834, -0.003642737865447998, -0.0034265518188476562, -0.0032103657722473145, -0.0029941797256469727, -0.002777993679046631, -0.002561807632446289, -0.0023456215858459473, -0.0021294355392456055, -0.0019132494926452637, -0.0016970634460449219, -0.00148087739944458, -0.0012646913528442383, -0.0010485053062438965, -0.0008323192596435547, -0.0006161332130432129, -0.0003999471664428711, -0.0001837611198425293, 3.24249267578125e-05, 0.0002486109733581543, 0.0004647970199584961, 0.0006809830665588379, 0.0008971691131591797, 0.0011133551597595215, 0.0013295412063598633, 0.001545727252960205, 0.0017619132995605469, 0.0019780993461608887, 0.0021942853927612305, 0.0024104714393615723, 0.002626657485961914, 0.002842843532562256, 0.0030590295791625977, 0.0032752156257629395, 0.0034914016723632812, 0.003707587718963623, 0.003923773765563965, 0.004139959812164307, 0.0043561458587646484, 0.00457233190536499, 0.004788517951965332, 0.005004703998565674, 0.005220890045166016, 0.005437076091766357, 0.005653262138366699, 0.005869448184967041, 0.006085634231567383, 0.006301820278167725, 0.006518006324768066, 0.006734192371368408, 0.00695037841796875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 96.0, 858.0, 56.0, 2.0, 0.0, 1.0], "bins": [-0.007806016132235527, -0.007674674037843943, -0.007543331943452358, -0.007411989849060774, -0.0072806477546691895, -0.007149305660277605, -0.007017963565886021, -0.006886621471494436, -0.006755279377102852, -0.0066239372827112675, -0.006492595188319683, -0.006361253093928099, -0.006229910999536514, -0.00609856890514493, -0.0059672268107533455, -0.005835884716361761, -0.005704542621970177, -0.005573200527578592, -0.005441858433187008, -0.0053105163387954235, -0.005179174244403839, -0.005047832150012255, -0.00491649005562067, -0.004785147961229086, -0.004653806332498789, -0.0045224642381072044, -0.00439112214371562, -0.004259780049324036, -0.004128437954932451, -0.003997095860540867, -0.0038657537661492825, -0.003734411671757698, -0.0036030698101967573, -0.003471727715805173, -0.0033403856214135885, -0.003209043527022004, -0.0030777014326304197, -0.0029463593382388353, -0.0028150174766778946, -0.00268367538228631, -0.002552333287894726, -0.0024209911935031414, -0.002289649099111557, -0.0021583070047199726, -0.002026964910328388, -0.0018956228159368038, -0.0017642808379605412, -0.0016329387435689569, -0.0015015965327620506, -0.0013702544383704662, -0.0012389123439788818, -0.0011075702495872974, -0.000976228213403374, -0.0008448861190117896, -0.0007135440828278661, -0.0005822019884362817, -0.0004508599522523582, -0.0003195178578607738, -0.00018817579257301986, -5.683372728526592e-05, 7.450836710631847e-05, 0.00020585046149790287, 0.00033719249768182635, 0.00046853459207341075, 0.0005998766864649951]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 9.0, 5.0, 8.0, 16.0, 11.0, 17.0, 22.0, 29.0, 36.0, 29.0, 43.0, 30.0, 45.0, 43.0, 58.0, 41.0, 47.0, 49.0, 56.0, 53.0, 50.0, 38.0, 43.0, 32.0, 32.0, 30.0, 23.0, 20.0, 20.0, 18.0, 12.0, 6.0, 8.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0004892349243164062, -0.0004763184115290642, -0.0004634018987417221, -0.00045048538595438004, -0.00043756887316703796, -0.0004246523603796959, -0.0004117358475923538, -0.00039881933480501175, -0.0003859028220176697, -0.0003729863092303276, -0.00036006979644298553, -0.00034715328365564346, -0.0003342367708683014, -0.0003213202580809593, -0.00030840374529361725, -0.0002954872325062752, -0.0002825707197189331, -0.00026965420693159103, -0.00025673769414424896, -0.0002438211813569069, -0.00023090466856956482, -0.00021798815578222275, -0.00020507164299488068, -0.0001921551302075386, -0.00017923861742019653, -0.00016632210463285446, -0.0001534055918455124, -0.00014048907905817032, -0.00012757256627082825, -0.00011465605348348618, -0.0001017395406961441, -8.882302790880203e-05, -7.590651512145996e-05, -6.299000233411789e-05, -5.007348954677582e-05, -3.7156976759433746e-05, -2.4240463972091675e-05, -1.1323951184749603e-05, 1.5925616025924683e-06, 1.450907438993454e-05, 2.742558717727661e-05, 4.034209996461868e-05, 5.3258612751960754e-05, 6.617512553930283e-05, 7.90916383266449e-05, 9.200815111398697e-05, 0.00010492466390132904, 0.00011784117668867111, 0.00013075768947601318, 0.00014367420226335526, 0.00015659071505069733, 0.0001695072278380394, 0.00018242374062538147, 0.00019534025341272354, 0.0002082567662000656, 0.00022117327898740768, 0.00023408979177474976, 0.00024700630456209183, 0.0002599228173494339, 0.00027283933013677597, 0.00028575584292411804, 0.0002986723557114601, 0.0003115888684988022, 0.00032450538128614426, 0.00033742189407348633]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 3.0, 5.0, 8.0, 20.0, 22.0, 22.0, 39.0, 62.0, 83.0, 88.0, 123.0, 103.0, 115.0, 90.0, 57.0, 66.0, 29.0, 25.0, 12.0, 10.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8046875, -4.675201416015625, -4.54571533203125, -4.416229248046875, -4.2867431640625, -4.157257080078125, -4.02777099609375, -3.898284912109375, -3.768798828125, -3.639312744140625, -3.50982666015625, -3.380340576171875, -3.2508544921875, -3.121368408203125, -2.99188232421875, -2.862396240234375, -2.73291015625, -2.603424072265625, -2.47393798828125, -2.344451904296875, -2.2149658203125, -2.085479736328125, -1.95599365234375, -1.826507568359375, -1.697021484375, -1.567535400390625, -1.43804931640625, -1.308563232421875, -1.1790771484375, -1.049591064453125, -0.92010498046875, -0.790618896484375, -0.6611328125, -0.531646728515625, -0.40216064453125, -0.272674560546875, -0.1431884765625, -0.013702392578125, 0.11578369140625, 0.245269775390625, 0.374755859375, 0.504241943359375, 0.63372802734375, 0.763214111328125, 0.8927001953125, 1.022186279296875, 1.15167236328125, 1.281158447265625, 1.41064453125, 1.540130615234375, 1.66961669921875, 1.799102783203125, 1.9285888671875, 2.058074951171875, 2.18756103515625, 2.317047119140625, 2.446533203125, 2.576019287109375, 2.70550537109375, 2.834991455078125, 2.9644775390625, 3.093963623046875, 3.22344970703125, 3.352935791015625, 3.482421875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 7.0, 8.0, 11.0, 11.0, 11.0, 45.0, 61.0, 61.0, 125.0, 196.0, 331.0, 654.0, 1557.0, 4678.0, 19406.0, 111546.0, 588540.0, 267183.0, 40857.0, 8664.0, 2588.0, 955.0, 444.0, 209.0, 130.0, 79.0, 53.0, 36.0, 25.0, 23.0, 13.0, 8.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.1328125, -4.9891357421875, -4.845458984375, -4.7017822265625, -4.55810546875, -4.4144287109375, -4.270751953125, -4.1270751953125, -3.9833984375, -3.8397216796875, -3.696044921875, -3.5523681640625, -3.40869140625, -3.2650146484375, -3.121337890625, -2.9776611328125, -2.833984375, -2.6903076171875, -2.546630859375, -2.4029541015625, -2.25927734375, -2.1156005859375, -1.971923828125, -1.8282470703125, -1.6845703125, -1.5408935546875, -1.397216796875, -1.2535400390625, -1.10986328125, -0.9661865234375, -0.822509765625, -0.6788330078125, -0.53515625, -0.3914794921875, -0.247802734375, -0.1041259765625, 0.03955078125, 0.1832275390625, 0.326904296875, 0.4705810546875, 0.6142578125, 0.7579345703125, 0.901611328125, 1.0452880859375, 1.18896484375, 1.3326416015625, 1.476318359375, 1.6199951171875, 1.763671875, 1.9073486328125, 2.051025390625, 2.1947021484375, 2.33837890625, 2.4820556640625, 2.625732421875, 2.7694091796875, 2.9130859375, 3.0567626953125, 3.200439453125, 3.3441162109375, 3.48779296875, 3.6314697265625, 3.775146484375, 3.9188232421875, 4.0625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 9.0, 12.0, 23.0, 19.0, 20.0, 23.0, 20.0, 29.0, 28.0, 33.0, 30.0, 34.0, 48.0, 48.0, 99.0, 239.0, 1621.0, 217.0, 71.0, 53.0, 46.0, 43.0, 36.0, 25.0, 32.0, 37.0, 22.0, 16.0, 26.0, 16.0, 19.0, 11.0, 8.0, 6.0, 8.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.7109375, -8.4652099609375, -8.219482421875, -7.9737548828125, -7.72802734375, -7.4822998046875, -7.236572265625, -6.9908447265625, -6.7451171875, -6.4993896484375, -6.253662109375, -6.0079345703125, -5.76220703125, -5.5164794921875, -5.270751953125, -5.0250244140625, -4.779296875, -4.5335693359375, -4.287841796875, -4.0421142578125, -3.79638671875, -3.5506591796875, -3.304931640625, -3.0592041015625, -2.8134765625, -2.5677490234375, -2.322021484375, -2.0762939453125, -1.83056640625, -1.5848388671875, -1.339111328125, -1.0933837890625, -0.84765625, -0.6019287109375, -0.356201171875, -0.1104736328125, 0.13525390625, 0.3809814453125, 0.626708984375, 0.8724365234375, 1.1181640625, 1.3638916015625, 1.609619140625, 1.8553466796875, 2.10107421875, 2.3468017578125, 2.592529296875, 2.8382568359375, 3.083984375, 3.3297119140625, 3.575439453125, 3.8211669921875, 4.06689453125, 4.3126220703125, 4.558349609375, 4.8040771484375, 5.0498046875, 5.2955322265625, 5.541259765625, 5.7869873046875, 6.03271484375, 6.2784423828125, 6.524169921875, 6.7698974609375, 7.015625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 7.0, 9.0, 11.0, 18.0, 20.0, 10.0, 25.0, 31.0, 30.0, 46.0, 35.0, 64.0, 92.0, 155.0, 321.0, 925.0, 17596.0, 3073751.0, 50268.0, 1298.0, 371.0, 184.0, 94.0, 79.0, 46.0, 33.0, 27.0, 28.0, 22.0, 21.0, 20.0, 15.0, 15.0, 13.0, 9.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.8797607421875, -13.376708984375, -12.8736572265625, -12.37060546875, -11.8675537109375, -11.364501953125, -10.8614501953125, -10.3583984375, -9.8553466796875, -9.352294921875, -8.8492431640625, -8.34619140625, -7.8431396484375, -7.340087890625, -6.8370361328125, -6.333984375, -5.8309326171875, -5.327880859375, -4.8248291015625, -4.32177734375, -3.8187255859375, -3.315673828125, -2.8126220703125, -2.3095703125, -1.8065185546875, -1.303466796875, -0.8004150390625, -0.29736328125, 0.2056884765625, 0.708740234375, 1.2117919921875, 1.71484375, 2.2178955078125, 2.720947265625, 3.2239990234375, 3.72705078125, 4.2301025390625, 4.733154296875, 5.2362060546875, 5.7392578125, 6.2423095703125, 6.745361328125, 7.2484130859375, 7.75146484375, 8.2545166015625, 8.757568359375, 9.2606201171875, 9.763671875, 10.2667236328125, 10.769775390625, 11.2728271484375, 11.77587890625, 12.2789306640625, 12.781982421875, 13.2850341796875, 13.7880859375, 14.2911376953125, 14.794189453125, 15.2972412109375, 15.80029296875, 16.3033447265625, 16.806396484375, 17.3094482421875, 17.8125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 8.0, 1004.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.908605575561523, -8.04853630065918, -2.1884679794311523, 3.671600341796875, 9.531669616699219, 15.391738891601562, 21.251806259155273, 27.111875534057617, 32.971946716308594, 38.83201599121094, 44.69208526611328, 50.552154541015625, 56.41222381591797, 62.27229309082031, 68.13235473632812, 73.992431640625, 79.85249328613281, 85.71256256103516, 91.5726318359375, 97.43270111083984, 103.29277038574219, 109.15283966064453, 115.01290893554688, 120.87297058105469, 126.73304748535156, 132.59310913085938, 138.45318603515625, 144.31324768066406, 150.17332458496094, 156.03338623046875, 161.89346313476562, 167.75352478027344, 173.6136016845703, 179.47366333007812, 185.333740234375, 191.1938018798828, 197.0538787841797, 202.9139404296875, 208.77401733398438, 214.6340789794922, 220.49415588378906, 226.35421752929688, 232.21429443359375, 238.07435607910156, 243.93443298339844, 249.79449462890625, 255.65457153320312, 261.5146484375, 267.37469482421875, 273.2347717285156, 279.0948181152344, 284.95489501953125, 290.8149719238281, 296.675048828125, 302.53509521484375, 308.3951721191406, 314.2552490234375, 320.1153259277344, 325.9753723144531, 331.83544921875, 337.6955261230469, 343.55560302734375, 349.4156494140625, 355.2757263183594, 361.13580322265625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 6.0, 8.0, 3.0, 9.0, 16.0, 16.0, 20.0, 22.0, 27.0, 37.0, 36.0, 34.0, 38.0, 27.0, 32.0, 51.0, 35.0, 49.0, 53.0, 45.0, 45.0, 38.0, 39.0, 38.0, 35.0, 46.0, 30.0, 25.0, 19.0, 21.0, 18.0, 19.0, 11.0, 12.0, 6.0, 5.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-28.132755279541016, -27.32994842529297, -26.527141571044922, -25.724334716796875, -24.921525955200195, -24.11871910095215, -23.3159122467041, -22.513105392456055, -21.710298538208008, -20.90749168395996, -20.104684829711914, -19.301876068115234, -18.499069213867188, -17.69626235961914, -16.893455505371094, -16.090648651123047, -15.287840843200684, -14.485033988952637, -13.682226181030273, -12.879419326782227, -12.07661247253418, -11.273805618286133, -10.47099781036377, -9.668190956115723, -8.86538314819336, -8.062576293945312, -7.259768962860107, -6.456961631774902, -5.6541547775268555, -4.85134744644165, -4.048540115356445, -3.2457332611083984, -2.4429264068603516, -1.6401193141937256, -0.8373121023178101, -0.03450489044189453, 0.7683022022247314, 1.5711092948913574, 2.3739166259765625, 3.1767234802246094, 3.9795308113098145, 4.7823381423950195, 5.585144996643066, 6.3879523277282715, 7.190759658813477, 7.993566513061523, 8.79637336730957, 9.599180221557617, 10.40198802947998, 11.204794883728027, 12.00760269165039, 12.810409545898438, 13.613216400146484, 14.416023254394531, 15.218831062316895, 16.021636962890625, 16.824445724487305, 17.62725257873535, 18.4300594329834, 19.232868194580078, 20.035675048828125, 20.838481903076172, 21.64128875732422, 22.444095611572266, 23.246902465820312]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 4.0, 11.0, 16.0, 25.0, 26.0, 43.0, 63.0, 77.0, 87.0, 123.0, 99.0, 114.0, 94.0, 59.0, 60.0, 34.0, 19.0, 15.0, 11.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8125, -4.682647705078125, -4.55279541015625, -4.422943115234375, -4.2930908203125, -4.163238525390625, -4.03338623046875, -3.903533935546875, -3.773681640625, -3.643829345703125, -3.51397705078125, -3.384124755859375, -3.2542724609375, -3.124420166015625, -2.99456787109375, -2.864715576171875, -2.73486328125, -2.605010986328125, -2.47515869140625, -2.345306396484375, -2.2154541015625, -2.085601806640625, -1.95574951171875, -1.825897216796875, -1.696044921875, -1.566192626953125, -1.43634033203125, -1.306488037109375, -1.1766357421875, -1.046783447265625, -0.91693115234375, -0.787078857421875, -0.6572265625, -0.527374267578125, -0.39752197265625, -0.267669677734375, -0.1378173828125, -0.007965087890625, 0.12188720703125, 0.251739501953125, 0.381591796875, 0.511444091796875, 0.64129638671875, 0.771148681640625, 0.9010009765625, 1.030853271484375, 1.16070556640625, 1.290557861328125, 1.42041015625, 1.550262451171875, 1.68011474609375, 1.809967041015625, 1.9398193359375, 2.069671630859375, 2.19952392578125, 2.329376220703125, 2.459228515625, 2.589080810546875, 2.71893310546875, 2.848785400390625, 2.9786376953125, 3.108489990234375, 3.23834228515625, 3.368194580078125, 3.498046875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 10.0, 20.0, 13.0, 29.0, 35.0, 80.0, 107.0, 159.0, 347.0, 645.0, 1277.0, 3636.0, 18283.0, 2704388.0, 1444805.0, 15338.0, 3023.0, 1042.0, 471.0, 221.0, 150.0, 73.0, 35.0, 31.0, 23.0, 13.0, 5.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.875, -24.201904296875, -23.52880859375, -22.855712890625, -22.1826171875, -21.509521484375, -20.83642578125, -20.163330078125, -19.490234375, -18.817138671875, -18.14404296875, -17.470947265625, -16.7978515625, -16.124755859375, -15.45166015625, -14.778564453125, -14.10546875, -13.432373046875, -12.75927734375, -12.086181640625, -11.4130859375, -10.739990234375, -10.06689453125, -9.393798828125, -8.720703125, -8.047607421875, -7.37451171875, -6.701416015625, -6.0283203125, -5.355224609375, -4.68212890625, -4.009033203125, -3.3359375, -2.662841796875, -1.98974609375, -1.316650390625, -0.6435546875, 0.029541015625, 0.70263671875, 1.375732421875, 2.048828125, 2.721923828125, 3.39501953125, 4.068115234375, 4.7412109375, 5.414306640625, 6.08740234375, 6.760498046875, 7.43359375, 8.106689453125, 8.77978515625, 9.452880859375, 10.1259765625, 10.799072265625, 11.47216796875, 12.145263671875, 12.818359375, 13.491455078125, 14.16455078125, 14.837646484375, 15.5107421875, 16.183837890625, 16.85693359375, 17.530029296875, 18.203125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 9.0, 14.0, 2.0, 16.0, 19.0, 11.0, 33.0, 39.0, 70.0, 71.0, 137.0, 223.0, 339.0, 498.0, 715.0, 627.0, 420.0, 288.0, 170.0, 116.0, 68.0, 54.0, 33.0, 26.0, 16.0, 14.0, 9.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1015625, -6.8629150390625, -6.624267578125, -6.3856201171875, -6.14697265625, -5.9083251953125, -5.669677734375, -5.4310302734375, -5.1923828125, -4.9537353515625, -4.715087890625, -4.4764404296875, -4.23779296875, -3.9991455078125, -3.760498046875, -3.5218505859375, -3.283203125, -3.0445556640625, -2.805908203125, -2.5672607421875, -2.32861328125, -2.0899658203125, -1.851318359375, -1.6126708984375, -1.3740234375, -1.1353759765625, -0.896728515625, -0.6580810546875, -0.41943359375, -0.1807861328125, 0.057861328125, 0.2965087890625, 0.53515625, 0.7738037109375, 1.012451171875, 1.2510986328125, 1.48974609375, 1.7283935546875, 1.967041015625, 2.2056884765625, 2.4443359375, 2.6829833984375, 2.921630859375, 3.1602783203125, 3.39892578125, 3.6375732421875, 3.876220703125, 4.1148681640625, 4.353515625, 4.5921630859375, 4.830810546875, 5.0694580078125, 5.30810546875, 5.5467529296875, 5.785400390625, 6.0240478515625, 6.2626953125, 6.5013427734375, 6.739990234375, 6.9786376953125, 7.21728515625, 7.4559326171875, 7.694580078125, 7.9332275390625, 8.171875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 5.0, 12.0, 26.0, 31.0, 41.0, 57.0, 86.0, 153.0, 287.0, 448.0, 851.0, 1699.0, 3508.0, 8250.0, 22829.0, 82200.0, 555135.0, 2847407.0, 550748.0, 82273.0, 22762.0, 8288.0, 3512.0, 1684.0, 832.0, 438.0, 258.0, 161.0, 86.0, 83.0, 43.0, 29.0, 22.0, 9.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-12.3125, -11.9449462890625, -11.577392578125, -11.2098388671875, -10.84228515625, -10.4747314453125, -10.107177734375, -9.7396240234375, -9.3720703125, -9.0045166015625, -8.636962890625, -8.2694091796875, -7.90185546875, -7.5343017578125, -7.166748046875, -6.7991943359375, -6.431640625, -6.0640869140625, -5.696533203125, -5.3289794921875, -4.96142578125, -4.5938720703125, -4.226318359375, -3.8587646484375, -3.4912109375, -3.1236572265625, -2.756103515625, -2.3885498046875, -2.02099609375, -1.6534423828125, -1.285888671875, -0.9183349609375, -0.55078125, -0.1832275390625, 0.184326171875, 0.5518798828125, 0.91943359375, 1.2869873046875, 1.654541015625, 2.0220947265625, 2.3896484375, 2.7572021484375, 3.124755859375, 3.4923095703125, 3.85986328125, 4.2274169921875, 4.594970703125, 4.9625244140625, 5.330078125, 5.6976318359375, 6.065185546875, 6.4327392578125, 6.80029296875, 7.1678466796875, 7.535400390625, 7.9029541015625, 8.2705078125, 8.6380615234375, 9.005615234375, 9.3731689453125, 9.74072265625, 10.1082763671875, 10.475830078125, 10.8433837890625, 11.2109375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 8.0, 25.0, 59.0, 145.0, 269.0, 278.0, 140.0, 67.0, 16.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.68810272216797, -21.9373779296875, -19.18665313720703, -16.43592643737793, -13.685201644897461, -10.934476852416992, -8.18375015258789, -5.433025360107422, -2.682300567626953, 0.06842470169067383, 2.819149971008301, 5.569875717163086, 8.320600509643555, 11.071325302124023, 13.822052001953125, 16.572776794433594, 19.323501586914062, 22.07422637939453, 24.824951171875, 27.5756778717041, 30.32640266418457, 33.077125549316406, 35.82785415649414, 38.57857894897461, 41.32930374145508, 44.08002853393555, 46.830753326416016, 49.58148193359375, 52.33220672607422, 55.08293151855469, 57.833656311035156, 60.584381103515625, 63.33509826660156, 66.08582305908203, 68.8365478515625, 71.58727264404297, 74.33799743652344, 77.0887222290039, 79.83944702148438, 82.59017944335938, 85.34089660644531, 88.09162139892578, 90.84234619140625, 93.59307098388672, 96.34379577636719, 99.09452056884766, 101.84524536132812, 104.59597778320312, 107.3467025756836, 110.09742736816406, 112.84815216064453, 115.598876953125, 118.34960174560547, 121.10032653808594, 123.85105895996094, 126.60177612304688, 129.35250854492188, 132.10324096679688, 134.8539581298828, 137.6046905517578, 140.35540771484375, 143.10614013671875, 145.8568572998047, 148.6075897216797, 151.35830688476562]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 5.0, 4.0, 4.0, 10.0, 5.0, 4.0, 13.0, 15.0, 17.0, 18.0, 23.0, 26.0, 28.0, 34.0, 26.0, 29.0, 39.0, 38.0, 38.0, 40.0, 54.0, 34.0, 53.0, 47.0, 37.0, 43.0, 34.0, 38.0, 34.0, 34.0, 34.0, 19.0, 13.0, 28.0, 18.0, 14.0, 10.0, 14.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.430870056152344, -23.666580200195312, -22.90228843688965, -22.137998580932617, -21.373706817626953, -20.609416961669922, -19.84512710571289, -19.080835342407227, -18.316545486450195, -17.552255630493164, -16.7879638671875, -16.02367401123047, -15.259383201599121, -14.495092391967773, -13.730801582336426, -12.966510772705078, -12.20221996307373, -11.437929153442383, -10.673638343811035, -9.909347534179688, -9.145057678222656, -8.380766868591309, -7.616476058959961, -6.8521857261657715, -6.087894916534424, -5.323604106903076, -4.559313774108887, -3.795022964477539, -3.0307323932647705, -2.266441822052002, -1.5021510124206543, -0.7378606796264648, 0.026430130004882812, 0.7907207608222961, 1.5550113916397095, 2.3193020820617676, 3.083592653274536, 3.8478832244873047, 4.612174034118652, 5.376464366912842, 6.1407551765441895, 6.905045986175537, 7.669336318969727, 8.433627128601074, 9.197917938232422, 9.962207794189453, 10.726499557495117, 11.490789413452148, 12.255080223083496, 13.019371032714844, 13.783661842346191, 14.547952651977539, 15.31224250793457, 16.076534271240234, 16.840824127197266, 17.605113983154297, 18.36940574645996, 19.133695602416992, 19.897987365722656, 20.662277221679688, 21.42656898498535, 22.190858840942383, 22.955150604248047, 23.719440460205078, 24.48373031616211]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 27.0, 18.0, 45.0, 58.0, 53.0, 82.0, 88.0, 82.0, 114.0, 94.0, 81.0, 60.0, 55.0, 41.0, 22.0, 15.0, 12.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.59765625, -4.475860595703125, -4.35406494140625, -4.232269287109375, -4.1104736328125, -3.988677978515625, -3.86688232421875, -3.745086669921875, -3.623291015625, -3.501495361328125, -3.37969970703125, -3.257904052734375, -3.1361083984375, -3.014312744140625, -2.89251708984375, -2.770721435546875, -2.64892578125, -2.527130126953125, -2.40533447265625, -2.283538818359375, -2.1617431640625, -2.039947509765625, -1.91815185546875, -1.796356201171875, -1.674560546875, -1.552764892578125, -1.43096923828125, -1.309173583984375, -1.1873779296875, -1.065582275390625, -0.94378662109375, -0.821990966796875, -0.7001953125, -0.578399658203125, -0.45660400390625, -0.334808349609375, -0.2130126953125, -0.091217041015625, 0.03057861328125, 0.152374267578125, 0.274169921875, 0.395965576171875, 0.51776123046875, 0.639556884765625, 0.7613525390625, 0.883148193359375, 1.00494384765625, 1.126739501953125, 1.24853515625, 1.370330810546875, 1.49212646484375, 1.613922119140625, 1.7357177734375, 1.857513427734375, 1.97930908203125, 2.101104736328125, 2.222900390625, 2.344696044921875, 2.46649169921875, 2.588287353515625, 2.7100830078125, 2.831878662109375, 2.95367431640625, 3.075469970703125, 3.197265625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 5.0, 4.0, 15.0, 16.0, 27.0, 29.0, 42.0, 39.0, 67.0, 85.0, 149.0, 222.0, 292.0, 477.0, 731.0, 1197.0, 2001.0, 3578.0, 6876.0, 14968.0, 39481.0, 127508.0, 562265.0, 195822.0, 54302.0, 19796.0, 8379.0, 4176.0, 2291.0, 1286.0, 846.0, 498.0, 337.0, 236.0, 149.0, 97.0, 69.0, 55.0, 34.0, 25.0, 21.0, 20.0, 14.0, 5.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.215087890625, -0.20806884765625, -0.2010498046875, -0.19403076171875, -0.18701171875, -0.17999267578125, -0.1729736328125, -0.16595458984375, -0.158935546875, -0.15191650390625, -0.1448974609375, -0.13787841796875, -0.130859375, -0.12384033203125, -0.1168212890625, -0.10980224609375, -0.102783203125, -0.09576416015625, -0.0887451171875, -0.08172607421875, -0.07470703125, -0.06768798828125, -0.0606689453125, -0.05364990234375, -0.046630859375, -0.03961181640625, -0.0325927734375, -0.02557373046875, -0.0185546875, -0.01153564453125, -0.0045166015625, 0.00250244140625, 0.009521484375, 0.01654052734375, 0.0235595703125, 0.03057861328125, 0.03759765625, 0.04461669921875, 0.0516357421875, 0.05865478515625, 0.065673828125, 0.07269287109375, 0.0797119140625, 0.08673095703125, 0.09375, 0.10076904296875, 0.1077880859375, 0.11480712890625, 0.121826171875, 0.12884521484375, 0.1358642578125, 0.14288330078125, 0.14990234375, 0.15692138671875, 0.1639404296875, 0.17095947265625, 0.177978515625, 0.18499755859375, 0.1920166015625, 0.19903564453125, 0.2060546875, 0.21307373046875, 0.2200927734375, 0.22711181640625, 0.234130859375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 3.0, 10.0, 8.0, 8.0, 15.0, 16.0, 17.0, 23.0, 25.0, 34.0, 24.0, 23.0, 35.0, 44.0, 36.0, 48.0, 39.0, 59.0, 1070.0, 34.0, 42.0, 26.0, 45.0, 45.0, 36.0, 36.0, 27.0, 32.0, 25.0, 26.0, 20.0, 21.0, 16.0, 17.0, 9.0, 6.0, 8.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.875, -2.797149658203125, -2.71929931640625, -2.641448974609375, -2.5635986328125, -2.485748291015625, -2.40789794921875, -2.330047607421875, -2.252197265625, -2.174346923828125, -2.09649658203125, -2.018646240234375, -1.9407958984375, -1.862945556640625, -1.78509521484375, -1.707244873046875, -1.62939453125, -1.551544189453125, -1.47369384765625, -1.395843505859375, -1.3179931640625, -1.240142822265625, -1.16229248046875, -1.084442138671875, -1.006591796875, -0.928741455078125, -0.85089111328125, -0.773040771484375, -0.6951904296875, -0.617340087890625, -0.53948974609375, -0.461639404296875, -0.3837890625, -0.305938720703125, -0.22808837890625, -0.150238037109375, -0.0723876953125, 0.005462646484375, 0.08331298828125, 0.161163330078125, 0.239013671875, 0.316864013671875, 0.39471435546875, 0.472564697265625, 0.5504150390625, 0.628265380859375, 0.70611572265625, 0.783966064453125, 0.86181640625, 0.939666748046875, 1.01751708984375, 1.095367431640625, 1.1732177734375, 1.251068115234375, 1.32891845703125, 1.406768798828125, 1.484619140625, 1.562469482421875, 1.64031982421875, 1.718170166015625, 1.7960205078125, 1.873870849609375, 1.95172119140625, 2.029571533203125, 2.107421875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 11.0, 27.0, 32.0, 53.0, 82.0, 170.0, 213.0, 347.0, 576.0, 900.0, 1385.0, 2148.0, 3448.0, 5425.0, 8555.0, 13523.0, 21553.0, 35825.0, 60720.0, 111932.0, 1036662.0, 530396.0, 109881.0, 60367.0, 34968.0, 21682.0, 13417.0, 8378.0, 5206.0, 3355.0, 2162.0, 1371.0, 843.0, 542.0, 354.0, 220.0, 119.0, 102.0, 70.0, 38.0, 15.0, 25.0, 6.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06719970703125, -0.06503105163574219, -0.06286239624023438, -0.06069374084472656, -0.05852508544921875, -0.05635643005371094, -0.054187774658203125, -0.05201911926269531, -0.0498504638671875, -0.04768180847167969, -0.045513153076171875, -0.04334449768066406, -0.04117584228515625, -0.03900718688964844, -0.036838531494140625, -0.03466987609863281, -0.032501220703125, -0.030332565307617188, -0.028163909912109375, -0.025995254516601562, -0.02382659912109375, -0.021657943725585938, -0.019489288330078125, -0.017320632934570312, -0.0151519775390625, -0.012983322143554688, -0.010814666748046875, -0.008646011352539062, -0.00647735595703125, -0.0043087005615234375, -0.002140045166015625, 2.86102294921875e-05, 0.002197265625, 0.0043659210205078125, 0.006534576416015625, 0.008703231811523438, 0.01087188720703125, 0.013040542602539062, 0.015209197998046875, 0.017377853393554688, 0.0195465087890625, 0.021715164184570312, 0.023883819580078125, 0.026052474975585938, 0.02822113037109375, 0.030389785766601562, 0.032558441162109375, 0.03472709655761719, 0.036895751953125, 0.03906440734863281, 0.041233062744140625, 0.04340171813964844, 0.04557037353515625, 0.04773902893066406, 0.049907684326171875, 0.05207633972167969, 0.0542449951171875, 0.05641365051269531, 0.058582305908203125, 0.06075096130371094, 0.06291961669921875, 0.06508827209472656, 0.06725692749023438, 0.06942558288574219, 0.07159423828125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 7.0, 9.0, 2.0, 11.0, 8.0, 17.0, 14.0, 34.0, 36.0, 34.0, 64.0, 46.0, 79.0, 73.0, 91.0, 81.0, 69.0, 59.0, 69.0, 37.0, 34.0, 21.0, 24.0, 15.0, 22.0, 6.0, 13.0, 9.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007200241088867188, -0.0007008612155914307, -0.0006816983222961426, -0.0006625354290008545, -0.0006433725357055664, -0.0006242096424102783, -0.0006050467491149902, -0.0005858838558197021, -0.0005667209625244141, -0.000547558069229126, -0.0005283951759338379, -0.0005092322826385498, -0.0004900693893432617, -0.00047090649604797363, -0.00045174360275268555, -0.00043258070945739746, -0.0004134178161621094, -0.0003942549228668213, -0.0003750920295715332, -0.0003559291362762451, -0.00033676624298095703, -0.00031760334968566895, -0.00029844045639038086, -0.0002792775630950928, -0.0002601146697998047, -0.0002409517765045166, -0.00022178888320922852, -0.00020262598991394043, -0.00018346309661865234, -0.00016430020332336426, -0.00014513731002807617, -0.00012597441673278809, -0.0001068115234375, -8.764863014221191e-05, -6.848573684692383e-05, -4.932284355163574e-05, -3.0159950256347656e-05, -1.099705696105957e-05, 8.165836334228516e-06, 2.73287296295166e-05, 4.649162292480469e-05, 6.565451622009277e-05, 8.481740951538086e-05, 0.00010398030281066895, 0.00012314319610595703, 0.00014230608940124512, 0.0001614689826965332, 0.0001806318759918213, 0.00019979476928710938, 0.00021895766258239746, 0.00023812055587768555, 0.00025728344917297363, 0.0002764463424682617, 0.0002956092357635498, 0.0003147721290588379, 0.000333935022354126, 0.00035309791564941406, 0.00037226080894470215, 0.00039142370223999023, 0.0004105865955352783, 0.0004297494888305664, 0.0004489123821258545, 0.0004680752754211426, 0.00048723816871643066, 0.0005064010620117188]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 11.0, 16.0, 22.0, 19.0, 40.0, 40.0, 48.0, 67.0, 91.0, 131.0, 207.0, 361.0, 2757.0, 116888.0, 910897.0, 15287.0, 811.0, 252.0, 146.0, 112.0, 83.0, 71.0, 48.0, 38.0, 23.0, 20.0, 13.0, 10.0, 11.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00897979736328125, -0.008672833442687988, -0.008365869522094727, -0.008058905601501465, -0.007751941680908203, -0.007444977760314941, -0.00713801383972168, -0.006831049919128418, -0.006524085998535156, -0.0062171220779418945, -0.005910158157348633, -0.005603194236755371, -0.005296230316162109, -0.004989266395568848, -0.004682302474975586, -0.004375338554382324, -0.0040683746337890625, -0.0037614107131958008, -0.003454446792602539, -0.0031474828720092773, -0.0028405189514160156, -0.002533555030822754, -0.002226591110229492, -0.0019196271896362305, -0.0016126632690429688, -0.001305699348449707, -0.0009987354278564453, -0.0006917715072631836, -0.0003848075866699219, -7.784366607666016e-05, 0.00022912025451660156, 0.0005360841751098633, 0.000843048095703125, 0.0011500120162963867, 0.0014569759368896484, 0.0017639398574829102, 0.002070903778076172, 0.0023778676986694336, 0.0026848316192626953, 0.002991795539855957, 0.0032987594604492188, 0.0036057233810424805, 0.003912687301635742, 0.004219651222229004, 0.004526615142822266, 0.004833579063415527, 0.005140542984008789, 0.005447506904602051, 0.0057544708251953125, 0.006061434745788574, 0.006368398666381836, 0.006675362586975098, 0.006982326507568359, 0.007289290428161621, 0.007596254348754883, 0.007903218269348145, 0.008210182189941406, 0.008517146110534668, 0.00882411003112793, 0.009131073951721191, 0.009438037872314453, 0.009745001792907715, 0.010051965713500977, 0.010358929634094238, 0.0106658935546875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 25.0, 124.0, 718.0, 132.0, 17.0, 2.0], "bins": [-0.009489239193499088, -0.00933240819722414, -0.009175577200949192, -0.009018746204674244, -0.008861915208399296, -0.008705084212124348, -0.0085482532158494, -0.008391422219574451, -0.008234591223299503, -0.008077760227024555, -0.007920929230749607, -0.007764098234474659, -0.007607267238199711, -0.007450436241924763, -0.007293605245649815, -0.0071367742493748665, -0.006979943253099918, -0.00682311225682497, -0.006666281260550022, -0.006509450264275074, -0.006352619268000126, -0.006195788271725178, -0.00603895727545023, -0.0058821262791752815, -0.005725294817239046, -0.005568463820964098, -0.00541163282468915, -0.005254801828414202, -0.005097970832139254, -0.0049411398358643055, -0.004784308839589357, -0.004627477843314409, -0.004470646381378174, -0.004313815385103226, -0.004156984388828278, -0.0040001533925533295, -0.0038433223962783813, -0.0036864914000034332, -0.003529660403728485, -0.003372829407453537, -0.003215998411178589, -0.0030591674149036407, -0.0029023364186286926, -0.0027455054223537445, -0.0025886744260787964, -0.0024318434298038483, -0.0022750124335289, -0.002118181437253952, -0.001961350440979004, -0.0018045194447040558, -0.0016476884484291077, -0.0014908574521541595, -0.0013340264558792114, -0.0011771954596042633, -0.0010203643469139934, -0.0008635333506390452, -0.0007067023543640971, -0.000549871358089149, -0.0003930403327103704, -0.00023620930733159184, -7.937831105664372e-05, 7.74526852183044e-05, 0.00023428373970091343, 0.00039111473597586155, 0.0005479457322508097]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 9.0, 8.0, 14.0, 13.0, 26.0, 22.0, 32.0, 35.0, 41.0, 47.0, 47.0, 39.0, 44.0, 54.0, 73.0, 45.0, 37.0, 49.0, 49.0, 50.0, 42.0, 39.0, 33.0, 35.0, 20.0, 18.0, 20.0, 11.0, 11.0, 11.0, 10.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0007194876670837402, -0.0007006833329796791, -0.000681878998875618, -0.0006630746647715569, -0.0006442703306674957, -0.0006254659965634346, -0.0006066616624593735, -0.0005878573283553123, -0.0005690529942512512, -0.0005502486601471901, -0.000531444326043129, -0.0005126399919390678, -0.0004938356578350067, -0.0004750313237309456, -0.00045622698962688446, -0.00043742265552282333, -0.0004186183214187622, -0.0003998139873147011, -0.00038100965321063995, -0.0003622053191065788, -0.0003434009850025177, -0.0003245966508984566, -0.00030579231679439545, -0.0002869879826903343, -0.0002681836485862732, -0.00024937931448221207, -0.00023057498037815094, -0.0002117706462740898, -0.0001929663121700287, -0.00017416197806596756, -0.00015535764396190643, -0.0001365533098578453, -0.00011774897575378418, -9.894464164972305e-05, -8.014030754566193e-05, -6.13359734416008e-05, -4.253163933753967e-05, -2.3727305233478546e-05, -4.9229711294174194e-06, 1.3881362974643707e-05, 3.2685697078704834e-05, 5.149003118276596e-05, 7.029436528682709e-05, 8.909869939088821e-05, 0.00010790303349494934, 0.00012670736759901047, 0.0001455117017030716, 0.00016431603580713272, 0.00018312036991119385, 0.00020192470401525497, 0.0002207290381193161, 0.00023953337222337723, 0.00025833770632743835, 0.0002771420404314995, 0.0002959463745355606, 0.00031475070863962173, 0.00033355504274368286, 0.000352359376847744, 0.0003711637109518051, 0.00038996804505586624, 0.00040877237915992737, 0.0004275767132639885, 0.0004463810473680496, 0.00046518538147211075, 0.0004839897155761719]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 27.0, 18.0, 45.0, 58.0, 53.0, 82.0, 88.0, 82.0, 114.0, 93.0, 82.0, 60.0, 55.0, 41.0, 22.0, 15.0, 12.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.59765625, -4.475860595703125, -4.35406494140625, -4.232269287109375, -4.1104736328125, -3.988677978515625, -3.86688232421875, -3.745086669921875, -3.623291015625, -3.501495361328125, -3.37969970703125, -3.257904052734375, -3.1361083984375, -3.014312744140625, -2.89251708984375, -2.770721435546875, -2.64892578125, -2.527130126953125, -2.40533447265625, -2.283538818359375, -2.1617431640625, -2.039947509765625, -1.91815185546875, -1.796356201171875, -1.674560546875, -1.552764892578125, -1.43096923828125, -1.309173583984375, -1.1873779296875, -1.065582275390625, -0.94378662109375, -0.821990966796875, -0.7001953125, -0.578399658203125, -0.45660400390625, -0.334808349609375, -0.2130126953125, -0.091217041015625, 0.03057861328125, 0.152374267578125, 0.274169921875, 0.395965576171875, 0.51776123046875, 0.639556884765625, 0.7613525390625, 0.883148193359375, 1.00494384765625, 1.126739501953125, 1.24853515625, 1.370330810546875, 1.49212646484375, 1.613922119140625, 1.7357177734375, 1.857513427734375, 1.97930908203125, 2.101104736328125, 2.222900390625, 2.344696044921875, 2.46649169921875, 2.588287353515625, 2.7100830078125, 2.831878662109375, 2.95367431640625, 3.075469970703125, 3.197265625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 7.0, 10.0, 16.0, 20.0, 29.0, 39.0, 61.0, 67.0, 118.0, 193.0, 337.0, 631.0, 1442.0, 4534.0, 30392.0, 963706.0, 38597.0, 5169.0, 1607.0, 677.0, 311.0, 209.0, 121.0, 74.0, 65.0, 34.0, 21.0, 16.0, 13.0, 15.0, 2.0, 7.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.3125, -19.66845703125, -19.0244140625, -18.38037109375, -17.736328125, -17.09228515625, -16.4482421875, -15.80419921875, -15.16015625, -14.51611328125, -13.8720703125, -13.22802734375, -12.583984375, -11.93994140625, -11.2958984375, -10.65185546875, -10.0078125, -9.36376953125, -8.7197265625, -8.07568359375, -7.431640625, -6.78759765625, -6.1435546875, -5.49951171875, -4.85546875, -4.21142578125, -3.5673828125, -2.92333984375, -2.279296875, -1.63525390625, -0.9912109375, -0.34716796875, 0.296875, 0.94091796875, 1.5849609375, 2.22900390625, 2.873046875, 3.51708984375, 4.1611328125, 4.80517578125, 5.44921875, 6.09326171875, 6.7373046875, 7.38134765625, 8.025390625, 8.66943359375, 9.3134765625, 9.95751953125, 10.6015625, 11.24560546875, 11.8896484375, 12.53369140625, 13.177734375, 13.82177734375, 14.4658203125, 15.10986328125, 15.75390625, 16.39794921875, 17.0419921875, 17.68603515625, 18.330078125, 18.97412109375, 19.6181640625, 20.26220703125, 20.90625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 7.0, 11.0, 15.0, 19.0, 24.0, 27.0, 32.0, 39.0, 39.0, 40.0, 55.0, 53.0, 68.0, 115.0, 1525.0, 428.0, 94.0, 73.0, 53.0, 43.0, 31.0, 38.0, 32.0, 37.0, 29.0, 31.0, 17.0, 15.0, 6.0, 9.0, 6.0, 4.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.263916015625, -7.95751953125, -7.651123046875, -7.3447265625, -7.038330078125, -6.73193359375, -6.425537109375, -6.119140625, -5.812744140625, -5.50634765625, -5.199951171875, -4.8935546875, -4.587158203125, -4.28076171875, -3.974365234375, -3.66796875, -3.361572265625, -3.05517578125, -2.748779296875, -2.4423828125, -2.135986328125, -1.82958984375, -1.523193359375, -1.216796875, -0.910400390625, -0.60400390625, -0.297607421875, 0.0087890625, 0.315185546875, 0.62158203125, 0.927978515625, 1.234375, 1.540771484375, 1.84716796875, 2.153564453125, 2.4599609375, 2.766357421875, 3.07275390625, 3.379150390625, 3.685546875, 3.991943359375, 4.29833984375, 4.604736328125, 4.9111328125, 5.217529296875, 5.52392578125, 5.830322265625, 6.13671875, 6.443115234375, 6.74951171875, 7.055908203125, 7.3623046875, 7.668701171875, 7.97509765625, 8.281494140625, 8.587890625, 8.894287109375, 9.20068359375, 9.507080078125, 9.8134765625, 10.119873046875, 10.42626953125, 10.732666015625, 11.0390625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 9.0, 15.0, 29.0, 25.0, 38.0, 51.0, 95.0, 114.0, 152.0, 227.0, 322.0, 481.0, 793.0, 1115.0, 1794.0, 3169.0, 5695.0, 11830.0, 34838.0, 1505155.0, 1519298.0, 34436.0, 12048.0, 5615.0, 3086.0, 1868.0, 1133.0, 743.0, 476.0, 325.0, 214.0, 143.0, 102.0, 86.0, 41.0, 28.0, 27.0, 20.0, 15.0, 17.0, 8.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.7109375, -14.2205810546875, -13.730224609375, -13.2398681640625, -12.74951171875, -12.2591552734375, -11.768798828125, -11.2784423828125, -10.7880859375, -10.2977294921875, -9.807373046875, -9.3170166015625, -8.82666015625, -8.3363037109375, -7.845947265625, -7.3555908203125, -6.865234375, -6.3748779296875, -5.884521484375, -5.3941650390625, -4.90380859375, -4.4134521484375, -3.923095703125, -3.4327392578125, -2.9423828125, -2.4520263671875, -1.961669921875, -1.4713134765625, -0.98095703125, -0.4906005859375, -0.000244140625, 0.4901123046875, 0.98046875, 1.4708251953125, 1.961181640625, 2.4515380859375, 2.94189453125, 3.4322509765625, 3.922607421875, 4.4129638671875, 4.9033203125, 5.3936767578125, 5.884033203125, 6.3743896484375, 6.86474609375, 7.3551025390625, 7.845458984375, 8.3358154296875, 8.826171875, 9.3165283203125, 9.806884765625, 10.2972412109375, 10.78759765625, 11.2779541015625, 11.768310546875, 12.2586669921875, 12.7490234375, 13.2393798828125, 13.729736328125, 14.2200927734375, 14.71044921875, 15.2008056640625, 15.691162109375, 16.1815185546875, 16.671875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 11.0, 19.0, 31.0, 42.0, 80.0, 133.0, 134.0, 154.0, 144.0, 96.0, 64.0, 43.0, 17.0, 11.0, 12.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.64273452758789, -54.412296295166016, -53.18185806274414, -51.951419830322266, -50.72098159790039, -49.490543365478516, -48.26010513305664, -47.0296630859375, -45.799224853515625, -44.56878662109375, -43.338348388671875, -42.10791015625, -40.877471923828125, -39.64703369140625, -38.416595458984375, -37.1861572265625, -35.955718994140625, -34.72528076171875, -33.494842529296875, -32.264404296875, -31.033966064453125, -29.80352783203125, -28.573087692260742, -27.342649459838867, -26.112211227416992, -24.881772994995117, -23.651334762573242, -22.420896530151367, -21.19045639038086, -19.960018157958984, -18.72957992553711, -17.499141693115234, -16.268707275390625, -15.03826904296875, -13.807830810546875, -12.577391624450684, -11.346953392028809, -10.116515159606934, -8.886075973510742, -7.655637741088867, -6.425199508666992, -5.194761276245117, -3.964322566986084, -2.73388409614563, -1.5034456253051758, -0.2730073928833008, 0.9574313163757324, 2.1878700256347656, 3.4183082580566406, 4.648746490478516, 5.879185199737549, 7.109623908996582, 8.340062141418457, 9.570500373840332, 10.800939559936523, 12.031377792358398, 13.261816024780273, 14.492254257202148, 15.722692489624023, 16.9531307220459, 18.183570861816406, 19.41400909423828, 20.644447326660156, 21.87488555908203, 23.105323791503906]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 8.0, 6.0, 8.0, 13.0, 15.0, 13.0, 16.0, 17.0, 26.0, 21.0, 26.0, 33.0, 27.0, 39.0, 41.0, 51.0, 48.0, 43.0, 46.0, 51.0, 41.0, 46.0, 42.0, 41.0, 41.0, 40.0, 31.0, 25.0, 28.0, 26.0, 18.0, 17.0, 13.0, 7.0, 10.0, 5.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-34.903656005859375, -33.89384078979492, -32.88402557373047, -31.874210357666016, -30.864395141601562, -29.85457992553711, -28.844764709472656, -27.834949493408203, -26.82513427734375, -25.815319061279297, -24.805503845214844, -23.79568862915039, -22.785873413085938, -21.776058197021484, -20.76624298095703, -19.756427764892578, -18.746612548828125, -17.736797332763672, -16.72698211669922, -15.717166900634766, -14.707351684570312, -13.69753646850586, -12.687721252441406, -11.677906036376953, -10.6680908203125, -9.658275604248047, -8.648460388183594, -7.638645172119141, -6.6288299560546875, -5.619014739990234, -4.609199523925781, -3.599384307861328, -2.5895729064941406, -1.5797576904296875, -0.5699424743652344, 0.43987274169921875, 1.4496879577636719, 2.459503173828125, 3.469318389892578, 4.479133605957031, 5.488948822021484, 6.4987640380859375, 7.508579254150391, 8.518394470214844, 9.528209686279297, 10.53802490234375, 11.547840118408203, 12.557655334472656, 13.56747055053711, 14.577285766601562, 15.587100982666016, 16.59691619873047, 17.606731414794922, 18.616546630859375, 19.626361846923828, 20.63617706298828, 21.645992279052734, 22.655807495117188, 23.66562271118164, 24.675437927246094, 25.685253143310547, 26.695068359375, 27.704883575439453, 28.714698791503906, 29.72451400756836]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 2.0, 2.0, 4.0, 3.0, 14.0, 15.0, 16.0, 25.0, 39.0, 61.0, 65.0, 66.0, 76.0, 93.0, 95.0, 105.0, 78.0, 57.0, 57.0, 43.0, 32.0, 22.0, 13.0, 4.0, 10.0, 0.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.69921875, -4.575408935546875, -4.45159912109375, -4.327789306640625, -4.2039794921875, -4.080169677734375, -3.95635986328125, -3.832550048828125, -3.708740234375, -3.584930419921875, -3.46112060546875, -3.337310791015625, -3.2135009765625, -3.089691162109375, -2.96588134765625, -2.842071533203125, -2.71826171875, -2.594451904296875, -2.47064208984375, -2.346832275390625, -2.2230224609375, -2.099212646484375, -1.97540283203125, -1.851593017578125, -1.727783203125, -1.603973388671875, -1.48016357421875, -1.356353759765625, -1.2325439453125, -1.108734130859375, -0.98492431640625, -0.861114501953125, -0.7373046875, -0.613494873046875, -0.48968505859375, -0.365875244140625, -0.2420654296875, -0.118255615234375, 0.00555419921875, 0.129364013671875, 0.253173828125, 0.376983642578125, 0.50079345703125, 0.624603271484375, 0.7484130859375, 0.872222900390625, 0.99603271484375, 1.119842529296875, 1.24365234375, 1.367462158203125, 1.49127197265625, 1.615081787109375, 1.7388916015625, 1.862701416015625, 1.98651123046875, 2.110321044921875, 2.234130859375, 2.357940673828125, 2.48175048828125, 2.605560302734375, 2.7293701171875, 2.853179931640625, 2.97698974609375, 3.100799560546875, 3.224609375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 7.0, 7.0, 14.0, 13.0, 17.0, 37.0, 61.0, 83.0, 159.0, 299.0, 699.0, 1837.0, 6508.0, 96907.0, 4005432.0, 74292.0, 5363.0, 1507.0, 524.0, 249.0, 117.0, 47.0, 28.0, 24.0, 12.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.90625, -24.241455078125, -23.57666015625, -22.911865234375, -22.2470703125, -21.582275390625, -20.91748046875, -20.252685546875, -19.587890625, -18.923095703125, -18.25830078125, -17.593505859375, -16.9287109375, -16.263916015625, -15.59912109375, -14.934326171875, -14.26953125, -13.604736328125, -12.93994140625, -12.275146484375, -11.6103515625, -10.945556640625, -10.28076171875, -9.615966796875, -8.951171875, -8.286376953125, -7.62158203125, -6.956787109375, -6.2919921875, -5.627197265625, -4.96240234375, -4.297607421875, -3.6328125, -2.968017578125, -2.30322265625, -1.638427734375, -0.9736328125, -0.308837890625, 0.35595703125, 1.020751953125, 1.685546875, 2.350341796875, 3.01513671875, 3.679931640625, 4.3447265625, 5.009521484375, 5.67431640625, 6.339111328125, 7.00390625, 7.668701171875, 8.33349609375, 8.998291015625, 9.6630859375, 10.327880859375, 10.99267578125, 11.657470703125, 12.322265625, 12.987060546875, 13.65185546875, 14.316650390625, 14.9814453125, 15.646240234375, 16.31103515625, 16.975830078125, 17.640625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 10.0, 7.0, 14.0, 25.0, 33.0, 55.0, 85.0, 135.0, 247.0, 431.0, 693.0, 856.0, 612.0, 347.0, 170.0, 133.0, 59.0, 42.0, 28.0, 26.0, 12.0, 13.0, 9.0, 4.0, 7.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.8828125, -10.5828857421875, -10.282958984375, -9.9830322265625, -9.68310546875, -9.3831787109375, -9.083251953125, -8.7833251953125, -8.4833984375, -8.1834716796875, -7.883544921875, -7.5836181640625, -7.28369140625, -6.9837646484375, -6.683837890625, -6.3839111328125, -6.083984375, -5.7840576171875, -5.484130859375, -5.1842041015625, -4.88427734375, -4.5843505859375, -4.284423828125, -3.9844970703125, -3.6845703125, -3.3846435546875, -3.084716796875, -2.7847900390625, -2.48486328125, -2.1849365234375, -1.885009765625, -1.5850830078125, -1.28515625, -0.9852294921875, -0.685302734375, -0.3853759765625, -0.08544921875, 0.2144775390625, 0.514404296875, 0.8143310546875, 1.1142578125, 1.4141845703125, 1.714111328125, 2.0140380859375, 2.31396484375, 2.6138916015625, 2.913818359375, 3.2137451171875, 3.513671875, 3.8135986328125, 4.113525390625, 4.4134521484375, 4.71337890625, 5.0133056640625, 5.313232421875, 5.6131591796875, 5.9130859375, 6.2130126953125, 6.512939453125, 6.8128662109375, 7.11279296875, 7.4127197265625, 7.712646484375, 8.0125732421875, 8.3125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 6.0, 18.0, 38.0, 51.0, 107.0, 183.0, 437.0, 1020.0, 3145.0, 13224.0, 94850.0, 3195490.0, 835558.0, 39554.0, 7246.0, 1990.0, 740.0, 286.0, 163.0, 71.0, 44.0, 19.0, 14.0, 9.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.625, -19.88330078125, -19.1416015625, -18.39990234375, -17.658203125, -16.91650390625, -16.1748046875, -15.43310546875, -14.69140625, -13.94970703125, -13.2080078125, -12.46630859375, -11.724609375, -10.98291015625, -10.2412109375, -9.49951171875, -8.7578125, -8.01611328125, -7.2744140625, -6.53271484375, -5.791015625, -5.04931640625, -4.3076171875, -3.56591796875, -2.82421875, -2.08251953125, -1.3408203125, -0.59912109375, 0.142578125, 0.88427734375, 1.6259765625, 2.36767578125, 3.109375, 3.85107421875, 4.5927734375, 5.33447265625, 6.076171875, 6.81787109375, 7.5595703125, 8.30126953125, 9.04296875, 9.78466796875, 10.5263671875, 11.26806640625, 12.009765625, 12.75146484375, 13.4931640625, 14.23486328125, 14.9765625, 15.71826171875, 16.4599609375, 17.20166015625, 17.943359375, 18.68505859375, 19.4267578125, 20.16845703125, 20.91015625, 21.65185546875, 22.3935546875, 23.13525390625, 23.876953125, 24.61865234375, 25.3603515625, 26.10205078125, 26.84375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 13.0, 13.0, 30.0, 58.0, 76.0, 124.0, 184.0, 156.0, 114.0, 94.0, 61.0, 34.0, 23.0, 10.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-84.50379943847656, -82.74308776855469, -80.98237609863281, -79.22166442871094, -77.46095275878906, -75.70024108886719, -73.93952941894531, -72.17881774902344, -70.41810607910156, -68.65739440917969, -66.89668273925781, -65.13597106933594, -63.37525939941406, -61.61454772949219, -59.85383605957031, -58.09312438964844, -56.33241653442383, -54.57170486450195, -52.81099319458008, -51.0502815246582, -49.28956985473633, -47.52885818481445, -45.768150329589844, -44.00743865966797, -42.246726989746094, -40.48601531982422, -38.725303649902344, -36.96459197998047, -35.203880310058594, -33.44316864013672, -31.682458877563477, -29.9217472076416, -28.16103744506836, -26.400325775146484, -24.63961410522461, -22.878902435302734, -21.11819076538086, -19.357479095458984, -17.596769332885742, -15.836057662963867, -14.075345993041992, -12.314634323120117, -10.553922653198242, -8.793211936950684, -7.032500267028809, -5.271788597106934, -3.511077880859375, -1.7503662109375, 0.010345458984375, 1.771056890487671, 3.531768321990967, 5.292479515075684, 7.053191184997559, 8.813902854919434, 10.574613571166992, 12.335325241088867, 14.096036911010742, 15.856748580932617, 17.617460250854492, 19.378170013427734, 21.13888168334961, 22.899593353271484, 24.66030502319336, 26.421016693115234, 28.18172836303711]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 7.0, 4.0, 14.0, 7.0, 11.0, 6.0, 18.0, 22.0, 15.0, 20.0, 29.0, 22.0, 26.0, 27.0, 32.0, 37.0, 41.0, 38.0, 27.0, 43.0, 35.0, 40.0, 43.0, 37.0, 34.0, 34.0, 29.0, 31.0, 33.0, 25.0, 27.0, 24.0, 24.0, 26.0, 14.0, 15.0, 13.0, 11.0, 7.0, 7.0, 4.0, 3.0, 5.0, 5.0, 6.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.42793083190918, -20.758066177368164, -20.08820343017578, -19.418338775634766, -18.74847412109375, -18.078609466552734, -17.40874481201172, -16.738882064819336, -16.06901741027832, -15.399152755737305, -14.729289054870605, -14.059425354003906, -13.38956069946289, -12.719696044921875, -12.049832344055176, -11.379968643188477, -10.710103988647461, -10.040239334106445, -9.370375633239746, -8.700511932373047, -8.030647277832031, -7.360783100128174, -6.690918922424316, -6.021054744720459, -5.351190567016602, -4.681326389312744, -4.011462211608887, -3.3415980339050293, -2.671733856201172, -2.0018696784973145, -1.332005500793457, -0.6621413230895996, 0.007724761962890625, 0.677588939666748, 1.3474531173706055, 2.017317295074463, 2.6871814727783203, 3.3570456504821777, 4.026909828186035, 4.696774005889893, 5.36663818359375, 6.036502361297607, 6.706366539001465, 7.376230716705322, 8.04609489440918, 8.715959548950195, 9.385823249816895, 10.055686950683594, 10.72555160522461, 11.395416259765625, 12.065279960632324, 12.735143661499023, 13.405008316040039, 14.074872970581055, 14.744736671447754, 15.414600372314453, 16.08446502685547, 16.754329681396484, 17.4241943359375, 18.094057083129883, 18.7639217376709, 19.433786392211914, 20.103649139404297, 20.773513793945312, 21.443378448486328]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 1.0, 5.0, 7.0, 15.0, 24.0, 24.0, 32.0, 40.0, 58.0, 72.0, 59.0, 76.0, 90.0, 94.0, 97.0, 83.0, 46.0, 46.0, 40.0, 39.0, 17.0, 18.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.411529541015625, -4.28790283203125, -4.164276123046875, -4.0406494140625, -3.917022705078125, -3.79339599609375, -3.669769287109375, -3.546142578125, -3.422515869140625, -3.29888916015625, -3.175262451171875, -3.0516357421875, -2.928009033203125, -2.80438232421875, -2.680755615234375, -2.55712890625, -2.433502197265625, -2.30987548828125, -2.186248779296875, -2.0626220703125, -1.938995361328125, -1.81536865234375, -1.691741943359375, -1.568115234375, -1.444488525390625, -1.32086181640625, -1.197235107421875, -1.0736083984375, -0.949981689453125, -0.82635498046875, -0.702728271484375, -0.5791015625, -0.455474853515625, -0.33184814453125, -0.208221435546875, -0.0845947265625, 0.039031982421875, 0.16265869140625, 0.286285400390625, 0.409912109375, 0.533538818359375, 0.65716552734375, 0.780792236328125, 0.9044189453125, 1.028045654296875, 1.15167236328125, 1.275299072265625, 1.39892578125, 1.522552490234375, 1.64617919921875, 1.769805908203125, 1.8934326171875, 2.017059326171875, 2.14068603515625, 2.264312744140625, 2.387939453125, 2.511566162109375, 2.63519287109375, 2.758819580078125, 2.8824462890625, 3.006072998046875, 3.12969970703125, 3.253326416015625, 3.376953125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 9.0, 3.0, 10.0, 20.0, 21.0, 25.0, 29.0, 57.0, 53.0, 88.0, 124.0, 179.0, 279.0, 403.0, 671.0, 1225.0, 2010.0, 3796.0, 7847.0, 17281.0, 44677.0, 138797.0, 525159.0, 203253.0, 59786.0, 22540.0, 9532.0, 4663.0, 2418.0, 1393.0, 772.0, 495.0, 290.0, 182.0, 139.0, 89.0, 64.0, 40.0, 36.0, 23.0, 18.0, 13.0, 14.0, 9.0, 4.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.240478515625, -0.23332977294921875, -0.2261810302734375, -0.21903228759765625, -0.211883544921875, -0.20473480224609375, -0.1975860595703125, -0.19043731689453125, -0.18328857421875, -0.17613983154296875, -0.1689910888671875, -0.16184234619140625, -0.154693603515625, -0.14754486083984375, -0.1403961181640625, -0.13324737548828125, -0.1260986328125, -0.11894989013671875, -0.1118011474609375, -0.10465240478515625, -0.097503662109375, -0.09035491943359375, -0.0832061767578125, -0.07605743408203125, -0.06890869140625, -0.06175994873046875, -0.0546112060546875, -0.04746246337890625, -0.040313720703125, -0.03316497802734375, -0.0260162353515625, -0.01886749267578125, -0.01171875, -0.00457000732421875, 0.0025787353515625, 0.00972747802734375, 0.016876220703125, 0.02402496337890625, 0.0311737060546875, 0.03832244873046875, 0.04547119140625, 0.05261993408203125, 0.0597686767578125, 0.06691741943359375, 0.074066162109375, 0.08121490478515625, 0.0883636474609375, 0.09551239013671875, 0.1026611328125, 0.10980987548828125, 0.1169586181640625, 0.12410736083984375, 0.131256103515625, 0.13840484619140625, 0.1455535888671875, 0.15270233154296875, 0.15985107421875, 0.16699981689453125, 0.1741485595703125, 0.18129730224609375, 0.188446044921875, 0.19559478759765625, 0.2027435302734375, 0.20989227294921875, 0.217041015625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 6.0, 7.0, 5.0, 12.0, 12.0, 10.0, 15.0, 20.0, 29.0, 17.0, 21.0, 25.0, 33.0, 31.0, 43.0, 39.0, 30.0, 44.0, 37.0, 37.0, 1065.0, 43.0, 36.0, 27.0, 41.0, 29.0, 33.0, 26.0, 37.0, 30.0, 31.0, 20.0, 14.0, 14.0, 12.0, 16.0, 19.0, 8.0, 11.0, 7.0, 8.0, 5.0, 5.0, 6.0, 2.0, 0.0, 3.0, 3.0], "bins": [-2.37109375, -2.306365966796875, -2.24163818359375, -2.176910400390625, -2.1121826171875, -2.047454833984375, -1.98272705078125, -1.917999267578125, -1.853271484375, -1.788543701171875, -1.72381591796875, -1.659088134765625, -1.5943603515625, -1.529632568359375, -1.46490478515625, -1.400177001953125, -1.33544921875, -1.270721435546875, -1.20599365234375, -1.141265869140625, -1.0765380859375, -1.011810302734375, -0.94708251953125, -0.882354736328125, -0.817626953125, -0.752899169921875, -0.68817138671875, -0.623443603515625, -0.5587158203125, -0.493988037109375, -0.42926025390625, -0.364532470703125, -0.2998046875, -0.235076904296875, -0.17034912109375, -0.105621337890625, -0.0408935546875, 0.023834228515625, 0.08856201171875, 0.153289794921875, 0.218017578125, 0.282745361328125, 0.34747314453125, 0.412200927734375, 0.4769287109375, 0.541656494140625, 0.60638427734375, 0.671112060546875, 0.73583984375, 0.800567626953125, 0.86529541015625, 0.930023193359375, 0.9947509765625, 1.059478759765625, 1.12420654296875, 1.188934326171875, 1.253662109375, 1.318389892578125, 1.38311767578125, 1.447845458984375, 1.5125732421875, 1.577301025390625, 1.64202880859375, 1.706756591796875, 1.771484375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 21.0, 26.0, 46.0, 62.0, 86.0, 154.0, 187.0, 273.0, 386.0, 636.0, 856.0, 1265.0, 1759.0, 2592.0, 3679.0, 5478.0, 7793.0, 11582.0, 17032.0, 25270.0, 38769.0, 61189.0, 106291.0, 500531.0, 1020267.0, 108500.0, 62384.0, 39418.0, 25781.0, 17375.0, 11576.0, 8016.0, 5388.0, 3788.0, 2669.0, 1837.0, 1277.0, 905.0, 613.0, 433.0, 275.0, 220.0, 131.0, 112.0, 69.0, 48.0, 32.0, 17.0, 10.0, 8.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.04815673828125, -0.046604156494140625, -0.04505157470703125, -0.043498992919921875, -0.0419464111328125, -0.040393829345703125, -0.03884124755859375, -0.037288665771484375, -0.035736083984375, -0.034183502197265625, -0.03263092041015625, -0.031078338623046875, -0.0295257568359375, -0.027973175048828125, -0.02642059326171875, -0.024868011474609375, -0.0233154296875, -0.021762847900390625, -0.02021026611328125, -0.018657684326171875, -0.0171051025390625, -0.015552520751953125, -0.01399993896484375, -0.012447357177734375, -0.010894775390625, -0.009342193603515625, -0.00778961181640625, -0.006237030029296875, -0.0046844482421875, -0.003131866455078125, -0.00157928466796875, -2.6702880859375e-05, 0.00152587890625, 0.003078460693359375, 0.00463104248046875, 0.006183624267578125, 0.0077362060546875, 0.009288787841796875, 0.01084136962890625, 0.012393951416015625, 0.013946533203125, 0.015499114990234375, 0.01705169677734375, 0.018604278564453125, 0.0201568603515625, 0.021709442138671875, 0.02326202392578125, 0.024814605712890625, 0.0263671875, 0.027919769287109375, 0.02947235107421875, 0.031024932861328125, 0.0325775146484375, 0.034130096435546875, 0.03568267822265625, 0.037235260009765625, 0.038787841796875, 0.040340423583984375, 0.04189300537109375, 0.043445587158203125, 0.0449981689453125, 0.046550750732421875, 0.04810333251953125, 0.049655914306640625, 0.05120849609375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 4.0, 9.0, 10.0, 6.0, 6.0, 14.0, 13.0, 18.0, 14.0, 19.0, 27.0, 42.0, 51.0, 47.0, 64.0, 73.0, 104.0, 91.0, 72.0, 50.0, 40.0, 32.0, 25.0, 19.0, 22.0, 17.0, 12.0, 12.0, 6.0, 8.0, 9.0, 9.0, 3.0, 2.0, 8.0, 4.0, 4.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002772808074951172, -0.00026794523000717163, -0.0002586096525192261, -0.0002492740750312805, -0.00023993849754333496, -0.0002306029200553894, -0.00022126734256744385, -0.0002119317650794983, -0.00020259618759155273, -0.00019326061010360718, -0.00018392503261566162, -0.00017458945512771606, -0.0001652538776397705, -0.00015591830015182495, -0.0001465827226638794, -0.00013724714517593384, -0.00012791156768798828, -0.00011857599020004272, -0.00010924041271209717, -9.990483522415161e-05, -9.056925773620605e-05, -8.12336802482605e-05, -7.189810276031494e-05, -6.256252527236938e-05, -5.322694778442383e-05, -4.389137029647827e-05, -3.4555792808532715e-05, -2.5220215320587158e-05, -1.58846378326416e-05, -6.549060344696045e-06, 2.7865171432495117e-06, 1.2122094631195068e-05, 2.1457672119140625e-05, 3.079324960708618e-05, 4.012882709503174e-05, 4.9464404582977295e-05, 5.879998207092285e-05, 6.813555955886841e-05, 7.747113704681396e-05, 8.680671453475952e-05, 9.614229202270508e-05, 0.00010547786951065063, 0.00011481344699859619, 0.00012414902448654175, 0.0001334846019744873, 0.00014282017946243286, 0.00015215575695037842, 0.00016149133443832397, 0.00017082691192626953, 0.0001801624894142151, 0.00018949806690216064, 0.0001988336443901062, 0.00020816922187805176, 0.00021750479936599731, 0.00022684037685394287, 0.00023617595434188843, 0.000245511531829834, 0.00025484710931777954, 0.0002641826868057251, 0.00027351826429367065, 0.0002828538417816162, 0.00029218941926956177, 0.0003015249967575073, 0.0003108605742454529, 0.00032019615173339844]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 8.0, 4.0, 4.0, 10.0, 3.0, 11.0, 9.0, 13.0, 18.0, 26.0, 23.0, 27.0, 30.0, 59.0, 58.0, 83.0, 139.0, 451.0, 2049.0, 12369.0, 102900.0, 801416.0, 112272.0, 13293.0, 2185.0, 511.0, 163.0, 95.0, 62.0, 42.0, 37.0, 34.0, 31.0, 23.0, 20.0, 14.0, 14.0, 12.0, 6.0, 7.0, 7.0, 2.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.005462646484375, -0.005304396152496338, -0.005146145820617676, -0.004987895488739014, -0.0048296451568603516, -0.0046713948249816895, -0.004513144493103027, -0.004354894161224365, -0.004196643829345703, -0.004038393497467041, -0.003880143165588379, -0.003721892833709717, -0.0035636425018310547, -0.0034053921699523926, -0.0032471418380737305, -0.0030888915061950684, -0.0029306411743164062, -0.002772390842437744, -0.002614140510559082, -0.00245589017868042, -0.002297639846801758, -0.0021393895149230957, -0.0019811391830444336, -0.0018228888511657715, -0.0016646385192871094, -0.0015063881874084473, -0.0013481378555297852, -0.001189887523651123, -0.001031637191772461, -0.0008733868598937988, -0.0007151365280151367, -0.0005568861961364746, -0.0003986358642578125, -0.0002403855323791504, -8.213520050048828e-05, 7.611513137817383e-05, 0.00023436546325683594, 0.00039261579513549805, 0.0005508661270141602, 0.0007091164588928223, 0.0008673667907714844, 0.0010256171226501465, 0.0011838674545288086, 0.0013421177864074707, 0.0015003681182861328, 0.001658618450164795, 0.001816868782043457, 0.001975119113922119, 0.0021333694458007812, 0.0022916197776794434, 0.0024498701095581055, 0.0026081204414367676, 0.0027663707733154297, 0.002924621105194092, 0.003082871437072754, 0.003241121768951416, 0.003399372100830078, 0.0035576224327087402, 0.0037158727645874023, 0.0038741230964660645, 0.0040323734283447266, 0.004190623760223389, 0.004348874092102051, 0.004507124423980713, 0.004665374755859375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 22.0, 95.0, 614.0, 234.0, 36.0, 9.0], "bins": [-0.008506637066602707, -0.008366578258574009, -0.008226520381867886, -0.008086461573839188, -0.00794640276581049, -0.007806344889104366, -0.007666286081075668, -0.007526227738708258, -0.007386169396340847, -0.007246111053973436, -0.007106052245944738, -0.006965993903577328, -0.006825935561209917, -0.006685877218842506, -0.0065458184108138084, -0.006405760068446398, -0.006265701726078987, -0.0061256433837115765, -0.0059855845756828785, -0.005845526233315468, -0.005705467890948057, -0.0055654095485806465, -0.0054253507405519485, -0.005285292398184538, -0.00514523359015584, -0.005005175247788429, -0.004865116439759731, -0.004725058097392321, -0.00458499975502491, -0.004444941412657499, -0.004304882604628801, -0.004164824262261391, -0.004024765454232693, -0.0038847068790346384, -0.0037446485366672277, -0.0036045899614691734, -0.0034645316191017628, -0.0033244730439037085, -0.003184414468705654, -0.0030443561263382435, -0.002904297783970833, -0.0027642392087727785, -0.002624180866405368, -0.0024841222912073135, -0.002344063948839903, -0.0022040053736418486, -0.0020639467984437943, -0.0019238884560763836, -0.001783830113708973, -0.0016437716549262404, -0.001503713196143508, -0.0013636546209454536, -0.001223596278578043, -0.0010835377033799887, -0.0009434792445972562, -0.0008034207858145237, -0.0006633622688241303, -0.0005233038100413978, -0.00038324532215483487, -0.00024318683426827192, -0.00010312837548553944, 3.693008329719305e-05, 0.00017698860028758645, 0.00031704705907031894, 0.0004571055178530514]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 7.0, 11.0, 9.0, 11.0, 17.0, 23.0, 30.0, 31.0, 39.0, 40.0, 53.0, 39.0, 57.0, 60.0, 59.0, 47.0, 60.0, 47.0, 51.0, 51.0, 40.0, 34.0, 38.0, 33.0, 24.0, 17.0, 17.0, 11.0, 11.0, 10.0, 6.0, 4.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042742490768432617, -0.00041339173913002014, -0.0003993585705757141, -0.0003853254020214081, -0.00037129223346710205, -0.000357259064912796, -0.00034322589635849, -0.00032919272780418396, -0.00031515955924987793, -0.0003011263906955719, -0.00028709322214126587, -0.00027306005358695984, -0.0002590268850326538, -0.0002449937164783478, -0.00023096054792404175, -0.00021692737936973572, -0.0002028942108154297, -0.00018886104226112366, -0.00017482787370681763, -0.0001607947051525116, -0.00014676153659820557, -0.00013272836804389954, -0.0001186951994895935, -0.00010466203093528748, -9.062886238098145e-05, -7.659569382667542e-05, -6.256252527236938e-05, -4.8529356718063354e-05, -3.4496188163757324e-05, -2.0463019609451294e-05, -6.429851055145264e-06, 7.603317499160767e-06, 2.1636486053466797e-05, 3.566965460777283e-05, 4.970282316207886e-05, 6.373599171638489e-05, 7.776916027069092e-05, 9.180232882499695e-05, 0.00010583549737930298, 0.00011986866593360901, 0.00013390183448791504, 0.00014793500304222107, 0.0001619681715965271, 0.00017600134015083313, 0.00019003450870513916, 0.0002040676772594452, 0.00021810084581375122, 0.00023213401436805725, 0.0002461671829223633, 0.0002602003514766693, 0.00027423352003097534, 0.00028826668858528137, 0.0003022998571395874, 0.00031633302569389343, 0.00033036619424819946, 0.0003443993628025055, 0.0003584325313568115, 0.00037246569991111755, 0.0003864988684654236, 0.0004005320370197296, 0.00041456520557403564, 0.0004285983741283417, 0.0004426315426826477, 0.00045666471123695374, 0.00047069787979125977]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 1.0, 5.0, 7.0, 15.0, 24.0, 24.0, 32.0, 40.0, 58.0, 72.0, 59.0, 76.0, 90.0, 94.0, 96.0, 84.0, 46.0, 46.0, 40.0, 39.0, 17.0, 18.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.411529541015625, -4.28790283203125, -4.164276123046875, -4.0406494140625, -3.917022705078125, -3.79339599609375, -3.669769287109375, -3.546142578125, -3.422515869140625, -3.29888916015625, -3.175262451171875, -3.0516357421875, -2.928009033203125, -2.80438232421875, -2.680755615234375, -2.55712890625, -2.433502197265625, -2.30987548828125, -2.186248779296875, -2.0626220703125, -1.938995361328125, -1.81536865234375, -1.691741943359375, -1.568115234375, -1.444488525390625, -1.32086181640625, -1.197235107421875, -1.0736083984375, -0.949981689453125, -0.82635498046875, -0.702728271484375, -0.5791015625, -0.455474853515625, -0.33184814453125, -0.208221435546875, -0.0845947265625, 0.039031982421875, 0.16265869140625, 0.286285400390625, 0.409912109375, 0.533538818359375, 0.65716552734375, 0.780792236328125, 0.9044189453125, 1.028045654296875, 1.15167236328125, 1.275299072265625, 1.39892578125, 1.522552490234375, 1.64617919921875, 1.769805908203125, 1.8934326171875, 2.017059326171875, 2.14068603515625, 2.264312744140625, 2.387939453125, 2.511566162109375, 2.63519287109375, 2.758819580078125, 2.8824462890625, 3.006072998046875, 3.12969970703125, 3.253326416015625, 3.376953125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 9.0, 7.0, 15.0, 21.0, 32.0, 54.0, 85.0, 179.0, 295.0, 718.0, 1860.0, 5351.0, 17245.0, 62183.0, 316640.0, 513875.0, 93705.0, 24646.0, 7389.0, 2457.0, 916.0, 392.0, 206.0, 105.0, 54.0, 37.0, 24.0, 15.0, 13.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.953125, -3.83734130859375, -3.7215576171875, -3.60577392578125, -3.489990234375, -3.37420654296875, -3.2584228515625, -3.14263916015625, -3.02685546875, -2.91107177734375, -2.7952880859375, -2.67950439453125, -2.563720703125, -2.44793701171875, -2.3321533203125, -2.21636962890625, -2.1005859375, -1.98480224609375, -1.8690185546875, -1.75323486328125, -1.637451171875, -1.52166748046875, -1.4058837890625, -1.29010009765625, -1.17431640625, -1.05853271484375, -0.9427490234375, -0.82696533203125, -0.711181640625, -0.59539794921875, -0.4796142578125, -0.36383056640625, -0.248046875, -0.13226318359375, -0.0164794921875, 0.09930419921875, 0.215087890625, 0.33087158203125, 0.4466552734375, 0.56243896484375, 0.67822265625, 0.79400634765625, 0.9097900390625, 1.02557373046875, 1.141357421875, 1.25714111328125, 1.3729248046875, 1.48870849609375, 1.6044921875, 1.72027587890625, 1.8360595703125, 1.95184326171875, 2.067626953125, 2.18341064453125, 2.2991943359375, 2.41497802734375, 2.53076171875, 2.64654541015625, 2.7623291015625, 2.87811279296875, 2.993896484375, 3.10968017578125, 3.2254638671875, 3.34124755859375, 3.45703125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 4.0, 9.0, 15.0, 15.0, 13.0, 18.0, 20.0, 14.0, 29.0, 30.0, 30.0, 33.0, 42.0, 34.0, 51.0, 64.0, 74.0, 183.0, 1624.0, 203.0, 108.0, 60.0, 56.0, 35.0, 32.0, 48.0, 28.0, 25.0, 25.0, 23.0, 20.0, 13.0, 14.0, 17.0, 5.0, 9.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.238525390625, -7.96923828125, -7.699951171875, -7.4306640625, -7.161376953125, -6.89208984375, -6.622802734375, -6.353515625, -6.084228515625, -5.81494140625, -5.545654296875, -5.2763671875, -5.007080078125, -4.73779296875, -4.468505859375, -4.19921875, -3.929931640625, -3.66064453125, -3.391357421875, -3.1220703125, -2.852783203125, -2.58349609375, -2.314208984375, -2.044921875, -1.775634765625, -1.50634765625, -1.237060546875, -0.9677734375, -0.698486328125, -0.42919921875, -0.159912109375, 0.109375, 0.378662109375, 0.64794921875, 0.917236328125, 1.1865234375, 1.455810546875, 1.72509765625, 1.994384765625, 2.263671875, 2.532958984375, 2.80224609375, 3.071533203125, 3.3408203125, 3.610107421875, 3.87939453125, 4.148681640625, 4.41796875, 4.687255859375, 4.95654296875, 5.225830078125, 5.4951171875, 5.764404296875, 6.03369140625, 6.302978515625, 6.572265625, 6.841552734375, 7.11083984375, 7.380126953125, 7.6494140625, 7.918701171875, 8.18798828125, 8.457275390625, 8.7265625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 10.0, 12.0, 18.0, 20.0, 30.0, 27.0, 27.0, 41.0, 63.0, 103.0, 236.0, 503.0, 1141.0, 3422.0, 19290.0, 520523.0, 2549225.0, 42533.0, 5497.0, 1652.0, 585.0, 244.0, 146.0, 81.0, 53.0, 43.0, 28.0, 21.0, 19.0, 21.0, 15.0, 16.0, 11.0, 12.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0078125, -11.6343994140625, -11.260986328125, -10.8875732421875, -10.51416015625, -10.1407470703125, -9.767333984375, -9.3939208984375, -9.0205078125, -8.6470947265625, -8.273681640625, -7.9002685546875, -7.52685546875, -7.1534423828125, -6.780029296875, -6.4066162109375, -6.033203125, -5.6597900390625, -5.286376953125, -4.9129638671875, -4.53955078125, -4.1661376953125, -3.792724609375, -3.4193115234375, -3.0458984375, -2.6724853515625, -2.299072265625, -1.9256591796875, -1.55224609375, -1.1788330078125, -0.805419921875, -0.4320068359375, -0.05859375, 0.3148193359375, 0.688232421875, 1.0616455078125, 1.43505859375, 1.8084716796875, 2.181884765625, 2.5552978515625, 2.9287109375, 3.3021240234375, 3.675537109375, 4.0489501953125, 4.42236328125, 4.7957763671875, 5.169189453125, 5.5426025390625, 5.916015625, 6.2894287109375, 6.662841796875, 7.0362548828125, 7.40966796875, 7.7830810546875, 8.156494140625, 8.5299072265625, 8.9033203125, 9.2767333984375, 9.650146484375, 10.0235595703125, 10.39697265625, 10.7703857421875, 11.143798828125, 11.5172119140625, 11.890625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 16.0, 38.0, 78.0, 155.0, 170.0, 205.0, 147.0, 108.0, 58.0, 20.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.738855361938477, -27.924104690551758, -27.10935401916504, -26.29460334777832, -25.4798526763916, -24.665102005004883, -23.85034942626953, -23.035598754882812, -22.220848083496094, -21.406097412109375, -20.591346740722656, -19.776596069335938, -18.96184539794922, -18.1470947265625, -17.33234405517578, -16.517593383789062, -15.702842712402344, -14.888092041015625, -14.073341369628906, -13.258590698242188, -12.443840026855469, -11.62908935546875, -10.814337730407715, -9.999587059020996, -9.184836387634277, -8.370085716247559, -7.55533504486084, -6.740583896636963, -5.925833225250244, -5.111082553863525, -4.296331405639648, -3.4815807342529297, -2.6668319702148438, -1.8520811796188354, -1.0373303890228271, -0.2225794792175293, 0.5921711921691895, 1.4069218635559082, 2.221673011779785, 3.036423683166504, 3.8511743545532227, 4.665925025939941, 5.48067569732666, 6.295426845550537, 7.110177516937256, 7.924928188323975, 8.739679336547852, 9.55443000793457, 10.369180679321289, 11.183931350708008, 11.998682022094727, 12.813432693481445, 13.628183364868164, 14.442934036254883, 15.257685661315918, 16.072437286376953, 16.887187957763672, 17.70193862915039, 18.51668930053711, 19.331439971923828, 20.146190643310547, 20.960941314697266, 21.775691986083984, 22.590442657470703, 23.405193328857422]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 5.0, 8.0, 6.0, 12.0, 8.0, 13.0, 14.0, 18.0, 22.0, 22.0, 19.0, 20.0, 33.0, 29.0, 36.0, 38.0, 44.0, 35.0, 27.0, 35.0, 26.0, 36.0, 27.0, 31.0, 37.0, 42.0, 37.0, 37.0, 39.0, 35.0, 22.0, 22.0, 15.0, 20.0, 21.0, 21.0, 13.0, 9.0, 15.0, 8.0, 13.0, 4.0, 7.0, 7.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-29.035263061523438, -28.222087860107422, -27.408910751342773, -26.595735549926758, -25.78255844116211, -24.969383239746094, -24.156208038330078, -23.34303092956543, -22.52985382080078, -21.716678619384766, -20.903501510620117, -20.0903263092041, -19.277149200439453, -18.463973999023438, -17.650798797607422, -16.837621688842773, -16.024446487426758, -15.211270332336426, -14.398094177246094, -13.584918975830078, -12.77174186706543, -11.958566665649414, -11.145390510559082, -10.33221435546875, -9.519038200378418, -8.705862045288086, -7.892685890197754, -7.07951021194458, -6.266334056854248, -5.453157901763916, -4.639982223510742, -3.82680606842041, -3.013629913330078, -2.200453758239746, -1.3872778415679932, -0.5741019248962402, 0.2390742301940918, 1.0522503852844238, 1.8654260635375977, 2.6786022186279297, 3.4917783737182617, 4.304954528808594, 5.118130683898926, 5.9313063621521, 6.744482517242432, 7.557658672332764, 8.370834350585938, 9.18401050567627, 9.997186660766602, 10.810362815856934, 11.623538970947266, 12.436714172363281, 13.24989128112793, 14.063066482543945, 14.876242637634277, 15.68941879272461, 16.502593994140625, 17.31576919555664, 18.12894630432129, 18.942121505737305, 19.755298614501953, 20.56847381591797, 21.381649017333984, 22.194826126098633, 23.00800323486328]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 1.0, 2.0, 3.0, 16.0, 13.0, 30.0, 21.0, 38.0, 53.0, 59.0, 62.0, 65.0, 78.0, 93.0, 100.0, 77.0, 71.0, 48.0, 45.0, 36.0, 41.0, 21.0, 11.0, 7.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4375, -4.3154296875, -4.193359375, -4.0712890625, -3.94921875, -3.8271484375, -3.705078125, -3.5830078125, -3.4609375, -3.3388671875, -3.216796875, -3.0947265625, -2.97265625, -2.8505859375, -2.728515625, -2.6064453125, -2.484375, -2.3623046875, -2.240234375, -2.1181640625, -1.99609375, -1.8740234375, -1.751953125, -1.6298828125, -1.5078125, -1.3857421875, -1.263671875, -1.1416015625, -1.01953125, -0.8974609375, -0.775390625, -0.6533203125, -0.53125, -0.4091796875, -0.287109375, -0.1650390625, -0.04296875, 0.0791015625, 0.201171875, 0.3232421875, 0.4453125, 0.5673828125, 0.689453125, 0.8115234375, 0.93359375, 1.0556640625, 1.177734375, 1.2998046875, 1.421875, 1.5439453125, 1.666015625, 1.7880859375, 1.91015625, 2.0322265625, 2.154296875, 2.2763671875, 2.3984375, 2.5205078125, 2.642578125, 2.7646484375, 2.88671875, 3.0087890625, 3.130859375, 3.2529296875, 3.375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 18.0, 14.0, 36.0, 35.0, 62.0, 88.0, 163.0, 310.0, 680.0, 1563.0, 5208.0, 39891.0, 3849853.0, 282621.0, 9928.0, 2313.0, 776.0, 351.0, 140.0, 78.0, 38.0, 37.0, 17.0, 10.0, 7.0, 6.0, 9.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.96875, -24.306640625, -23.64453125, -22.982421875, -22.3203125, -21.658203125, -20.99609375, -20.333984375, -19.671875, -19.009765625, -18.34765625, -17.685546875, -17.0234375, -16.361328125, -15.69921875, -15.037109375, -14.375, -13.712890625, -13.05078125, -12.388671875, -11.7265625, -11.064453125, -10.40234375, -9.740234375, -9.078125, -8.416015625, -7.75390625, -7.091796875, -6.4296875, -5.767578125, -5.10546875, -4.443359375, -3.78125, -3.119140625, -2.45703125, -1.794921875, -1.1328125, -0.470703125, 0.19140625, 0.853515625, 1.515625, 2.177734375, 2.83984375, 3.501953125, 4.1640625, 4.826171875, 5.48828125, 6.150390625, 6.8125, 7.474609375, 8.13671875, 8.798828125, 9.4609375, 10.123046875, 10.78515625, 11.447265625, 12.109375, 12.771484375, 13.43359375, 14.095703125, 14.7578125, 15.419921875, 16.08203125, 16.744140625, 17.40625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 5.0, 7.0, 5.0, 5.0, 10.0, 18.0, 15.0, 34.0, 50.0, 46.0, 96.0, 117.0, 237.0, 334.0, 473.0, 627.0, 629.0, 455.0, 342.0, 185.0, 109.0, 63.0, 46.0, 42.0, 26.0, 24.0, 22.0, 11.0, 7.0, 5.0, 3.0, 3.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.51953125, -7.290283203125, -7.06103515625, -6.831787109375, -6.6025390625, -6.373291015625, -6.14404296875, -5.914794921875, -5.685546875, -5.456298828125, -5.22705078125, -4.997802734375, -4.7685546875, -4.539306640625, -4.31005859375, -4.080810546875, -3.8515625, -3.622314453125, -3.39306640625, -3.163818359375, -2.9345703125, -2.705322265625, -2.47607421875, -2.246826171875, -2.017578125, -1.788330078125, -1.55908203125, -1.329833984375, -1.1005859375, -0.871337890625, -0.64208984375, -0.412841796875, -0.18359375, 0.045654296875, 0.27490234375, 0.504150390625, 0.7333984375, 0.962646484375, 1.19189453125, 1.421142578125, 1.650390625, 1.879638671875, 2.10888671875, 2.338134765625, 2.5673828125, 2.796630859375, 3.02587890625, 3.255126953125, 3.484375, 3.713623046875, 3.94287109375, 4.172119140625, 4.4013671875, 4.630615234375, 4.85986328125, 5.089111328125, 5.318359375, 5.547607421875, 5.77685546875, 6.006103515625, 6.2353515625, 6.464599609375, 6.69384765625, 6.923095703125, 7.15234375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 13.0, 18.0, 21.0, 42.0, 64.0, 107.0, 198.0, 276.0, 520.0, 995.0, 1585.0, 2913.0, 5787.0, 12732.0, 34248.0, 138317.0, 1094385.0, 2462918.0, 340120.0, 62008.0, 19850.0, 8273.0, 3974.0, 2024.0, 1181.0, 673.0, 421.0, 229.0, 145.0, 99.0, 53.0, 29.0, 22.0, 12.0, 7.0, 10.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.875, -10.52685546875, -10.1787109375, -9.83056640625, -9.482421875, -9.13427734375, -8.7861328125, -8.43798828125, -8.08984375, -7.74169921875, -7.3935546875, -7.04541015625, -6.697265625, -6.34912109375, -6.0009765625, -5.65283203125, -5.3046875, -4.95654296875, -4.6083984375, -4.26025390625, -3.912109375, -3.56396484375, -3.2158203125, -2.86767578125, -2.51953125, -2.17138671875, -1.8232421875, -1.47509765625, -1.126953125, -0.77880859375, -0.4306640625, -0.08251953125, 0.265625, 0.61376953125, 0.9619140625, 1.31005859375, 1.658203125, 2.00634765625, 2.3544921875, 2.70263671875, 3.05078125, 3.39892578125, 3.7470703125, 4.09521484375, 4.443359375, 4.79150390625, 5.1396484375, 5.48779296875, 5.8359375, 6.18408203125, 6.5322265625, 6.88037109375, 7.228515625, 7.57666015625, 7.9248046875, 8.27294921875, 8.62109375, 8.96923828125, 9.3173828125, 9.66552734375, 10.013671875, 10.36181640625, 10.7099609375, 11.05810546875, 11.40625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 10.0, 23.0, 27.0, 60.0, 86.0, 121.0, 162.0, 128.0, 139.0, 91.0, 60.0, 41.0, 27.0, 14.0, 5.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.423763275146484, -59.6796760559082, -57.93558883666992, -56.19150161743164, -54.447410583496094, -52.70332336425781, -50.95923614501953, -49.21514892578125, -47.47106170654297, -45.72697448730469, -43.982887268066406, -42.238800048828125, -40.494712829589844, -38.75062561035156, -37.006534576416016, -35.262447357177734, -33.51836013793945, -31.774272918701172, -30.03018569946289, -28.286096572875977, -26.542009353637695, -24.797922134399414, -23.0538330078125, -21.30974578857422, -19.565658569335938, -17.821571350097656, -16.077484130859375, -14.333395004272461, -12.58930778503418, -10.845220565795898, -9.1011323928833, -7.357044219970703, -5.612953186035156, -3.868865489959717, -2.1247777938842773, -0.3806900978088379, 1.3633975982666016, 3.107484817504883, 4.8515729904174805, 6.595661163330078, 8.33974838256836, 10.08383560180664, 11.827923774719238, 13.572011947631836, 15.316099166870117, 17.0601863861084, 18.804275512695312, 20.548362731933594, 22.292449951171875, 24.036537170410156, 25.780624389648438, 27.52471351623535, 29.268800735473633, 31.012887954711914, 32.75697708129883, 34.50106430053711, 36.24515151977539, 37.98923873901367, 39.73332595825195, 41.477413177490234, 43.22150421142578, 44.96559143066406, 46.709678649902344, 48.453765869140625, 50.197853088378906]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 8.0, 0.0, 5.0, 6.0, 5.0, 13.0, 6.0, 13.0, 18.0, 15.0, 24.0, 20.0, 16.0, 19.0, 30.0, 31.0, 20.0, 41.0, 39.0, 39.0, 40.0, 37.0, 30.0, 53.0, 36.0, 37.0, 24.0, 53.0, 35.0, 33.0, 36.0, 31.0, 34.0, 22.0, 17.0, 18.0, 14.0, 13.0, 11.0, 12.0, 7.0, 8.0, 11.0, 10.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-19.55889129638672, -18.92671775817871, -18.294546127319336, -17.662372589111328, -17.03019905090332, -16.398025512695312, -15.765853881835938, -15.13368034362793, -14.501507759094238, -13.869335174560547, -13.237161636352539, -12.604989051818848, -11.972816467285156, -11.340642929077148, -10.708470344543457, -10.076297760009766, -9.444124221801758, -8.811951637268066, -8.179778099060059, -7.547605514526367, -6.915432453155518, -6.283259391784668, -5.651086807250977, -5.018913745880127, -4.386740684509277, -3.7545676231384277, -3.1223948001861572, -2.4902219772338867, -1.858048915863037, -1.2258758544921875, -0.593703031539917, 0.038469791412353516, 0.6706409454345703, 1.3028138875961304, 1.9349868297576904, 2.567159652709961, 3.1993327140808105, 3.83150577545166, 4.463678359985352, 5.095851421356201, 5.728024482727051, 6.3601975440979, 6.99237060546875, 7.624543190002441, 8.256715774536133, 8.88888931274414, 9.521061897277832, 10.153234481811523, 10.785408020019531, 11.417580604553223, 12.04975414276123, 12.681926727294922, 13.31410026550293, 13.946272850036621, 14.578445434570312, 15.21061897277832, 15.842791557312012, 16.474964141845703, 17.10713768005371, 17.73931121826172, 18.371482849121094, 19.0036563873291, 19.63582992553711, 20.268001556396484, 20.900175094604492]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 5.0, 11.0, 9.0, 16.0, 23.0, 31.0, 39.0, 49.0, 51.0, 49.0, 67.0, 73.0, 83.0, 82.0, 77.0, 78.0, 64.0, 47.0, 39.0, 29.0, 23.0, 22.0, 13.0, 10.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.30078125, -4.18353271484375, -4.0662841796875, -3.94903564453125, -3.831787109375, -3.71453857421875, -3.5972900390625, -3.48004150390625, -3.36279296875, -3.24554443359375, -3.1282958984375, -3.01104736328125, -2.893798828125, -2.77655029296875, -2.6593017578125, -2.54205322265625, -2.4248046875, -2.30755615234375, -2.1903076171875, -2.07305908203125, -1.955810546875, -1.83856201171875, -1.7213134765625, -1.60406494140625, -1.48681640625, -1.36956787109375, -1.2523193359375, -1.13507080078125, -1.017822265625, -0.90057373046875, -0.7833251953125, -0.66607666015625, -0.548828125, -0.43157958984375, -0.3143310546875, -0.19708251953125, -0.079833984375, 0.03741455078125, 0.1546630859375, 0.27191162109375, 0.38916015625, 0.50640869140625, 0.6236572265625, 0.74090576171875, 0.858154296875, 0.97540283203125, 1.0926513671875, 1.20989990234375, 1.3271484375, 1.44439697265625, 1.5616455078125, 1.67889404296875, 1.796142578125, 1.91339111328125, 2.0306396484375, 2.14788818359375, 2.26513671875, 2.38238525390625, 2.4996337890625, 2.61688232421875, 2.734130859375, 2.85137939453125, 2.9686279296875, 3.08587646484375, 3.203125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 5.0, 8.0, 15.0, 23.0, 22.0, 53.0, 43.0, 64.0, 111.0, 141.0, 231.0, 354.0, 592.0, 1121.0, 1933.0, 3581.0, 6898.0, 13938.0, 32444.0, 83191.0, 281711.0, 430056.0, 113770.0, 42163.0, 18028.0, 8326.0, 4300.0, 2235.0, 1268.0, 661.0, 397.0, 278.0, 186.0, 118.0, 77.0, 57.0, 46.0, 31.0, 20.0, 19.0, 7.0, 8.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.220703125, -0.21361732482910156, -0.20653152465820312, -0.1994457244873047, -0.19235992431640625, -0.1852741241455078, -0.17818832397460938, -0.17110252380371094, -0.1640167236328125, -0.15693092346191406, -0.14984512329101562, -0.1427593231201172, -0.13567352294921875, -0.1285877227783203, -0.12150192260742188, -0.11441612243652344, -0.107330322265625, -0.10024452209472656, -0.09315872192382812, -0.08607292175292969, -0.07898712158203125, -0.07190132141113281, -0.06481552124023438, -0.05772972106933594, -0.0506439208984375, -0.04355812072753906, -0.036472320556640625, -0.029386520385742188, -0.02230072021484375, -0.015214920043945312, -0.008129119873046875, -0.0010433197021484375, 0.00604248046875, 0.013128280639648438, 0.020214080810546875, 0.027299880981445312, 0.03438568115234375, 0.04147148132324219, 0.048557281494140625, 0.05564308166503906, 0.0627288818359375, 0.06981468200683594, 0.07690048217773438, 0.08398628234863281, 0.09107208251953125, 0.09815788269042969, 0.10524368286132812, 0.11232948303222656, 0.119415283203125, 0.12650108337402344, 0.13358688354492188, 0.1406726837158203, 0.14775848388671875, 0.1548442840576172, 0.16193008422851562, 0.16901588439941406, 0.1761016845703125, 0.18318748474121094, 0.19027328491210938, 0.1973590850830078, 0.20444488525390625, 0.2115306854248047, 0.21861648559570312, 0.22570228576660156, 0.2327880859375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 5.0, 3.0, 3.0, 12.0, 5.0, 10.0, 13.0, 20.0, 25.0, 18.0, 23.0, 22.0, 23.0, 28.0, 27.0, 33.0, 26.0, 35.0, 32.0, 35.0, 49.0, 46.0, 1064.0, 41.0, 26.0, 40.0, 26.0, 36.0, 45.0, 25.0, 27.0, 30.0, 20.0, 19.0, 15.0, 22.0, 16.0, 12.0, 13.0, 6.0, 8.0, 11.0, 8.0, 8.0, 2.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.75390625, -1.6923828125, -1.630859375, -1.5693359375, -1.5078125, -1.4462890625, -1.384765625, -1.3232421875, -1.26171875, -1.2001953125, -1.138671875, -1.0771484375, -1.015625, -0.9541015625, -0.892578125, -0.8310546875, -0.76953125, -0.7080078125, -0.646484375, -0.5849609375, -0.5234375, -0.4619140625, -0.400390625, -0.3388671875, -0.27734375, -0.2158203125, -0.154296875, -0.0927734375, -0.03125, 0.0302734375, 0.091796875, 0.1533203125, 0.21484375, 0.2763671875, 0.337890625, 0.3994140625, 0.4609375, 0.5224609375, 0.583984375, 0.6455078125, 0.70703125, 0.7685546875, 0.830078125, 0.8916015625, 0.953125, 1.0146484375, 1.076171875, 1.1376953125, 1.19921875, 1.2607421875, 1.322265625, 1.3837890625, 1.4453125, 1.5068359375, 1.568359375, 1.6298828125, 1.69140625, 1.7529296875, 1.814453125, 1.8759765625, 1.9375, 1.9990234375, 2.060546875, 2.1220703125, 2.18359375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 6.0, 5.0, 8.0, 17.0, 20.0, 23.0, 26.0, 62.0, 61.0, 102.0, 148.0, 197.0, 267.0, 378.0, 563.0, 667.0, 927.0, 1296.0, 1818.0, 2533.0, 3623.0, 5171.0, 7089.0, 10240.0, 14920.0, 21567.0, 32635.0, 49898.0, 81573.0, 152216.0, 1317566.0, 154009.0, 81820.0, 50179.0, 32756.0, 21974.0, 15061.0, 10414.0, 7319.0, 5150.0, 3673.0, 2563.0, 1957.0, 1348.0, 968.0, 687.0, 444.0, 368.0, 223.0, 182.0, 115.0, 89.0, 60.0, 50.0, 30.0, 33.0, 18.0, 9.0, 11.0, 7.0, 4.0, 4.0], "bins": [-0.043121337890625, -0.041794776916503906, -0.04046821594238281, -0.03914165496826172, -0.037815093994140625, -0.03648853302001953, -0.03516197204589844, -0.033835411071777344, -0.03250885009765625, -0.031182289123535156, -0.029855728149414062, -0.02852916717529297, -0.027202606201171875, -0.02587604522705078, -0.024549484252929688, -0.023222923278808594, -0.0218963623046875, -0.020569801330566406, -0.019243240356445312, -0.01791667938232422, -0.016590118408203125, -0.015263557434082031, -0.013936996459960938, -0.012610435485839844, -0.01128387451171875, -0.009957313537597656, -0.008630752563476562, -0.007304191589355469, -0.005977630615234375, -0.004651069641113281, -0.0033245086669921875, -0.0019979476928710938, -0.00067138671875, 0.0006551742553710938, 0.0019817352294921875, 0.0033082962036132812, 0.004634857177734375, 0.005961418151855469, 0.0072879791259765625, 0.008614540100097656, 0.00994110107421875, 0.011267662048339844, 0.012594223022460938, 0.013920783996582031, 0.015247344970703125, 0.01657390594482422, 0.017900466918945312, 0.019227027893066406, 0.0205535888671875, 0.021880149841308594, 0.023206710815429688, 0.02453327178955078, 0.025859832763671875, 0.02718639373779297, 0.028512954711914062, 0.029839515686035156, 0.03116607666015625, 0.032492637634277344, 0.03381919860839844, 0.03514575958251953, 0.036472320556640625, 0.03779888153076172, 0.03912544250488281, 0.040452003479003906, 0.041778564453125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 6.0, 8.0, 15.0, 14.0, 17.0, 16.0, 14.0, 17.0, 24.0, 42.0, 32.0, 50.0, 77.0, 103.0, 111.0, 100.0, 88.0, 48.0, 40.0, 31.0, 31.0, 22.0, 15.0, 20.0, 5.0, 12.0, 4.0, 10.0, 4.0, 2.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005235671997070312, -0.0005052238702774048, -0.0004868805408477783, -0.00046853721141815186, -0.0004501938819885254, -0.0004318505525588989, -0.00041350722312927246, -0.000395163893699646, -0.00037682056427001953, -0.00035847723484039307, -0.0003401339054107666, -0.00032179057598114014, -0.00030344724655151367, -0.0002851039171218872, -0.00026676058769226074, -0.0002484172582626343, -0.0002300739288330078, -0.00021173059940338135, -0.00019338726997375488, -0.00017504394054412842, -0.00015670061111450195, -0.0001383572816848755, -0.00012001395225524902, -0.00010167062282562256, -8.33272933959961e-05, -6.498396396636963e-05, -4.6640634536743164e-05, -2.82973051071167e-05, -9.953975677490234e-06, 8.38935375213623e-06, 2.6732683181762695e-05, 4.507601261138916e-05, 6.341934204101562e-05, 8.176267147064209e-05, 0.00010010600090026855, 0.00011844933032989502, 0.00013679265975952148, 0.00015513598918914795, 0.00017347931861877441, 0.00019182264804840088, 0.00021016597747802734, 0.0002285093069076538, 0.0002468526363372803, 0.00026519596576690674, 0.0002835392951965332, 0.00030188262462615967, 0.00032022595405578613, 0.0003385692834854126, 0.00035691261291503906, 0.00037525594234466553, 0.000393599271774292, 0.00041194260120391846, 0.0004302859306335449, 0.0004486292600631714, 0.00046697258949279785, 0.0004853159189224243, 0.0005036592483520508, 0.0005220025777816772, 0.0005403459072113037, 0.0005586892366409302, 0.0005770325660705566, 0.0005953758955001831, 0.0006137192249298096, 0.000632062554359436, 0.0006504058837890625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 7.0, 9.0, 13.0, 21.0, 21.0, 29.0, 57.0, 67.0, 96.0, 126.0, 210.0, 886.0, 8087.0, 155497.0, 844419.0, 35458.0, 2582.0, 418.0, 177.0, 99.0, 64.0, 35.0, 38.0, 31.0, 24.0, 18.0, 12.0, 9.0, 13.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01025390625, -0.009963154792785645, -0.009672403335571289, -0.009381651878356934, -0.009090900421142578, -0.008800148963928223, -0.008509397506713867, -0.008218646049499512, -0.007927894592285156, -0.007637143135070801, -0.007346391677856445, -0.00705564022064209, -0.006764888763427734, -0.006474137306213379, -0.0061833858489990234, -0.005892634391784668, -0.0056018829345703125, -0.005311131477355957, -0.0050203800201416016, -0.004729628562927246, -0.004438877105712891, -0.004148125648498535, -0.0038573741912841797, -0.0035666227340698242, -0.0032758712768554688, -0.0029851198196411133, -0.002694368362426758, -0.0024036169052124023, -0.002112865447998047, -0.0018221139907836914, -0.001531362533569336, -0.0012406110763549805, -0.000949859619140625, -0.0006591081619262695, -0.00036835670471191406, -7.76052474975586e-05, 0.00021314620971679688, 0.0005038976669311523, 0.0007946491241455078, 0.0010854005813598633, 0.0013761520385742188, 0.0016669034957885742, 0.0019576549530029297, 0.002248406410217285, 0.0025391578674316406, 0.002829909324645996, 0.0031206607818603516, 0.003411412239074707, 0.0037021636962890625, 0.003992915153503418, 0.0042836666107177734, 0.004574418067932129, 0.004865169525146484, 0.00515592098236084, 0.005446672439575195, 0.005737423896789551, 0.006028175354003906, 0.006318926811218262, 0.006609678268432617, 0.006900429725646973, 0.007191181182861328, 0.007481932640075684, 0.007772684097290039, 0.008063435554504395, 0.00835418701171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 11.0, 51.0, 607.0, 323.0, 24.0], "bins": [-0.013291134499013424, -0.013076398521661758, -0.012861662544310093, -0.012646926566958427, -0.012432190589606762, -0.012217454612255096, -0.012002719566226006, -0.01178798358887434, -0.011573247611522675, -0.011358511634171009, -0.011143775656819344, -0.010929039679467678, -0.010714303702116013, -0.010499568656086922, -0.010284831747412682, -0.01007009670138359, -0.00985535979270935, -0.009640623815357685, -0.00942588783800602, -0.009211151860654354, -0.008996415883302689, -0.008781680837273598, -0.008566943928599358, -0.008352208882570267, -0.008137472905218601, -0.007922736927866936, -0.00770800095051527, -0.007493264973163605, -0.0072785294614732265, -0.007063793484121561, -0.0068490575067698956, -0.00663432152941823, -0.0064195855520665646, -0.006204849574714899, -0.0059901135973632336, -0.005775378085672855, -0.00556064210832119, -0.005345906130969524, -0.005131170153617859, -0.004916434176266193, -0.004701698198914528, -0.004486962221562862, -0.004272226244211197, -0.004057490266859531, -0.003842754755169153, -0.0036280187778174877, -0.0034132828004658222, -0.0031985468231141567, -0.0029838113114237785, -0.002769075334072113, -0.002554339589551091, -0.0023396036121994257, -0.002124867867678404, -0.0019101318903267384, -0.0016953959129750729, -0.0014806600520387292, -0.0012659241911023855, -0.0010511883301660419, -0.0008364524110220373, -0.0006217164918780327, -0.000406980630941689, -0.00019224477000534534, 2.2491207346320152e-05, 0.00023722706828266382, 0.0004519629292190075]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 10.0, 14.0, 15.0, 21.0, 36.0, 26.0, 46.0, 43.0, 48.0, 64.0, 55.0, 64.0, 59.0, 70.0, 61.0, 62.0, 53.0, 52.0, 42.0, 31.0, 26.0, 25.0, 21.0, 19.0, 13.0, 6.0, 12.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005148649215698242, -0.0004944652318954468, -0.00047406554222106934, -0.0004536658525466919, -0.00043326616287231445, -0.000412866473197937, -0.00039246678352355957, -0.00037206709384918213, -0.0003516674041748047, -0.00033126771450042725, -0.0003108680248260498, -0.00029046833515167236, -0.0002700686454772949, -0.0002496689558029175, -0.00022926926612854004, -0.0002088695764541626, -0.00018846988677978516, -0.00016807019710540771, -0.00014767050743103027, -0.00012727081775665283, -0.00010687112808227539, -8.647143840789795e-05, -6.607174873352051e-05, -4.5672059059143066e-05, -2.5272369384765625e-05, -4.872679710388184e-06, 1.5527009963989258e-05, 3.59266996383667e-05, 5.632638931274414e-05, 7.672607898712158e-05, 9.712576866149902e-05, 0.00011752545833587646, 0.0001379251480102539, 0.00015832483768463135, 0.0001787245273590088, 0.00019912421703338623, 0.00021952390670776367, 0.0002399235963821411, 0.00026032328605651855, 0.000280722975730896, 0.00030112266540527344, 0.0003215223550796509, 0.0003419220447540283, 0.00036232173442840576, 0.0003827214241027832, 0.00040312111377716064, 0.0004235208034515381, 0.00044392049312591553, 0.00046432018280029297, 0.0004847198724746704, 0.0005051195621490479, 0.0005255192518234253, 0.0005459189414978027, 0.0005663186311721802, 0.0005867183208465576, 0.0006071180105209351, 0.0006275177001953125, 0.0006479173898696899, 0.0006683170795440674, 0.0006887167692184448, 0.0007091164588928223, 0.0007295161485671997, 0.0007499158382415771, 0.0007703155279159546, 0.000790715217590332]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 5.0, 11.0, 9.0, 16.0, 23.0, 31.0, 39.0, 49.0, 51.0, 49.0, 67.0, 73.0, 83.0, 82.0, 77.0, 78.0, 64.0, 47.0, 39.0, 29.0, 23.0, 22.0, 13.0, 10.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.30078125, -4.18353271484375, -4.0662841796875, -3.94903564453125, -3.831787109375, -3.71453857421875, -3.5972900390625, -3.48004150390625, -3.36279296875, -3.24554443359375, -3.1282958984375, -3.01104736328125, -2.893798828125, -2.77655029296875, -2.6593017578125, -2.54205322265625, -2.4248046875, -2.30755615234375, -2.1903076171875, -2.07305908203125, -1.955810546875, -1.83856201171875, -1.7213134765625, -1.60406494140625, -1.48681640625, -1.36956787109375, -1.2523193359375, -1.13507080078125, -1.017822265625, -0.90057373046875, -0.7833251953125, -0.66607666015625, -0.548828125, -0.43157958984375, -0.3143310546875, -0.19708251953125, -0.079833984375, 0.03741455078125, 0.1546630859375, 0.27191162109375, 0.38916015625, 0.50640869140625, 0.6236572265625, 0.74090576171875, 0.858154296875, 0.97540283203125, 1.0926513671875, 1.20989990234375, 1.3271484375, 1.44439697265625, 1.5616455078125, 1.67889404296875, 1.796142578125, 1.91339111328125, 2.0306396484375, 2.14788818359375, 2.26513671875, 2.38238525390625, 2.4996337890625, 2.61688232421875, 2.734130859375, 2.85137939453125, 2.9686279296875, 3.08587646484375, 3.203125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 8.0, 9.0, 11.0, 21.0, 21.0, 46.0, 73.0, 127.0, 209.0, 501.0, 1128.0, 3242.0, 13089.0, 91205.0, 814384.0, 104808.0, 13904.0, 3544.0, 1207.0, 488.0, 224.0, 120.0, 63.0, 44.0, 32.0, 15.0, 13.0, 12.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2578125, -10.9219970703125, -10.586181640625, -10.2503662109375, -9.91455078125, -9.5787353515625, -9.242919921875, -8.9071044921875, -8.5712890625, -8.2354736328125, -7.899658203125, -7.5638427734375, -7.22802734375, -6.8922119140625, -6.556396484375, -6.2205810546875, -5.884765625, -5.5489501953125, -5.213134765625, -4.8773193359375, -4.54150390625, -4.2056884765625, -3.869873046875, -3.5340576171875, -3.1982421875, -2.8624267578125, -2.526611328125, -2.1907958984375, -1.85498046875, -1.5191650390625, -1.183349609375, -0.8475341796875, -0.51171875, -0.1759033203125, 0.159912109375, 0.4957275390625, 0.83154296875, 1.1673583984375, 1.503173828125, 1.8389892578125, 2.1748046875, 2.5106201171875, 2.846435546875, 3.1822509765625, 3.51806640625, 3.8538818359375, 4.189697265625, 4.5255126953125, 4.861328125, 5.1971435546875, 5.532958984375, 5.8687744140625, 6.20458984375, 6.5404052734375, 6.876220703125, 7.2120361328125, 7.5478515625, 7.8836669921875, 8.219482421875, 8.5552978515625, 8.89111328125, 9.2269287109375, 9.562744140625, 9.8985595703125, 10.234375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 10.0, 4.0, 5.0, 5.0, 7.0, 5.0, 7.0, 15.0, 15.0, 25.0, 21.0, 24.0, 25.0, 23.0, 48.0, 33.0, 19.0, 39.0, 46.0, 58.0, 64.0, 110.0, 190.0, 1367.0, 236.0, 120.0, 52.0, 53.0, 43.0, 43.0, 43.0, 32.0, 26.0, 17.0, 34.0, 24.0, 20.0, 28.0, 18.0, 15.0, 13.0, 8.0, 11.0, 9.0, 10.0, 6.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.86328125, -6.6466064453125, -6.429931640625, -6.2132568359375, -5.99658203125, -5.7799072265625, -5.563232421875, -5.3465576171875, -5.1298828125, -4.9132080078125, -4.696533203125, -4.4798583984375, -4.26318359375, -4.0465087890625, -3.829833984375, -3.6131591796875, -3.396484375, -3.1798095703125, -2.963134765625, -2.7464599609375, -2.52978515625, -2.3131103515625, -2.096435546875, -1.8797607421875, -1.6630859375, -1.4464111328125, -1.229736328125, -1.0130615234375, -0.79638671875, -0.5797119140625, -0.363037109375, -0.1463623046875, 0.0703125, 0.2869873046875, 0.503662109375, 0.7203369140625, 0.93701171875, 1.1536865234375, 1.370361328125, 1.5870361328125, 1.8037109375, 2.0203857421875, 2.237060546875, 2.4537353515625, 2.67041015625, 2.8870849609375, 3.103759765625, 3.3204345703125, 3.537109375, 3.7537841796875, 3.970458984375, 4.1871337890625, 4.40380859375, 4.6204833984375, 4.837158203125, 5.0538330078125, 5.2705078125, 5.4871826171875, 5.703857421875, 5.9205322265625, 6.13720703125, 6.3538818359375, 6.570556640625, 6.7872314453125, 7.00390625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 12.0, 21.0, 12.0, 14.0, 17.0, 28.0, 42.0, 53.0, 59.0, 124.0, 173.0, 227.0, 423.0, 740.0, 1421.0, 2856.0, 6097.0, 14951.0, 46549.0, 355342.0, 2486689.0, 174935.0, 33365.0, 11538.0, 4935.0, 2216.0, 1134.0, 636.0, 341.0, 232.0, 136.0, 85.0, 75.0, 47.0, 42.0, 20.0, 24.0, 14.0, 13.0, 8.0, 13.0, 8.0, 4.0, 3.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-10.9765625, -10.637451171875, -10.29833984375, -9.959228515625, -9.6201171875, -9.281005859375, -8.94189453125, -8.602783203125, -8.263671875, -7.924560546875, -7.58544921875, -7.246337890625, -6.9072265625, -6.568115234375, -6.22900390625, -5.889892578125, -5.55078125, -5.211669921875, -4.87255859375, -4.533447265625, -4.1943359375, -3.855224609375, -3.51611328125, -3.177001953125, -2.837890625, -2.498779296875, -2.15966796875, -1.820556640625, -1.4814453125, -1.142333984375, -0.80322265625, -0.464111328125, -0.125, 0.214111328125, 0.55322265625, 0.892333984375, 1.2314453125, 1.570556640625, 1.90966796875, 2.248779296875, 2.587890625, 2.927001953125, 3.26611328125, 3.605224609375, 3.9443359375, 4.283447265625, 4.62255859375, 4.961669921875, 5.30078125, 5.639892578125, 5.97900390625, 6.318115234375, 6.6572265625, 6.996337890625, 7.33544921875, 7.674560546875, 8.013671875, 8.352783203125, 8.69189453125, 9.031005859375, 9.3701171875, 9.709228515625, 10.04833984375, 10.387451171875, 10.7265625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [4.0, 140.0, 809.0, 65.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.585744857788086, -10.903063774108887, -3.2203826904296875, 4.462297439575195, 12.144979476928711, 19.827661514282227, 27.510339736938477, 35.193023681640625, 42.875701904296875, 50.55838394165039, 58.241065979003906, 65.92374420166016, 73.60643005371094, 81.28910827636719, 88.97178649902344, 96.65446472167969, 104.33715057373047, 112.01982879638672, 119.7025146484375, 127.38519287109375, 135.06787109375, 142.75054931640625, 150.4332275390625, 158.1159210205078, 165.79859924316406, 173.4812774658203, 181.16395568847656, 188.84664916992188, 196.52932739257812, 204.21200561523438, 211.89468383789062, 219.57736206054688, 227.26004028320312, 234.94271850585938, 242.62539672851562, 250.30807495117188, 257.9907531738281, 265.6734619140625, 273.35614013671875, 281.038818359375, 288.72149658203125, 296.4041748046875, 304.08685302734375, 311.76953125, 319.45220947265625, 327.1348876953125, 334.81756591796875, 342.5002746582031, 350.18292236328125, 357.8656005859375, 365.54827880859375, 373.23095703125, 380.91363525390625, 388.5963134765625, 396.27899169921875, 403.9617004394531, 411.6443786621094, 419.3270568847656, 427.0097351074219, 434.6924133300781, 442.3750915527344, 450.05780029296875, 457.740478515625, 465.42315673828125, 473.1058349609375]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 11.0, 5.0, 12.0, 8.0, 15.0, 22.0, 19.0, 20.0, 25.0, 18.0, 34.0, 30.0, 28.0, 27.0, 33.0, 56.0, 37.0, 35.0, 33.0, 36.0, 35.0, 45.0, 49.0, 34.0, 40.0, 38.0, 38.0, 28.0, 17.0, 21.0, 24.0, 16.0, 20.0, 18.0, 17.0, 8.0, 8.0, 4.0, 7.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.87702751159668, -28.988431930541992, -28.099836349487305, -27.211238861083984, -26.322643280029297, -25.43404769897461, -24.545452117919922, -23.656856536865234, -22.768260955810547, -21.87966537475586, -20.991069793701172, -20.102474212646484, -19.213876724243164, -18.325281143188477, -17.43668556213379, -16.5480899810791, -15.659492492675781, -14.770896911621094, -13.88230037689209, -12.993704795837402, -12.105108261108398, -11.216512680053711, -10.327917098999023, -9.439321517944336, -8.550724983215332, -7.662128925323486, -6.773532867431641, -5.884937286376953, -4.996341228485107, -4.107745170593262, -3.219149589538574, -2.3305535316467285, -1.4419574737548828, -0.5533615350723267, 0.3352344036102295, 1.223830223083496, 2.112426280975342, 3.0010223388671875, 3.889617919921875, 4.778213977813721, 5.666810035705566, 6.555406093597412, 7.444002151489258, 8.332597732543945, 9.221193313598633, 10.109789848327637, 10.998385429382324, 11.886981964111328, 12.775577545166016, 13.664173126220703, 14.552769660949707, 15.441365242004395, 16.3299617767334, 17.218557357788086, 18.107152938842773, 18.99574851989746, 19.88434600830078, 20.77294158935547, 21.661537170410156, 22.550132751464844, 23.438730239868164, 24.32732582092285, 25.21592140197754, 26.104516983032227, 26.993112564086914]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 6.0, 14.0, 10.0, 16.0, 37.0, 31.0, 34.0, 46.0, 53.0, 42.0, 59.0, 63.0, 86.0, 83.0, 58.0, 77.0, 67.0, 37.0, 46.0, 35.0, 24.0, 25.0, 19.0, 12.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1171875, -4.005035400390625, -3.89288330078125, -3.780731201171875, -3.6685791015625, -3.556427001953125, -3.44427490234375, -3.332122802734375, -3.219970703125, -3.107818603515625, -2.99566650390625, -2.883514404296875, -2.7713623046875, -2.659210205078125, -2.54705810546875, -2.434906005859375, -2.32275390625, -2.210601806640625, -2.09844970703125, -1.986297607421875, -1.8741455078125, -1.761993408203125, -1.64984130859375, -1.537689208984375, -1.425537109375, -1.313385009765625, -1.20123291015625, -1.089080810546875, -0.9769287109375, -0.864776611328125, -0.75262451171875, -0.640472412109375, -0.5283203125, -0.416168212890625, -0.30401611328125, -0.191864013671875, -0.0797119140625, 0.032440185546875, 0.14459228515625, 0.256744384765625, 0.368896484375, 0.481048583984375, 0.59320068359375, 0.705352783203125, 0.8175048828125, 0.929656982421875, 1.04180908203125, 1.153961181640625, 1.26611328125, 1.378265380859375, 1.49041748046875, 1.602569580078125, 1.7147216796875, 1.826873779296875, 1.93902587890625, 2.051177978515625, 2.163330078125, 2.275482177734375, 2.38763427734375, 2.499786376953125, 2.6119384765625, 2.724090576171875, 2.83624267578125, 2.948394775390625, 3.060546875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 12.0, 12.0, 23.0, 23.0, 20.0, 48.0, 45.0, 102.0, 163.0, 273.0, 494.0, 918.0, 1918.0, 5519.0, 21902.0, 458838.0, 3565933.0, 119277.0, 12673.0, 3553.0, 1277.0, 566.0, 284.0, 150.0, 99.0, 66.0, 28.0, 12.0, 13.0, 10.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.828125, -17.374755859375, -16.92138671875, -16.468017578125, -16.0146484375, -15.561279296875, -15.10791015625, -14.654541015625, -14.201171875, -13.747802734375, -13.29443359375, -12.841064453125, -12.3876953125, -11.934326171875, -11.48095703125, -11.027587890625, -10.57421875, -10.120849609375, -9.66748046875, -9.214111328125, -8.7607421875, -8.307373046875, -7.85400390625, -7.400634765625, -6.947265625, -6.493896484375, -6.04052734375, -5.587158203125, -5.1337890625, -4.680419921875, -4.22705078125, -3.773681640625, -3.3203125, -2.866943359375, -2.41357421875, -1.960205078125, -1.5068359375, -1.053466796875, -0.60009765625, -0.146728515625, 0.306640625, 0.760009765625, 1.21337890625, 1.666748046875, 2.1201171875, 2.573486328125, 3.02685546875, 3.480224609375, 3.93359375, 4.386962890625, 4.84033203125, 5.293701171875, 5.7470703125, 6.200439453125, 6.65380859375, 7.107177734375, 7.560546875, 8.013916015625, 8.46728515625, 8.920654296875, 9.3740234375, 9.827392578125, 10.28076171875, 10.734130859375, 11.1875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 10.0, 16.0, 15.0, 19.0, 44.0, 73.0, 93.0, 144.0, 274.0, 439.0, 654.0, 779.0, 582.0, 364.0, 202.0, 111.0, 97.0, 52.0, 25.0, 18.0, 15.0, 8.0, 11.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.3380126953125, -8.043212890625, -7.7484130859375, -7.45361328125, -7.1588134765625, -6.864013671875, -6.5692138671875, -6.2744140625, -5.9796142578125, -5.684814453125, -5.3900146484375, -5.09521484375, -4.8004150390625, -4.505615234375, -4.2108154296875, -3.916015625, -3.6212158203125, -3.326416015625, -3.0316162109375, -2.73681640625, -2.4420166015625, -2.147216796875, -1.8524169921875, -1.5576171875, -1.2628173828125, -0.968017578125, -0.6732177734375, -0.37841796875, -0.0836181640625, 0.211181640625, 0.5059814453125, 0.80078125, 1.0955810546875, 1.390380859375, 1.6851806640625, 1.97998046875, 2.2747802734375, 2.569580078125, 2.8643798828125, 3.1591796875, 3.4539794921875, 3.748779296875, 4.0435791015625, 4.33837890625, 4.6331787109375, 4.927978515625, 5.2227783203125, 5.517578125, 5.8123779296875, 6.107177734375, 6.4019775390625, 6.69677734375, 6.9915771484375, 7.286376953125, 7.5811767578125, 7.8759765625, 8.1707763671875, 8.465576171875, 8.7603759765625, 9.05517578125, 9.3499755859375, 9.644775390625, 9.9395751953125, 10.234375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 14.0, 32.0, 37.0, 65.0, 127.0, 234.0, 454.0, 811.0, 1663.0, 3733.0, 9589.0, 31475.0, 162612.0, 1705515.0, 2030701.0, 193676.0, 35183.0, 10605.0, 4009.0, 1839.0, 881.0, 459.0, 243.0, 152.0, 77.0, 46.0, 19.0, 10.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.9296875, -13.5205078125, -13.111328125, -12.7021484375, -12.29296875, -11.8837890625, -11.474609375, -11.0654296875, -10.65625, -10.2470703125, -9.837890625, -9.4287109375, -9.01953125, -8.6103515625, -8.201171875, -7.7919921875, -7.3828125, -6.9736328125, -6.564453125, -6.1552734375, -5.74609375, -5.3369140625, -4.927734375, -4.5185546875, -4.109375, -3.7001953125, -3.291015625, -2.8818359375, -2.47265625, -2.0634765625, -1.654296875, -1.2451171875, -0.8359375, -0.4267578125, -0.017578125, 0.3916015625, 0.80078125, 1.2099609375, 1.619140625, 2.0283203125, 2.4375, 2.8466796875, 3.255859375, 3.6650390625, 4.07421875, 4.4833984375, 4.892578125, 5.3017578125, 5.7109375, 6.1201171875, 6.529296875, 6.9384765625, 7.34765625, 7.7568359375, 8.166015625, 8.5751953125, 8.984375, 9.3935546875, 9.802734375, 10.2119140625, 10.62109375, 11.0302734375, 11.439453125, 11.8486328125, 12.2578125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 8.0, 39.0, 61.0, 114.0, 191.0, 186.0, 163.0, 99.0, 85.0, 27.0, 20.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-100.6738510131836, -98.3565444946289, -96.03923797607422, -93.72193145751953, -91.40461730957031, -89.08731079101562, -86.77000427246094, -84.45269775390625, -82.13539123535156, -79.81808471679688, -77.50077819824219, -75.1834716796875, -72.86616516113281, -70.5488510131836, -68.2315444946289, -65.91423797607422, -63.59693145751953, -61.279624938964844, -58.962318420410156, -56.6450080871582, -54.327701568603516, -52.01039505004883, -49.693084716796875, -47.37577819824219, -45.0584716796875, -42.74116516113281, -40.423858642578125, -38.10654830932617, -35.789241790771484, -33.4719352722168, -31.154626846313477, -28.837318420410156, -26.520004272460938, -24.20269775390625, -21.88538932800293, -19.56808090209961, -17.250774383544922, -14.933466911315918, -12.616159439086914, -10.298851013183594, -7.981544494628906, -5.664237022399902, -3.3469295501708984, -1.0296220779418945, 1.2876853942871094, 3.6049928665161133, 5.922300338745117, 8.239608764648438, 10.556915283203125, 12.874222755432129, 15.191530227661133, 17.508838653564453, 19.82614517211914, 22.143451690673828, 24.46076011657715, 26.77806854248047, 29.095375061035156, 31.412681579589844, 33.72998809814453, 36.047298431396484, 38.36460494995117, 40.68191146850586, 42.99922180175781, 45.3165283203125, 47.63383483886719]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 4.0, 5.0, 9.0, 12.0, 12.0, 12.0, 17.0, 32.0, 27.0, 35.0, 31.0, 46.0, 30.0, 36.0, 50.0, 46.0, 34.0, 41.0, 43.0, 62.0, 45.0, 42.0, 41.0, 32.0, 47.0, 27.0, 21.0, 27.0, 20.0, 22.0, 19.0, 10.0, 12.0, 8.0, 7.0, 7.0, 5.0, 10.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.952232360839844, -20.172441482543945, -19.392650604248047, -18.61285972595215, -17.83306884765625, -17.053279876708984, -16.273487091064453, -15.493698120117188, -14.713907241821289, -13.93411636352539, -13.154325485229492, -12.374534606933594, -11.594744682312012, -10.814953804016113, -10.035162925720215, -9.255373001098633, -8.475581169128418, -7.6957902908325195, -6.915999889373779, -6.136209011077881, -5.356418609619141, -4.576627731323242, -3.7968368530273438, -3.0170464515686035, -2.237255573272705, -1.4574649333953857, -0.6776741743087769, 0.10211658477783203, 0.8819072246551514, 1.6616978645324707, 2.441488742828369, 3.2212791442871094, 4.001070022583008, 4.780860900878906, 5.5606513023376465, 6.340442180633545, 7.120232582092285, 7.900023460388184, 8.679814338684082, 9.459604263305664, 10.239395141601562, 11.019186019897461, 11.79897689819336, 12.578767776489258, 13.35855770111084, 14.138348579406738, 14.918139457702637, 15.697929382324219, 16.47772216796875, 17.25751304626465, 18.037303924560547, 18.817094802856445, 19.596885681152344, 20.37667465209961, 21.15646743774414, 21.936256408691406, 22.716047286987305, 23.495838165283203, 24.2756290435791, 25.055419921875, 25.8352108001709, 26.615001678466797, 27.394790649414062, 28.17458152770996, 28.95437240600586]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 13.0, 9.0, 18.0, 15.0, 23.0, 32.0, 41.0, 37.0, 32.0, 45.0, 68.0, 67.0, 73.0, 67.0, 67.0, 59.0, 64.0, 49.0, 35.0, 46.0, 30.0, 30.0, 17.0, 19.0, 15.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.76171875, -3.657684326171875, -3.55364990234375, -3.449615478515625, -3.3455810546875, -3.241546630859375, -3.13751220703125, -3.033477783203125, -2.929443359375, -2.825408935546875, -2.72137451171875, -2.617340087890625, -2.5133056640625, -2.409271240234375, -2.30523681640625, -2.201202392578125, -2.09716796875, -1.993133544921875, -1.88909912109375, -1.785064697265625, -1.6810302734375, -1.576995849609375, -1.47296142578125, -1.368927001953125, -1.264892578125, -1.160858154296875, -1.05682373046875, -0.952789306640625, -0.8487548828125, -0.744720458984375, -0.64068603515625, -0.536651611328125, -0.4326171875, -0.328582763671875, -0.22454833984375, -0.120513916015625, -0.0164794921875, 0.087554931640625, 0.19158935546875, 0.295623779296875, 0.399658203125, 0.503692626953125, 0.60772705078125, 0.711761474609375, 0.8157958984375, 0.919830322265625, 1.02386474609375, 1.127899169921875, 1.23193359375, 1.335968017578125, 1.44000244140625, 1.544036865234375, 1.6480712890625, 1.752105712890625, 1.85614013671875, 1.960174560546875, 2.064208984375, 2.168243408203125, 2.27227783203125, 2.376312255859375, 2.4803466796875, 2.584381103515625, 2.68841552734375, 2.792449951171875, 2.896484375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 14.0, 7.0, 23.0, 33.0, 33.0, 46.0, 55.0, 93.0, 130.0, 188.0, 302.0, 452.0, 733.0, 1250.0, 2136.0, 3787.0, 6835.0, 13023.0, 24878.0, 50062.0, 111770.0, 359635.0, 284134.0, 96445.0, 44268.0, 21939.0, 11440.0, 6279.0, 3438.0, 1953.0, 1146.0, 666.0, 450.0, 293.0, 185.0, 110.0, 90.0, 60.0, 53.0, 30.0, 18.0, 13.0, 17.0, 11.0, 13.0, 5.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0], "bins": [-0.1978759765625, -0.19204139709472656, -0.18620681762695312, -0.1803722381591797, -0.17453765869140625, -0.1687030792236328, -0.16286849975585938, -0.15703392028808594, -0.1511993408203125, -0.14536476135253906, -0.13953018188476562, -0.1336956024169922, -0.12786102294921875, -0.12202644348144531, -0.11619186401367188, -0.11035728454589844, -0.104522705078125, -0.09868812561035156, -0.09285354614257812, -0.08701896667480469, -0.08118438720703125, -0.07534980773925781, -0.06951522827148438, -0.06368064880371094, -0.0578460693359375, -0.05201148986816406, -0.046176910400390625, -0.04034233093261719, -0.03450775146484375, -0.028673171997070312, -0.022838592529296875, -0.017004013061523438, -0.01116943359375, -0.0053348541259765625, 0.000499725341796875, 0.0063343048095703125, 0.01216888427734375, 0.018003463745117188, 0.023838043212890625, 0.029672622680664062, 0.0355072021484375, 0.04134178161621094, 0.047176361083984375, 0.05301094055175781, 0.05884552001953125, 0.06468009948730469, 0.07051467895507812, 0.07634925842285156, 0.082183837890625, 0.08801841735839844, 0.09385299682617188, 0.09968757629394531, 0.10552215576171875, 0.11135673522949219, 0.11719131469726562, 0.12302589416503906, 0.1288604736328125, 0.13469505310058594, 0.14052963256835938, 0.1463642120361328, 0.15219879150390625, 0.1580333709716797, 0.16386795043945312, 0.16970252990722656, 0.175537109375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 9.0, 10.0, 7.0, 7.0, 8.0, 14.0, 6.0, 7.0, 20.0, 20.0, 24.0, 22.0, 22.0, 27.0, 24.0, 29.0, 45.0, 38.0, 32.0, 45.0, 48.0, 1059.0, 27.0, 42.0, 45.0, 38.0, 36.0, 36.0, 33.0, 39.0, 34.0, 26.0, 28.0, 20.0, 13.0, 10.0, 21.0, 4.0, 11.0, 13.0, 8.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9501953125, -1.8871002197265625, -1.824005126953125, -1.7609100341796875, -1.69781494140625, -1.6347198486328125, -1.571624755859375, -1.5085296630859375, -1.4454345703125, -1.3823394775390625, -1.319244384765625, -1.2561492919921875, -1.19305419921875, -1.1299591064453125, -1.066864013671875, -1.0037689208984375, -0.940673828125, -0.8775787353515625, -0.814483642578125, -0.7513885498046875, -0.68829345703125, -0.6251983642578125, -0.562103271484375, -0.4990081787109375, -0.4359130859375, -0.3728179931640625, -0.309722900390625, -0.2466278076171875, -0.18353271484375, -0.1204376220703125, -0.057342529296875, 0.0057525634765625, 0.06884765625, 0.1319427490234375, 0.195037841796875, 0.2581329345703125, 0.32122802734375, 0.3843231201171875, 0.447418212890625, 0.5105133056640625, 0.5736083984375, 0.6367034912109375, 0.699798583984375, 0.7628936767578125, 0.82598876953125, 0.8890838623046875, 0.952178955078125, 1.0152740478515625, 1.078369140625, 1.1414642333984375, 1.204559326171875, 1.2676544189453125, 1.33074951171875, 1.3938446044921875, 1.456939697265625, 1.5200347900390625, 1.5831298828125, 1.6462249755859375, 1.709320068359375, 1.7724151611328125, 1.83551025390625, 1.8986053466796875, 1.961700439453125, 2.0247955322265625, 2.087890625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 8.0, 7.0, 13.0, 18.0, 31.0, 42.0, 57.0, 85.0, 127.0, 167.0, 223.0, 324.0, 475.0, 649.0, 886.0, 1265.0, 1787.0, 2500.0, 3505.0, 4984.0, 7190.0, 10328.0, 14731.0, 21608.0, 32597.0, 50173.0, 81698.0, 154147.0, 1314405.0, 155298.0, 82748.0, 50588.0, 32942.0, 22042.0, 14770.0, 10280.0, 7088.0, 4970.0, 3580.0, 2469.0, 1886.0, 1295.0, 915.0, 654.0, 475.0, 314.0, 237.0, 157.0, 125.0, 89.0, 62.0, 45.0, 25.0, 15.0, 17.0, 8.0, 10.0, 3.0, 2.0, 3.0], "bins": [-0.044769287109375, -0.043392181396484375, -0.04201507568359375, -0.040637969970703125, -0.0392608642578125, -0.037883758544921875, -0.03650665283203125, -0.035129547119140625, -0.03375244140625, -0.032375335693359375, -0.03099822998046875, -0.029621124267578125, -0.0282440185546875, -0.026866912841796875, -0.02548980712890625, -0.024112701416015625, -0.022735595703125, -0.021358489990234375, -0.01998138427734375, -0.018604278564453125, -0.0172271728515625, -0.015850067138671875, -0.01447296142578125, -0.013095855712890625, -0.01171875, -0.010341644287109375, -0.00896453857421875, -0.007587432861328125, -0.0062103271484375, -0.004833221435546875, -0.00345611572265625, -0.002079010009765625, -0.000701904296875, 0.000675201416015625, 0.00205230712890625, 0.003429412841796875, 0.0048065185546875, 0.006183624267578125, 0.00756072998046875, 0.008937835693359375, 0.01031494140625, 0.011692047119140625, 0.01306915283203125, 0.014446258544921875, 0.0158233642578125, 0.017200469970703125, 0.01857757568359375, 0.019954681396484375, 0.021331787109375, 0.022708892822265625, 0.02408599853515625, 0.025463104248046875, 0.0268402099609375, 0.028217315673828125, 0.02959442138671875, 0.030971527099609375, 0.0323486328125, 0.033725738525390625, 0.03510284423828125, 0.036479949951171875, 0.0378570556640625, 0.039234161376953125, 0.04061126708984375, 0.041988372802734375, 0.043365478515625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 7.0, 16.0, 6.0, 12.0, 17.0, 34.0, 39.0, 37.0, 46.0, 53.0, 102.0, 116.0, 113.0, 73.0, 55.0, 52.0, 42.0, 31.0, 24.0, 20.0, 18.0, 11.0, 6.0, 11.0, 10.0, 4.0, 9.0, 2.0, 0.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004665851593017578, -0.00045050308108329773, -0.00043442100286483765, -0.00041833892464637756, -0.0004022568464279175, -0.0003861747682094574, -0.0003700926899909973, -0.00035401061177253723, -0.00033792853355407715, -0.00032184645533561707, -0.000305764377117157, -0.0002896822988986969, -0.0002736002206802368, -0.00025751814246177673, -0.00024143606424331665, -0.00022535398602485657, -0.00020927190780639648, -0.0001931898295879364, -0.00017710775136947632, -0.00016102567315101624, -0.00014494359493255615, -0.00012886151671409607, -0.00011277943849563599, -9.66973602771759e-05, -8.061528205871582e-05, -6.453320384025574e-05, -4.8451125621795654e-05, -3.236904740333557e-05, -1.6286969184875488e-05, -2.0489096641540527e-07, 1.5877187252044678e-05, 3.195926547050476e-05, 4.8041343688964844e-05, 6.412342190742493e-05, 8.020550012588501e-05, 9.628757834434509e-05, 0.00011236965656280518, 0.00012845173478126526, 0.00014453381299972534, 0.00016061589121818542, 0.0001766979694366455, 0.0001927800476551056, 0.00020886212587356567, 0.00022494420409202576, 0.00024102628231048584, 0.0002571083605289459, 0.000273190438747406, 0.0002892725169658661, 0.00030535459518432617, 0.00032143667340278625, 0.00033751875162124634, 0.0003536008298397064, 0.0003696829080581665, 0.0003857649862766266, 0.00040184706449508667, 0.00041792914271354675, 0.00043401122093200684, 0.0004500932991504669, 0.000466175377368927, 0.0004822574555873871, 0.0004983395338058472, 0.0005144216120243073, 0.0005305036902427673, 0.0005465857684612274, 0.0005626678466796875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 1.0, 4.0, 7.0, 10.0, 15.0, 12.0, 19.0, 24.0, 25.0, 45.0, 67.0, 104.0, 194.0, 636.0, 3560.0, 31048.0, 657582.0, 330538.0, 20987.0, 2624.0, 524.0, 179.0, 99.0, 70.0, 43.0, 35.0, 23.0, 13.0, 15.0, 6.0, 14.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0091552734375, -0.008893072605133057, -0.008630871772766113, -0.00836867094039917, -0.008106470108032227, -0.007844269275665283, -0.00758206844329834, -0.0073198676109313965, -0.007057666778564453, -0.00679546594619751, -0.006533265113830566, -0.006271064281463623, -0.00600886344909668, -0.005746662616729736, -0.005484461784362793, -0.00522226095199585, -0.004960060119628906, -0.004697859287261963, -0.0044356584548950195, -0.004173457622528076, -0.003911256790161133, -0.0036490559577941895, -0.003386855125427246, -0.0031246542930603027, -0.0028624534606933594, -0.002600252628326416, -0.0023380517959594727, -0.0020758509635925293, -0.001813650131225586, -0.0015514492988586426, -0.0012892484664916992, -0.0010270476341247559, -0.0007648468017578125, -0.0005026459693908691, -0.00024044513702392578, 2.1755695343017578e-05, 0.00028395652770996094, 0.0005461573600769043, 0.0008083581924438477, 0.001070559024810791, 0.0013327598571777344, 0.0015949606895446777, 0.001857161521911621, 0.0021193623542785645, 0.002381563186645508, 0.002643764019012451, 0.0029059648513793945, 0.003168165683746338, 0.0034303665161132812, 0.0036925673484802246, 0.003954768180847168, 0.004216969013214111, 0.004479169845581055, 0.004741370677947998, 0.005003571510314941, 0.005265772342681885, 0.005527973175048828, 0.0057901740074157715, 0.006052374839782715, 0.006314575672149658, 0.0065767765045166016, 0.006838977336883545, 0.007101178169250488, 0.007363379001617432, 0.007625579833984375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 33.0, 377.0, 556.0, 37.0, 8.0], "bins": [-0.013181163929402828, -0.012965384870767593, -0.012749604880809784, -0.012533825822174549, -0.012318046763539314, -0.012102266773581505, -0.01188648771494627, -0.011670708656311035, -0.0114549295976758, -0.011239150539040565, -0.011023370549082756, -0.010807591490447521, -0.010591812431812286, -0.010376032441854477, -0.010160253383219242, -0.009944474324584007, -0.009728694334626198, -0.009512915275990963, -0.009297135286033154, -0.009081356227397919, -0.008865577168762684, -0.008649798110127449, -0.00843401812016964, -0.008218239061534405, -0.00800246000289917, -0.007786680478602648, -0.007570901419967413, -0.007355121895670891, -0.007139342837035656, -0.006923563312739134, -0.006707783788442612, -0.006492004729807377, -0.006276224739849567, -0.006060445215553045, -0.0058446661569178104, -0.005628886632621288, -0.0054131075739860535, -0.005197328049689531, -0.004981548525393009, -0.004765769466757774, -0.0045499904081225395, -0.004334210883826017, -0.0041184318251907825, -0.0039026523008942604, -0.003686873009428382, -0.0034710937179625034, -0.003255314426496625, -0.0030395351350307465, -0.0028237556107342243, -0.002607976319268346, -0.0023921970278024673, -0.002176417503505945, -0.0019606382120400667, -0.0017448589205741882, -0.0015290796291083097, -0.0013133002212271094, -0.001097520929761231, -0.0008817415800876915, -0.0006659622304141521, -0.00045018293894827366, -0.00023440358927473426, -1.862423960119486e-05, 0.00019715505186468363, 0.00041293445974588394, 0.0006287137512117624]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 9.0, 12.0, 19.0, 17.0, 23.0, 25.0, 49.0, 46.0, 52.0, 70.0, 53.0, 60.0, 73.0, 73.0, 80.0, 50.0, 48.0, 45.0, 38.0, 47.0, 29.0, 25.0, 19.0, 10.0, 12.0, 12.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004439353942871094, -0.00042630359530448914, -0.0004086717963218689, -0.00039103999733924866, -0.0003734081983566284, -0.0003557763993740082, -0.00033814460039138794, -0.0003205128014087677, -0.00030288100242614746, -0.0002852492034435272, -0.000267617404460907, -0.00024998560547828674, -0.0002323538064956665, -0.00021472200751304626, -0.00019709020853042603, -0.00017945840954780579, -0.00016182661056518555, -0.0001441948115825653, -0.00012656301259994507, -0.00010893121361732483, -9.129941463470459e-05, -7.366761565208435e-05, -5.603581666946411e-05, -3.840401768684387e-05, -2.0772218704223633e-05, -3.1404197216033936e-06, 1.4491379261016846e-05, 3.2123178243637085e-05, 4.9754977226257324e-05, 6.738677620887756e-05, 8.50185751914978e-05, 0.00010265037417411804, 0.00012028217315673828, 0.00013791397213935852, 0.00015554577112197876, 0.000173177570104599, 0.00019080936908721924, 0.00020844116806983948, 0.00022607296705245972, 0.00024370476603507996, 0.0002613365650177002, 0.00027896836400032043, 0.0002966001629829407, 0.0003142319619655609, 0.00033186376094818115, 0.0003494955599308014, 0.00036712735891342163, 0.00038475915789604187, 0.0004023909568786621, 0.00042002275586128235, 0.0004376545548439026, 0.00045528635382652283, 0.00047291815280914307, 0.0004905499517917633, 0.0005081817507743835, 0.0005258135497570038, 0.000543445348739624, 0.0005610771477222443, 0.0005787089467048645, 0.0005963407456874847, 0.000613972544670105, 0.0006316043436527252, 0.0006492361426353455, 0.0006668679416179657, 0.0006844997406005859]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 13.0, 9.0, 18.0, 14.0, 23.0, 33.0, 41.0, 37.0, 32.0, 45.0, 68.0, 66.0, 74.0, 66.0, 68.0, 59.0, 64.0, 49.0, 34.0, 47.0, 29.0, 31.0, 17.0, 19.0, 15.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.763671875, -3.65960693359375, -3.5555419921875, -3.45147705078125, -3.347412109375, -3.24334716796875, -3.1392822265625, -3.03521728515625, -2.93115234375, -2.82708740234375, -2.7230224609375, -2.61895751953125, -2.514892578125, -2.41082763671875, -2.3067626953125, -2.20269775390625, -2.0986328125, -1.99456787109375, -1.8905029296875, -1.78643798828125, -1.682373046875, -1.57830810546875, -1.4742431640625, -1.37017822265625, -1.26611328125, -1.16204833984375, -1.0579833984375, -0.95391845703125, -0.849853515625, -0.74578857421875, -0.6417236328125, -0.53765869140625, -0.43359375, -0.32952880859375, -0.2254638671875, -0.12139892578125, -0.017333984375, 0.08673095703125, 0.1907958984375, 0.29486083984375, 0.39892578125, 0.50299072265625, 0.6070556640625, 0.71112060546875, 0.815185546875, 0.91925048828125, 1.0233154296875, 1.12738037109375, 1.2314453125, 1.33551025390625, 1.4395751953125, 1.54364013671875, 1.647705078125, 1.75177001953125, 1.8558349609375, 1.95989990234375, 2.06396484375, 2.16802978515625, 2.2720947265625, 2.37615966796875, 2.480224609375, 2.58428955078125, 2.6883544921875, 2.79241943359375, 2.896484375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 13.0, 23.0, 38.0, 56.0, 105.0, 148.0, 300.0, 714.0, 1873.0, 5846.0, 26141.0, 622019.0, 362127.0, 21150.0, 4979.0, 1660.0, 649.0, 318.0, 163.0, 94.0, 43.0, 27.0, 11.0, 15.0, 8.0, 10.0, 11.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.1639404296875, -11.695068359375, -11.2261962890625, -10.75732421875, -10.2884521484375, -9.819580078125, -9.3507080078125, -8.8818359375, -8.4129638671875, -7.944091796875, -7.4752197265625, -7.00634765625, -6.5374755859375, -6.068603515625, -5.5997314453125, -5.130859375, -4.6619873046875, -4.193115234375, -3.7242431640625, -3.25537109375, -2.7864990234375, -2.317626953125, -1.8487548828125, -1.3798828125, -0.9110107421875, -0.442138671875, 0.0267333984375, 0.49560546875, 0.9644775390625, 1.433349609375, 1.9022216796875, 2.37109375, 2.8399658203125, 3.308837890625, 3.7777099609375, 4.24658203125, 4.7154541015625, 5.184326171875, 5.6531982421875, 6.1220703125, 6.5909423828125, 7.059814453125, 7.5286865234375, 7.99755859375, 8.4664306640625, 8.935302734375, 9.4041748046875, 9.873046875, 10.3419189453125, 10.810791015625, 11.2796630859375, 11.74853515625, 12.2174072265625, 12.686279296875, 13.1551513671875, 13.6240234375, 14.0928955078125, 14.561767578125, 15.0306396484375, 15.49951171875, 15.9683837890625, 16.437255859375, 16.9061279296875, 17.375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 12.0, 11.0, 7.0, 8.0, 15.0, 16.0, 12.0, 10.0, 21.0, 27.0, 26.0, 26.0, 29.0, 28.0, 39.0, 41.0, 43.0, 67.0, 86.0, 126.0, 244.0, 1408.0, 158.0, 94.0, 87.0, 58.0, 50.0, 43.0, 30.0, 31.0, 24.0, 25.0, 19.0, 20.0, 16.0, 15.0, 15.0, 17.0, 7.0, 8.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-7.125, -6.90362548828125, -6.6822509765625, -6.46087646484375, -6.239501953125, -6.01812744140625, -5.7967529296875, -5.57537841796875, -5.35400390625, -5.13262939453125, -4.9112548828125, -4.68988037109375, -4.468505859375, -4.24713134765625, -4.0257568359375, -3.80438232421875, -3.5830078125, -3.36163330078125, -3.1402587890625, -2.91888427734375, -2.697509765625, -2.47613525390625, -2.2547607421875, -2.03338623046875, -1.81201171875, -1.59063720703125, -1.3692626953125, -1.14788818359375, -0.926513671875, -0.70513916015625, -0.4837646484375, -0.26239013671875, -0.041015625, 0.18035888671875, 0.4017333984375, 0.62310791015625, 0.844482421875, 1.06585693359375, 1.2872314453125, 1.50860595703125, 1.72998046875, 1.95135498046875, 2.1727294921875, 2.39410400390625, 2.615478515625, 2.83685302734375, 3.0582275390625, 3.27960205078125, 3.5009765625, 3.72235107421875, 3.9437255859375, 4.16510009765625, 4.386474609375, 4.60784912109375, 4.8292236328125, 5.05059814453125, 5.27197265625, 5.49334716796875, 5.7147216796875, 5.93609619140625, 6.157470703125, 6.37884521484375, 6.6002197265625, 6.82159423828125, 7.04296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 3.0, 7.0, 11.0, 10.0, 23.0, 23.0, 23.0, 28.0, 44.0, 59.0, 64.0, 153.0, 245.0, 479.0, 840.0, 2035.0, 5015.0, 15814.0, 105030.0, 2362323.0, 597527.0, 40466.0, 9261.0, 3223.0, 1389.0, 655.0, 323.0, 187.0, 115.0, 65.0, 69.0, 48.0, 17.0, 19.0, 17.0, 22.0, 14.0, 14.0, 8.0, 5.0, 10.0, 8.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.0859375, -10.7371826171875, -10.388427734375, -10.0396728515625, -9.69091796875, -9.3421630859375, -8.993408203125, -8.6446533203125, -8.2958984375, -7.9471435546875, -7.598388671875, -7.2496337890625, -6.90087890625, -6.5521240234375, -6.203369140625, -5.8546142578125, -5.505859375, -5.1571044921875, -4.808349609375, -4.4595947265625, -4.11083984375, -3.7620849609375, -3.413330078125, -3.0645751953125, -2.7158203125, -2.3670654296875, -2.018310546875, -1.6695556640625, -1.32080078125, -0.9720458984375, -0.623291015625, -0.2745361328125, 0.07421875, 0.4229736328125, 0.771728515625, 1.1204833984375, 1.46923828125, 1.8179931640625, 2.166748046875, 2.5155029296875, 2.8642578125, 3.2130126953125, 3.561767578125, 3.9105224609375, 4.25927734375, 4.6080322265625, 4.956787109375, 5.3055419921875, 5.654296875, 6.0030517578125, 6.351806640625, 6.7005615234375, 7.04931640625, 7.3980712890625, 7.746826171875, 8.0955810546875, 8.4443359375, 8.7930908203125, 9.141845703125, 9.4906005859375, 9.83935546875, 10.1881103515625, 10.536865234375, 10.8856201171875, 11.234375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 123.0, 610.0, 265.0, 17.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.53078842163086, -25.123645782470703, -20.716503143310547, -16.309358596801758, -11.902215957641602, -7.495073318481445, -3.0879287719726562, 1.3192138671875, 5.726356506347656, 10.133499145507812, 14.540642738342285, 18.947786331176758, 23.354928970336914, 27.76207160949707, 32.16921615600586, 36.576358795166016, 40.98350143432617, 45.39064407348633, 49.797786712646484, 54.204933166503906, 58.61207580566406, 63.01921844482422, 67.42636108398438, 71.83350372314453, 76.24064636230469, 80.64778900146484, 85.054931640625, 89.46207427978516, 93.86921691894531, 98.27635955810547, 102.68350219726562, 107.09065246582031, 111.497802734375, 115.90494537353516, 120.31208801269531, 124.71923065185547, 129.12637329101562, 133.5335235595703, 137.94065856933594, 142.34780883789062, 146.75494384765625, 151.16209411621094, 155.56922912597656, 159.97637939453125, 164.38351440429688, 168.79066467285156, 173.1977996826172, 177.60494995117188, 182.0120849609375, 186.4192352294922, 190.8263702392578, 195.2335205078125, 199.64065551757812, 204.0478057861328, 208.45494079589844, 212.86209106445312, 217.2692413330078, 221.6763916015625, 226.08352661132812, 230.4906768798828, 234.89781188964844, 239.30496215820312, 243.71209716796875, 248.11924743652344, 252.52638244628906]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 5.0, 13.0, 4.0, 8.0, 16.0, 18.0, 18.0, 15.0, 25.0, 25.0, 32.0, 24.0, 32.0, 34.0, 26.0, 32.0, 39.0, 40.0, 47.0, 43.0, 41.0, 42.0, 38.0, 44.0, 41.0, 36.0, 34.0, 31.0, 40.0, 27.0, 26.0, 23.0, 20.0, 12.0, 9.0, 8.0, 10.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-28.002681732177734, -27.202951431274414, -26.403223037719727, -25.603492736816406, -24.803762435913086, -24.004032135009766, -23.204303741455078, -22.404573440551758, -21.604843139648438, -20.805112838745117, -20.00538444519043, -19.20565414428711, -18.40592384338379, -17.60619354248047, -16.80646514892578, -16.00673484802246, -15.207006454467773, -14.40727710723877, -13.60754680633545, -12.807817459106445, -12.008087158203125, -11.208357810974121, -10.408628463745117, -9.608898162841797, -8.809168815612793, -8.009439468383789, -7.209709167480469, -6.409979820251465, -5.610249996185303, -4.810520172119141, -4.010790824890137, -3.2110610008239746, -2.4113311767578125, -1.61160147190094, -0.8118717670440674, -0.012142181396484375, 0.7875876426696777, 1.5873174667358398, 2.3870468139648438, 3.186776638031006, 3.986506462097168, 4.78623628616333, 5.585966110229492, 6.385695457458496, 7.185425281524658, 7.98515510559082, 8.784884452819824, 9.584613800048828, 10.384344100952148, 11.184073448181152, 11.983803749084473, 12.783533096313477, 13.583263397216797, 14.3829927444458, 15.182722091674805, 15.982452392578125, 16.782180786132812, 17.581911087036133, 18.38163948059082, 19.18136978149414, 19.98110008239746, 20.78083038330078, 21.58055877685547, 22.38028907775879, 23.18001937866211]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 6.0, 11.0, 10.0, 10.0, 23.0, 15.0, 28.0, 38.0, 41.0, 37.0, 44.0, 49.0, 59.0, 69.0, 65.0, 64.0, 59.0, 62.0, 50.0, 55.0, 38.0, 42.0, 33.0, 24.0, 17.0, 21.0, 10.0, 8.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.744140625, -3.639495849609375, -3.53485107421875, -3.430206298828125, -3.3255615234375, -3.220916748046875, -3.11627197265625, -3.011627197265625, -2.906982421875, -2.802337646484375, -2.69769287109375, -2.593048095703125, -2.4884033203125, -2.383758544921875, -2.27911376953125, -2.174468994140625, -2.06982421875, -1.965179443359375, -1.86053466796875, -1.755889892578125, -1.6512451171875, -1.546600341796875, -1.44195556640625, -1.337310791015625, -1.232666015625, -1.128021240234375, -1.02337646484375, -0.918731689453125, -0.8140869140625, -0.709442138671875, -0.60479736328125, -0.500152587890625, -0.3955078125, -0.290863037109375, -0.18621826171875, -0.081573486328125, 0.0230712890625, 0.127716064453125, 0.23236083984375, 0.337005615234375, 0.441650390625, 0.546295166015625, 0.65093994140625, 0.755584716796875, 0.8602294921875, 0.964874267578125, 1.06951904296875, 1.174163818359375, 1.27880859375, 1.383453369140625, 1.48809814453125, 1.592742919921875, 1.6973876953125, 1.802032470703125, 1.90667724609375, 2.011322021484375, 2.115966796875, 2.220611572265625, 2.32525634765625, 2.429901123046875, 2.5345458984375, 2.639190673828125, 2.74383544921875, 2.848480224609375, 2.953125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 6.0, 14.0, 13.0, 18.0, 30.0, 23.0, 42.0, 58.0, 91.0, 146.0, 231.0, 337.0, 618.0, 1044.0, 2002.0, 4180.0, 10924.0, 43867.0, 447295.0, 3076650.0, 533544.0, 52369.0, 12286.0, 4413.0, 1958.0, 951.0, 450.0, 269.0, 149.0, 110.0, 57.0, 46.0, 29.0, 15.0, 10.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-10.96875, -10.6981201171875, -10.427490234375, -10.1568603515625, -9.88623046875, -9.6156005859375, -9.344970703125, -9.0743408203125, -8.8037109375, -8.5330810546875, -8.262451171875, -7.9918212890625, -7.72119140625, -7.4505615234375, -7.179931640625, -6.9093017578125, -6.638671875, -6.3680419921875, -6.097412109375, -5.8267822265625, -5.55615234375, -5.2855224609375, -5.014892578125, -4.7442626953125, -4.4736328125, -4.2030029296875, -3.932373046875, -3.6617431640625, -3.39111328125, -3.1204833984375, -2.849853515625, -2.5792236328125, -2.30859375, -2.0379638671875, -1.767333984375, -1.4967041015625, -1.22607421875, -0.9554443359375, -0.684814453125, -0.4141845703125, -0.1435546875, 0.1270751953125, 0.397705078125, 0.6683349609375, 0.93896484375, 1.2095947265625, 1.480224609375, 1.7508544921875, 2.021484375, 2.2921142578125, 2.562744140625, 2.8333740234375, 3.10400390625, 3.3746337890625, 3.645263671875, 3.9158935546875, 4.1865234375, 4.4571533203125, 4.727783203125, 4.9984130859375, 5.26904296875, 5.5396728515625, 5.810302734375, 6.0809326171875, 6.3515625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 3.0, 6.0, 8.0, 6.0, 8.0, 15.0, 19.0, 23.0, 36.0, 61.0, 74.0, 108.0, 178.0, 284.0, 410.0, 557.0, 610.0, 520.0, 380.0, 249.0, 168.0, 96.0, 67.0, 40.0, 34.0, 29.0, 23.0, 20.0, 10.0, 7.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.84375, -7.6151123046875, -7.386474609375, -7.1578369140625, -6.92919921875, -6.7005615234375, -6.471923828125, -6.2432861328125, -6.0146484375, -5.7860107421875, -5.557373046875, -5.3287353515625, -5.10009765625, -4.8714599609375, -4.642822265625, -4.4141845703125, -4.185546875, -3.9569091796875, -3.728271484375, -3.4996337890625, -3.27099609375, -3.0423583984375, -2.813720703125, -2.5850830078125, -2.3564453125, -2.1278076171875, -1.899169921875, -1.6705322265625, -1.44189453125, -1.2132568359375, -0.984619140625, -0.7559814453125, -0.52734375, -0.2987060546875, -0.070068359375, 0.1585693359375, 0.38720703125, 0.6158447265625, 0.844482421875, 1.0731201171875, 1.3017578125, 1.5303955078125, 1.759033203125, 1.9876708984375, 2.21630859375, 2.4449462890625, 2.673583984375, 2.9022216796875, 3.130859375, 3.3594970703125, 3.588134765625, 3.8167724609375, 4.04541015625, 4.2740478515625, 4.502685546875, 4.7313232421875, 4.9599609375, 5.1885986328125, 5.417236328125, 5.6458740234375, 5.87451171875, 6.1031494140625, 6.331787109375, 6.5604248046875, 6.7890625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 12.0, 6.0, 16.0, 13.0, 22.0, 37.0, 53.0, 88.0, 142.0, 238.0, 350.0, 509.0, 991.0, 1620.0, 2960.0, 5593.0, 11994.0, 30629.0, 107764.0, 563199.0, 2313327.0, 920573.0, 162601.0, 41484.0, 15036.0, 6843.0, 3403.0, 1930.0, 1126.0, 631.0, 367.0, 230.0, 197.0, 103.0, 55.0, 49.0, 22.0, 13.0, 16.0, 12.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.59375, -8.313232421875, -8.03271484375, -7.752197265625, -7.4716796875, -7.191162109375, -6.91064453125, -6.630126953125, -6.349609375, -6.069091796875, -5.78857421875, -5.508056640625, -5.2275390625, -4.947021484375, -4.66650390625, -4.385986328125, -4.10546875, -3.824951171875, -3.54443359375, -3.263916015625, -2.9833984375, -2.702880859375, -2.42236328125, -2.141845703125, -1.861328125, -1.580810546875, -1.30029296875, -1.019775390625, -0.7392578125, -0.458740234375, -0.17822265625, 0.102294921875, 0.3828125, 0.663330078125, 0.94384765625, 1.224365234375, 1.5048828125, 1.785400390625, 2.06591796875, 2.346435546875, 2.626953125, 2.907470703125, 3.18798828125, 3.468505859375, 3.7490234375, 4.029541015625, 4.31005859375, 4.590576171875, 4.87109375, 5.151611328125, 5.43212890625, 5.712646484375, 5.9931640625, 6.273681640625, 6.55419921875, 6.834716796875, 7.115234375, 7.395751953125, 7.67626953125, 7.956787109375, 8.2373046875, 8.517822265625, 8.79833984375, 9.078857421875, 9.359375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 17.0, 22.0, 43.0, 62.0, 93.0, 117.0, 119.0, 137.0, 102.0, 105.0, 67.0, 36.0, 29.0, 16.0, 16.0, 5.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.916015625, -45.53499221801758, -44.153968811035156, -42.77294158935547, -41.39191818237305, -40.010894775390625, -38.6298713684082, -37.24884796142578, -35.867820739746094, -34.48679733276367, -33.10577392578125, -31.724748611450195, -30.34372329711914, -28.96269989013672, -27.581676483154297, -26.200653076171875, -24.819629669189453, -23.43860626220703, -22.057580947875977, -20.676557540893555, -19.2955322265625, -17.914508819580078, -16.533485412597656, -15.152461051940918, -13.77143669128418, -12.390412330627441, -11.009387969970703, -9.628364562988281, -8.247340202331543, -6.866315841674805, -5.485292434692383, -4.1042680740356445, -2.723247528076172, -1.3422234058380127, 0.038800716400146484, 1.4198246002197266, 2.800848960876465, 4.181873321533203, 5.562896728515625, 6.943921089172363, 8.324945449829102, 9.70596981048584, 11.086994171142578, 12.468017578125, 13.849041938781738, 15.230066299438477, 16.6110897064209, 17.992115020751953, 19.373138427734375, 20.754161834716797, 22.13518714904785, 23.516210556030273, 24.897235870361328, 26.27825927734375, 27.659282684326172, 29.040306091308594, 30.42133140563965, 31.80235481262207, 33.183380126953125, 34.56440353393555, 35.94542694091797, 37.326454162597656, 38.70747375488281, 40.0885009765625, 41.46952438354492]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 13.0, 5.0, 5.0, 8.0, 14.0, 16.0, 20.0, 15.0, 16.0, 22.0, 25.0, 22.0, 22.0, 25.0, 30.0, 36.0, 36.0, 44.0, 44.0, 33.0, 37.0, 34.0, 39.0, 44.0, 36.0, 40.0, 35.0, 46.0, 49.0, 27.0, 24.0, 25.0, 30.0, 11.0, 11.0, 14.0, 10.0, 10.0, 5.0, 7.0, 3.0, 7.0, 3.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.16278839111328, -19.51471710205078, -18.86664581298828, -18.21857452392578, -17.57050323486328, -16.92243003845215, -16.27435874938965, -15.626287460327148, -14.978216171264648, -14.330144882202148, -13.682073593139648, -13.034001350402832, -12.385930061340332, -11.737858772277832, -11.089786529541016, -10.441715240478516, -9.793643951416016, -9.145572662353516, -8.497501373291016, -7.849429130554199, -7.201357841491699, -6.553286552429199, -5.905214786529541, -5.257143020629883, -4.609071731567383, -3.9610002040863037, -3.3129286766052246, -2.6648571491241455, -2.0167856216430664, -1.3687140941619873, -0.7206425666809082, -0.07257080078125, 0.57550048828125, 1.223572015762329, 1.8716435432434082, 2.5197150707244873, 3.1677865982055664, 3.8158581256866455, 4.463929653167725, 5.112001419067383, 5.760072708129883, 6.408143997192383, 7.056215763092041, 7.704287528991699, 8.3523588180542, 9.0004301071167, 9.648502349853516, 10.296573638916016, 10.944644927978516, 11.592716217041016, 12.240787506103516, 12.888859748840332, 13.536931037902832, 14.185002326965332, 14.833074569702148, 15.481145858764648, 16.12921714782715, 16.77728843688965, 17.42535972595215, 18.07343101501465, 18.72150421142578, 19.36957550048828, 20.01764678955078, 20.66571807861328, 21.31378936767578]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 8.0, 11.0, 9.0, 18.0, 23.0, 26.0, 32.0, 42.0, 38.0, 50.0, 44.0, 44.0, 70.0, 77.0, 50.0, 71.0, 54.0, 63.0, 48.0, 37.0, 34.0, 31.0, 29.0, 16.0, 14.0, 20.0, 12.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.46875, -3.366546630859375, -3.26434326171875, -3.162139892578125, -3.0599365234375, -2.957733154296875, -2.85552978515625, -2.753326416015625, -2.651123046875, -2.548919677734375, -2.44671630859375, -2.344512939453125, -2.2423095703125, -2.140106201171875, -2.03790283203125, -1.935699462890625, -1.83349609375, -1.731292724609375, -1.62908935546875, -1.526885986328125, -1.4246826171875, -1.322479248046875, -1.22027587890625, -1.118072509765625, -1.015869140625, -0.913665771484375, -0.81146240234375, -0.709259033203125, -0.6070556640625, -0.504852294921875, -0.40264892578125, -0.300445556640625, -0.1982421875, -0.096038818359375, 0.00616455078125, 0.108367919921875, 0.2105712890625, 0.312774658203125, 0.41497802734375, 0.517181396484375, 0.619384765625, 0.721588134765625, 0.82379150390625, 0.925994873046875, 1.0281982421875, 1.130401611328125, 1.23260498046875, 1.334808349609375, 1.43701171875, 1.539215087890625, 1.64141845703125, 1.743621826171875, 1.8458251953125, 1.948028564453125, 2.05023193359375, 2.152435302734375, 2.254638671875, 2.356842041015625, 2.45904541015625, 2.561248779296875, 2.6634521484375, 2.765655517578125, 2.86785888671875, 2.970062255859375, 3.072265625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 1.0, 2.0, 6.0, 8.0, 12.0, 8.0, 26.0, 31.0, 50.0, 64.0, 80.0, 116.0, 191.0, 283.0, 447.0, 752.0, 1123.0, 1870.0, 3150.0, 5411.0, 9506.0, 17487.0, 33640.0, 67951.0, 156767.0, 413716.0, 179595.0, 75082.0, 36941.0, 19340.0, 10426.0, 5838.0, 3354.0, 1949.0, 1209.0, 743.0, 445.0, 300.0, 204.0, 129.0, 98.0, 63.0, 53.0, 20.0, 19.0, 15.0, 15.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.200439453125, -0.1940898895263672, -0.18774032592773438, -0.18139076232910156, -0.17504119873046875, -0.16869163513183594, -0.16234207153320312, -0.1559925079345703, -0.1496429443359375, -0.1432933807373047, -0.13694381713867188, -0.13059425354003906, -0.12424468994140625, -0.11789512634277344, -0.11154556274414062, -0.10519599914550781, -0.098846435546875, -0.09249687194824219, -0.08614730834960938, -0.07979774475097656, -0.07344818115234375, -0.06709861755371094, -0.060749053955078125, -0.05439949035644531, -0.0480499267578125, -0.04170036315917969, -0.035350799560546875, -0.029001235961914062, -0.02265167236328125, -0.016302108764648438, -0.009952545166015625, -0.0036029815673828125, 0.00274658203125, 0.009096145629882812, 0.015445709228515625, 0.021795272827148438, 0.02814483642578125, 0.03449440002441406, 0.040843963623046875, 0.04719352722167969, 0.0535430908203125, 0.05989265441894531, 0.06624221801757812, 0.07259178161621094, 0.07894134521484375, 0.08529090881347656, 0.09164047241210938, 0.09799003601074219, 0.104339599609375, 0.11068916320800781, 0.11703872680664062, 0.12338829040527344, 0.12973785400390625, 0.13608741760253906, 0.14243698120117188, 0.1487865447998047, 0.1551361083984375, 0.1614856719970703, 0.16783523559570312, 0.17418479919433594, 0.18053436279296875, 0.18688392639160156, 0.19323348999023438, 0.1995830535888672, 0.2059326171875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 5.0, 10.0, 8.0, 12.0, 10.0, 12.0, 15.0, 27.0, 23.0, 23.0, 22.0, 18.0, 37.0, 31.0, 36.0, 37.0, 46.0, 45.0, 37.0, 35.0, 1064.0, 48.0, 46.0, 37.0, 39.0, 29.0, 33.0, 30.0, 19.0, 31.0, 26.0, 21.0, 23.0, 19.0, 16.0, 10.0, 10.0, 14.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.404296875, -2.33380126953125, -2.2633056640625, -2.19281005859375, -2.122314453125, -2.05181884765625, -1.9813232421875, -1.91082763671875, -1.84033203125, -1.76983642578125, -1.6993408203125, -1.62884521484375, -1.558349609375, -1.48785400390625, -1.4173583984375, -1.34686279296875, -1.2763671875, -1.20587158203125, -1.1353759765625, -1.06488037109375, -0.994384765625, -0.92388916015625, -0.8533935546875, -0.78289794921875, -0.71240234375, -0.64190673828125, -0.5714111328125, -0.50091552734375, -0.430419921875, -0.35992431640625, -0.2894287109375, -0.21893310546875, -0.1484375, -0.07794189453125, -0.0074462890625, 0.06304931640625, 0.133544921875, 0.20404052734375, 0.2745361328125, 0.34503173828125, 0.41552734375, 0.48602294921875, 0.5565185546875, 0.62701416015625, 0.697509765625, 0.76800537109375, 0.8385009765625, 0.90899658203125, 0.9794921875, 1.04998779296875, 1.1204833984375, 1.19097900390625, 1.261474609375, 1.33197021484375, 1.4024658203125, 1.47296142578125, 1.54345703125, 1.61395263671875, 1.6844482421875, 1.75494384765625, 1.825439453125, 1.89593505859375, 1.9664306640625, 2.03692626953125, 2.107421875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 10.0, 18.0, 24.0, 32.0, 51.0, 77.0, 110.0, 149.0, 216.0, 324.0, 473.0, 671.0, 1032.0, 1545.0, 2330.0, 3279.0, 4763.0, 7101.0, 10474.0, 16130.0, 24501.0, 38090.0, 60583.0, 101898.0, 293096.0, 1226912.0, 115609.0, 66605.0, 41446.0, 26529.0, 17327.0, 11643.0, 7685.0, 5165.0, 3542.0, 2333.0, 1670.0, 1116.0, 773.0, 594.0, 387.0, 265.0, 176.0, 125.0, 85.0, 53.0, 44.0, 22.0, 15.0, 11.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0], "bins": [-0.05377197265625, -0.05214738845825195, -0.050522804260253906, -0.04889822006225586, -0.04727363586425781, -0.045649051666259766, -0.04402446746826172, -0.04239988327026367, -0.040775299072265625, -0.03915071487426758, -0.03752613067626953, -0.035901546478271484, -0.03427696228027344, -0.03265237808227539, -0.031027793884277344, -0.029403209686279297, -0.02777862548828125, -0.026154041290283203, -0.024529457092285156, -0.02290487289428711, -0.021280288696289062, -0.019655704498291016, -0.01803112030029297, -0.016406536102294922, -0.014781951904296875, -0.013157367706298828, -0.011532783508300781, -0.009908199310302734, -0.008283615112304688, -0.006659030914306641, -0.005034446716308594, -0.003409862518310547, -0.0017852783203125, -0.00016069412231445312, 0.0014638900756835938, 0.0030884742736816406, 0.0047130584716796875, 0.006337642669677734, 0.007962226867675781, 0.009586811065673828, 0.011211395263671875, 0.012835979461669922, 0.014460563659667969, 0.016085147857666016, 0.017709732055664062, 0.01933431625366211, 0.020958900451660156, 0.022583484649658203, 0.02420806884765625, 0.025832653045654297, 0.027457237243652344, 0.02908182144165039, 0.030706405639648438, 0.032330989837646484, 0.03395557403564453, 0.03558015823364258, 0.037204742431640625, 0.03882932662963867, 0.04045391082763672, 0.042078495025634766, 0.04370307922363281, 0.04532766342163086, 0.046952247619628906, 0.04857683181762695, 0.050201416015625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 8.0, 7.0, 8.0, 22.0, 23.0, 30.0, 29.0, 33.0, 54.0, 62.0, 79.0, 103.0, 125.0, 96.0, 65.0, 45.0, 39.0, 31.0, 24.0, 18.0, 21.0, 14.0, 14.0, 8.0, 5.0, 3.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004258155822753906, -0.0004117041826248169, -0.00039759278297424316, -0.00038348138332366943, -0.0003693699836730957, -0.00035525858402252197, -0.00034114718437194824, -0.0003270357847213745, -0.0003129243850708008, -0.00029881298542022705, -0.0002847015857696533, -0.0002705901861190796, -0.00025647878646850586, -0.00024236738681793213, -0.0002282559871673584, -0.00021414458751678467, -0.00020003318786621094, -0.0001859217882156372, -0.00017181038856506348, -0.00015769898891448975, -0.00014358758926391602, -0.00012947618961334229, -0.00011536478996276855, -0.00010125339031219482, -8.71419906616211e-05, -7.303059101104736e-05, -5.891919136047363e-05, -4.48077917098999e-05, -3.069639205932617e-05, -1.658499240875244e-05, -2.473592758178711e-06, 1.163780689239502e-05, 2.574920654296875e-05, 3.986060619354248e-05, 5.397200584411621e-05, 6.808340549468994e-05, 8.219480514526367e-05, 9.63062047958374e-05, 0.00011041760444641113, 0.00012452900409698486, 0.0001386404037475586, 0.00015275180339813232, 0.00016686320304870605, 0.00018097460269927979, 0.00019508600234985352, 0.00020919740200042725, 0.00022330880165100098, 0.0002374202013015747, 0.00025153160095214844, 0.00026564300060272217, 0.0002797544002532959, 0.00029386579990386963, 0.00030797719955444336, 0.0003220885992050171, 0.0003361999988555908, 0.00035031139850616455, 0.0003644227981567383, 0.000378534197807312, 0.00039264559745788574, 0.00040675699710845947, 0.0004208683967590332, 0.00043497979640960693, 0.00044909119606018066, 0.0004632025957107544, 0.0004773139953613281]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 2.0, 13.0, 10.0, 22.0, 32.0, 47.0, 68.0, 127.0, 224.0, 502.0, 1012.0, 2730.0, 7495.0, 22073.0, 76060.0, 497217.0, 347652.0, 63470.0, 18871.0, 6555.0, 2432.0, 983.0, 411.0, 162.0, 117.0, 85.0, 56.0, 23.0, 27.0, 21.0, 11.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0084991455078125, -0.008248686790466309, -0.007998228073120117, -0.007747769355773926, -0.007497310638427734, -0.007246851921081543, -0.0069963932037353516, -0.00674593448638916, -0.006495475769042969, -0.006245017051696777, -0.005994558334350586, -0.0057440996170043945, -0.005493640899658203, -0.005243182182312012, -0.00499272346496582, -0.004742264747619629, -0.0044918060302734375, -0.004241347312927246, -0.003990888595581055, -0.0037404298782348633, -0.003489971160888672, -0.0032395124435424805, -0.002989053726196289, -0.0027385950088500977, -0.0024881362915039062, -0.002237677574157715, -0.0019872188568115234, -0.001736760139465332, -0.0014863014221191406, -0.0012358427047729492, -0.0009853839874267578, -0.0007349252700805664, -0.000484466552734375, -0.0002340078353881836, 1.6450881958007812e-05, 0.0002669095993041992, 0.0005173683166503906, 0.000767827033996582, 0.0010182857513427734, 0.0012687444686889648, 0.0015192031860351562, 0.0017696619033813477, 0.002020120620727539, 0.0022705793380737305, 0.002521038055419922, 0.0027714967727661133, 0.0030219554901123047, 0.003272414207458496, 0.0035228729248046875, 0.003773331642150879, 0.00402379035949707, 0.004274249076843262, 0.004524707794189453, 0.0047751665115356445, 0.005025625228881836, 0.005276083946228027, 0.005526542663574219, 0.00577700138092041, 0.0060274600982666016, 0.006277918815612793, 0.006528377532958984, 0.006778836250305176, 0.007029294967651367, 0.007279753684997559, 0.00753021240234375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 22.0, 31.0, 94.0, 480.0, 283.0, 73.0, 19.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011955345049500465, -0.011669577099382877, -0.01138380914926529, -0.011098040267825127, -0.010812272317707539, -0.01052650436758995, -0.010240736417472363, -0.009954968467354774, -0.009669199585914612, -0.009383431635797024, -0.009097663685679436, -0.008811894804239273, -0.008526126854121685, -0.008240358904004097, -0.007954590953886509, -0.007668822538107634, -0.0073830545879900455, -0.0070972866378724575, -0.006811518222093582, -0.006525750271975994, -0.006239981856197119, -0.005954213906079531, -0.005668445490300655, -0.005382677540183067, -0.005096909590065479, -0.004811141639947891, -0.004525373224169016, -0.004239605274051428, -0.0039538368582725525, -0.0036680689081549644, -0.0033823007252067327, -0.003096532542258501, -0.0028107636608183384, -0.0025249954778701067, -0.002239227294921875, -0.001953459344804287, -0.0016676910454407334, -0.0013819228624925017, -0.0010961547959595919, -0.0008103866130113602, -0.0005246184300631285, -0.00023885027621872723, 4.691787762567401e-05, 0.0003326860023662448, 0.0006184541853144765, 0.0009042223682627082, 0.001189990434795618, 0.0014757586177438498, 0.0017615268006920815, 0.002047294983640313, 0.002333063166588545, 0.002618831116706133, 0.0029045995324850082, 0.0031903674826025963, 0.003476135665550828, 0.0037619038484990597, 0.004047672264277935, 0.004333440214395523, 0.004619208630174398, 0.0049049765802919865, 0.005190744996070862, 0.00547651294618845, 0.005762280896306038, 0.006048049312084913, 0.006333817262202501]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 8.0, 5.0, 6.0, 3.0, 19.0, 20.0, 18.0, 25.0, 40.0, 36.0, 50.0, 54.0, 64.0, 49.0, 72.0, 82.0, 59.0, 59.0, 61.0, 62.0, 50.0, 37.0, 24.0, 27.0, 24.0, 14.0, 9.0, 10.0, 5.0, 7.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041168928146362305, -0.00039730407297611237, -0.0003829188644886017, -0.000368533656001091, -0.0003541484475135803, -0.00033976323902606964, -0.00032537803053855896, -0.0003109928220510483, -0.0002966076135635376, -0.0002822224050760269, -0.00026783719658851624, -0.00025345198810100555, -0.00023906677961349487, -0.0002246815711259842, -0.0002102963626384735, -0.00019591115415096283, -0.00018152594566345215, -0.00016714073717594147, -0.00015275552868843079, -0.0001383703202009201, -0.00012398511171340942, -0.00010959990322589874, -9.521469473838806e-05, -8.082948625087738e-05, -6.64442777633667e-05, -5.205906927585602e-05, -3.767386078834534e-05, -2.3288652300834656e-05, -8.903443813323975e-06, 5.4817646741867065e-06, 1.9866973161697388e-05, 3.425218164920807e-05, 4.863739013671875e-05, 6.302259862422943e-05, 7.740780711174011e-05, 9.17930155992508e-05, 0.00010617822408676147, 0.00012056343257427216, 0.00013494864106178284, 0.00014933384954929352, 0.0001637190580368042, 0.00017810426652431488, 0.00019248947501182556, 0.00020687468349933624, 0.00022125989198684692, 0.0002356451004743576, 0.0002500303089618683, 0.00026441551744937897, 0.00027880072593688965, 0.00029318593442440033, 0.000307571142911911, 0.0003219563513994217, 0.0003363415598869324, 0.00035072676837444305, 0.00036511197686195374, 0.0003794971853494644, 0.0003938823938369751, 0.0004082676023244858, 0.00042265281081199646, 0.00043703801929950714, 0.0004514232277870178, 0.0004658084362745285, 0.0004801936447620392, 0.0004945788532495499, 0.0005089640617370605]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 8.0, 11.0, 9.0, 18.0, 23.0, 26.0, 32.0, 41.0, 39.0, 50.0, 44.0, 44.0, 70.0, 77.0, 50.0, 71.0, 55.0, 62.0, 48.0, 37.0, 34.0, 31.0, 29.0, 16.0, 14.0, 20.0, 12.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.46875, -3.366546630859375, -3.26434326171875, -3.162139892578125, -3.0599365234375, -2.957733154296875, -2.85552978515625, -2.753326416015625, -2.651123046875, -2.548919677734375, -2.44671630859375, -2.344512939453125, -2.2423095703125, -2.140106201171875, -2.03790283203125, -1.935699462890625, -1.83349609375, -1.731292724609375, -1.62908935546875, -1.526885986328125, -1.4246826171875, -1.322479248046875, -1.22027587890625, -1.118072509765625, -1.015869140625, -0.913665771484375, -0.81146240234375, -0.709259033203125, -0.6070556640625, -0.504852294921875, -0.40264892578125, -0.300445556640625, -0.1982421875, -0.096038818359375, 0.00616455078125, 0.108367919921875, 0.2105712890625, 0.312774658203125, 0.41497802734375, 0.517181396484375, 0.619384765625, 0.721588134765625, 0.82379150390625, 0.925994873046875, 1.0281982421875, 1.130401611328125, 1.23260498046875, 1.334808349609375, 1.43701171875, 1.539215087890625, 1.64141845703125, 1.743621826171875, 1.8458251953125, 1.948028564453125, 2.05023193359375, 2.152435302734375, 2.254638671875, 2.356842041015625, 2.45904541015625, 2.561248779296875, 2.6634521484375, 2.765655517578125, 2.86785888671875, 2.970062255859375, 3.072265625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 12.0, 11.0, 17.0, 38.0, 47.0, 56.0, 119.0, 210.0, 359.0, 723.0, 1440.0, 3097.0, 7990.0, 29927.0, 213577.0, 681614.0, 83676.0, 16091.0, 5143.0, 2130.0, 1023.0, 536.0, 312.0, 153.0, 88.0, 56.0, 33.0, 28.0, 18.0, 7.0, 5.0, 3.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60546875, -7.34576416015625, -7.0860595703125, -6.82635498046875, -6.566650390625, -6.30694580078125, -6.0472412109375, -5.78753662109375, -5.52783203125, -5.26812744140625, -5.0084228515625, -4.74871826171875, -4.489013671875, -4.22930908203125, -3.9696044921875, -3.70989990234375, -3.4501953125, -3.19049072265625, -2.9307861328125, -2.67108154296875, -2.411376953125, -2.15167236328125, -1.8919677734375, -1.63226318359375, -1.37255859375, -1.11285400390625, -0.8531494140625, -0.59344482421875, -0.333740234375, -0.07403564453125, 0.1856689453125, 0.44537353515625, 0.705078125, 0.96478271484375, 1.2244873046875, 1.48419189453125, 1.743896484375, 2.00360107421875, 2.2633056640625, 2.52301025390625, 2.78271484375, 3.04241943359375, 3.3021240234375, 3.56182861328125, 3.821533203125, 4.08123779296875, 4.3409423828125, 4.60064697265625, 4.8603515625, 5.12005615234375, 5.3797607421875, 5.63946533203125, 5.899169921875, 6.15887451171875, 6.4185791015625, 6.67828369140625, 6.93798828125, 7.19769287109375, 7.4573974609375, 7.71710205078125, 7.976806640625, 8.23651123046875, 8.4962158203125, 8.75592041015625, 9.015625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 3.0, 8.0, 11.0, 11.0, 8.0, 21.0, 17.0, 18.0, 19.0, 20.0, 26.0, 30.0, 34.0, 46.0, 53.0, 57.0, 80.0, 107.0, 215.0, 1438.0, 200.0, 129.0, 72.0, 60.0, 54.0, 53.0, 38.0, 36.0, 32.0, 22.0, 13.0, 26.0, 13.0, 7.0, 13.0, 13.0, 4.0, 9.0, 3.0, 3.0, 7.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9375, -7.68505859375, -7.4326171875, -7.18017578125, -6.927734375, -6.67529296875, -6.4228515625, -6.17041015625, -5.91796875, -5.66552734375, -5.4130859375, -5.16064453125, -4.908203125, -4.65576171875, -4.4033203125, -4.15087890625, -3.8984375, -3.64599609375, -3.3935546875, -3.14111328125, -2.888671875, -2.63623046875, -2.3837890625, -2.13134765625, -1.87890625, -1.62646484375, -1.3740234375, -1.12158203125, -0.869140625, -0.61669921875, -0.3642578125, -0.11181640625, 0.140625, 0.39306640625, 0.6455078125, 0.89794921875, 1.150390625, 1.40283203125, 1.6552734375, 1.90771484375, 2.16015625, 2.41259765625, 2.6650390625, 2.91748046875, 3.169921875, 3.42236328125, 3.6748046875, 3.92724609375, 4.1796875, 4.43212890625, 4.6845703125, 4.93701171875, 5.189453125, 5.44189453125, 5.6943359375, 5.94677734375, 6.19921875, 6.45166015625, 6.7041015625, 6.95654296875, 7.208984375, 7.46142578125, 7.7138671875, 7.96630859375, 8.21875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 5.0, 8.0, 10.0, 13.0, 9.0, 16.0, 20.0, 30.0, 29.0, 38.0, 50.0, 73.0, 127.0, 212.0, 313.0, 702.0, 2246.0, 9510.0, 92946.0, 2484608.0, 521254.0, 26629.0, 4299.0, 1269.0, 498.0, 233.0, 135.0, 92.0, 78.0, 51.0, 29.0, 25.0, 26.0, 22.0, 10.0, 14.0, 15.0, 13.0, 10.0, 4.0, 3.0, 4.0, 6.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.375, -11.97265625, -11.5703125, -11.16796875, -10.765625, -10.36328125, -9.9609375, -9.55859375, -9.15625, -8.75390625, -8.3515625, -7.94921875, -7.546875, -7.14453125, -6.7421875, -6.33984375, -5.9375, -5.53515625, -5.1328125, -4.73046875, -4.328125, -3.92578125, -3.5234375, -3.12109375, -2.71875, -2.31640625, -1.9140625, -1.51171875, -1.109375, -0.70703125, -0.3046875, 0.09765625, 0.5, 0.90234375, 1.3046875, 1.70703125, 2.109375, 2.51171875, 2.9140625, 3.31640625, 3.71875, 4.12109375, 4.5234375, 4.92578125, 5.328125, 5.73046875, 6.1328125, 6.53515625, 6.9375, 7.33984375, 7.7421875, 8.14453125, 8.546875, 8.94921875, 9.3515625, 9.75390625, 10.15625, 10.55859375, 10.9609375, 11.36328125, 11.765625, 12.16796875, 12.5703125, 12.97265625, 13.375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 9.0, 11.0, 41.0, 67.0, 118.0, 157.0, 165.0, 187.0, 124.0, 60.0, 45.0, 15.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.619930267333984, -33.673526763916016, -32.72712707519531, -31.780723571777344, -30.834320068359375, -29.88791847229004, -28.941516876220703, -27.995113372802734, -27.0487117767334, -26.102310180664062, -25.155906677246094, -24.209505081176758, -23.26310157775879, -22.316699981689453, -21.370296478271484, -20.42389488220215, -19.477493286132812, -18.531091690063477, -17.584688186645508, -16.638286590576172, -15.69188404083252, -14.745481491088867, -13.799078941345215, -12.852676391601562, -11.906272888183594, -10.959870338439941, -10.013467788696289, -9.067066192626953, -8.1206636428833, -7.174261093139648, -6.227858543395996, -5.281456470489502, -4.335054397583008, -3.3886520862579346, -2.4422497749328613, -1.495847225189209, -0.5494449138641357, 0.3969573974609375, 1.3433599472045898, 2.289762020111084, 3.2361645698547363, 4.182567119598389, 5.128969192504883, 6.075371742248535, 7.0217742919921875, 7.968176364898682, 8.914579391479492, 9.860980987548828, 10.80738353729248, 11.753786087036133, 12.700188636779785, 13.646591186523438, 14.592992782592773, 15.539395332336426, 16.485797882080078, 17.432199478149414, 18.378602981567383, 19.32500457763672, 20.271408081054688, 21.217809677124023, 22.164213180541992, 23.110614776611328, 24.057018280029297, 25.003419876098633, 25.94982147216797]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 6.0, 12.0, 21.0, 16.0, 13.0, 19.0, 30.0, 26.0, 37.0, 35.0, 31.0, 34.0, 41.0, 48.0, 54.0, 53.0, 45.0, 48.0, 42.0, 44.0, 41.0, 67.0, 34.0, 34.0, 35.0, 18.0, 26.0, 21.0, 15.0, 18.0, 9.0, 5.0, 9.0, 1.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-33.14874267578125, -32.308895111083984, -31.469051361083984, -30.62920379638672, -29.789358139038086, -28.949512481689453, -28.109664916992188, -27.269819259643555, -26.429973602294922, -25.59012794494629, -24.750282287597656, -23.91043472290039, -23.070589065551758, -22.230743408203125, -21.39089584350586, -20.551050186157227, -19.711204528808594, -18.87135887145996, -18.031513214111328, -17.191665649414062, -16.35181999206543, -15.511974334716797, -14.672127723693848, -13.832281112670898, -12.992435455322266, -12.152589797973633, -11.312743186950684, -10.472896575927734, -9.633050918579102, -8.793205261230469, -7.9533586502075195, -7.1135125160217285, -6.27366828918457, -5.433822154998779, -4.593976020812988, -3.7541298866271973, -2.9142837524414062, -2.0744376182556152, -1.2345914840698242, -0.3947453498840332, 0.4451007843017578, 1.2849469184875488, 2.12479305267334, 2.964639186859131, 3.804485321044922, 4.644331455230713, 5.484177589416504, 6.324023723602295, 7.163869857788086, 8.003715515136719, 8.843562126159668, 9.683408737182617, 10.52325439453125, 11.363100051879883, 12.202946662902832, 13.042793273925781, 13.882638931274414, 14.722484588623047, 15.562331199645996, 16.402177810668945, 17.242023468017578, 18.08186912536621, 18.921714782714844, 19.76156234741211, 20.601408004760742]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 6.0, 6.0, 11.0, 10.0, 20.0, 23.0, 29.0, 34.0, 37.0, 40.0, 45.0, 50.0, 55.0, 51.0, 77.0, 48.0, 65.0, 59.0, 56.0, 45.0, 42.0, 30.0, 29.0, 38.0, 16.0, 16.0, 17.0, 15.0, 5.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.439453125, -3.338043212890625, -3.23663330078125, -3.135223388671875, -3.0338134765625, -2.932403564453125, -2.83099365234375, -2.729583740234375, -2.628173828125, -2.526763916015625, -2.42535400390625, -2.323944091796875, -2.2225341796875, -2.121124267578125, -2.01971435546875, -1.918304443359375, -1.81689453125, -1.715484619140625, -1.61407470703125, -1.512664794921875, -1.4112548828125, -1.309844970703125, -1.20843505859375, -1.107025146484375, -1.005615234375, -0.904205322265625, -0.80279541015625, -0.701385498046875, -0.5999755859375, -0.498565673828125, -0.39715576171875, -0.295745849609375, -0.1943359375, -0.092926025390625, 0.00848388671875, 0.109893798828125, 0.2113037109375, 0.312713623046875, 0.41412353515625, 0.515533447265625, 0.616943359375, 0.718353271484375, 0.81976318359375, 0.921173095703125, 1.0225830078125, 1.123992919921875, 1.22540283203125, 1.326812744140625, 1.42822265625, 1.529632568359375, 1.63104248046875, 1.732452392578125, 1.8338623046875, 1.935272216796875, 2.03668212890625, 2.138092041015625, 2.239501953125, 2.340911865234375, 2.44232177734375, 2.543731689453125, 2.6451416015625, 2.746551513671875, 2.84796142578125, 2.949371337890625, 3.05078125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 1.0, 7.0, 6.0, 6.0, 7.0, 11.0, 10.0, 29.0, 22.0, 42.0, 76.0, 91.0, 149.0, 238.0, 352.0, 620.0, 1002.0, 1915.0, 3732.0, 9306.0, 33895.0, 306256.0, 2941836.0, 803864.0, 66576.0, 14207.0, 5083.0, 2302.0, 1095.0, 583.0, 365.0, 196.0, 135.0, 89.0, 60.0, 32.0, 29.0, 18.0, 10.0, 10.0, 4.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-10.4296875, -10.15283203125, -9.8759765625, -9.59912109375, -9.322265625, -9.04541015625, -8.7685546875, -8.49169921875, -8.21484375, -7.93798828125, -7.6611328125, -7.38427734375, -7.107421875, -6.83056640625, -6.5537109375, -6.27685546875, -6.0, -5.72314453125, -5.4462890625, -5.16943359375, -4.892578125, -4.61572265625, -4.3388671875, -4.06201171875, -3.78515625, -3.50830078125, -3.2314453125, -2.95458984375, -2.677734375, -2.40087890625, -2.1240234375, -1.84716796875, -1.5703125, -1.29345703125, -1.0166015625, -0.73974609375, -0.462890625, -0.18603515625, 0.0908203125, 0.36767578125, 0.64453125, 0.92138671875, 1.1982421875, 1.47509765625, 1.751953125, 2.02880859375, 2.3056640625, 2.58251953125, 2.859375, 3.13623046875, 3.4130859375, 3.68994140625, 3.966796875, 4.24365234375, 4.5205078125, 4.79736328125, 5.07421875, 5.35107421875, 5.6279296875, 5.90478515625, 6.181640625, 6.45849609375, 6.7353515625, 7.01220703125, 7.2890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 15.0, 12.0, 24.0, 50.0, 48.0, 103.0, 181.0, 265.0, 402.0, 669.0, 741.0, 593.0, 353.0, 215.0, 136.0, 84.0, 53.0, 37.0, 18.0, 18.0, 9.0, 8.0, 5.0, 6.0, 8.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4453125, -9.1614990234375, -8.877685546875, -8.5938720703125, -8.31005859375, -8.0262451171875, -7.742431640625, -7.4586181640625, -7.1748046875, -6.8909912109375, -6.607177734375, -6.3233642578125, -6.03955078125, -5.7557373046875, -5.471923828125, -5.1881103515625, -4.904296875, -4.6204833984375, -4.336669921875, -4.0528564453125, -3.76904296875, -3.4852294921875, -3.201416015625, -2.9176025390625, -2.6337890625, -2.3499755859375, -2.066162109375, -1.7823486328125, -1.49853515625, -1.2147216796875, -0.930908203125, -0.6470947265625, -0.36328125, -0.0794677734375, 0.204345703125, 0.4881591796875, 0.77197265625, 1.0557861328125, 1.339599609375, 1.6234130859375, 1.9072265625, 2.1910400390625, 2.474853515625, 2.7586669921875, 3.04248046875, 3.3262939453125, 3.610107421875, 3.8939208984375, 4.177734375, 4.4615478515625, 4.745361328125, 5.0291748046875, 5.31298828125, 5.5968017578125, 5.880615234375, 6.1644287109375, 6.4482421875, 6.7320556640625, 7.015869140625, 7.2996826171875, 7.58349609375, 7.8673095703125, 8.151123046875, 8.4349365234375, 8.71875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 6.0, 6.0, 3.0, 13.0, 9.0, 16.0, 27.0, 55.0, 84.0, 148.0, 321.0, 792.0, 2448.0, 10601.0, 93374.0, 3260176.0, 788317.0, 30016.0, 5358.0, 1477.0, 550.0, 224.0, 110.0, 73.0, 31.0, 19.0, 12.0, 10.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.134033203125, -20.42431640625, -19.714599609375, -19.0048828125, -18.295166015625, -17.58544921875, -16.875732421875, -16.166015625, -15.456298828125, -14.74658203125, -14.036865234375, -13.3271484375, -12.617431640625, -11.90771484375, -11.197998046875, -10.48828125, -9.778564453125, -9.06884765625, -8.359130859375, -7.6494140625, -6.939697265625, -6.22998046875, -5.520263671875, -4.810546875, -4.100830078125, -3.39111328125, -2.681396484375, -1.9716796875, -1.261962890625, -0.55224609375, 0.157470703125, 0.8671875, 1.576904296875, 2.28662109375, 2.996337890625, 3.7060546875, 4.415771484375, 5.12548828125, 5.835205078125, 6.544921875, 7.254638671875, 7.96435546875, 8.674072265625, 9.3837890625, 10.093505859375, 10.80322265625, 11.512939453125, 12.22265625, 12.932373046875, 13.64208984375, 14.351806640625, 15.0615234375, 15.771240234375, 16.48095703125, 17.190673828125, 17.900390625, 18.610107421875, 19.31982421875, 20.029541015625, 20.7392578125, 21.448974609375, 22.15869140625, 22.868408203125, 23.578125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 12.0, 29.0, 29.0, 50.0, 55.0, 98.0, 109.0, 110.0, 133.0, 108.0, 92.0, 63.0, 34.0, 38.0, 11.0, 15.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.41304016113281, -65.94137573242188, -64.46971130371094, -62.998046875, -61.52638244628906, -60.054718017578125, -58.58305358886719, -57.11138916015625, -55.63972473144531, -54.168060302734375, -52.69639587402344, -51.2247314453125, -49.75306701660156, -48.281402587890625, -46.80973815917969, -45.33807373046875, -43.86641311645508, -42.39474868774414, -40.9230842590332, -39.451419830322266, -37.97975540161133, -36.50809097290039, -35.03643035888672, -33.56476593017578, -32.093101501464844, -30.621437072753906, -29.14977264404297, -27.67810821533203, -26.206443786621094, -24.734779357910156, -23.26311683654785, -21.791452407836914, -20.319787979125977, -18.84812355041504, -17.3764591217041, -15.90479564666748, -14.433131217956543, -12.961466789245605, -11.489803314208984, -10.018138885498047, -8.54647445678711, -7.074810028076172, -5.603146076202393, -4.131482124328613, -2.659817695617676, -1.1881532669067383, 0.2835102081298828, 1.7551746368408203, 3.226839065551758, 4.698503494262695, 6.170167446136475, 7.641831398010254, 9.113495826721191, 10.585160255432129, 12.05682373046875, 13.528488159179688, 15.000152587890625, 16.471817016601562, 17.9434814453125, 19.415145874023438, 20.886810302734375, 22.358474731445312, 23.830137252807617, 25.301801681518555, 26.773466110229492]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 4.0, 3.0, 4.0, 6.0, 7.0, 13.0, 3.0, 8.0, 14.0, 17.0, 11.0, 22.0, 19.0, 20.0, 25.0, 29.0, 24.0, 29.0, 40.0, 37.0, 40.0, 38.0, 32.0, 36.0, 31.0, 41.0, 37.0, 36.0, 33.0, 32.0, 30.0, 28.0, 34.0, 35.0, 24.0, 24.0, 19.0, 13.0, 16.0, 20.0, 9.0, 10.0, 14.0, 6.0, 7.0, 6.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.286697387695312, -19.62721061706543, -18.967721939086914, -18.30823516845703, -17.648746490478516, -16.989259719848633, -16.32977294921875, -15.670284271240234, -15.010797500610352, -14.351309776306152, -13.691822052001953, -13.03233528137207, -12.372847557067871, -11.713359832763672, -11.053872108459473, -10.394384384155273, -9.734896659851074, -9.075408935546875, -8.415921211242676, -7.756433963775635, -7.096946716308594, -6.4374589920043945, -5.777971267700195, -5.118484020233154, -4.458996295928955, -3.799508810043335, -3.140021324157715, -2.4805335998535156, -1.8210461139678955, -1.1615586280822754, -0.5020709037780762, 0.15741634368896484, 0.8169040679931641, 1.4763915538787842, 2.1358790397644043, 2.7953667640686035, 3.4548542499542236, 4.114341735839844, 4.773829460144043, 5.433316707611084, 6.092804431915283, 6.752292156219482, 7.411779403686523, 8.071267127990723, 8.730754852294922, 9.390241622924805, 10.04973030090332, 10.709217071533203, 11.368704795837402, 12.028192520141602, 12.6876802444458, 13.34716796875, 14.006654739379883, 14.666142463684082, 15.325630187988281, 15.985116958618164, 16.64460563659668, 17.304092407226562, 17.963581085205078, 18.62306785583496, 19.282556533813477, 19.94204330444336, 20.601531982421875, 21.261018753051758, 21.92050552368164]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 7.0, 10.0, 13.0, 6.0, 12.0, 20.0, 15.0, 24.0, 28.0, 47.0, 33.0, 32.0, 53.0, 47.0, 59.0, 64.0, 48.0, 52.0, 56.0, 63.0, 49.0, 49.0, 27.0, 44.0, 34.0, 22.0, 19.0, 11.0, 14.0, 10.0, 14.0, 9.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.3046875, -3.20623779296875, -3.1077880859375, -3.00933837890625, -2.910888671875, -2.81243896484375, -2.7139892578125, -2.61553955078125, -2.51708984375, -2.41864013671875, -2.3201904296875, -2.22174072265625, -2.123291015625, -2.02484130859375, -1.9263916015625, -1.82794189453125, -1.7294921875, -1.63104248046875, -1.5325927734375, -1.43414306640625, -1.335693359375, -1.23724365234375, -1.1387939453125, -1.04034423828125, -0.94189453125, -0.84344482421875, -0.7449951171875, -0.64654541015625, -0.548095703125, -0.44964599609375, -0.3511962890625, -0.25274658203125, -0.154296875, -0.05584716796875, 0.0426025390625, 0.14105224609375, 0.239501953125, 0.33795166015625, 0.4364013671875, 0.53485107421875, 0.63330078125, 0.73175048828125, 0.8302001953125, 0.92864990234375, 1.027099609375, 1.12554931640625, 1.2239990234375, 1.32244873046875, 1.4208984375, 1.51934814453125, 1.6177978515625, 1.71624755859375, 1.814697265625, 1.91314697265625, 2.0115966796875, 2.11004638671875, 2.20849609375, 2.30694580078125, 2.4053955078125, 2.50384521484375, 2.602294921875, 2.70074462890625, 2.7991943359375, 2.89764404296875, 2.99609375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 7.0, 7.0, 2.0, 15.0, 8.0, 19.0, 34.0, 33.0, 53.0, 76.0, 119.0, 177.0, 249.0, 379.0, 625.0, 968.0, 1508.0, 2437.0, 4030.0, 6729.0, 11533.0, 20448.0, 37486.0, 73295.0, 155196.0, 373173.0, 181514.0, 82641.0, 41850.0, 22304.0, 12552.0, 7411.0, 4412.0, 2672.0, 1632.0, 1037.0, 648.0, 414.0, 291.0, 165.0, 131.0, 89.0, 62.0, 37.0, 28.0, 19.0, 17.0, 12.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1591796875, -0.15379905700683594, -0.14841842651367188, -0.1430377960205078, -0.13765716552734375, -0.1322765350341797, -0.12689590454101562, -0.12151527404785156, -0.1161346435546875, -0.11075401306152344, -0.10537338256835938, -0.09999275207519531, -0.09461212158203125, -0.08923149108886719, -0.08385086059570312, -0.07847023010253906, -0.073089599609375, -0.06770896911621094, -0.062328338623046875, -0.05694770812988281, -0.05156707763671875, -0.04618644714355469, -0.040805816650390625, -0.03542518615722656, -0.0300445556640625, -0.024663925170898438, -0.019283294677734375, -0.013902664184570312, -0.00852203369140625, -0.0031414031982421875, 0.002239227294921875, 0.0076198577880859375, 0.01300048828125, 0.018381118774414062, 0.023761749267578125, 0.029142379760742188, 0.03452301025390625, 0.03990364074707031, 0.045284271240234375, 0.05066490173339844, 0.0560455322265625, 0.06142616271972656, 0.06680679321289062, 0.07218742370605469, 0.07756805419921875, 0.08294868469238281, 0.08832931518554688, 0.09370994567871094, 0.099090576171875, 0.10447120666503906, 0.10985183715820312, 0.11523246765136719, 0.12061309814453125, 0.1259937286376953, 0.13137435913085938, 0.13675498962402344, 0.1421356201171875, 0.14751625061035156, 0.15289688110351562, 0.1582775115966797, 0.16365814208984375, 0.1690387725830078, 0.17441940307617188, 0.17980003356933594, 0.1851806640625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 7.0, 7.0, 7.0, 16.0, 17.0, 10.0, 14.0, 21.0, 24.0, 15.0, 24.0, 30.0, 49.0, 39.0, 29.0, 33.0, 38.0, 36.0, 43.0, 1056.0, 34.0, 53.0, 42.0, 34.0, 43.0, 36.0, 27.0, 34.0, 35.0, 23.0, 29.0, 20.0, 14.0, 18.0, 16.0, 8.0, 11.0, 8.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.37890625, -2.306121826171875, -2.23333740234375, -2.160552978515625, -2.0877685546875, -2.014984130859375, -1.94219970703125, -1.869415283203125, -1.796630859375, -1.723846435546875, -1.65106201171875, -1.578277587890625, -1.5054931640625, -1.432708740234375, -1.35992431640625, -1.287139892578125, -1.21435546875, -1.141571044921875, -1.06878662109375, -0.996002197265625, -0.9232177734375, -0.850433349609375, -0.77764892578125, -0.704864501953125, -0.632080078125, -0.559295654296875, -0.48651123046875, -0.413726806640625, -0.3409423828125, -0.268157958984375, -0.19537353515625, -0.122589111328125, -0.0498046875, 0.022979736328125, 0.09576416015625, 0.168548583984375, 0.2413330078125, 0.314117431640625, 0.38690185546875, 0.459686279296875, 0.532470703125, 0.605255126953125, 0.67803955078125, 0.750823974609375, 0.8236083984375, 0.896392822265625, 0.96917724609375, 1.041961669921875, 1.11474609375, 1.187530517578125, 1.26031494140625, 1.333099365234375, 1.4058837890625, 1.478668212890625, 1.55145263671875, 1.624237060546875, 1.697021484375, 1.769805908203125, 1.84259033203125, 1.915374755859375, 1.9881591796875, 2.060943603515625, 2.13372802734375, 2.206512451171875, 2.279296875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 3.0, 11.0, 19.0, 25.0, 37.0, 48.0, 59.0, 107.0, 146.0, 248.0, 372.0, 609.0, 928.0, 1504.0, 2485.0, 4064.0, 6667.0, 11110.0, 19128.0, 33240.0, 59091.0, 112393.0, 463412.0, 1120311.0, 116002.0, 61607.0, 34550.0, 19844.0, 11503.0, 6859.0, 4009.0, 2436.0, 1550.0, 958.0, 630.0, 402.0, 254.0, 182.0, 94.0, 88.0, 54.0, 29.0, 24.0, 13.0, 8.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.06866455078125, -0.06658554077148438, -0.06450653076171875, -0.062427520751953125, -0.0603485107421875, -0.058269500732421875, -0.05619049072265625, -0.054111480712890625, -0.052032470703125, -0.049953460693359375, -0.04787445068359375, -0.045795440673828125, -0.0437164306640625, -0.041637420654296875, -0.03955841064453125, -0.037479400634765625, -0.035400390625, -0.033321380615234375, -0.03124237060546875, -0.029163360595703125, -0.0270843505859375, -0.025005340576171875, -0.02292633056640625, -0.020847320556640625, -0.018768310546875, -0.016689300537109375, -0.01461029052734375, -0.012531280517578125, -0.0104522705078125, -0.008373260498046875, -0.00629425048828125, -0.004215240478515625, -0.00213623046875, -5.7220458984375e-05, 0.00202178955078125, 0.004100799560546875, 0.0061798095703125, 0.008258819580078125, 0.01033782958984375, 0.012416839599609375, 0.014495849609375, 0.016574859619140625, 0.01865386962890625, 0.020732879638671875, 0.0228118896484375, 0.024890899658203125, 0.02696990966796875, 0.029048919677734375, 0.0311279296875, 0.033206939697265625, 0.03528594970703125, 0.037364959716796875, 0.0394439697265625, 0.041522979736328125, 0.04360198974609375, 0.045680999755859375, 0.047760009765625, 0.049839019775390625, 0.05191802978515625, 0.053997039794921875, 0.0560760498046875, 0.058155059814453125, 0.06023406982421875, 0.062313079833984375, 0.06439208984375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 9.0, 13.0, 8.0, 19.0, 27.0, 14.0, 25.0, 27.0, 33.0, 57.0, 98.0, 135.0, 141.0, 106.0, 64.0, 44.0, 33.0, 25.0, 20.0, 17.0, 13.0, 11.0, 12.0, 5.0, 9.0, 6.0, 13.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0], "bins": [-0.0008792877197265625, -0.0008589327335357666, -0.0008385777473449707, -0.0008182227611541748, -0.0007978677749633789, -0.000777512788772583, -0.0007571578025817871, -0.0007368028163909912, -0.0007164478302001953, -0.0006960928440093994, -0.0006757378578186035, -0.0006553828716278076, -0.0006350278854370117, -0.0006146728992462158, -0.0005943179130554199, -0.000573962926864624, -0.0005536079406738281, -0.0005332529544830322, -0.0005128979682922363, -0.0004925429821014404, -0.00047218799591064453, -0.00045183300971984863, -0.00043147802352905273, -0.00041112303733825684, -0.00039076805114746094, -0.00037041306495666504, -0.00035005807876586914, -0.00032970309257507324, -0.00030934810638427734, -0.00028899312019348145, -0.00026863813400268555, -0.00024828314781188965, -0.00022792816162109375, -0.00020757317543029785, -0.00018721818923950195, -0.00016686320304870605, -0.00014650821685791016, -0.00012615323066711426, -0.00010579824447631836, -8.544325828552246e-05, -6.508827209472656e-05, -4.4733285903930664e-05, -2.4378299713134766e-05, -4.023313522338867e-06, 1.633167266845703e-05, 3.668665885925293e-05, 5.704164505004883e-05, 7.739663124084473e-05, 9.775161743164062e-05, 0.00011810660362243652, 0.00013846158981323242, 0.00015881657600402832, 0.00017917156219482422, 0.00019952654838562012, 0.00021988153457641602, 0.00024023652076721191, 0.0002605915069580078, 0.0002809464931488037, 0.0003013014793395996, 0.0003216564655303955, 0.0003420114517211914, 0.0003623664379119873, 0.0003827214241027832, 0.0004030764102935791, 0.000423431396484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 7.0, 5.0, 5.0, 8.0, 19.0, 22.0, 39.0, 57.0, 77.0, 147.0, 395.0, 1437.0, 6725.0, 45574.0, 692586.0, 269826.0, 25807.0, 4216.0, 968.0, 294.0, 134.0, 78.0, 39.0, 21.0, 20.0, 16.0, 9.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00806427001953125, -0.007739901542663574, -0.0074155330657958984, -0.007091164588928223, -0.006766796112060547, -0.006442427635192871, -0.006118059158325195, -0.0057936906814575195, -0.005469322204589844, -0.005144953727722168, -0.004820585250854492, -0.004496216773986816, -0.004171848297119141, -0.003847479820251465, -0.003523111343383789, -0.0031987428665161133, -0.0028743743896484375, -0.0025500059127807617, -0.002225637435913086, -0.0019012689590454102, -0.0015769004821777344, -0.0012525320053100586, -0.0009281635284423828, -0.000603795051574707, -0.00027942657470703125, 4.494190216064453e-05, 0.0003693103790283203, 0.0006936788558959961, 0.0010180473327636719, 0.0013424158096313477, 0.0016667842864990234, 0.0019911527633666992, 0.002315521240234375, 0.0026398897171020508, 0.0029642581939697266, 0.0032886266708374023, 0.003612995147705078, 0.003937363624572754, 0.00426173210144043, 0.0045861005783081055, 0.004910469055175781, 0.005234837532043457, 0.005559206008911133, 0.005883574485778809, 0.006207942962646484, 0.00653231143951416, 0.006856679916381836, 0.007181048393249512, 0.0075054168701171875, 0.007829785346984863, 0.008154153823852539, 0.008478522300720215, 0.00880289077758789, 0.009127259254455566, 0.009451627731323242, 0.009775996208190918, 0.010100364685058594, 0.01042473316192627, 0.010749101638793945, 0.011073470115661621, 0.011397838592529297, 0.011722207069396973, 0.012046575546264648, 0.012370944023132324, 0.0126953125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 11.0, 33.0, 86.0, 282.0, 413.0, 106.0, 49.0, 14.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004466247744858265, -0.004313251003623009, -0.0041602542623877525, -0.004007257521152496, -0.0038542605470865965, -0.0037012638058513403, -0.0035482668317854404, -0.0033952700905501842, -0.003242273349314928, -0.003089276608079672, -0.0029362798668444157, -0.002783282892778516, -0.0026302861515432596, -0.0024772894103080034, -0.0023242924362421036, -0.0021712956950068474, -0.002018298953771591, -0.001865302212536335, -0.001712305354885757, -0.001559308497235179, -0.0014063117559999228, -0.0012533150147646666, -0.0011003181571140885, -0.0009473212994635105, -0.0007943245582282543, -0.0006413277587853372, -0.0004883309593424201, -0.000335334159899503, -0.00018233736045658588, -2.9340561013668776e-05, 0.00012365623842924833, 0.00027665309607982635, 0.00042965030297636986, 0.000582647102419287, 0.0007356439018622041, 0.0008886407013051212, 0.0010416375007480383, 0.0011946342419832945, 0.0013476310996338725, 0.0015006279572844505, 0.0016536246985197067, 0.001806621439754963, 0.001959618180990219, 0.002112615155056119, 0.002265611896291375, 0.0024186086375266314, 0.002571605611592531, 0.0027246023528277874, 0.0028775990940630436, 0.0030305958352983, 0.003183592576533556, 0.003336589550599456, 0.003489586291834712, 0.0036425830330699682, 0.003795580007135868, 0.003948576748371124, 0.0041015734896063805, 0.004254570230841637, 0.004407566972076893, 0.004560563713312149, 0.004713560454547405, 0.004866557661443949, 0.005019554402679205, 0.005172551143914461, 0.005325547885149717]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 11.0, 9.0, 21.0, 16.0, 16.0, 38.0, 35.0, 34.0, 39.0, 43.0, 56.0, 54.0, 59.0, 55.0, 59.0, 55.0, 68.0, 59.0, 66.0, 34.0, 25.0, 39.0, 28.0, 20.0, 16.0, 12.0, 9.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005463361740112305, -0.0005301665514707565, -0.0005139969289302826, -0.0004978273063898087, -0.0004816576838493347, -0.0004654880613088608, -0.00044931843876838684, -0.0004331488162279129, -0.00041697919368743896, -0.000400809571146965, -0.0003846399486064911, -0.00036847032606601715, -0.0003523007035255432, -0.0003361310809850693, -0.00031996145844459534, -0.0003037918359041214, -0.00028762221336364746, -0.0002714525908231735, -0.0002552829682826996, -0.00023911334574222565, -0.0002229437232017517, -0.00020677410066127777, -0.00019060447812080383, -0.0001744348555803299, -0.00015826523303985596, -0.00014209561049938202, -0.00012592598795890808, -0.00010975636541843414, -9.35867428779602e-05, -7.741712033748627e-05, -6.124749779701233e-05, -4.507787525653839e-05, -2.8908252716064453e-05, -1.2738630175590515e-05, 3.430992364883423e-06, 1.960061490535736e-05, 3.57702374458313e-05, 5.193985998630524e-05, 6.810948252677917e-05, 8.427910506725311e-05, 0.00010044872760772705, 0.00011661835014820099, 0.00013278797268867493, 0.00014895759522914886, 0.0001651272177696228, 0.00018129684031009674, 0.00019746646285057068, 0.00021363608539104462, 0.00022980570793151855, 0.0002459753304719925, 0.00026214495301246643, 0.00027831457555294037, 0.0002944841980934143, 0.00031065382063388824, 0.0003268234431743622, 0.0003429930657148361, 0.00035916268825531006, 0.000375332310795784, 0.00039150193333625793, 0.00040767155587673187, 0.0004238411784172058, 0.00044001080095767975, 0.0004561804234981537, 0.0004723500460386276, 0.0004885196685791016]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 7.0, 10.0, 13.0, 6.0, 12.0, 20.0, 15.0, 24.0, 28.0, 47.0, 33.0, 33.0, 52.0, 47.0, 59.0, 64.0, 47.0, 53.0, 56.0, 63.0, 49.0, 49.0, 27.0, 44.0, 34.0, 22.0, 19.0, 11.0, 14.0, 10.0, 14.0, 9.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.3046875, -3.20623779296875, -3.1077880859375, -3.00933837890625, -2.910888671875, -2.81243896484375, -2.7139892578125, -2.61553955078125, -2.51708984375, -2.41864013671875, -2.3201904296875, -2.22174072265625, -2.123291015625, -2.02484130859375, -1.9263916015625, -1.82794189453125, -1.7294921875, -1.63104248046875, -1.5325927734375, -1.43414306640625, -1.335693359375, -1.23724365234375, -1.1387939453125, -1.04034423828125, -0.94189453125, -0.84344482421875, -0.7449951171875, -0.64654541015625, -0.548095703125, -0.44964599609375, -0.3511962890625, -0.25274658203125, -0.154296875, -0.05584716796875, 0.0426025390625, 0.14105224609375, 0.239501953125, 0.33795166015625, 0.4364013671875, 0.53485107421875, 0.63330078125, 0.73175048828125, 0.8302001953125, 0.92864990234375, 1.027099609375, 1.12554931640625, 1.2239990234375, 1.32244873046875, 1.4208984375, 1.51934814453125, 1.6177978515625, 1.71624755859375, 1.814697265625, 1.91314697265625, 2.0115966796875, 2.11004638671875, 2.20849609375, 2.30694580078125, 2.4053955078125, 2.50384521484375, 2.602294921875, 2.70074462890625, 2.7991943359375, 2.89764404296875, 2.99609375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 13.0, 35.0, 50.0, 69.0, 113.0, 160.0, 347.0, 595.0, 1296.0, 3053.0, 10474.0, 70561.0, 746907.0, 184006.0, 22405.0, 4790.0, 1797.0, 824.0, 453.0, 212.0, 147.0, 69.0, 53.0, 40.0, 17.0, 14.0, 12.0, 7.0, 4.0, 6.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.671875, -11.279052734375, -10.88623046875, -10.493408203125, -10.1005859375, -9.707763671875, -9.31494140625, -8.922119140625, -8.529296875, -8.136474609375, -7.74365234375, -7.350830078125, -6.9580078125, -6.565185546875, -6.17236328125, -5.779541015625, -5.38671875, -4.993896484375, -4.60107421875, -4.208251953125, -3.8154296875, -3.422607421875, -3.02978515625, -2.636962890625, -2.244140625, -1.851318359375, -1.45849609375, -1.065673828125, -0.6728515625, -0.280029296875, 0.11279296875, 0.505615234375, 0.8984375, 1.291259765625, 1.68408203125, 2.076904296875, 2.4697265625, 2.862548828125, 3.25537109375, 3.648193359375, 4.041015625, 4.433837890625, 4.82666015625, 5.219482421875, 5.6123046875, 6.005126953125, 6.39794921875, 6.790771484375, 7.18359375, 7.576416015625, 7.96923828125, 8.362060546875, 8.7548828125, 9.147705078125, 9.54052734375, 9.933349609375, 10.326171875, 10.718994140625, 11.11181640625, 11.504638671875, 11.8974609375, 12.290283203125, 12.68310546875, 13.075927734375, 13.46875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 4.0, 10.0, 12.0, 8.0, 23.0, 26.0, 30.0, 22.0, 25.0, 34.0, 41.0, 35.0, 50.0, 71.0, 112.0, 175.0, 1374.0, 304.0, 136.0, 114.0, 79.0, 50.0, 53.0, 30.0, 34.0, 44.0, 32.0, 24.0, 19.0, 11.0, 7.0, 9.0, 1.0, 10.0, 6.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.265625, -9.97998046875, -9.6943359375, -9.40869140625, -9.123046875, -8.83740234375, -8.5517578125, -8.26611328125, -7.98046875, -7.69482421875, -7.4091796875, -7.12353515625, -6.837890625, -6.55224609375, -6.2666015625, -5.98095703125, -5.6953125, -5.40966796875, -5.1240234375, -4.83837890625, -4.552734375, -4.26708984375, -3.9814453125, -3.69580078125, -3.41015625, -3.12451171875, -2.8388671875, -2.55322265625, -2.267578125, -1.98193359375, -1.6962890625, -1.41064453125, -1.125, -0.83935546875, -0.5537109375, -0.26806640625, 0.017578125, 0.30322265625, 0.5888671875, 0.87451171875, 1.16015625, 1.44580078125, 1.7314453125, 2.01708984375, 2.302734375, 2.58837890625, 2.8740234375, 3.15966796875, 3.4453125, 3.73095703125, 4.0166015625, 4.30224609375, 4.587890625, 4.87353515625, 5.1591796875, 5.44482421875, 5.73046875, 6.01611328125, 6.3017578125, 6.58740234375, 6.873046875, 7.15869140625, 7.4443359375, 7.72998046875, 8.015625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 4.0, 5.0, 9.0, 7.0, 8.0, 13.0, 16.0, 18.0, 25.0, 39.0, 49.0, 59.0, 112.0, 149.0, 283.0, 540.0, 1309.0, 3753.0, 15662.0, 153515.0, 2514400.0, 415897.0, 30652.0, 5751.0, 1806.0, 693.0, 333.0, 180.0, 120.0, 76.0, 53.0, 44.0, 33.0, 21.0, 24.0, 10.0, 7.0, 6.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.46875, -12.0338134765625, -11.598876953125, -11.1639404296875, -10.72900390625, -10.2940673828125, -9.859130859375, -9.4241943359375, -8.9892578125, -8.5543212890625, -8.119384765625, -7.6844482421875, -7.24951171875, -6.8145751953125, -6.379638671875, -5.9447021484375, -5.509765625, -5.0748291015625, -4.639892578125, -4.2049560546875, -3.77001953125, -3.3350830078125, -2.900146484375, -2.4652099609375, -2.0302734375, -1.5953369140625, -1.160400390625, -0.7254638671875, -0.29052734375, 0.1444091796875, 0.579345703125, 1.0142822265625, 1.44921875, 1.8841552734375, 2.319091796875, 2.7540283203125, 3.18896484375, 3.6239013671875, 4.058837890625, 4.4937744140625, 4.9287109375, 5.3636474609375, 5.798583984375, 6.2335205078125, 6.66845703125, 7.1033935546875, 7.538330078125, 7.9732666015625, 8.408203125, 8.8431396484375, 9.278076171875, 9.7130126953125, 10.14794921875, 10.5828857421875, 11.017822265625, 11.4527587890625, 11.8876953125, 12.3226318359375, 12.757568359375, 13.1925048828125, 13.62744140625, 14.0623779296875, 14.497314453125, 14.9322509765625, 15.3671875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [4.0, 27.0, 181.0, 427.0, 304.0, 63.0, 9.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.46053695678711, -9.165708541870117, -5.870879173278809, -2.5760498046875, 0.7187786102294922, 4.013607025146484, 7.308437347412109, 10.603265762329102, 13.898094177246094, 17.192922592163086, 20.487751007080078, 23.782581329345703, 27.077409744262695, 30.372238159179688, 33.66706848144531, 36.96189880371094, 40.2567253112793, 43.55155563354492, 46.84638214111328, 50.141212463378906, 53.43604278564453, 56.73086929321289, 60.025699615478516, 63.320526123046875, 66.6153564453125, 69.91018676757812, 73.20501708984375, 76.49984741210938, 79.79467010498047, 83.0895004272461, 86.38433074951172, 89.67916107177734, 92.97398376464844, 96.26881408691406, 99.56364440917969, 102.85847473144531, 106.1532974243164, 109.44812774658203, 112.74295806884766, 116.03778839111328, 119.33261108398438, 122.62744140625, 125.92227172851562, 129.21710205078125, 132.51193237304688, 135.8067626953125, 139.10159301757812, 142.3964080810547, 145.69125366210938, 148.986083984375, 152.28091430664062, 155.57574462890625, 158.87057495117188, 162.1654052734375, 165.46023559570312, 168.7550506591797, 172.0498809814453, 175.34471130371094, 178.63954162597656, 181.9343719482422, 185.2292022705078, 188.52401733398438, 191.81884765625, 195.11367797851562, 198.40850830078125]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 9.0, 6.0, 10.0, 7.0, 16.0, 20.0, 24.0, 22.0, 26.0, 17.0, 29.0, 31.0, 43.0, 50.0, 47.0, 44.0, 47.0, 40.0, 38.0, 46.0, 42.0, 34.0, 36.0, 36.0, 43.0, 30.0, 29.0, 35.0, 24.0, 18.0, 15.0, 17.0, 13.0, 18.0, 12.0, 8.0, 5.0, 11.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.645442962646484, -30.732877731323242, -29.8203125, -28.907747268676758, -27.995182037353516, -27.082618713378906, -26.170053482055664, -25.257488250732422, -24.34492301940918, -23.432357788085938, -22.519792556762695, -21.607227325439453, -20.694664001464844, -19.78209686279297, -18.86953353881836, -17.956968307495117, -17.044403076171875, -16.131837844848633, -15.21927261352539, -14.306708335876465, -13.394143104553223, -12.48157787322998, -11.569013595581055, -10.656448364257812, -9.74388313293457, -8.831317901611328, -7.918753147125244, -7.00618839263916, -6.093623161315918, -5.181057929992676, -4.268493175506592, -3.355928421020508, -2.4433631896972656, -1.5307981967926025, -0.6182332038879395, 0.29433178901672363, 1.2068967819213867, 2.119462013244629, 3.032026767730713, 3.944591522216797, 4.857156753540039, 5.769721984863281, 6.682286739349365, 7.594851493835449, 8.507416725158691, 9.419981956481934, 10.33254623413086, 11.245111465454102, 12.157676696777344, 13.070241928100586, 13.982807159423828, 14.895371437072754, 15.807936668395996, 16.720500946044922, 17.633066177368164, 18.545631408691406, 19.45819664001465, 20.37076187133789, 21.283327102661133, 22.195892333984375, 23.108455657958984, 24.02102279663086, 24.93358612060547, 25.84615135192871, 26.758716583251953]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 8.0, 5.0, 8.0, 5.0, 11.0, 13.0, 18.0, 15.0, 14.0, 23.0, 32.0, 31.0, 39.0, 37.0, 49.0, 54.0, 54.0, 42.0, 44.0, 45.0, 54.0, 54.0, 47.0, 43.0, 44.0, 37.0, 33.0, 30.0, 22.0, 25.0, 12.0, 10.0, 9.0, 10.0, 10.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.158203125, -3.06463623046875, -2.9710693359375, -2.87750244140625, -2.783935546875, -2.69036865234375, -2.5968017578125, -2.50323486328125, -2.40966796875, -2.31610107421875, -2.2225341796875, -2.12896728515625, -2.035400390625, -1.94183349609375, -1.8482666015625, -1.75469970703125, -1.6611328125, -1.56756591796875, -1.4739990234375, -1.38043212890625, -1.286865234375, -1.19329833984375, -1.0997314453125, -1.00616455078125, -0.91259765625, -0.81903076171875, -0.7254638671875, -0.63189697265625, -0.538330078125, -0.44476318359375, -0.3511962890625, -0.25762939453125, -0.1640625, -0.07049560546875, 0.0230712890625, 0.11663818359375, 0.210205078125, 0.30377197265625, 0.3973388671875, 0.49090576171875, 0.58447265625, 0.67803955078125, 0.7716064453125, 0.86517333984375, 0.958740234375, 1.05230712890625, 1.1458740234375, 1.23944091796875, 1.3330078125, 1.42657470703125, 1.5201416015625, 1.61370849609375, 1.707275390625, 1.80084228515625, 1.8944091796875, 1.98797607421875, 2.08154296875, 2.17510986328125, 2.2686767578125, 2.36224365234375, 2.455810546875, 2.54937744140625, 2.6429443359375, 2.73651123046875, 2.830078125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 10.0, 12.0, 14.0, 17.0, 20.0, 44.0, 52.0, 72.0, 132.0, 202.0, 356.0, 673.0, 1202.0, 2249.0, 4815.0, 13016.0, 59945.0, 760413.0, 2964925.0, 333489.0, 35741.0, 9542.0, 3712.0, 1695.0, 868.0, 429.0, 229.0, 153.0, 68.0, 54.0, 52.0, 25.0, 21.0, 8.0, 8.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.15625, -10.8653564453125, -10.574462890625, -10.2835693359375, -9.99267578125, -9.7017822265625, -9.410888671875, -9.1199951171875, -8.8291015625, -8.5382080078125, -8.247314453125, -7.9564208984375, -7.66552734375, -7.3746337890625, -7.083740234375, -6.7928466796875, -6.501953125, -6.2110595703125, -5.920166015625, -5.6292724609375, -5.33837890625, -5.0474853515625, -4.756591796875, -4.4656982421875, -4.1748046875, -3.8839111328125, -3.593017578125, -3.3021240234375, -3.01123046875, -2.7203369140625, -2.429443359375, -2.1385498046875, -1.84765625, -1.5567626953125, -1.265869140625, -0.9749755859375, -0.68408203125, -0.3931884765625, -0.102294921875, 0.1885986328125, 0.4794921875, 0.7703857421875, 1.061279296875, 1.3521728515625, 1.64306640625, 1.9339599609375, 2.224853515625, 2.5157470703125, 2.806640625, 3.0975341796875, 3.388427734375, 3.6793212890625, 3.97021484375, 4.2611083984375, 4.552001953125, 4.8428955078125, 5.1337890625, 5.4246826171875, 5.715576171875, 6.0064697265625, 6.29736328125, 6.5882568359375, 6.879150390625, 7.1700439453125, 7.4609375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 9.0, 11.0, 11.0, 18.0, 26.0, 26.0, 38.0, 55.0, 78.0, 102.0, 157.0, 283.0, 364.0, 546.0, 593.0, 548.0, 377.0, 258.0, 165.0, 131.0, 74.0, 65.0, 37.0, 23.0, 13.0, 15.0, 14.0, 4.0, 6.0, 4.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.671875, -6.4376220703125, -6.203369140625, -5.9691162109375, -5.73486328125, -5.5006103515625, -5.266357421875, -5.0321044921875, -4.7978515625, -4.5635986328125, -4.329345703125, -4.0950927734375, -3.86083984375, -3.6265869140625, -3.392333984375, -3.1580810546875, -2.923828125, -2.6895751953125, -2.455322265625, -2.2210693359375, -1.98681640625, -1.7525634765625, -1.518310546875, -1.2840576171875, -1.0498046875, -0.8155517578125, -0.581298828125, -0.3470458984375, -0.11279296875, 0.1214599609375, 0.355712890625, 0.5899658203125, 0.82421875, 1.0584716796875, 1.292724609375, 1.5269775390625, 1.76123046875, 1.9954833984375, 2.229736328125, 2.4639892578125, 2.6982421875, 2.9324951171875, 3.166748046875, 3.4010009765625, 3.63525390625, 3.8695068359375, 4.103759765625, 4.3380126953125, 4.572265625, 4.8065185546875, 5.040771484375, 5.2750244140625, 5.50927734375, 5.7435302734375, 5.977783203125, 6.2120361328125, 6.4462890625, 6.6805419921875, 6.914794921875, 7.1490478515625, 7.38330078125, 7.6175537109375, 7.851806640625, 8.0860595703125, 8.3203125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 13.0, 13.0, 20.0, 15.0, 19.0, 34.0, 48.0, 80.0, 166.0, 313.0, 687.0, 1563.0, 3959.0, 11786.0, 57401.0, 721762.0, 3055904.0, 294480.0, 32574.0, 8256.0, 2824.0, 1164.0, 557.0, 244.0, 139.0, 83.0, 47.0, 32.0, 26.0, 18.0, 20.0, 11.0, 7.0, 5.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.703125, -17.241455078125, -16.77978515625, -16.318115234375, -15.8564453125, -15.394775390625, -14.93310546875, -14.471435546875, -14.009765625, -13.548095703125, -13.08642578125, -12.624755859375, -12.1630859375, -11.701416015625, -11.23974609375, -10.778076171875, -10.31640625, -9.854736328125, -9.39306640625, -8.931396484375, -8.4697265625, -8.008056640625, -7.54638671875, -7.084716796875, -6.623046875, -6.161376953125, -5.69970703125, -5.238037109375, -4.7763671875, -4.314697265625, -3.85302734375, -3.391357421875, -2.9296875, -2.468017578125, -2.00634765625, -1.544677734375, -1.0830078125, -0.621337890625, -0.15966796875, 0.302001953125, 0.763671875, 1.225341796875, 1.68701171875, 2.148681640625, 2.6103515625, 3.072021484375, 3.53369140625, 3.995361328125, 4.45703125, 4.918701171875, 5.38037109375, 5.842041015625, 6.3037109375, 6.765380859375, 7.22705078125, 7.688720703125, 8.150390625, 8.612060546875, 9.07373046875, 9.535400390625, 9.9970703125, 10.458740234375, 10.92041015625, 11.382080078125, 11.84375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 7.0, 8.0, 15.0, 11.0, 18.0, 29.0, 20.0, 27.0, 28.0, 37.0, 47.0, 49.0, 53.0, 56.0, 60.0, 65.0, 59.0, 52.0, 61.0, 48.0, 41.0, 47.0, 27.0, 32.0, 17.0, 18.0, 14.0, 9.0, 15.0, 4.0, 7.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.93575096130371, -19.27741050720215, -18.619068145751953, -17.96072769165039, -17.302387237548828, -16.644046783447266, -15.985705375671387, -15.327363967895508, -14.669023513793945, -14.010683059692383, -13.352341651916504, -12.694000244140625, -12.035659790039062, -11.3773193359375, -10.718977928161621, -10.060636520385742, -9.40229606628418, -8.743955612182617, -8.085614204406738, -7.427273273468018, -6.768932342529297, -6.110591411590576, -5.4522504806518555, -4.793909549713135, -4.135568618774414, -3.4772276878356934, -2.8188867568969727, -2.160545825958252, -1.5022048950195312, -0.8438639640808105, -0.18552303314208984, 0.47281789779663086, 1.1311607360839844, 1.789501667022705, 2.447842597961426, 3.1061835289001465, 3.764524459838867, 4.422865390777588, 5.081206321716309, 5.739547252655029, 6.39788818359375, 7.056229114532471, 7.714570045471191, 8.37291145324707, 9.031251907348633, 9.689592361450195, 10.347933769226074, 11.006275177001953, 11.664615631103516, 12.322956085205078, 12.981297492980957, 13.639638900756836, 14.297979354858398, 14.956319808959961, 15.61466121673584, 16.27300262451172, 16.93134307861328, 17.589683532714844, 18.248023986816406, 18.9063663482666, 19.564706802368164, 20.223047256469727, 20.881389617919922, 21.539730072021484, 22.198070526123047]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 1.0, 5.0, 3.0, 9.0, 4.0, 10.0, 16.0, 14.0, 20.0, 21.0, 25.0, 27.0, 24.0, 32.0, 25.0, 27.0, 40.0, 37.0, 39.0, 31.0, 45.0, 41.0, 35.0, 36.0, 35.0, 47.0, 29.0, 44.0, 26.0, 24.0, 38.0, 27.0, 24.0, 22.0, 10.0, 16.0, 14.0, 16.0, 11.0, 9.0, 9.0, 8.0, 4.0, 7.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-21.031719207763672, -20.40998649597168, -19.788253784179688, -19.166521072387695, -18.544788360595703, -17.92305564880371, -17.30132293701172, -16.67959213256836, -16.057857513427734, -15.436124801635742, -14.81439208984375, -14.192659378051758, -13.570926666259766, -12.949193954467773, -12.327462196350098, -11.705729484558105, -11.08399772644043, -10.462265014648438, -9.840532302856445, -9.218799591064453, -8.597066879272461, -7.975334644317627, -7.353602409362793, -6.731869697570801, -6.110136985778809, -5.488404273986816, -4.866671562194824, -4.24493932723999, -3.623206615447998, -3.001473903656006, -2.3797414302825928, -1.7580089569091797, -1.1362743377685547, -0.514541745185852, 0.10719084739685059, 0.7289234399795532, 1.3506560325622559, 1.972388744354248, 2.594121217727661, 3.215853691101074, 3.8375864028930664, 4.459319114685059, 5.081051826477051, 5.702784061431885, 6.324516773223877, 6.946249485015869, 7.567981719970703, 8.189714431762695, 8.811447143554688, 9.43317985534668, 10.054912567138672, 10.676645278930664, 11.298377990722656, 11.920110702514648, 12.541842460632324, 13.163575172424316, 13.785307884216309, 14.4070405960083, 15.028773307800293, 15.650506019592285, 16.27223777770996, 16.893970489501953, 17.515703201293945, 18.137435913085938, 18.75916862487793]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 5.0, 3.0, 6.0, 12.0, 6.0, 9.0, 13.0, 19.0, 19.0, 12.0, 25.0, 35.0, 23.0, 40.0, 49.0, 40.0, 41.0, 41.0, 50.0, 49.0, 53.0, 49.0, 42.0, 49.0, 55.0, 31.0, 47.0, 28.0, 29.0, 20.0, 16.0, 13.0, 20.0, 10.0, 11.0, 6.0, 8.0, 4.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.95703125, -2.86669921875, -2.7763671875, -2.68603515625, -2.595703125, -2.50537109375, -2.4150390625, -2.32470703125, -2.234375, -2.14404296875, -2.0537109375, -1.96337890625, -1.873046875, -1.78271484375, -1.6923828125, -1.60205078125, -1.51171875, -1.42138671875, -1.3310546875, -1.24072265625, -1.150390625, -1.06005859375, -0.9697265625, -0.87939453125, -0.7890625, -0.69873046875, -0.6083984375, -0.51806640625, -0.427734375, -0.33740234375, -0.2470703125, -0.15673828125, -0.06640625, 0.02392578125, 0.1142578125, 0.20458984375, 0.294921875, 0.38525390625, 0.4755859375, 0.56591796875, 0.65625, 0.74658203125, 0.8369140625, 0.92724609375, 1.017578125, 1.10791015625, 1.1982421875, 1.28857421875, 1.37890625, 1.46923828125, 1.5595703125, 1.64990234375, 1.740234375, 1.83056640625, 1.9208984375, 2.01123046875, 2.1015625, 2.19189453125, 2.2822265625, 2.37255859375, 2.462890625, 2.55322265625, 2.6435546875, 2.73388671875, 2.82421875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 12.0, 7.0, 15.0, 17.0, 30.0, 49.0, 65.0, 101.0, 149.0, 229.0, 376.0, 557.0, 866.0, 1365.0, 2314.0, 3994.0, 6857.0, 11509.0, 19493.0, 33936.0, 61561.0, 124931.0, 333465.0, 232021.0, 96360.0, 50166.0, 28173.0, 16219.0, 9584.0, 5660.0, 3263.0, 1896.0, 1250.0, 742.0, 444.0, 313.0, 186.0, 131.0, 75.0, 60.0, 44.0, 19.0, 18.0, 11.0, 11.0, 3.0, 8.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.1579723358154297, -0.15249252319335938, -0.14701271057128906, -0.14153289794921875, -0.13605308532714844, -0.13057327270507812, -0.1250934600830078, -0.1196136474609375, -0.11413383483886719, -0.10865402221679688, -0.10317420959472656, -0.09769439697265625, -0.09221458435058594, -0.08673477172851562, -0.08125495910644531, -0.075775146484375, -0.07029533386230469, -0.06481552124023438, -0.05933570861816406, -0.05385589599609375, -0.04837608337402344, -0.042896270751953125, -0.03741645812988281, -0.0319366455078125, -0.026456832885742188, -0.020977020263671875, -0.015497207641601562, -0.01001739501953125, -0.0045375823974609375, 0.000942230224609375, 0.0064220428466796875, 0.01190185546875, 0.017381668090820312, 0.022861480712890625, 0.028341293334960938, 0.03382110595703125, 0.03930091857910156, 0.044780731201171875, 0.05026054382324219, 0.0557403564453125, 0.06122016906738281, 0.06669998168945312, 0.07217979431152344, 0.07765960693359375, 0.08313941955566406, 0.08861923217773438, 0.09409904479980469, 0.099578857421875, 0.10505867004394531, 0.11053848266601562, 0.11601829528808594, 0.12149810791015625, 0.12697792053222656, 0.13245773315429688, 0.1379375457763672, 0.1434173583984375, 0.1488971710205078, 0.15437698364257812, 0.15985679626464844, 0.16533660888671875, 0.17081642150878906, 0.17629623413085938, 0.1817760467529297, 0.187255859375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 8.0, 7.0, 4.0, 7.0, 10.0, 15.0, 15.0, 21.0, 16.0, 18.0, 28.0, 37.0, 29.0, 40.0, 38.0, 34.0, 42.0, 37.0, 42.0, 39.0, 1071.0, 41.0, 26.0, 42.0, 39.0, 41.0, 37.0, 33.0, 32.0, 39.0, 23.0, 20.0, 16.0, 16.0, 11.0, 4.0, 11.0, 7.0, 6.0, 11.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08203125, -2.00799560546875, -1.9339599609375, -1.85992431640625, -1.785888671875, -1.71185302734375, -1.6378173828125, -1.56378173828125, -1.48974609375, -1.41571044921875, -1.3416748046875, -1.26763916015625, -1.193603515625, -1.11956787109375, -1.0455322265625, -0.97149658203125, -0.8974609375, -0.82342529296875, -0.7493896484375, -0.67535400390625, -0.601318359375, -0.52728271484375, -0.4532470703125, -0.37921142578125, -0.30517578125, -0.23114013671875, -0.1571044921875, -0.08306884765625, -0.009033203125, 0.06500244140625, 0.1390380859375, 0.21307373046875, 0.287109375, 0.36114501953125, 0.4351806640625, 0.50921630859375, 0.583251953125, 0.65728759765625, 0.7313232421875, 0.80535888671875, 0.87939453125, 0.95343017578125, 1.0274658203125, 1.10150146484375, 1.175537109375, 1.24957275390625, 1.3236083984375, 1.39764404296875, 1.4716796875, 1.54571533203125, 1.6197509765625, 1.69378662109375, 1.767822265625, 1.84185791015625, 1.9158935546875, 1.98992919921875, 2.06396484375, 2.13800048828125, 2.2120361328125, 2.28607177734375, 2.360107421875, 2.43414306640625, 2.5081787109375, 2.58221435546875, 2.65625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 8.0, 10.0, 14.0, 16.0, 21.0, 56.0, 55.0, 89.0, 95.0, 170.0, 247.0, 325.0, 495.0, 669.0, 992.0, 1345.0, 1897.0, 2919.0, 4197.0, 6206.0, 9213.0, 13656.0, 21210.0, 32872.0, 52543.0, 89270.0, 176638.0, 1325719.0, 145373.0, 77093.0, 46556.0, 29290.0, 18946.0, 12559.0, 8279.0, 5605.0, 3774.0, 2583.0, 1900.0, 1265.0, 891.0, 598.0, 439.0, 291.0, 233.0, 164.0, 98.0, 79.0, 55.0, 39.0, 29.0, 15.0, 14.0, 6.0, 8.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.0496826171875, -0.04809904098510742, -0.046515464782714844, -0.044931888580322266, -0.04334831237792969, -0.04176473617553711, -0.04018115997314453, -0.03859758377075195, -0.037014007568359375, -0.0354304313659668, -0.03384685516357422, -0.03226327896118164, -0.030679702758789062, -0.029096126556396484, -0.027512550354003906, -0.025928974151611328, -0.02434539794921875, -0.022761821746826172, -0.021178245544433594, -0.019594669342041016, -0.018011093139648438, -0.01642751693725586, -0.014843940734863281, -0.013260364532470703, -0.011676788330078125, -0.010093212127685547, -0.008509635925292969, -0.006926059722900391, -0.0053424835205078125, -0.0037589073181152344, -0.0021753311157226562, -0.0005917549133300781, 0.0009918212890625, 0.002575397491455078, 0.004158973693847656, 0.005742549896240234, 0.0073261260986328125, 0.00890970230102539, 0.010493278503417969, 0.012076854705810547, 0.013660430908203125, 0.015244007110595703, 0.01682758331298828, 0.01841115951538086, 0.019994735717773438, 0.021578311920166016, 0.023161888122558594, 0.024745464324951172, 0.02632904052734375, 0.027912616729736328, 0.029496192932128906, 0.031079769134521484, 0.03266334533691406, 0.03424692153930664, 0.03583049774169922, 0.0374140739440918, 0.038997650146484375, 0.04058122634887695, 0.04216480255126953, 0.04374837875366211, 0.04533195495605469, 0.046915531158447266, 0.048499107360839844, 0.05008268356323242, 0.051666259765625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 3.0, 5.0, 6.0, 11.0, 8.0, 10.0, 12.0, 16.0, 15.0, 29.0, 23.0, 28.0, 37.0, 45.0, 69.0, 85.0, 114.0, 101.0, 78.0, 54.0, 57.0, 42.0, 25.0, 30.0, 25.0, 17.0, 17.0, 6.0, 6.0, 4.0, 4.0, 10.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.000667572021484375, -0.0006489977240562439, -0.0006304234266281128, -0.0006118491291999817, -0.0005932748317718506, -0.0005747005343437195, -0.0005561262369155884, -0.0005375519394874573, -0.0005189776420593262, -0.0005004033446311951, -0.00048182904720306396, -0.00046325474977493286, -0.00044468045234680176, -0.00042610615491867065, -0.00040753185749053955, -0.00038895756006240845, -0.00037038326263427734, -0.00035180896520614624, -0.00033323466777801514, -0.00031466037034988403, -0.00029608607292175293, -0.0002775117754936218, -0.0002589374780654907, -0.00024036318063735962, -0.00022178888320922852, -0.0002032145857810974, -0.0001846402883529663, -0.0001660659909248352, -0.0001474916934967041, -0.000128917396068573, -0.0001103430986404419, -9.176880121231079e-05, -7.319450378417969e-05, -5.4620206356048584e-05, -3.604590892791748e-05, -1.7471611499786377e-05, 1.1026859283447266e-06, 1.967698335647583e-05, 3.8251280784606934e-05, 5.682557821273804e-05, 7.539987564086914e-05, 9.397417306900024e-05, 0.00011254847049713135, 0.00013112276792526245, 0.00014969706535339355, 0.00016827136278152466, 0.00018684566020965576, 0.00020541995763778687, 0.00022399425506591797, 0.00024256855249404907, 0.0002611428499221802, 0.0002797171473503113, 0.0002982914447784424, 0.0003168657422065735, 0.0003354400396347046, 0.0003540143370628357, 0.0003725886344909668, 0.0003911629319190979, 0.000409737229347229, 0.0004283115267753601, 0.0004468858242034912, 0.0004654601216316223, 0.0004840344190597534, 0.0005026087164878845, 0.0005211830139160156]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 6.0, 8.0, 6.0, 8.0, 22.0, 33.0, 40.0, 94.0, 168.0, 528.0, 2030.0, 9373.0, 55418.0, 637948.0, 300296.0, 34427.0, 6069.0, 1368.0, 364.0, 134.0, 66.0, 42.0, 24.0, 18.0, 15.0, 8.0, 9.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00795745849609375, -0.007681846618652344, -0.0074062347412109375, -0.007130622863769531, -0.006855010986328125, -0.006579399108886719, -0.0063037872314453125, -0.006028175354003906, -0.0057525634765625, -0.005476951599121094, -0.0052013397216796875, -0.004925727844238281, -0.004650115966796875, -0.004374504089355469, -0.0040988922119140625, -0.0038232803344726562, -0.00354766845703125, -0.0032720565795898438, -0.0029964447021484375, -0.0027208328247070312, -0.002445220947265625, -0.0021696090698242188, -0.0018939971923828125, -0.0016183853149414062, -0.0013427734375, -0.0010671615600585938, -0.0007915496826171875, -0.0005159378051757812, -0.000240325927734375, 3.528594970703125e-05, 0.0003108978271484375, 0.0005865097045898438, 0.00086212158203125, 0.0011377334594726562, 0.0014133453369140625, 0.0016889572143554688, 0.001964569091796875, 0.0022401809692382812, 0.0025157928466796875, 0.0027914047241210938, 0.0030670166015625, 0.0033426284790039062, 0.0036182403564453125, 0.0038938522338867188, 0.004169464111328125, 0.004445075988769531, 0.0047206878662109375, 0.004996299743652344, 0.00527191162109375, 0.005547523498535156, 0.0058231353759765625, 0.006098747253417969, 0.006374359130859375, 0.006649971008300781, 0.0069255828857421875, 0.007201194763183594, 0.007476806640625, 0.007752418518066406, 0.008028030395507812, 0.008303642272949219, 0.008579254150390625, 0.008854866027832031, 0.009130477905273438, 0.009406089782714844, 0.00968170166015625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 12.0, 134.0, 750.0, 104.0, 13.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002684985753148794, -0.0023683321196585894, -0.0020516784861683846, -0.0017350249690935016, -0.0014183713356032968, -0.001101717702113092, -0.000785064185038209, -0.00046841055154800415, -0.00015175691805779934, 0.00016489668632857502, 0.00048155029071494937, 0.0007982038659974933, 0.001114857499487698, 0.0014315111329779029, 0.0017481646500527859, 0.0020648182835429907, 0.0023814719170331955, 0.0026981255505234003, 0.003014779184013605, 0.0033314325846731663, 0.0036480864509940147, 0.003964739851653576, 0.004281393252313137, 0.0045980471186339855, 0.004914700984954834, 0.005231354385614395, 0.005548008251935244, 0.005864661652594805, 0.006181315518915653, 0.006497968919575214, 0.0068146223202347755, 0.007131276186555624, 0.007447929121553898, 0.007764582522213459, 0.00808123592287302, 0.008397890254855156, 0.008714543655514717, 0.009031197056174278, 0.00934785045683384, 0.0096645038574934, 0.009981158189475536, 0.010297811590135098, 0.010614464990794659, 0.010931119322776794, 0.011247772723436356, 0.011564426124095917, 0.011881079524755478, 0.012197732925415039, 0.0125143863260746, 0.012831039726734161, 0.013147693127393723, 0.013464347459375858, 0.01378100086003542, 0.01409765426069498, 0.014414307661354542, 0.014730961993336678, 0.015047615393996239, 0.0153642687946558, 0.01568092219531536, 0.015997575595974922, 0.016314228996634483, 0.016630884259939194, 0.016947537660598755, 0.017264191061258316, 0.017580844461917877]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 8.0, 5.0, 24.0, 30.0, 38.0, 67.0, 76.0, 93.0, 99.0, 89.0, 97.0, 86.0, 62.0, 80.0, 49.0, 46.0, 28.0, 12.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013107657432556152, -0.0012807315215468407, -0.001250697299838066, -0.0012206630781292915, -0.001190628856420517, -0.0011605946347117424, -0.0011305604130029678, -0.0011005261912941933, -0.0010704919695854187, -0.0010404577478766441, -0.0010104235261678696, -0.000980389304459095, -0.0009503550827503204, -0.0009203208610415459, -0.0008902866393327713, -0.0008602524176239967, -0.0008302181959152222, -0.0008001839742064476, -0.000770149752497673, -0.0007401155307888985, -0.0007100813090801239, -0.0006800470873713493, -0.0006500128656625748, -0.0006199786439538002, -0.0005899444222450256, -0.0005599102005362511, -0.0005298759788274765, -0.0004998417571187019, -0.00046980753540992737, -0.0004397733137011528, -0.00040973909199237823, -0.00037970487028360367, -0.0003496706485748291, -0.00031963642686605453, -0.00028960220515727997, -0.0002595679834485054, -0.00022953376173973083, -0.00019949954003095627, -0.0001694653183221817, -0.00013943109661340714, -0.00010939687490463257, -7.9362653195858e-05, -4.9328431487083435e-05, -1.929420977830887e-05, 1.0740011930465698e-05, 4.0774233639240265e-05, 7.080845534801483e-05, 0.0001008426770567894, 0.00013087689876556396, 0.00016091112047433853, 0.0001909453421831131, 0.00022097956389188766, 0.00025101378560066223, 0.0002810480073094368, 0.00031108222901821136, 0.00034111645072698593, 0.0003711506724357605, 0.00040118489414453506, 0.00043121911585330963, 0.0004612533375620842, 0.0004912875592708588, 0.0005213217809796333, 0.0005513560026884079, 0.0005813902243971825, 0.000611424446105957]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 5.0, 3.0, 6.0, 12.0, 6.0, 9.0, 13.0, 19.0, 19.0, 12.0, 25.0, 35.0, 23.0, 40.0, 49.0, 40.0, 41.0, 41.0, 50.0, 49.0, 53.0, 49.0, 42.0, 49.0, 55.0, 31.0, 47.0, 28.0, 29.0, 20.0, 16.0, 13.0, 20.0, 10.0, 11.0, 6.0, 8.0, 4.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.95703125, -2.86669921875, -2.7763671875, -2.68603515625, -2.595703125, -2.50537109375, -2.4150390625, -2.32470703125, -2.234375, -2.14404296875, -2.0537109375, -1.96337890625, -1.873046875, -1.78271484375, -1.6923828125, -1.60205078125, -1.51171875, -1.42138671875, -1.3310546875, -1.24072265625, -1.150390625, -1.06005859375, -0.9697265625, -0.87939453125, -0.7890625, -0.69873046875, -0.6083984375, -0.51806640625, -0.427734375, -0.33740234375, -0.2470703125, -0.15673828125, -0.06640625, 0.02392578125, 0.1142578125, 0.20458984375, 0.294921875, 0.38525390625, 0.4755859375, 0.56591796875, 0.65625, 0.74658203125, 0.8369140625, 0.92724609375, 1.017578125, 1.10791015625, 1.1982421875, 1.28857421875, 1.37890625, 1.46923828125, 1.5595703125, 1.64990234375, 1.740234375, 1.83056640625, 1.9208984375, 2.01123046875, 2.1015625, 2.19189453125, 2.2822265625, 2.37255859375, 2.462890625, 2.55322265625, 2.6435546875, 2.73388671875, 2.82421875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 9.0, 19.0, 17.0, 28.0, 38.0, 63.0, 162.0, 249.0, 480.0, 899.0, 1973.0, 4716.0, 13274.0, 43096.0, 156933.0, 510335.0, 226207.0, 61059.0, 17963.0, 6265.0, 2467.0, 1052.0, 565.0, 296.0, 142.0, 92.0, 63.0, 23.0, 20.0, 14.0, 8.0, 5.0, 8.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.578125, -7.37127685546875, -7.1644287109375, -6.95758056640625, -6.750732421875, -6.54388427734375, -6.3370361328125, -6.13018798828125, -5.92333984375, -5.71649169921875, -5.5096435546875, -5.30279541015625, -5.095947265625, -4.88909912109375, -4.6822509765625, -4.47540283203125, -4.2685546875, -4.06170654296875, -3.8548583984375, -3.64801025390625, -3.441162109375, -3.23431396484375, -3.0274658203125, -2.82061767578125, -2.61376953125, -2.40692138671875, -2.2000732421875, -1.99322509765625, -1.786376953125, -1.57952880859375, -1.3726806640625, -1.16583251953125, -0.958984375, -0.75213623046875, -0.5452880859375, -0.33843994140625, -0.131591796875, 0.07525634765625, 0.2821044921875, 0.48895263671875, 0.69580078125, 0.90264892578125, 1.1094970703125, 1.31634521484375, 1.523193359375, 1.73004150390625, 1.9368896484375, 2.14373779296875, 2.3505859375, 2.55743408203125, 2.7642822265625, 2.97113037109375, 3.177978515625, 3.38482666015625, 3.5916748046875, 3.79852294921875, 4.00537109375, 4.21221923828125, 4.4190673828125, 4.62591552734375, 4.832763671875, 5.03961181640625, 5.2464599609375, 5.45330810546875, 5.66015625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 7.0, 1.0, 5.0, 6.0, 8.0, 4.0, 12.0, 10.0, 9.0, 27.0, 23.0, 23.0, 39.0, 28.0, 34.0, 43.0, 49.0, 60.0, 85.0, 127.0, 185.0, 1352.0, 230.0, 117.0, 100.0, 66.0, 57.0, 59.0, 31.0, 27.0, 45.0, 30.0, 23.0, 19.0, 22.0, 22.0, 13.0, 14.0, 12.0, 9.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.53125, -8.2431640625, -7.955078125, -7.6669921875, -7.37890625, -7.0908203125, -6.802734375, -6.5146484375, -6.2265625, -5.9384765625, -5.650390625, -5.3623046875, -5.07421875, -4.7861328125, -4.498046875, -4.2099609375, -3.921875, -3.6337890625, -3.345703125, -3.0576171875, -2.76953125, -2.4814453125, -2.193359375, -1.9052734375, -1.6171875, -1.3291015625, -1.041015625, -0.7529296875, -0.46484375, -0.1767578125, 0.111328125, 0.3994140625, 0.6875, 0.9755859375, 1.263671875, 1.5517578125, 1.83984375, 2.1279296875, 2.416015625, 2.7041015625, 2.9921875, 3.2802734375, 3.568359375, 3.8564453125, 4.14453125, 4.4326171875, 4.720703125, 5.0087890625, 5.296875, 5.5849609375, 5.873046875, 6.1611328125, 6.44921875, 6.7373046875, 7.025390625, 7.3134765625, 7.6015625, 7.8896484375, 8.177734375, 8.4658203125, 8.75390625, 9.0419921875, 9.330078125, 9.6181640625, 9.90625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 8.0, 11.0, 10.0, 10.0, 24.0, 28.0, 34.0, 61.0, 68.0, 95.0, 185.0, 258.0, 457.0, 884.0, 2135.0, 6456.0, 33891.0, 471554.0, 2475907.0, 131024.0, 15443.0, 3858.0, 1504.0, 753.0, 380.0, 217.0, 143.0, 98.0, 47.0, 42.0, 29.0, 16.0, 15.0, 17.0, 7.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-18.515625, -17.990966796875, -17.46630859375, -16.941650390625, -16.4169921875, -15.892333984375, -15.36767578125, -14.843017578125, -14.318359375, -13.793701171875, -13.26904296875, -12.744384765625, -12.2197265625, -11.695068359375, -11.17041015625, -10.645751953125, -10.12109375, -9.596435546875, -9.07177734375, -8.547119140625, -8.0224609375, -7.497802734375, -6.97314453125, -6.448486328125, -5.923828125, -5.399169921875, -4.87451171875, -4.349853515625, -3.8251953125, -3.300537109375, -2.77587890625, -2.251220703125, -1.7265625, -1.201904296875, -0.67724609375, -0.152587890625, 0.3720703125, 0.896728515625, 1.42138671875, 1.946044921875, 2.470703125, 2.995361328125, 3.52001953125, 4.044677734375, 4.5693359375, 5.093994140625, 5.61865234375, 6.143310546875, 6.66796875, 7.192626953125, 7.71728515625, 8.241943359375, 8.7666015625, 9.291259765625, 9.81591796875, 10.340576171875, 10.865234375, 11.389892578125, 11.91455078125, 12.439208984375, 12.9638671875, 13.488525390625, 14.01318359375, 14.537841796875, 15.0625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 14.0, 45.0, 83.0, 262.0, 267.0, 217.0, 89.0, 19.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.848533630371094, -31.134279251098633, -28.420024871826172, -25.705772399902344, -22.991518020629883, -20.277263641357422, -17.563011169433594, -14.848756790161133, -12.134502410888672, -9.420248031616211, -6.705994606018066, -3.991741180419922, -1.277486801147461, 1.436767578125, 4.151020050048828, 6.865274429321289, 9.57952880859375, 12.293783187866211, 15.008036613464355, 17.7222900390625, 20.43654441833496, 23.150798797607422, 25.86505126953125, 28.57930564880371, 31.293560028076172, 34.0078125, 36.722068786621094, 39.43632125854492, 42.15057373046875, 44.864830017089844, 47.57908248901367, 50.2933349609375, 53.007598876953125, 55.72185134887695, 58.43610763549805, 61.150360107421875, 63.86461639404297, 66.57887268066406, 69.29312133789062, 72.00737762451172, 74.72163391113281, 77.4358901977539, 80.15013885498047, 82.86439514160156, 85.57865142822266, 88.29290771484375, 91.00715637207031, 93.7214126586914, 96.43566131591797, 99.14991760253906, 101.86416625976562, 104.57842254638672, 107.29267883300781, 110.00692749023438, 112.72118377685547, 115.43544006347656, 118.14968872070312, 120.86394500732422, 123.57819366455078, 126.29244995117188, 129.00669860839844, 131.72096252441406, 134.43521118164062, 137.1494598388672, 139.8637237548828]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 3.0, 6.0, 9.0, 9.0, 8.0, 15.0, 13.0, 19.0, 19.0, 23.0, 23.0, 25.0, 29.0, 32.0, 34.0, 31.0, 23.0, 40.0, 41.0, 48.0, 39.0, 37.0, 36.0, 38.0, 30.0, 36.0, 36.0, 20.0, 32.0, 26.0, 25.0, 19.0, 24.0, 21.0, 16.0, 17.0, 20.0, 7.0, 12.0, 11.0, 6.0, 3.0, 8.0, 7.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.35373306274414, -24.54157257080078, -23.72941017150879, -22.91724967956543, -22.105087280273438, -21.292926788330078, -20.48076629638672, -19.668603897094727, -18.856443405151367, -18.044282913208008, -17.232120513916016, -16.419960021972656, -15.60779857635498, -14.795637130737305, -13.983475685119629, -13.171314239501953, -12.359152793884277, -11.546991348266602, -10.734829902648926, -9.92266845703125, -9.11050796508789, -8.298346519470215, -7.486185073852539, -6.6740241050720215, -5.861862659454346, -5.04970121383667, -4.237540245056152, -3.4253787994384766, -2.61321759223938, -1.8010563850402832, -0.9888949394226074, -0.17673397064208984, 0.6354274749755859, 1.4475886821746826, 2.2597498893737793, 3.071911334991455, 3.8840725421905518, 4.696233749389648, 5.508395195007324, 6.320556163787842, 7.132717609405518, 7.944879055023193, 8.757040023803711, 9.569201469421387, 10.381362915039062, 11.193523406982422, 12.005685806274414, 12.817846298217773, 13.63000774383545, 14.442169189453125, 15.2543306350708, 16.066492080688477, 16.878652572631836, 17.690814971923828, 18.502975463867188, 19.315135955810547, 20.12729835510254, 20.9394588470459, 21.75162124633789, 22.56378173828125, 23.375944137573242, 24.1881046295166, 25.000267028808594, 25.812427520751953, 26.624588012695312]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 2.0, 3.0, 5.0, 6.0, 10.0, 9.0, 12.0, 12.0, 17.0, 16.0, 19.0, 30.0, 27.0, 27.0, 28.0, 44.0, 38.0, 45.0, 48.0, 49.0, 55.0, 44.0, 54.0, 47.0, 37.0, 41.0, 35.0, 35.0, 36.0, 30.0, 31.0, 20.0, 11.0, 18.0, 12.0, 11.0, 7.0, 11.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.138671875, -3.043243408203125, -2.94781494140625, -2.852386474609375, -2.7569580078125, -2.661529541015625, -2.56610107421875, -2.470672607421875, -2.375244140625, -2.279815673828125, -2.18438720703125, -2.088958740234375, -1.9935302734375, -1.898101806640625, -1.80267333984375, -1.707244873046875, -1.61181640625, -1.516387939453125, -1.42095947265625, -1.325531005859375, -1.2301025390625, -1.134674072265625, -1.03924560546875, -0.943817138671875, -0.848388671875, -0.752960205078125, -0.65753173828125, -0.562103271484375, -0.4666748046875, -0.371246337890625, -0.27581787109375, -0.180389404296875, -0.0849609375, 0.010467529296875, 0.10589599609375, 0.201324462890625, 0.2967529296875, 0.392181396484375, 0.48760986328125, 0.583038330078125, 0.678466796875, 0.773895263671875, 0.86932373046875, 0.964752197265625, 1.0601806640625, 1.155609130859375, 1.25103759765625, 1.346466064453125, 1.44189453125, 1.537322998046875, 1.63275146484375, 1.728179931640625, 1.8236083984375, 1.919036865234375, 2.01446533203125, 2.109893798828125, 2.205322265625, 2.300750732421875, 2.39617919921875, 2.491607666015625, 2.5870361328125, 2.682464599609375, 2.77789306640625, 2.873321533203125, 2.96875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 10.0, 10.0, 25.0, 23.0, 26.0, 47.0, 95.0, 107.0, 167.0, 293.0, 417.0, 679.0, 1202.0, 2217.0, 4334.0, 9773.0, 27206.0, 139078.0, 1457781.0, 2247907.0, 241964.0, 38458.0, 12147.0, 5058.0, 2364.0, 1172.0, 674.0, 368.0, 236.0, 151.0, 90.0, 74.0, 31.0, 27.0, 17.0, 11.0, 11.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.2890625, -10.00421142578125, -9.7193603515625, -9.43450927734375, -9.149658203125, -8.86480712890625, -8.5799560546875, -8.29510498046875, -8.01025390625, -7.72540283203125, -7.4405517578125, -7.15570068359375, -6.870849609375, -6.58599853515625, -6.3011474609375, -6.01629638671875, -5.7314453125, -5.44659423828125, -5.1617431640625, -4.87689208984375, -4.592041015625, -4.30718994140625, -4.0223388671875, -3.73748779296875, -3.45263671875, -3.16778564453125, -2.8829345703125, -2.59808349609375, -2.313232421875, -2.02838134765625, -1.7435302734375, -1.45867919921875, -1.173828125, -0.88897705078125, -0.6041259765625, -0.31927490234375, -0.034423828125, 0.25042724609375, 0.5352783203125, 0.82012939453125, 1.10498046875, 1.38983154296875, 1.6746826171875, 1.95953369140625, 2.244384765625, 2.52923583984375, 2.8140869140625, 3.09893798828125, 3.3837890625, 3.66864013671875, 3.9534912109375, 4.23834228515625, 4.523193359375, 4.80804443359375, 5.0928955078125, 5.37774658203125, 5.66259765625, 5.94744873046875, 6.2322998046875, 6.51715087890625, 6.802001953125, 7.08685302734375, 7.3717041015625, 7.65655517578125, 7.94140625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 9.0, 5.0, 16.0, 13.0, 22.0, 28.0, 35.0, 70.0, 112.0, 169.0, 242.0, 363.0, 493.0, 621.0, 538.0, 409.0, 303.0, 190.0, 135.0, 70.0, 63.0, 44.0, 26.0, 20.0, 14.0, 10.0, 11.0, 10.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.2890625, -7.035400390625, -6.78173828125, -6.528076171875, -6.2744140625, -6.020751953125, -5.76708984375, -5.513427734375, -5.259765625, -5.006103515625, -4.75244140625, -4.498779296875, -4.2451171875, -3.991455078125, -3.73779296875, -3.484130859375, -3.23046875, -2.976806640625, -2.72314453125, -2.469482421875, -2.2158203125, -1.962158203125, -1.70849609375, -1.454833984375, -1.201171875, -0.947509765625, -0.69384765625, -0.440185546875, -0.1865234375, 0.067138671875, 0.32080078125, 0.574462890625, 0.828125, 1.081787109375, 1.33544921875, 1.589111328125, 1.8427734375, 2.096435546875, 2.35009765625, 2.603759765625, 2.857421875, 3.111083984375, 3.36474609375, 3.618408203125, 3.8720703125, 4.125732421875, 4.37939453125, 4.633056640625, 4.88671875, 5.140380859375, 5.39404296875, 5.647705078125, 5.9013671875, 6.155029296875, 6.40869140625, 6.662353515625, 6.916015625, 7.169677734375, 7.42333984375, 7.677001953125, 7.9306640625, 8.184326171875, 8.43798828125, 8.691650390625, 8.9453125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 6.0, 5.0, 13.0, 12.0, 13.0, 35.0, 48.0, 56.0, 95.0, 184.0, 342.0, 626.0, 1453.0, 3699.0, 11632.0, 60272.0, 994363.0, 2912691.0, 176357.0, 22148.0, 6103.0, 2173.0, 931.0, 428.0, 216.0, 131.0, 72.0, 43.0, 34.0, 31.0, 16.0, 14.0, 11.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.8704833984375, -18.319091796875, -17.7677001953125, -17.21630859375, -16.6649169921875, -16.113525390625, -15.5621337890625, -15.0107421875, -14.4593505859375, -13.907958984375, -13.3565673828125, -12.80517578125, -12.2537841796875, -11.702392578125, -11.1510009765625, -10.599609375, -10.0482177734375, -9.496826171875, -8.9454345703125, -8.39404296875, -7.8426513671875, -7.291259765625, -6.7398681640625, -6.1884765625, -5.6370849609375, -5.085693359375, -4.5343017578125, -3.98291015625, -3.4315185546875, -2.880126953125, -2.3287353515625, -1.77734375, -1.2259521484375, -0.674560546875, -0.1231689453125, 0.42822265625, 0.9796142578125, 1.531005859375, 2.0823974609375, 2.6337890625, 3.1851806640625, 3.736572265625, 4.2879638671875, 4.83935546875, 5.3907470703125, 5.942138671875, 6.4935302734375, 7.044921875, 7.5963134765625, 8.147705078125, 8.6990966796875, 9.25048828125, 9.8018798828125, 10.353271484375, 10.9046630859375, 11.4560546875, 12.0074462890625, 12.558837890625, 13.1102294921875, 13.66162109375, 14.2130126953125, 14.764404296875, 15.3157958984375, 15.8671875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 15.0, 10.0, 33.0, 43.0, 66.0, 78.0, 100.0, 103.0, 106.0, 114.0, 93.0, 65.0, 51.0, 45.0, 25.0, 17.0, 9.0, 11.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.406036376953125, -48.03774642944336, -46.66946029663086, -45.301170349121094, -43.932884216308594, -42.56459426879883, -41.19630432128906, -39.82801818847656, -38.4597282409668, -37.09143829345703, -35.72315216064453, -34.354862213134766, -32.986572265625, -31.6182861328125, -30.249996185302734, -28.8817081451416, -27.51342010498047, -26.145132064819336, -24.776844024658203, -23.408554077148438, -22.040266036987305, -20.671977996826172, -19.303688049316406, -17.935400009155273, -16.56711196899414, -15.198823928833008, -13.830534934997559, -12.46224594116211, -11.093957901000977, -9.725669860839844, -8.357380867004395, -6.989091873168945, -5.620807647705078, -4.252519130706787, -2.884230613708496, -1.515942096710205, -0.14765357971191406, 1.220634937286377, 2.588923454284668, 3.957212448120117, 5.32550048828125, 6.693789005279541, 8.062077522277832, 9.430366516113281, 10.798654556274414, 12.166942596435547, 13.535231590270996, 14.903520584106445, 16.271808624267578, 17.64009666442871, 19.008384704589844, 20.37667465209961, 21.744962692260742, 23.113250732421875, 24.48154067993164, 25.849828720092773, 27.218116760253906, 28.58640480041504, 29.954692840576172, 31.322982788085938, 32.69126892089844, 34.0595588684082, 35.42784881591797, 36.79613494873047, 38.164424896240234]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 14.0, 10.0, 9.0, 17.0, 15.0, 18.0, 17.0, 15.0, 21.0, 24.0, 24.0, 33.0, 36.0, 29.0, 33.0, 43.0, 40.0, 32.0, 28.0, 35.0, 32.0, 37.0, 40.0, 37.0, 46.0, 32.0, 39.0, 29.0, 24.0, 28.0, 24.0, 20.0, 19.0, 10.0, 14.0, 9.0, 13.0, 16.0, 11.0, 9.0, 8.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-26.156085968017578, -25.404306411743164, -24.652524948120117, -23.900745391845703, -23.14896583557129, -22.397184371948242, -21.645404815673828, -20.89362335205078, -20.141843795776367, -19.390064239501953, -18.638282775878906, -17.886503219604492, -17.134723663330078, -16.38294219970703, -15.631162643432617, -14.879382133483887, -14.127602577209473, -13.375822067260742, -12.624042510986328, -11.872262001037598, -11.120481491088867, -10.368701934814453, -9.616921424865723, -8.865140914916992, -8.113361358642578, -7.361581325531006, -6.609800815582275, -5.858020782470703, -5.106240272521973, -4.3544602394104, -3.602680206298828, -2.8508996963500977, -2.099119186401367, -1.3473389148712158, -0.595558762550354, 0.1562213897705078, 0.9080016613006592, 1.6597819328308105, 2.411561965942383, 3.1633424758911133, 3.9151225090026855, 4.666902542114258, 5.418683052062988, 6.1704630851745605, 6.922243118286133, 7.674023628234863, 8.425804138183594, 9.177583694458008, 9.929364204406738, 10.681144714355469, 11.432924270629883, 12.184704780578613, 12.936485290527344, 13.688264846801758, 14.440045356750488, 15.191825866699219, 15.943605422973633, 16.695384979248047, 17.447166442871094, 18.198945999145508, 18.950725555419922, 19.70250701904297, 20.454286575317383, 21.206066131591797, 21.957847595214844]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 2.0, 8.0, 5.0, 1.0, 5.0, 11.0, 14.0, 12.0, 19.0, 22.0, 23.0, 27.0, 31.0, 42.0, 29.0, 40.0, 43.0, 37.0, 60.0, 54.0, 46.0, 35.0, 42.0, 61.0, 36.0, 49.0, 32.0, 49.0, 25.0, 24.0, 20.0, 26.0, 11.0, 19.0, 10.0, 11.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.107421875, -3.0081787109375, -2.908935546875, -2.8096923828125, -2.71044921875, -2.6112060546875, -2.511962890625, -2.4127197265625, -2.3134765625, -2.2142333984375, -2.114990234375, -2.0157470703125, -1.91650390625, -1.8172607421875, -1.718017578125, -1.6187744140625, -1.51953125, -1.4202880859375, -1.321044921875, -1.2218017578125, -1.12255859375, -1.0233154296875, -0.924072265625, -0.8248291015625, -0.7255859375, -0.6263427734375, -0.527099609375, -0.4278564453125, -0.32861328125, -0.2293701171875, -0.130126953125, -0.0308837890625, 0.068359375, 0.1676025390625, 0.266845703125, 0.3660888671875, 0.46533203125, 0.5645751953125, 0.663818359375, 0.7630615234375, 0.8623046875, 0.9615478515625, 1.060791015625, 1.1600341796875, 1.25927734375, 1.3585205078125, 1.457763671875, 1.5570068359375, 1.65625, 1.7554931640625, 1.854736328125, 1.9539794921875, 2.05322265625, 2.1524658203125, 2.251708984375, 2.3509521484375, 2.4501953125, 2.5494384765625, 2.648681640625, 2.7479248046875, 2.84716796875, 2.9464111328125, 3.045654296875, 3.1448974609375, 3.244140625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 8.0, 13.0, 19.0, 20.0, 52.0, 68.0, 93.0, 128.0, 208.0, 307.0, 483.0, 693.0, 1033.0, 1606.0, 2451.0, 3652.0, 5676.0, 8713.0, 13744.0, 21105.0, 33493.0, 56761.0, 101764.0, 241199.0, 279582.0, 113250.0, 61446.0, 36416.0, 22868.0, 14570.0, 9430.0, 6098.0, 3970.0, 2603.0, 1708.0, 1114.0, 718.0, 512.0, 320.0, 230.0, 142.0, 95.0, 71.0, 46.0, 24.0, 19.0, 14.0, 13.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1541748046875, -0.14965057373046875, -0.1451263427734375, -0.14060211181640625, -0.136077880859375, -0.13155364990234375, -0.1270294189453125, -0.12250518798828125, -0.11798095703125, -0.11345672607421875, -0.1089324951171875, -0.10440826416015625, -0.099884033203125, -0.09535980224609375, -0.0908355712890625, -0.08631134033203125, -0.081787109375, -0.07726287841796875, -0.0727386474609375, -0.06821441650390625, -0.063690185546875, -0.05916595458984375, -0.0546417236328125, -0.05011749267578125, -0.04559326171875, -0.04106903076171875, -0.0365447998046875, -0.03202056884765625, -0.027496337890625, -0.02297210693359375, -0.0184478759765625, -0.01392364501953125, -0.0093994140625, -0.00487518310546875, -0.0003509521484375, 0.00417327880859375, 0.008697509765625, 0.01322174072265625, 0.0177459716796875, 0.02227020263671875, 0.02679443359375, 0.03131866455078125, 0.0358428955078125, 0.04036712646484375, 0.044891357421875, 0.04941558837890625, 0.0539398193359375, 0.05846405029296875, 0.06298828125, 0.06751251220703125, 0.0720367431640625, 0.07656097412109375, 0.081085205078125, 0.08560943603515625, 0.0901336669921875, 0.09465789794921875, 0.09918212890625, 0.10370635986328125, 0.1082305908203125, 0.11275482177734375, 0.117279052734375, 0.12180328369140625, 0.1263275146484375, 0.13085174560546875, 0.1353759765625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 2.0, 8.0, 7.0, 11.0, 16.0, 15.0, 8.0, 16.0, 17.0, 32.0, 19.0, 26.0, 25.0, 40.0, 43.0, 29.0, 36.0, 43.0, 34.0, 37.0, 1066.0, 42.0, 38.0, 50.0, 41.0, 29.0, 40.0, 36.0, 39.0, 24.0, 22.0, 14.0, 21.0, 11.0, 12.0, 11.0, 15.0, 7.0, 7.0, 7.0, 4.0, 7.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.298828125, -2.22186279296875, -2.1448974609375, -2.06793212890625, -1.990966796875, -1.91400146484375, -1.8370361328125, -1.76007080078125, -1.68310546875, -1.60614013671875, -1.5291748046875, -1.45220947265625, -1.375244140625, -1.29827880859375, -1.2213134765625, -1.14434814453125, -1.0673828125, -0.99041748046875, -0.9134521484375, -0.83648681640625, -0.759521484375, -0.68255615234375, -0.6055908203125, -0.52862548828125, -0.45166015625, -0.37469482421875, -0.2977294921875, -0.22076416015625, -0.143798828125, -0.06683349609375, 0.0101318359375, 0.08709716796875, 0.1640625, 0.24102783203125, 0.3179931640625, 0.39495849609375, 0.471923828125, 0.54888916015625, 0.6258544921875, 0.70281982421875, 0.77978515625, 0.85675048828125, 0.9337158203125, 1.01068115234375, 1.087646484375, 1.16461181640625, 1.2415771484375, 1.31854248046875, 1.3955078125, 1.47247314453125, 1.5494384765625, 1.62640380859375, 1.703369140625, 1.78033447265625, 1.8572998046875, 1.93426513671875, 2.01123046875, 2.08819580078125, 2.1651611328125, 2.24212646484375, 2.319091796875, 2.39605712890625, 2.4730224609375, 2.54998779296875, 2.626953125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 3.0, 10.0, 22.0, 18.0, 19.0, 25.0, 53.0, 60.0, 103.0, 142.0, 147.0, 235.0, 322.0, 464.0, 619.0, 923.0, 1232.0, 1923.0, 2685.0, 3877.0, 5452.0, 7873.0, 12008.0, 17751.0, 26737.0, 40833.0, 65781.0, 116257.0, 1170532.0, 334786.0, 107504.0, 61664.0, 38815.0, 25357.0, 16509.0, 11107.0, 7859.0, 5189.0, 3595.0, 2455.0, 1743.0, 1256.0, 896.0, 686.0, 469.0, 327.0, 254.0, 149.0, 125.0, 90.0, 55.0, 32.0, 35.0, 26.0, 14.0, 10.0, 9.0, 9.0, 7.0, 4.0], "bins": [-0.05206298828125, -0.05048227310180664, -0.04890155792236328, -0.04732084274291992, -0.04574012756347656, -0.0441594123840332, -0.042578697204589844, -0.040997982025146484, -0.039417266845703125, -0.037836551666259766, -0.036255836486816406, -0.03467512130737305, -0.03309440612792969, -0.03151369094848633, -0.02993297576904297, -0.02835226058959961, -0.02677154541015625, -0.02519083023071289, -0.02361011505126953, -0.022029399871826172, -0.020448684692382812, -0.018867969512939453, -0.017287254333496094, -0.015706539154052734, -0.014125823974609375, -0.012545108795166016, -0.010964393615722656, -0.009383678436279297, -0.0078029632568359375, -0.006222248077392578, -0.004641532897949219, -0.0030608177185058594, -0.0014801025390625, 0.00010061264038085938, 0.0016813278198242188, 0.003262042999267578, 0.0048427581787109375, 0.006423473358154297, 0.008004188537597656, 0.009584903717041016, 0.011165618896484375, 0.012746334075927734, 0.014327049255371094, 0.015907764434814453, 0.017488479614257812, 0.019069194793701172, 0.02064990997314453, 0.02223062515258789, 0.02381134033203125, 0.02539205551147461, 0.02697277069091797, 0.028553485870361328, 0.030134201049804688, 0.03171491622924805, 0.033295631408691406, 0.034876346588134766, 0.036457061767578125, 0.038037776947021484, 0.039618492126464844, 0.0411992073059082, 0.04277992248535156, 0.04436063766479492, 0.04594135284423828, 0.04752206802368164, 0.049102783203125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 13.0, 15.0, 7.0, 9.0, 27.0, 13.0, 27.0, 41.0, 42.0, 39.0, 46.0, 74.0, 118.0, 120.0, 73.0, 51.0, 37.0, 43.0, 35.0, 25.0, 23.0, 27.0, 22.0, 11.0, 12.0, 6.0, 8.0, 7.0, 5.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00070953369140625, -0.000684201717376709, -0.000658869743347168, -0.000633537769317627, -0.0006082057952880859, -0.0005828738212585449, -0.0005575418472290039, -0.0005322098731994629, -0.0005068778991699219, -0.00048154592514038086, -0.00045621395111083984, -0.00043088197708129883, -0.0004055500030517578, -0.0003802180290222168, -0.0003548860549926758, -0.00032955408096313477, -0.00030422210693359375, -0.00027889013290405273, -0.0002535581588745117, -0.0002282261848449707, -0.0002028942108154297, -0.00017756223678588867, -0.00015223026275634766, -0.00012689828872680664, -0.00010156631469726562, -7.623434066772461e-05, -5.0902366638183594e-05, -2.5570392608642578e-05, -2.384185791015625e-07, 2.5093555450439453e-05, 5.042552947998047e-05, 7.575750350952148e-05, 0.0001010894775390625, 0.00012642145156860352, 0.00015175342559814453, 0.00017708539962768555, 0.00020241737365722656, 0.00022774934768676758, 0.0002530813217163086, 0.0002784132957458496, 0.0003037452697753906, 0.00032907724380493164, 0.00035440921783447266, 0.00037974119186401367, 0.0004050731658935547, 0.0004304051399230957, 0.0004557371139526367, 0.00048106908798217773, 0.0005064010620117188, 0.0005317330360412598, 0.0005570650100708008, 0.0005823969841003418, 0.0006077289581298828, 0.0006330609321594238, 0.0006583929061889648, 0.0006837248802185059, 0.0007090568542480469, 0.0007343888282775879, 0.0007597208023071289, 0.0007850527763366699, 0.0008103847503662109, 0.000835716724395752, 0.000861048698425293, 0.000886380672454834, 0.000911712646484375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 6.0, 8.0, 12.0, 5.0, 14.0, 20.0, 26.0, 32.0, 32.0, 57.0, 102.0, 175.0, 671.0, 8313.0, 449726.0, 578541.0, 9465.0, 793.0, 227.0, 100.0, 64.0, 43.0, 20.0, 25.0, 12.0, 12.0, 14.0, 10.0, 9.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0154571533203125, -0.015027999877929688, -0.014598846435546875, -0.014169692993164062, -0.01374053955078125, -0.013311386108398438, -0.012882232666015625, -0.012453079223632812, -0.01202392578125, -0.011594772338867188, -0.011165618896484375, -0.010736465454101562, -0.01030731201171875, -0.009878158569335938, -0.009449005126953125, -0.009019851684570312, -0.0085906982421875, -0.008161544799804688, -0.007732391357421875, -0.0073032379150390625, -0.00687408447265625, -0.0064449310302734375, -0.006015777587890625, -0.0055866241455078125, -0.005157470703125, -0.0047283172607421875, -0.004299163818359375, -0.0038700103759765625, -0.00344085693359375, -0.0030117034912109375, -0.002582550048828125, -0.0021533966064453125, -0.0017242431640625, -0.0012950897216796875, -0.000865936279296875, -0.0004367828369140625, -7.62939453125e-06, 0.0004215240478515625, 0.000850677490234375, 0.0012798309326171875, 0.001708984375, 0.0021381378173828125, 0.002567291259765625, 0.0029964447021484375, 0.00342559814453125, 0.0038547515869140625, 0.004283905029296875, 0.0047130584716796875, 0.0051422119140625, 0.0055713653564453125, 0.006000518798828125, 0.0064296722412109375, 0.00685882568359375, 0.0072879791259765625, 0.007717132568359375, 0.008146286010742188, 0.008575439453125, 0.009004592895507812, 0.009433746337890625, 0.009862899780273438, 0.01029205322265625, 0.010721206665039062, 0.011150360107421875, 0.011579513549804688, 0.0120086669921875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 12.0, 485.0, 503.0, 17.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022504893131554127, -0.001876032561995089, -0.0015015758108347654, -0.00112711894325912, -0.0007526621920987964, -0.00037820544093847275, -3.748573362827301e-06, 0.0003707080613821745, 0.0007451649289578199, 0.0011196216801181436, 0.0014940784312784672, 0.0018685352988541126, 0.002242992166429758, 0.00261744880117476, 0.0029919056687504053, 0.003366362303495407, 0.0037408191710710526, 0.004115276038646698, 0.0044897329062223434, 0.004864189773797989, 0.005238646175712347, 0.0056131030432879925, 0.005987559910863638, 0.006362016312777996, 0.0067364731803536415, 0.007110930047929287, 0.007485386915504932, 0.007859843783080578, 0.008234300650656223, 0.008608756586909294, 0.00898321345448494, 0.009357670322060585, 0.009732128120958805, 0.01010658498853445, 0.010481041856110096, 0.010855498723685741, 0.011229955591261387, 0.011604411527514458, 0.011978868395090103, 0.012353325262665749, 0.012727782130241394, 0.01310223899781704, 0.013476695865392685, 0.01385115273296833, 0.014225609600543976, 0.014600066468119621, 0.014974523335695267, 0.015348979271948338, 0.015723437070846558, 0.016097893938422203, 0.01647235080599785, 0.016846807673573494, 0.01722126454114914, 0.017595721408724785, 0.01797017827630043, 0.018344635143876076, 0.018719090148806572, 0.019093547016382217, 0.019468003883957863, 0.01984246075153351, 0.020216917619109154, 0.0205913744866848, 0.020965831354260445, 0.02134028822183609, 0.021714745089411736]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 5.0, 8.0, 9.0, 18.0, 19.0, 32.0, 38.0, 50.0, 47.0, 65.0, 65.0, 76.0, 59.0, 71.0, 78.0, 89.0, 61.0, 47.0, 42.0, 36.0, 18.0, 19.0, 19.0, 15.0, 6.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001292884349822998, -0.0012626098468899727, -0.0012323353439569473, -0.001202060841023922, -0.0011717863380908966, -0.0011415118351578712, -0.0011112373322248459, -0.0010809628292918205, -0.0010506883263587952, -0.0010204138234257698, -0.0009901393204927444, -0.0009598648175597191, -0.0009295903146266937, -0.0008993158116936684, -0.000869041308760643, -0.0008387668058276176, -0.0008084923028945923, -0.0007782177999615669, -0.0007479432970285416, -0.0007176687940955162, -0.0006873942911624908, -0.0006571197882294655, -0.0006268452852964401, -0.0005965707823634148, -0.0005662962794303894, -0.000536021776497364, -0.0005057472735643387, -0.0004754727706313133, -0.00044519826769828796, -0.0004149237647652626, -0.00038464926183223724, -0.0003543747588992119, -0.0003241002559661865, -0.00029382575303316116, -0.0002635512501001358, -0.00023327674716711044, -0.00020300224423408508, -0.00017272774130105972, -0.00014245323836803436, -0.000112178735435009, -8.190423250198364e-05, -5.162972956895828e-05, -2.1355226635932922e-05, 8.919276297092438e-06, 3.91937792301178e-05, 6.946828216314316e-05, 9.974278509616852e-05, 0.00013001728802919388, 0.00016029179096221924, 0.0001905662938952446, 0.00022084079682826996, 0.0002511152997612953, 0.0002813898026943207, 0.00031166430562734604, 0.0003419388085603714, 0.00037221331149339676, 0.0004024878144264221, 0.0004327623173594475, 0.00046303682029247284, 0.0004933113232254982, 0.0005235858261585236, 0.0005538603290915489, 0.0005841348320245743, 0.0006144093349575996, 0.000644683837890625]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 2.0, 8.0, 5.0, 1.0, 5.0, 11.0, 14.0, 12.0, 19.0, 22.0, 24.0, 26.0, 31.0, 42.0, 29.0, 40.0, 43.0, 37.0, 60.0, 54.0, 46.0, 35.0, 42.0, 61.0, 36.0, 49.0, 32.0, 49.0, 25.0, 24.0, 20.0, 26.0, 11.0, 19.0, 10.0, 11.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.107421875, -3.0081787109375, -2.908935546875, -2.8096923828125, -2.71044921875, -2.6112060546875, -2.511962890625, -2.4127197265625, -2.3134765625, -2.2142333984375, -2.114990234375, -2.0157470703125, -1.91650390625, -1.8172607421875, -1.718017578125, -1.6187744140625, -1.51953125, -1.4202880859375, -1.321044921875, -1.2218017578125, -1.12255859375, -1.0233154296875, -0.924072265625, -0.8248291015625, -0.7255859375, -0.6263427734375, -0.527099609375, -0.4278564453125, -0.32861328125, -0.2293701171875, -0.130126953125, -0.0308837890625, 0.068359375, 0.1676025390625, 0.266845703125, 0.3660888671875, 0.46533203125, 0.5645751953125, 0.663818359375, 0.7630615234375, 0.8623046875, 0.9615478515625, 1.060791015625, 1.1600341796875, 1.25927734375, 1.3585205078125, 1.457763671875, 1.5570068359375, 1.65625, 1.7554931640625, 1.854736328125, 1.9539794921875, 2.05322265625, 2.1524658203125, 2.251708984375, 2.3509521484375, 2.4501953125, 2.5494384765625, 2.648681640625, 2.7479248046875, 2.84716796875, 2.9464111328125, 3.045654296875, 3.1448974609375, 3.244140625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 10.0, 11.0, 17.0, 39.0, 46.0, 81.0, 115.0, 202.0, 367.0, 691.0, 1319.0, 2844.0, 6723.0, 19350.0, 75653.0, 466056.0, 383934.0, 63006.0, 16792.0, 6000.0, 2576.0, 1236.0, 621.0, 321.0, 200.0, 121.0, 86.0, 32.0, 29.0, 19.0, 17.0, 13.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -11.2568359375, -10.880859375, -10.5048828125, -10.12890625, -9.7529296875, -9.376953125, -9.0009765625, -8.625, -8.2490234375, -7.873046875, -7.4970703125, -7.12109375, -6.7451171875, -6.369140625, -5.9931640625, -5.6171875, -5.2412109375, -4.865234375, -4.4892578125, -4.11328125, -3.7373046875, -3.361328125, -2.9853515625, -2.609375, -2.2333984375, -1.857421875, -1.4814453125, -1.10546875, -0.7294921875, -0.353515625, 0.0224609375, 0.3984375, 0.7744140625, 1.150390625, 1.5263671875, 1.90234375, 2.2783203125, 2.654296875, 3.0302734375, 3.40625, 3.7822265625, 4.158203125, 4.5341796875, 4.91015625, 5.2861328125, 5.662109375, 6.0380859375, 6.4140625, 6.7900390625, 7.166015625, 7.5419921875, 7.91796875, 8.2939453125, 8.669921875, 9.0458984375, 9.421875, 9.7978515625, 10.173828125, 10.5498046875, 10.92578125, 11.3017578125, 11.677734375, 12.0537109375, 12.4296875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 13.0, 15.0, 13.0, 11.0, 22.0, 12.0, 33.0, 43.0, 32.0, 41.0, 45.0, 60.0, 101.0, 138.0, 208.0, 1313.0, 249.0, 177.0, 98.0, 74.0, 60.0, 40.0, 40.0, 34.0, 32.0, 23.0, 8.0, 19.0, 20.0, 10.0, 11.0, 13.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.20654296875, -8.8974609375, -8.58837890625, -8.279296875, -7.97021484375, -7.6611328125, -7.35205078125, -7.04296875, -6.73388671875, -6.4248046875, -6.11572265625, -5.806640625, -5.49755859375, -5.1884765625, -4.87939453125, -4.5703125, -4.26123046875, -3.9521484375, -3.64306640625, -3.333984375, -3.02490234375, -2.7158203125, -2.40673828125, -2.09765625, -1.78857421875, -1.4794921875, -1.17041015625, -0.861328125, -0.55224609375, -0.2431640625, 0.06591796875, 0.375, 0.68408203125, 0.9931640625, 1.30224609375, 1.611328125, 1.92041015625, 2.2294921875, 2.53857421875, 2.84765625, 3.15673828125, 3.4658203125, 3.77490234375, 4.083984375, 4.39306640625, 4.7021484375, 5.01123046875, 5.3203125, 5.62939453125, 5.9384765625, 6.24755859375, 6.556640625, 6.86572265625, 7.1748046875, 7.48388671875, 7.79296875, 8.10205078125, 8.4111328125, 8.72021484375, 9.029296875, 9.33837890625, 9.6474609375, 9.95654296875, 10.265625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 9.0, 15.0, 8.0, 14.0, 13.0, 21.0, 29.0, 31.0, 41.0, 61.0, 101.0, 169.0, 293.0, 629.0, 1467.0, 4089.0, 13232.0, 74066.0, 1477895.0, 1478421.0, 74509.0, 13687.0, 4047.0, 1478.0, 605.0, 288.0, 132.0, 97.0, 62.0, 46.0, 33.0, 21.0, 13.0, 17.0, 11.0, 12.0, 9.0, 5.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.234375, -15.72705078125, -15.2197265625, -14.71240234375, -14.205078125, -13.69775390625, -13.1904296875, -12.68310546875, -12.17578125, -11.66845703125, -11.1611328125, -10.65380859375, -10.146484375, -9.63916015625, -9.1318359375, -8.62451171875, -8.1171875, -7.60986328125, -7.1025390625, -6.59521484375, -6.087890625, -5.58056640625, -5.0732421875, -4.56591796875, -4.05859375, -3.55126953125, -3.0439453125, -2.53662109375, -2.029296875, -1.52197265625, -1.0146484375, -0.50732421875, 0.0, 0.50732421875, 1.0146484375, 1.52197265625, 2.029296875, 2.53662109375, 3.0439453125, 3.55126953125, 4.05859375, 4.56591796875, 5.0732421875, 5.58056640625, 6.087890625, 6.59521484375, 7.1025390625, 7.60986328125, 8.1171875, 8.62451171875, 9.1318359375, 9.63916015625, 10.146484375, 10.65380859375, 11.1611328125, 11.66845703125, 12.17578125, 12.68310546875, 13.1904296875, 13.69775390625, 14.205078125, 14.71240234375, 15.2197265625, 15.72705078125, 16.234375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 15.0, 20.0, 40.0, 68.0, 100.0, 125.0, 147.0, 134.0, 132.0, 82.0, 54.0, 45.0, 19.0, 12.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.56389045715332, -15.25368881225586, -13.943486213684082, -12.633284568786621, -11.323081970214844, -10.012880325317383, -8.702678680419922, -7.3924760818481445, -6.082274436950684, -4.7720723152160645, -3.4618704319000244, -2.1516685485839844, -0.8414664268493652, 0.4687356948852539, 1.7789373397827148, 3.089139938354492, 4.399341583251953, 5.709543704986572, 7.019745826721191, 8.329947471618652, 9.64015007019043, 10.95035171508789, 12.260553359985352, 13.570755958557129, 14.88095760345459, 16.191160202026367, 17.501361846923828, 18.81156349182129, 20.12176513671875, 21.431968688964844, 22.742168426513672, 24.052371978759766, 25.36257553100586, 26.67277717590332, 27.98297882080078, 29.293182373046875, 30.603384017944336, 31.913585662841797, 33.223785400390625, 34.53398895263672, 35.84419250488281, 37.154396057128906, 38.464595794677734, 39.77479934692383, 41.084999084472656, 42.39520263671875, 43.705406188964844, 45.01560592651367, 46.3258056640625, 47.636009216308594, 48.94620895385742, 50.256412506103516, 51.566612243652344, 52.87681579589844, 54.18701934814453, 55.49721908569336, 56.80742263793945, 58.11762619018555, 59.427825927734375, 60.73802947998047, 62.0482292175293, 63.35843276977539, 64.66863250732422, 65.97883605957031, 67.2890396118164]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 9.0, 11.0, 17.0, 14.0, 14.0, 23.0, 27.0, 27.0, 25.0, 24.0, 26.0, 30.0, 37.0, 47.0, 47.0, 45.0, 46.0, 40.0, 43.0, 48.0, 36.0, 48.0, 30.0, 40.0, 32.0, 20.0, 31.0, 26.0, 18.0, 16.0, 13.0, 11.0, 9.0, 13.0, 8.0, 12.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.860036849975586, -28.899385452270508, -27.93873405456543, -26.97808074951172, -26.01742935180664, -25.056777954101562, -24.096126556396484, -23.135475158691406, -22.174823760986328, -21.21417236328125, -20.253520965576172, -19.292869567871094, -18.332216262817383, -17.371564865112305, -16.410913467407227, -15.450262069702148, -14.489608764648438, -13.52895736694336, -12.568305015563965, -11.607653617858887, -10.647001266479492, -9.686349868774414, -8.725698471069336, -7.7650465965271, -6.804394721984863, -5.843742847442627, -4.883090972900391, -3.9224395751953125, -2.961787700653076, -2.00113582611084, -1.0404844284057617, -0.07983255386352539, 0.8808174133300781, 1.841469168663025, 2.8021209239959717, 3.762772560119629, 4.723424434661865, 5.684076309204102, 6.64472770690918, 7.605379581451416, 8.566031455993652, 9.52668285369873, 10.487335205078125, 11.447986602783203, 12.408638000488281, 13.369290351867676, 14.329941749572754, 15.290594100952148, 16.251245498657227, 17.211896896362305, 18.172548294067383, 19.133201599121094, 20.093852996826172, 21.05450439453125, 22.015155792236328, 22.975807189941406, 23.936458587646484, 24.897109985351562, 25.85776138305664, 26.81841278076172, 27.77906608581543, 28.739717483520508, 29.700368881225586, 30.661020278930664, 31.621673583984375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 1.0, 6.0, 15.0, 23.0, 17.0, 19.0, 22.0, 22.0, 50.0, 21.0, 35.0, 32.0, 40.0, 38.0, 49.0, 53.0, 49.0, 38.0, 46.0, 37.0, 50.0, 48.0, 36.0, 39.0, 37.0, 30.0, 24.0, 20.0, 19.0, 7.0, 13.0, 9.0, 8.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.486328125, -3.382415771484375, -3.27850341796875, -3.174591064453125, -3.0706787109375, -2.966766357421875, -2.86285400390625, -2.758941650390625, -2.655029296875, -2.551116943359375, -2.44720458984375, -2.343292236328125, -2.2393798828125, -2.135467529296875, -2.03155517578125, -1.927642822265625, -1.82373046875, -1.719818115234375, -1.61590576171875, -1.511993408203125, -1.4080810546875, -1.304168701171875, -1.20025634765625, -1.096343994140625, -0.992431640625, -0.888519287109375, -0.78460693359375, -0.680694580078125, -0.5767822265625, -0.472869873046875, -0.36895751953125, -0.265045166015625, -0.1611328125, -0.057220458984375, 0.04669189453125, 0.150604248046875, 0.2545166015625, 0.358428955078125, 0.46234130859375, 0.566253662109375, 0.670166015625, 0.774078369140625, 0.87799072265625, 0.981903076171875, 1.0858154296875, 1.189727783203125, 1.29364013671875, 1.397552490234375, 1.50146484375, 1.605377197265625, 1.70928955078125, 1.813201904296875, 1.9171142578125, 2.021026611328125, 2.12493896484375, 2.228851318359375, 2.332763671875, 2.436676025390625, 2.54058837890625, 2.644500732421875, 2.7484130859375, 2.852325439453125, 2.95623779296875, 3.060150146484375, 3.1640625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 4.0, 9.0, 7.0, 25.0, 24.0, 40.0, 49.0, 108.0, 158.0, 272.0, 455.0, 771.0, 1500.0, 3344.0, 8105.0, 26570.0, 199498.0, 2623301.0, 1221508.0, 82779.0, 15952.0, 5244.0, 2146.0, 1069.0, 549.0, 311.0, 172.0, 114.0, 67.0, 42.0, 33.0, 14.0, 11.0, 13.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4921875, -11.1419677734375, -10.791748046875, -10.4415283203125, -10.09130859375, -9.7410888671875, -9.390869140625, -9.0406494140625, -8.6904296875, -8.3402099609375, -7.989990234375, -7.6397705078125, -7.28955078125, -6.9393310546875, -6.589111328125, -6.2388916015625, -5.888671875, -5.5384521484375, -5.188232421875, -4.8380126953125, -4.48779296875, -4.1375732421875, -3.787353515625, -3.4371337890625, -3.0869140625, -2.7366943359375, -2.386474609375, -2.0362548828125, -1.68603515625, -1.3358154296875, -0.985595703125, -0.6353759765625, -0.28515625, 0.0650634765625, 0.415283203125, 0.7655029296875, 1.11572265625, 1.4659423828125, 1.816162109375, 2.1663818359375, 2.5166015625, 2.8668212890625, 3.217041015625, 3.5672607421875, 3.91748046875, 4.2677001953125, 4.617919921875, 4.9681396484375, 5.318359375, 5.6685791015625, 6.018798828125, 6.3690185546875, 6.71923828125, 7.0694580078125, 7.419677734375, 7.7698974609375, 8.1201171875, 8.4703369140625, 8.820556640625, 9.1707763671875, 9.52099609375, 9.8712158203125, 10.221435546875, 10.5716552734375, 10.921875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 1.0, 5.0, 2.0, 7.0, 9.0, 11.0, 12.0, 25.0, 25.0, 38.0, 52.0, 69.0, 96.0, 114.0, 155.0, 241.0, 302.0, 389.0, 458.0, 482.0, 428.0, 304.0, 220.0, 182.0, 134.0, 82.0, 47.0, 44.0, 33.0, 13.0, 16.0, 14.0, 15.0, 13.0, 4.0, 8.0, 3.0, 10.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.28125, -6.07208251953125, -5.8629150390625, -5.65374755859375, -5.444580078125, -5.23541259765625, -5.0262451171875, -4.81707763671875, -4.60791015625, -4.39874267578125, -4.1895751953125, -3.98040771484375, -3.771240234375, -3.56207275390625, -3.3529052734375, -3.14373779296875, -2.9345703125, -2.72540283203125, -2.5162353515625, -2.30706787109375, -2.097900390625, -1.88873291015625, -1.6795654296875, -1.47039794921875, -1.26123046875, -1.05206298828125, -0.8428955078125, -0.63372802734375, -0.424560546875, -0.21539306640625, -0.0062255859375, 0.20294189453125, 0.412109375, 0.62127685546875, 0.8304443359375, 1.03961181640625, 1.248779296875, 1.45794677734375, 1.6671142578125, 1.87628173828125, 2.08544921875, 2.29461669921875, 2.5037841796875, 2.71295166015625, 2.922119140625, 3.13128662109375, 3.3404541015625, 3.54962158203125, 3.7587890625, 3.96795654296875, 4.1771240234375, 4.38629150390625, 4.595458984375, 4.80462646484375, 5.0137939453125, 5.22296142578125, 5.43212890625, 5.64129638671875, 5.8504638671875, 6.05963134765625, 6.268798828125, 6.47796630859375, 6.6871337890625, 6.89630126953125, 7.10546875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 13.0, 6.0, 18.0, 19.0, 23.0, 24.0, 32.0, 53.0, 88.0, 143.0, 270.0, 711.0, 1902.0, 7106.0, 56316.0, 2241944.0, 1828059.0, 47723.0, 6559.0, 1820.0, 634.0, 307.0, 159.0, 111.0, 66.0, 38.0, 28.0, 26.0, 15.0, 18.0, 4.0, 4.0, 10.0, 2.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.375, -22.666015625, -21.95703125, -21.248046875, -20.5390625, -19.830078125, -19.12109375, -18.412109375, -17.703125, -16.994140625, -16.28515625, -15.576171875, -14.8671875, -14.158203125, -13.44921875, -12.740234375, -12.03125, -11.322265625, -10.61328125, -9.904296875, -9.1953125, -8.486328125, -7.77734375, -7.068359375, -6.359375, -5.650390625, -4.94140625, -4.232421875, -3.5234375, -2.814453125, -2.10546875, -1.396484375, -0.6875, 0.021484375, 0.73046875, 1.439453125, 2.1484375, 2.857421875, 3.56640625, 4.275390625, 4.984375, 5.693359375, 6.40234375, 7.111328125, 7.8203125, 8.529296875, 9.23828125, 9.947265625, 10.65625, 11.365234375, 12.07421875, 12.783203125, 13.4921875, 14.201171875, 14.91015625, 15.619140625, 16.328125, 17.037109375, 17.74609375, 18.455078125, 19.1640625, 19.873046875, 20.58203125, 21.291015625, 22.0]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 16.0, 29.0, 86.0, 143.0, 184.0, 229.0, 151.0, 95.0, 46.0, 14.0, 9.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.230268478393555, -17.723499298095703, -15.216730117797852, -12.709961891174316, -10.203192710876465, -7.696423530578613, -5.189655303955078, -2.6828861236572266, -0.176116943359375, 2.3306519985198975, 4.83742094039917, 7.344189643859863, 9.850958824157715, 12.357728004455566, 14.864496231079102, 17.371265411376953, 19.878034591674805, 22.384803771972656, 24.891572952270508, 27.39834213256836, 29.905109405517578, 32.41188049316406, 34.91864776611328, 37.4254150390625, 39.932186126708984, 42.4389533996582, 44.94572448730469, 47.452491760253906, 49.95926284790039, 52.46603012084961, 54.972801208496094, 57.47956848144531, 59.98633575439453, 62.49310302734375, 64.99987030029297, 67.50664520263672, 70.01341247558594, 72.52017974853516, 75.02694702148438, 77.53372192382812, 80.04048919677734, 82.54725646972656, 85.05402374267578, 87.56079864501953, 90.06756591796875, 92.57433319091797, 95.08110046386719, 97.58787536621094, 100.09463500976562, 102.60140228271484, 105.10816955566406, 107.61494445800781, 110.12171173095703, 112.62847900390625, 115.13524627685547, 117.64201354980469, 120.14878845214844, 122.65555572509766, 125.16232299804688, 127.66909790039062, 130.1758575439453, 132.68263244628906, 135.1894073486328, 137.6961669921875, 140.20294189453125]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 7.0, 4.0, 5.0, 10.0, 8.0, 11.0, 14.0, 18.0, 16.0, 21.0, 16.0, 37.0, 30.0, 38.0, 29.0, 33.0, 41.0, 44.0, 50.0, 39.0, 50.0, 49.0, 53.0, 44.0, 45.0, 36.0, 25.0, 21.0, 22.0, 31.0, 26.0, 19.0, 22.0, 18.0, 18.0, 12.0, 8.0, 6.0, 10.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.2144832611084, -24.47092628479004, -23.727367401123047, -22.983810424804688, -22.240253448486328, -21.49669647216797, -20.75313949584961, -20.009580612182617, -19.266023635864258, -18.5224666595459, -17.778907775878906, -17.035350799560547, -16.291793823242188, -15.548236846923828, -14.804678916931152, -14.061120986938477, -13.317564010620117, -12.574007034301758, -11.830449104309082, -11.086891174316406, -10.343334197998047, -9.599777221679688, -8.856219291687012, -8.112661361694336, -7.369104385375977, -6.625546932220459, -5.881989479064941, -5.138432025909424, -4.394874572753906, -3.6513171195983887, -2.907759666442871, -2.1642022132873535, -1.4206466674804688, -0.6770892143249512, 0.0664682388305664, 0.810025691986084, 1.5535831451416016, 2.297140598297119, 3.0406980514526367, 3.7842555046081543, 4.527812957763672, 5.2713704109191895, 6.014927864074707, 6.758485317230225, 7.502042770385742, 8.245599746704102, 8.989157676696777, 9.732715606689453, 10.476272583007812, 11.219829559326172, 11.963387489318848, 12.706945419311523, 13.450502395629883, 14.194059371948242, 14.937617301940918, 15.681175231933594, 16.424732208251953, 17.168289184570312, 17.911846160888672, 18.655405044555664, 19.398962020874023, 20.142518997192383, 20.886077880859375, 21.629634857177734, 22.373191833496094]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 7.0, 4.0, 5.0, 6.0, 11.0, 10.0, 15.0, 14.0, 19.0, 30.0, 29.0, 30.0, 22.0, 28.0, 39.0, 53.0, 35.0, 44.0, 47.0, 42.0, 40.0, 50.0, 39.0, 45.0, 43.0, 37.0, 40.0, 42.0, 32.0, 27.0, 17.0, 18.0, 18.0, 12.0, 19.0, 8.0, 7.0, 6.0, 4.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.013580322265625, -2.90997314453125, -2.806365966796875, -2.7027587890625, -2.599151611328125, -2.49554443359375, -2.391937255859375, -2.288330078125, -2.184722900390625, -2.08111572265625, -1.977508544921875, -1.8739013671875, -1.770294189453125, -1.66668701171875, -1.563079833984375, -1.45947265625, -1.355865478515625, -1.25225830078125, -1.148651123046875, -1.0450439453125, -0.941436767578125, -0.83782958984375, -0.734222412109375, -0.630615234375, -0.527008056640625, -0.42340087890625, -0.319793701171875, -0.2161865234375, -0.112579345703125, -0.00897216796875, 0.094635009765625, 0.1982421875, 0.301849365234375, 0.40545654296875, 0.509063720703125, 0.6126708984375, 0.716278076171875, 0.81988525390625, 0.923492431640625, 1.027099609375, 1.130706787109375, 1.23431396484375, 1.337921142578125, 1.4415283203125, 1.545135498046875, 1.64874267578125, 1.752349853515625, 1.85595703125, 1.959564208984375, 2.06317138671875, 2.166778564453125, 2.2703857421875, 2.373992919921875, 2.47760009765625, 2.581207275390625, 2.684814453125, 2.788421630859375, 2.89202880859375, 2.995635986328125, 3.0992431640625, 3.202850341796875, 3.30645751953125, 3.410064697265625, 3.513671875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 18.0, 13.0, 21.0, 43.0, 59.0, 81.0, 149.0, 153.0, 291.0, 399.0, 654.0, 1037.0, 1585.0, 2429.0, 3767.0, 5756.0, 9417.0, 15253.0, 25505.0, 44359.0, 81679.0, 169423.0, 325170.0, 168612.0, 81923.0, 44404.0, 25564.0, 15045.0, 9259.0, 5881.0, 3776.0, 2366.0, 1475.0, 1020.0, 661.0, 433.0, 300.0, 195.0, 122.0, 92.0, 49.0, 37.0, 22.0, 21.0, 17.0, 10.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166015625, -0.16057205200195312, -0.15512847900390625, -0.14968490600585938, -0.1442413330078125, -0.13879776000976562, -0.13335418701171875, -0.12791061401367188, -0.122467041015625, -0.11702346801757812, -0.11157989501953125, -0.10613632202148438, -0.1006927490234375, -0.09524917602539062, -0.08980560302734375, -0.08436203002929688, -0.07891845703125, -0.07347488403320312, -0.06803131103515625, -0.06258773803710938, -0.0571441650390625, -0.051700592041015625, -0.04625701904296875, -0.040813446044921875, -0.035369873046875, -0.029926300048828125, -0.02448272705078125, -0.019039154052734375, -0.0135955810546875, -0.008152008056640625, -0.00270843505859375, 0.002735137939453125, 0.0081787109375, 0.013622283935546875, 0.01906585693359375, 0.024509429931640625, 0.0299530029296875, 0.035396575927734375, 0.04084014892578125, 0.046283721923828125, 0.051727294921875, 0.057170867919921875, 0.06261444091796875, 0.06805801391601562, 0.0735015869140625, 0.07894515991210938, 0.08438873291015625, 0.08983230590820312, 0.09527587890625, 0.10071945190429688, 0.10616302490234375, 0.11160659790039062, 0.1170501708984375, 0.12249374389648438, 0.12793731689453125, 0.13338088989257812, 0.138824462890625, 0.14426803588867188, 0.14971160888671875, 0.15515518188476562, 0.1605987548828125, 0.16604232788085938, 0.17148590087890625, 0.17692947387695312, 0.182373046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 12.0, 7.0, 12.0, 13.0, 16.0, 16.0, 21.0, 16.0, 17.0, 28.0, 26.0, 26.0, 26.0, 42.0, 35.0, 33.0, 44.0, 36.0, 38.0, 1064.0, 39.0, 36.0, 39.0, 38.0, 26.0, 36.0, 28.0, 31.0, 31.0, 33.0, 22.0, 18.0, 21.0, 12.0, 16.0, 11.0, 13.0, 7.0, 5.0, 6.0, 9.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.615234375, -2.535308837890625, -2.45538330078125, -2.375457763671875, -2.2955322265625, -2.215606689453125, -2.13568115234375, -2.055755615234375, -1.975830078125, -1.895904541015625, -1.81597900390625, -1.736053466796875, -1.6561279296875, -1.576202392578125, -1.49627685546875, -1.416351318359375, -1.33642578125, -1.256500244140625, -1.17657470703125, -1.096649169921875, -1.0167236328125, -0.936798095703125, -0.85687255859375, -0.776947021484375, -0.697021484375, -0.617095947265625, -0.53717041015625, -0.457244873046875, -0.3773193359375, -0.297393798828125, -0.21746826171875, -0.137542724609375, -0.0576171875, 0.022308349609375, 0.10223388671875, 0.182159423828125, 0.2620849609375, 0.342010498046875, 0.42193603515625, 0.501861572265625, 0.581787109375, 0.661712646484375, 0.74163818359375, 0.821563720703125, 0.9014892578125, 0.981414794921875, 1.06134033203125, 1.141265869140625, 1.22119140625, 1.301116943359375, 1.38104248046875, 1.460968017578125, 1.5408935546875, 1.620819091796875, 1.70074462890625, 1.780670166015625, 1.860595703125, 1.940521240234375, 2.02044677734375, 2.100372314453125, 2.1802978515625, 2.260223388671875, 2.34014892578125, 2.420074462890625, 2.5]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 7.0, 10.0, 17.0, 13.0, 31.0, 33.0, 45.0, 72.0, 87.0, 126.0, 181.0, 299.0, 385.0, 518.0, 712.0, 1051.0, 1457.0, 1978.0, 2709.0, 3980.0, 5565.0, 7791.0, 11214.0, 15667.0, 23360.0, 34812.0, 53961.0, 89851.0, 170040.0, 1300163.0, 141790.0, 78705.0, 48532.0, 31463.0, 20914.0, 14568.0, 10081.0, 7094.0, 5098.0, 3584.0, 2611.0, 1898.0, 1280.0, 967.0, 684.0, 477.0, 369.0, 258.0, 203.0, 127.0, 81.0, 70.0, 46.0, 40.0, 19.0, 21.0, 12.0, 11.0, 1.0, 5.0, 2.0, 1.0], "bins": [-0.050750732421875, -0.04913330078125, -0.047515869140625, -0.0458984375, -0.044281005859375, -0.04266357421875, -0.041046142578125, -0.0394287109375, -0.037811279296875, -0.03619384765625, -0.034576416015625, -0.032958984375, -0.031341552734375, -0.02972412109375, -0.028106689453125, -0.0264892578125, -0.024871826171875, -0.02325439453125, -0.021636962890625, -0.02001953125, -0.018402099609375, -0.01678466796875, -0.015167236328125, -0.0135498046875, -0.011932373046875, -0.01031494140625, -0.008697509765625, -0.007080078125, -0.005462646484375, -0.00384521484375, -0.002227783203125, -0.0006103515625, 0.001007080078125, 0.00262451171875, 0.004241943359375, 0.005859375, 0.007476806640625, 0.00909423828125, 0.010711669921875, 0.0123291015625, 0.013946533203125, 0.01556396484375, 0.017181396484375, 0.018798828125, 0.020416259765625, 0.02203369140625, 0.023651123046875, 0.0252685546875, 0.026885986328125, 0.02850341796875, 0.030120849609375, 0.03173828125, 0.033355712890625, 0.03497314453125, 0.036590576171875, 0.0382080078125, 0.039825439453125, 0.04144287109375, 0.043060302734375, 0.044677734375, 0.046295166015625, 0.04791259765625, 0.049530029296875, 0.0511474609375, 0.052764892578125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 5.0, 1.0, 7.0, 7.0, 6.0, 8.0, 8.0, 7.0, 19.0, 24.0, 30.0, 27.0, 36.0, 54.0, 58.0, 73.0, 126.0, 125.0, 83.0, 47.0, 44.0, 31.0, 32.0, 27.0, 18.0, 11.0, 15.0, 5.0, 9.0, 12.0, 6.0, 7.0, 1.0, 5.0, 2.0, 8.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0009245872497558594, -0.0008936896920204163, -0.0008627921342849731, -0.00083189457654953, -0.0008009970188140869, -0.0007700994610786438, -0.0007392019033432007, -0.0007083043456077576, -0.0006774067878723145, -0.0006465092301368713, -0.0006156116724014282, -0.0005847141146659851, -0.000553816556930542, -0.0005229189991950989, -0.0004920214414596558, -0.00046112388372421265, -0.00043022632598876953, -0.0003993287682533264, -0.0003684312105178833, -0.0003375336527824402, -0.00030663609504699707, -0.00027573853731155396, -0.00024484097957611084, -0.00021394342184066772, -0.0001830458641052246, -0.0001521483063697815, -0.00012125074863433838, -9.035319089889526e-05, -5.945563316345215e-05, -2.8558075428009033e-05, 2.339482307434082e-06, 3.32370400428772e-05, 6.413459777832031e-05, 9.503215551376343e-05, 0.00012592971324920654, 0.00015682727098464966, 0.00018772482872009277, 0.0002186223864555359, 0.000249519944190979, 0.0002804175019264221, 0.00031131505966186523, 0.00034221261739730835, 0.00037311017513275146, 0.0004040077328681946, 0.0004349052906036377, 0.0004658028483390808, 0.0004967004060745239, 0.000527597963809967, 0.0005584955215454102, 0.0005893930792808533, 0.0006202906370162964, 0.0006511881947517395, 0.0006820857524871826, 0.0007129833102226257, 0.0007438808679580688, 0.000774778425693512, 0.0008056759834289551, 0.0008365735411643982, 0.0008674710988998413, 0.0008983686566352844, 0.0009292662143707275, 0.0009601637721061707, 0.0009910613298416138, 0.0010219588875770569, 0.0010528564453125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 10.0, 1.0, 3.0, 3.0, 2.0, 8.0, 10.0, 13.0, 5.0, 11.0, 15.0, 17.0, 35.0, 40.0, 72.0, 102.0, 283.0, 1278.0, 31318.0, 979370.0, 33975.0, 1363.0, 251.0, 116.0, 58.0, 51.0, 37.0, 27.0, 16.0, 9.0, 11.0, 7.0, 6.0, 6.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.019622802734375, -0.019054174423217773, -0.018485546112060547, -0.01791691780090332, -0.017348289489746094, -0.016779661178588867, -0.01621103286743164, -0.015642404556274414, -0.015073776245117188, -0.014505147933959961, -0.013936519622802734, -0.013367891311645508, -0.012799263000488281, -0.012230634689331055, -0.011662006378173828, -0.011093378067016602, -0.010524749755859375, -0.009956121444702148, -0.009387493133544922, -0.008818864822387695, -0.008250236511230469, -0.007681608200073242, -0.007112979888916016, -0.006544351577758789, -0.0059757232666015625, -0.005407094955444336, -0.004838466644287109, -0.004269838333129883, -0.0037012100219726562, -0.0031325817108154297, -0.002563953399658203, -0.0019953250885009766, -0.00142669677734375, -0.0008580684661865234, -0.0002894401550292969, 0.0002791881561279297, 0.0008478164672851562, 0.0014164447784423828, 0.0019850730895996094, 0.002553701400756836, 0.0031223297119140625, 0.003690958023071289, 0.004259586334228516, 0.004828214645385742, 0.005396842956542969, 0.005965471267700195, 0.006534099578857422, 0.0071027278900146484, 0.007671356201171875, 0.008239984512329102, 0.008808612823486328, 0.009377241134643555, 0.009945869445800781, 0.010514497756958008, 0.011083126068115234, 0.011651754379272461, 0.012220382690429688, 0.012789011001586914, 0.01335763931274414, 0.013926267623901367, 0.014494895935058594, 0.01506352424621582, 0.015632152557373047, 0.016200780868530273, 0.0167694091796875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 653.0, 359.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018341382965445518, -0.001212620292790234, -0.0005911022890359163, 3.0415714718401432e-05, 0.0006519337184727192, 0.0012734518386423588, 0.0018949697259813547, 0.0025164876133203506, 0.0031380057334899902, 0.00375952385365963, 0.004381041973829269, 0.005002559628337622, 0.005624077748507261, 0.006245595868676901, 0.006867113523185253, 0.007488631643354893, 0.008110149763524532, 0.008731667883694172, 0.009353186003863811, 0.009974704124033451, 0.010596221312880516, 0.011217739433050156, 0.011839257553219795, 0.012460775673389435, 0.013082293793559074, 0.013703811913728714, 0.014325330033898354, 0.014946848154067993, 0.015568366274237633, 0.016189884394407272, 0.016811402514576912, 0.01743292063474655, 0.018054436892271042, 0.01867595501244068, 0.01929747313261032, 0.01991899125277996, 0.0205405093729496, 0.02116202749311924, 0.02178354561328888, 0.02240506187081337, 0.02302658185362816, 0.023648099973797798, 0.024269618093967438, 0.024891136214137077, 0.025512654334306717, 0.026134172454476357, 0.026755690574645996, 0.027377206832170486, 0.027998724952340126, 0.028620243072509766, 0.029241761192679405, 0.029863279312849045, 0.030484797433018684, 0.031106315553188324, 0.031727831810712814, 0.0323493517935276, 0.032970868051052094, 0.033592384308576584, 0.03421390429139137, 0.03483542054891586, 0.03545694053173065, 0.03607845678925514, 0.03669997677206993, 0.03732149302959442, 0.03794301301240921]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 9.0, 7.0, 13.0, 29.0, 30.0, 30.0, 46.0, 55.0, 50.0, 84.0, 73.0, 79.0, 108.0, 66.0, 85.0, 63.0, 53.0, 42.0, 35.0, 24.0, 10.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.002049744129180908, -0.002006715163588524, -0.0019636861979961395, -0.0019206572324037552, -0.0018776282668113708, -0.0018345993012189865, -0.0017915703356266022, -0.0017485413700342178, -0.0017055124044418335, -0.0016624834388494492, -0.0016194544732570648, -0.0015764255076646805, -0.0015333965420722961, -0.0014903675764799118, -0.0014473386108875275, -0.0014043096452951431, -0.0013612806797027588, -0.0013182517141103745, -0.0012752227485179901, -0.0012321937829256058, -0.0011891648173332214, -0.001146135851740837, -0.0011031068861484528, -0.0010600779205560684, -0.001017048954963684, -0.0009740199893712997, -0.0009309910237789154, -0.0008879620581865311, -0.0008449330925941467, -0.0008019041270017624, -0.000758875161409378, -0.0007158461958169937, -0.0006728172302246094, -0.000629788264632225, -0.0005867592990398407, -0.0005437303334474564, -0.000500701367855072, -0.0004576724022626877, -0.00041464343667030334, -0.000371614471077919, -0.00032858550548553467, -0.00028555653989315033, -0.000242527574300766, -0.00019949860870838165, -0.00015646964311599731, -0.00011344067752361298, -7.041171193122864e-05, -2.73827463388443e-05, 1.564621925354004e-05, 5.867518484592438e-05, 0.00010170415043830872, 0.00014473311603069305, 0.0001877620816230774, 0.00023079104721546173, 0.00027382001280784607, 0.0003168489784002304, 0.00035987794399261475, 0.0004029069095849991, 0.0004459358751773834, 0.0004889648407697678, 0.0005319938063621521, 0.0005750227719545364, 0.0006180517375469208, 0.0006610807031393051, 0.0007041096687316895]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 7.0, 4.0, 5.0, 6.0, 11.0, 10.0, 15.0, 14.0, 19.0, 30.0, 29.0, 30.0, 22.0, 28.0, 39.0, 53.0, 35.0, 44.0, 47.0, 42.0, 40.0, 50.0, 39.0, 45.0, 43.0, 37.0, 40.0, 42.0, 32.0, 27.0, 17.0, 18.0, 18.0, 12.0, 19.0, 8.0, 7.0, 6.0, 4.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.013580322265625, -2.90997314453125, -2.806365966796875, -2.7027587890625, -2.599151611328125, -2.49554443359375, -2.391937255859375, -2.288330078125, -2.184722900390625, -2.08111572265625, -1.977508544921875, -1.8739013671875, -1.770294189453125, -1.66668701171875, -1.563079833984375, -1.45947265625, -1.355865478515625, -1.25225830078125, -1.148651123046875, -1.0450439453125, -0.941436767578125, -0.83782958984375, -0.734222412109375, -0.630615234375, -0.527008056640625, -0.42340087890625, -0.319793701171875, -0.2161865234375, -0.112579345703125, -0.00897216796875, 0.094635009765625, 0.1982421875, 0.301849365234375, 0.40545654296875, 0.509063720703125, 0.6126708984375, 0.716278076171875, 0.81988525390625, 0.923492431640625, 1.027099609375, 1.130706787109375, 1.23431396484375, 1.337921142578125, 1.4415283203125, 1.545135498046875, 1.64874267578125, 1.752349853515625, 1.85595703125, 1.959564208984375, 2.06317138671875, 2.166778564453125, 2.2703857421875, 2.373992919921875, 2.47760009765625, 2.581207275390625, 2.684814453125, 2.788421630859375, 2.89202880859375, 2.995635986328125, 3.0992431640625, 3.202850341796875, 3.30645751953125, 3.410064697265625, 3.513671875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 12.0, 8.0, 19.0, 21.0, 43.0, 61.0, 118.0, 154.0, 265.0, 454.0, 751.0, 1355.0, 2515.0, 4702.0, 9846.0, 22616.0, 57395.0, 176433.0, 428822.0, 223002.0, 69928.0, 26697.0, 11492.0, 5494.0, 2769.0, 1478.0, 782.0, 526.0, 282.0, 178.0, 116.0, 62.0, 56.0, 32.0, 22.0, 18.0, 9.0, 9.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.91058349609375, -5.7235107421875, -5.53643798828125, -5.349365234375, -5.16229248046875, -4.9752197265625, -4.78814697265625, -4.60107421875, -4.41400146484375, -4.2269287109375, -4.03985595703125, -3.852783203125, -3.66571044921875, -3.4786376953125, -3.29156494140625, -3.1044921875, -2.91741943359375, -2.7303466796875, -2.54327392578125, -2.356201171875, -2.16912841796875, -1.9820556640625, -1.79498291015625, -1.60791015625, -1.42083740234375, -1.2337646484375, -1.04669189453125, -0.859619140625, -0.67254638671875, -0.4854736328125, -0.29840087890625, -0.111328125, 0.07574462890625, 0.2628173828125, 0.44989013671875, 0.636962890625, 0.82403564453125, 1.0111083984375, 1.19818115234375, 1.38525390625, 1.57232666015625, 1.7593994140625, 1.94647216796875, 2.133544921875, 2.32061767578125, 2.5076904296875, 2.69476318359375, 2.8818359375, 3.06890869140625, 3.2559814453125, 3.44305419921875, 3.630126953125, 3.81719970703125, 4.0042724609375, 4.19134521484375, 4.37841796875, 4.56549072265625, 4.7525634765625, 4.93963623046875, 5.126708984375, 5.31378173828125, 5.5008544921875, 5.68792724609375, 5.875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 3.0, 8.0, 9.0, 15.0, 12.0, 13.0, 16.0, 24.0, 28.0, 23.0, 34.0, 43.0, 51.0, 52.0, 73.0, 119.0, 171.0, 1339.0, 330.0, 175.0, 111.0, 70.0, 61.0, 42.0, 41.0, 20.0, 32.0, 28.0, 18.0, 12.0, 20.0, 13.0, 7.0, 8.0, 8.0, 2.0, 6.0, 0.0, 2.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.9466552734375, -10.604248046875, -10.2618408203125, -9.91943359375, -9.5770263671875, -9.234619140625, -8.8922119140625, -8.5498046875, -8.2073974609375, -7.864990234375, -7.5225830078125, -7.18017578125, -6.8377685546875, -6.495361328125, -6.1529541015625, -5.810546875, -5.4681396484375, -5.125732421875, -4.7833251953125, -4.44091796875, -4.0985107421875, -3.756103515625, -3.4136962890625, -3.0712890625, -2.7288818359375, -2.386474609375, -2.0440673828125, -1.70166015625, -1.3592529296875, -1.016845703125, -0.6744384765625, -0.33203125, 0.0103759765625, 0.352783203125, 0.6951904296875, 1.03759765625, 1.3800048828125, 1.722412109375, 2.0648193359375, 2.4072265625, 2.7496337890625, 3.092041015625, 3.4344482421875, 3.77685546875, 4.1192626953125, 4.461669921875, 4.8040771484375, 5.146484375, 5.4888916015625, 5.831298828125, 6.1737060546875, 6.51611328125, 6.8585205078125, 7.200927734375, 7.5433349609375, 7.8857421875, 8.2281494140625, 8.570556640625, 8.9129638671875, 9.25537109375, 9.5977783203125, 9.940185546875, 10.2825927734375, 10.625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 11.0, 11.0, 4.0, 14.0, 22.0, 28.0, 41.0, 38.0, 54.0, 71.0, 107.0, 165.0, 228.0, 463.0, 1219.0, 3885.0, 25041.0, 782205.0, 2262337.0, 60165.0, 6404.0, 1626.0, 618.0, 306.0, 183.0, 120.0, 73.0, 65.0, 44.0, 35.0, 19.0, 22.0, 21.0, 14.0, 13.0, 9.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.07373046875, -15.5224609375, -14.97119140625, -14.419921875, -13.86865234375, -13.3173828125, -12.76611328125, -12.21484375, -11.66357421875, -11.1123046875, -10.56103515625, -10.009765625, -9.45849609375, -8.9072265625, -8.35595703125, -7.8046875, -7.25341796875, -6.7021484375, -6.15087890625, -5.599609375, -5.04833984375, -4.4970703125, -3.94580078125, -3.39453125, -2.84326171875, -2.2919921875, -1.74072265625, -1.189453125, -0.63818359375, -0.0869140625, 0.46435546875, 1.015625, 1.56689453125, 2.1181640625, 2.66943359375, 3.220703125, 3.77197265625, 4.3232421875, 4.87451171875, 5.42578125, 5.97705078125, 6.5283203125, 7.07958984375, 7.630859375, 8.18212890625, 8.7333984375, 9.28466796875, 9.8359375, 10.38720703125, 10.9384765625, 11.48974609375, 12.041015625, 12.59228515625, 13.1435546875, 13.69482421875, 14.24609375, 14.79736328125, 15.3486328125, 15.89990234375, 16.451171875, 17.00244140625, 17.5537109375, 18.10498046875, 18.65625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 13.0, 325.0, 639.0, 42.0, 1.0], "bins": [-458.5304870605469, -451.0351867675781, -443.5398864746094, -436.0445556640625, -428.54925537109375, -421.053955078125, -413.55865478515625, -406.0633239746094, -398.5680236816406, -391.0727233886719, -383.5774230957031, -376.08209228515625, -368.5867919921875, -361.09149169921875, -353.59619140625, -346.1008605957031, -338.6055603027344, -331.1102600097656, -323.6149597167969, -316.11962890625, -308.62432861328125, -301.1290283203125, -293.63372802734375, -286.1383972167969, -278.6430969238281, -271.1477966308594, -263.6524963378906, -256.15716552734375, -248.661865234375, -241.16656494140625, -233.67124938964844, -226.1759490966797, -218.68063354492188, -211.18533325195312, -203.6900177001953, -196.19471740722656, -188.69940185546875, -181.2041015625, -173.7087860107422, -166.21348571777344, -158.7181854248047, -151.22288513183594, -143.72756958007812, -136.23226928710938, -128.73695373535156, -121.24165344238281, -113.746337890625, -106.25103759765625, -98.75572204589844, -91.26041412353516, -83.76510620117188, -76.2697982788086, -68.77449035644531, -61.2791862487793, -53.783878326416016, -46.288570404052734, -38.79326248168945, -31.297954559326172, -23.80264663696289, -16.307340621948242, -8.812032699584961, -1.3167266845703125, 6.178581237792969, 13.67388916015625, 21.16919708251953]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 8.0, 5.0, 12.0, 18.0, 16.0, 17.0, 18.0, 20.0, 19.0, 33.0, 37.0, 38.0, 39.0, 45.0, 41.0, 58.0, 40.0, 45.0, 38.0, 39.0, 33.0, 51.0, 32.0, 32.0, 31.0, 30.0, 25.0, 27.0, 23.0, 32.0, 18.0, 12.0, 17.0, 11.0, 9.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.43394470214844, -32.4145393371582, -31.395137786865234, -30.375734329223633, -29.35633087158203, -28.336925506591797, -27.317522048950195, -26.298118591308594, -25.278715133666992, -24.25931167602539, -23.23990821838379, -22.220504760742188, -21.201099395751953, -20.181697845458984, -19.16229248046875, -18.14288902282715, -17.123485565185547, -16.104082107543945, -15.084678649902344, -14.065274238586426, -13.045870780944824, -12.026467323303223, -11.007062911987305, -9.987659454345703, -8.968255996704102, -7.9488525390625, -6.92944860458374, -5.9100446701049805, -4.890641212463379, -3.8712377548217773, -2.8518338203430176, -1.8324298858642578, -0.8130302429199219, 0.2063734531402588, 1.2257771492004395, 2.24518084526062, 3.264584541320801, 4.283987998962402, 5.303391933441162, 6.322795867919922, 7.342199325561523, 8.361602783203125, 9.381006240844727, 10.400410652160645, 11.419814109802246, 12.439217567443848, 13.458621978759766, 14.478025436401367, 15.497428894042969, 16.51683235168457, 17.536235809326172, 18.555639266967773, 19.575042724609375, 20.59444808959961, 21.61385154724121, 22.633255004882812, 23.652658462524414, 24.672061920166016, 25.691465377807617, 26.71086883544922, 27.730274200439453, 28.749675750732422, 29.769081115722656, 30.788484573364258, 31.80788803100586]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 4.0, 9.0, 11.0, 6.0, 6.0, 15.0, 12.0, 20.0, 17.0, 22.0, 28.0, 27.0, 30.0, 38.0, 25.0, 40.0, 45.0, 44.0, 51.0, 45.0, 36.0, 39.0, 51.0, 46.0, 36.0, 35.0, 41.0, 38.0, 37.0, 26.0, 20.0, 18.0, 17.0, 13.0, 12.0, 10.0, 7.0, 6.0, 10.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.404296875, -3.298065185546875, -3.19183349609375, -3.085601806640625, -2.9793701171875, -2.873138427734375, -2.76690673828125, -2.660675048828125, -2.554443359375, -2.448211669921875, -2.34197998046875, -2.235748291015625, -2.1295166015625, -2.023284912109375, -1.91705322265625, -1.810821533203125, -1.70458984375, -1.598358154296875, -1.49212646484375, -1.385894775390625, -1.2796630859375, -1.173431396484375, -1.06719970703125, -0.960968017578125, -0.854736328125, -0.748504638671875, -0.64227294921875, -0.536041259765625, -0.4298095703125, -0.323577880859375, -0.21734619140625, -0.111114501953125, -0.0048828125, 0.101348876953125, 0.20758056640625, 0.313812255859375, 0.4200439453125, 0.526275634765625, 0.63250732421875, 0.738739013671875, 0.844970703125, 0.951202392578125, 1.05743408203125, 1.163665771484375, 1.2698974609375, 1.376129150390625, 1.48236083984375, 1.588592529296875, 1.69482421875, 1.801055908203125, 1.90728759765625, 2.013519287109375, 2.1197509765625, 2.225982666015625, 2.33221435546875, 2.438446044921875, 2.544677734375, 2.650909423828125, 2.75714111328125, 2.863372802734375, 2.9696044921875, 3.075836181640625, 3.18206787109375, 3.288299560546875, 3.39453125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 8.0, 6.0, 9.0, 12.0, 24.0, 47.0, 56.0, 97.0, 169.0, 234.0, 452.0, 883.0, 1849.0, 3893.0, 10331.0, 37207.0, 369706.0, 2999431.0, 692840.0, 55603.0, 12653.0, 4565.0, 2034.0, 1001.0, 489.0, 259.0, 153.0, 95.0, 67.0, 29.0, 28.0, 17.0, 17.0, 5.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.53125, -11.1776123046875, -10.823974609375, -10.4703369140625, -10.11669921875, -9.7630615234375, -9.409423828125, -9.0557861328125, -8.7021484375, -8.3485107421875, -7.994873046875, -7.6412353515625, -7.28759765625, -6.9339599609375, -6.580322265625, -6.2266845703125, -5.873046875, -5.5194091796875, -5.165771484375, -4.8121337890625, -4.45849609375, -4.1048583984375, -3.751220703125, -3.3975830078125, -3.0439453125, -2.6903076171875, -2.336669921875, -1.9830322265625, -1.62939453125, -1.2757568359375, -0.922119140625, -0.5684814453125, -0.21484375, 0.1387939453125, 0.492431640625, 0.8460693359375, 1.19970703125, 1.5533447265625, 1.906982421875, 2.2606201171875, 2.6142578125, 2.9678955078125, 3.321533203125, 3.6751708984375, 4.02880859375, 4.3824462890625, 4.736083984375, 5.0897216796875, 5.443359375, 5.7969970703125, 6.150634765625, 6.5042724609375, 6.85791015625, 7.2115478515625, 7.565185546875, 7.9188232421875, 8.2724609375, 8.6260986328125, 8.979736328125, 9.3333740234375, 9.68701171875, 10.0406494140625, 10.394287109375, 10.7479248046875, 11.1015625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 12.0, 20.0, 31.0, 40.0, 64.0, 123.0, 151.0, 277.0, 453.0, 713.0, 794.0, 557.0, 358.0, 201.0, 105.0, 63.0, 41.0, 17.0, 23.0, 11.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.203125, -11.845703125, -11.48828125, -11.130859375, -10.7734375, -10.416015625, -10.05859375, -9.701171875, -9.34375, -8.986328125, -8.62890625, -8.271484375, -7.9140625, -7.556640625, -7.19921875, -6.841796875, -6.484375, -6.126953125, -5.76953125, -5.412109375, -5.0546875, -4.697265625, -4.33984375, -3.982421875, -3.625, -3.267578125, -2.91015625, -2.552734375, -2.1953125, -1.837890625, -1.48046875, -1.123046875, -0.765625, -0.408203125, -0.05078125, 0.306640625, 0.6640625, 1.021484375, 1.37890625, 1.736328125, 2.09375, 2.451171875, 2.80859375, 3.166015625, 3.5234375, 3.880859375, 4.23828125, 4.595703125, 4.953125, 5.310546875, 5.66796875, 6.025390625, 6.3828125, 6.740234375, 7.09765625, 7.455078125, 7.8125, 8.169921875, 8.52734375, 8.884765625, 9.2421875, 9.599609375, 9.95703125, 10.314453125, 10.671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 20.0, 25.0, 38.0, 67.0, 159.0, 255.0, 792.0, 2887.0, 28037.0, 3335165.0, 811808.0, 12016.0, 1859.0, 553.0, 277.0, 126.0, 69.0, 45.0, 27.0, 13.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.9375, -31.7958984375, -30.654296875, -29.5126953125, -28.37109375, -27.2294921875, -26.087890625, -24.9462890625, -23.8046875, -22.6630859375, -21.521484375, -20.3798828125, -19.23828125, -18.0966796875, -16.955078125, -15.8134765625, -14.671875, -13.5302734375, -12.388671875, -11.2470703125, -10.10546875, -8.9638671875, -7.822265625, -6.6806640625, -5.5390625, -4.3974609375, -3.255859375, -2.1142578125, -0.97265625, 0.1689453125, 1.310546875, 2.4521484375, 3.59375, 4.7353515625, 5.876953125, 7.0185546875, 8.16015625, 9.3017578125, 10.443359375, 11.5849609375, 12.7265625, 13.8681640625, 15.009765625, 16.1513671875, 17.29296875, 18.4345703125, 19.576171875, 20.7177734375, 21.859375, 23.0009765625, 24.142578125, 25.2841796875, 26.42578125, 27.5673828125, 28.708984375, 29.8505859375, 30.9921875, 32.1337890625, 33.275390625, 34.4169921875, 35.55859375, 36.7001953125, 37.841796875, 38.9833984375, 40.125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 10.0, 16.0, 20.0, 25.0, 38.0, 54.0, 76.0, 95.0, 108.0, 113.0, 90.0, 90.0, 73.0, 61.0, 35.0, 34.0, 17.0, 13.0, 8.0, 13.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.78776168823242, -36.51385498046875, -35.23994445800781, -33.96603775024414, -32.69213104248047, -31.418222427368164, -30.14431381225586, -28.870407104492188, -27.596500396728516, -26.32259178161621, -25.04868507385254, -23.774776458740234, -22.500869750976562, -21.226961135864258, -19.953052520751953, -18.67914581298828, -17.405237197875977, -16.131328582763672, -14.857421875, -13.583513259887695, -12.309606552124023, -11.035697937011719, -9.76179027557373, -8.487882614135742, -7.213974952697754, -5.940067291259766, -4.666159629821777, -3.392251491546631, -2.1183438301086426, -0.8444361686706543, 0.4294719696044922, 1.7033796310424805, 2.9772872924804688, 4.251194953918457, 5.525102615356445, 6.799010753631592, 8.072917938232422, 9.346826553344727, 10.620734214782715, 11.894641876220703, 13.168549537658691, 14.44245719909668, 15.716364860534668, 16.990272521972656, 18.26418113708496, 19.538087844848633, 20.811996459960938, 22.08590316772461, 23.359811782836914, 24.63372039794922, 25.90762710571289, 27.181535720825195, 28.455442428588867, 29.729351043701172, 31.003257751464844, 32.27716827392578, 33.55107498168945, 34.824981689453125, 36.09889221191406, 37.372798919677734, 38.646705627441406, 39.92061233520508, 41.194522857666016, 42.46842956542969, 43.74233627319336]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 1.0, 1.0, 5.0, 7.0, 15.0, 6.0, 15.0, 13.0, 22.0, 18.0, 28.0, 28.0, 21.0, 25.0, 28.0, 35.0, 25.0, 46.0, 35.0, 33.0, 33.0, 47.0, 39.0, 30.0, 34.0, 30.0, 32.0, 35.0, 37.0, 32.0, 31.0, 26.0, 28.0, 17.0, 22.0, 18.0, 13.0, 7.0, 18.0, 10.0, 13.0, 7.0, 6.0, 6.0, 3.0, 4.0, 3.0, 5.0, 6.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-20.617080688476562, -19.964778900146484, -19.312477111816406, -18.660175323486328, -18.00787353515625, -17.355571746826172, -16.703269958496094, -16.050968170166016, -15.398666381835938, -14.74636459350586, -14.094062805175781, -13.441761016845703, -12.789459228515625, -12.137157440185547, -11.484855651855469, -10.83255386352539, -10.180252075195312, -9.527950286865234, -8.875648498535156, -8.223346710205078, -7.571044921875, -6.918743133544922, -6.266441345214844, -5.614139556884766, -4.9618377685546875, -4.309535980224609, -3.6572341918945312, -3.004932403564453, -2.352630615234375, -1.7003288269042969, -1.0480270385742188, -0.3957252502441406, 0.2565765380859375, 0.9088783264160156, 1.5611801147460938, 2.213481903076172, 2.86578369140625, 3.518085479736328, 4.170387268066406, 4.822689056396484, 5.4749908447265625, 6.127292633056641, 6.779594421386719, 7.431896209716797, 8.084197998046875, 8.736499786376953, 9.388801574707031, 10.04110336303711, 10.693405151367188, 11.345706939697266, 11.998008728027344, 12.650310516357422, 13.3026123046875, 13.954914093017578, 14.607215881347656, 15.259517669677734, 15.911819458007812, 16.56412124633789, 17.21642303466797, 17.868724822998047, 18.521026611328125, 19.173328399658203, 19.82563018798828, 20.47793197631836, 21.130233764648438]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 5.0, 7.0, 3.0, 12.0, 5.0, 10.0, 9.0, 14.0, 14.0, 18.0, 18.0, 28.0, 26.0, 30.0, 30.0, 37.0, 37.0, 39.0, 38.0, 54.0, 38.0, 39.0, 44.0, 47.0, 38.0, 41.0, 38.0, 33.0, 36.0, 35.0, 28.0, 28.0, 23.0, 13.0, 15.0, 17.0, 13.0, 9.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.5078125, -3.403350830078125, -3.29888916015625, -3.194427490234375, -3.0899658203125, -2.985504150390625, -2.88104248046875, -2.776580810546875, -2.672119140625, -2.567657470703125, -2.46319580078125, -2.358734130859375, -2.2542724609375, -2.149810791015625, -2.04534912109375, -1.940887451171875, -1.83642578125, -1.731964111328125, -1.62750244140625, -1.523040771484375, -1.4185791015625, -1.314117431640625, -1.20965576171875, -1.105194091796875, -1.000732421875, -0.896270751953125, -0.79180908203125, -0.687347412109375, -0.5828857421875, -0.478424072265625, -0.37396240234375, -0.269500732421875, -0.1650390625, -0.060577392578125, 0.04388427734375, 0.148345947265625, 0.2528076171875, 0.357269287109375, 0.46173095703125, 0.566192626953125, 0.670654296875, 0.775115966796875, 0.87957763671875, 0.984039306640625, 1.0885009765625, 1.192962646484375, 1.29742431640625, 1.401885986328125, 1.50634765625, 1.610809326171875, 1.71527099609375, 1.819732666015625, 1.9241943359375, 2.028656005859375, 2.13311767578125, 2.237579345703125, 2.342041015625, 2.446502685546875, 2.55096435546875, 2.655426025390625, 2.7598876953125, 2.864349365234375, 2.96881103515625, 3.073272705078125, 3.177734375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 2.0, 12.0, 16.0, 37.0, 44.0, 65.0, 65.0, 139.0, 199.0, 267.0, 428.0, 615.0, 857.0, 1327.0, 2132.0, 3340.0, 5147.0, 8506.0, 13864.0, 23269.0, 40812.0, 74616.0, 159974.0, 372954.0, 162192.0, 75524.0, 41149.0, 23777.0, 13865.0, 8476.0, 5177.0, 3396.0, 2109.0, 1424.0, 939.0, 560.0, 405.0, 310.0, 178.0, 105.0, 100.0, 63.0, 34.0, 34.0, 19.0, 14.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.203369140625, -0.19729995727539062, -0.19123077392578125, -0.18516159057617188, -0.1790924072265625, -0.17302322387695312, -0.16695404052734375, -0.16088485717773438, -0.154815673828125, -0.14874649047851562, -0.14267730712890625, -0.13660812377929688, -0.1305389404296875, -0.12446975708007812, -0.11840057373046875, -0.11233139038085938, -0.10626220703125, -0.10019302368164062, -0.09412384033203125, -0.08805465698242188, -0.0819854736328125, -0.07591629028320312, -0.06984710693359375, -0.06377792358398438, -0.057708740234375, -0.051639556884765625, -0.04557037353515625, -0.039501190185546875, -0.0334320068359375, -0.027362823486328125, -0.02129364013671875, -0.015224456787109375, -0.0091552734375, -0.003086090087890625, 0.00298309326171875, 0.009052276611328125, 0.0151214599609375, 0.021190643310546875, 0.02725982666015625, 0.033329010009765625, 0.039398193359375, 0.045467376708984375, 0.05153656005859375, 0.057605743408203125, 0.0636749267578125, 0.06974411010742188, 0.07581329345703125, 0.08188247680664062, 0.08795166015625, 0.09402084350585938, 0.10009002685546875, 0.10615921020507812, 0.1122283935546875, 0.11829757690429688, 0.12436676025390625, 0.13043594360351562, 0.136505126953125, 0.14257431030273438, 0.14864349365234375, 0.15471267700195312, 0.1607818603515625, 0.16685104370117188, 0.17292022705078125, 0.17898941040039062, 0.18505859375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 4.0, 10.0, 4.0, 11.0, 7.0, 19.0, 16.0, 23.0, 27.0, 20.0, 22.0, 31.0, 30.0, 28.0, 33.0, 32.0, 31.0, 44.0, 31.0, 39.0, 1070.0, 44.0, 51.0, 33.0, 43.0, 40.0, 35.0, 29.0, 30.0, 34.0, 27.0, 19.0, 15.0, 15.0, 14.0, 9.0, 15.0, 12.0, 6.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.8984375, -2.811279296875, -2.72412109375, -2.636962890625, -2.5498046875, -2.462646484375, -2.37548828125, -2.288330078125, -2.201171875, -2.114013671875, -2.02685546875, -1.939697265625, -1.8525390625, -1.765380859375, -1.67822265625, -1.591064453125, -1.50390625, -1.416748046875, -1.32958984375, -1.242431640625, -1.1552734375, -1.068115234375, -0.98095703125, -0.893798828125, -0.806640625, -0.719482421875, -0.63232421875, -0.545166015625, -0.4580078125, -0.370849609375, -0.28369140625, -0.196533203125, -0.109375, -0.022216796875, 0.06494140625, 0.152099609375, 0.2392578125, 0.326416015625, 0.41357421875, 0.500732421875, 0.587890625, 0.675048828125, 0.76220703125, 0.849365234375, 0.9365234375, 1.023681640625, 1.11083984375, 1.197998046875, 1.28515625, 1.372314453125, 1.45947265625, 1.546630859375, 1.6337890625, 1.720947265625, 1.80810546875, 1.895263671875, 1.982421875, 2.069580078125, 2.15673828125, 2.243896484375, 2.3310546875, 2.418212890625, 2.50537109375, 2.592529296875, 2.6796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 2.0, 10.0, 6.0, 14.0, 20.0, 36.0, 46.0, 58.0, 92.0, 107.0, 200.0, 283.0, 372.0, 569.0, 801.0, 1213.0, 1775.0, 2722.0, 4082.0, 6403.0, 9795.0, 15047.0, 23948.0, 37636.0, 62233.0, 113683.0, 520384.0, 1008119.0, 116570.0, 63608.0, 38210.0, 24113.0, 15651.0, 9924.0, 6619.0, 4262.0, 2808.0, 1921.0, 1191.0, 820.0, 547.0, 394.0, 261.0, 184.0, 124.0, 85.0, 64.0, 29.0, 30.0, 20.0, 19.0, 9.0, 10.0, 3.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.06573486328125, -0.06374406814575195, -0.061753273010253906, -0.05976247787475586, -0.05777168273925781, -0.055780887603759766, -0.05379009246826172, -0.05179929733276367, -0.049808502197265625, -0.04781770706176758, -0.04582691192626953, -0.043836116790771484, -0.04184532165527344, -0.03985452651977539, -0.037863731384277344, -0.0358729362487793, -0.03388214111328125, -0.0318913459777832, -0.029900550842285156, -0.02790975570678711, -0.025918960571289062, -0.023928165435791016, -0.02193737030029297, -0.019946575164794922, -0.017955780029296875, -0.015964984893798828, -0.013974189758300781, -0.011983394622802734, -0.009992599487304688, -0.00800180435180664, -0.006011009216308594, -0.004020214080810547, -0.0020294189453125, -3.8623809814453125e-05, 0.0019521713256835938, 0.003942966461181641, 0.0059337615966796875, 0.007924556732177734, 0.009915351867675781, 0.011906147003173828, 0.013896942138671875, 0.015887737274169922, 0.01787853240966797, 0.019869327545166016, 0.021860122680664062, 0.02385091781616211, 0.025841712951660156, 0.027832508087158203, 0.02982330322265625, 0.0318140983581543, 0.033804893493652344, 0.03579568862915039, 0.03778648376464844, 0.039777278900146484, 0.04176807403564453, 0.04375886917114258, 0.045749664306640625, 0.04774045944213867, 0.04973125457763672, 0.051722049713134766, 0.05371284484863281, 0.05570363998413086, 0.057694435119628906, 0.05968523025512695, 0.061676025390625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 11.0, 6.0, 8.0, 18.0, 15.0, 19.0, 24.0, 19.0, 32.0, 30.0, 59.0, 29.0, 50.0, 66.0, 106.0, 79.0, 65.0, 50.0, 43.0, 44.0, 36.0, 34.0, 26.0, 22.0, 20.0, 12.0, 9.0, 12.0, 3.0, 7.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007395744323730469, -0.0007162019610404968, -0.0006928294897079468, -0.0006694570183753967, -0.0006460845470428467, -0.0006227120757102966, -0.0005993396043777466, -0.0005759671330451965, -0.0005525946617126465, -0.0005292221903800964, -0.0005058497190475464, -0.00048247724771499634, -0.0004591047763824463, -0.00043573230504989624, -0.0004123598337173462, -0.00038898736238479614, -0.0003656148910522461, -0.00034224241971969604, -0.000318869948387146, -0.00029549747705459595, -0.0002721250057220459, -0.00024875253438949585, -0.0002253800630569458, -0.00020200759172439575, -0.0001786351203918457, -0.00015526264905929565, -0.0001318901777267456, -0.00010851770639419556, -8.514523506164551e-05, -6.177276372909546e-05, -3.840029239654541e-05, -1.5027821063995361e-05, 8.344650268554688e-06, 3.1717121601104736e-05, 5.5089592933654785e-05, 7.846206426620483e-05, 0.00010183453559875488, 0.00012520700693130493, 0.00014857947826385498, 0.00017195194959640503, 0.00019532442092895508, 0.00021869689226150513, 0.00024206936359405518, 0.0002654418349266052, 0.0002888143062591553, 0.0003121867775917053, 0.00033555924892425537, 0.0003589317202568054, 0.00038230419158935547, 0.0004056766629219055, 0.00042904913425445557, 0.0004524216055870056, 0.00047579407691955566, 0.0004991665482521057, 0.0005225390195846558, 0.0005459114909172058, 0.0005692839622497559, 0.0005926564335823059, 0.000616028904914856, 0.000639401376247406, 0.0006627738475799561, 0.0006861463189125061, 0.0007095187902450562, 0.0007328912615776062, 0.0007562637329101562]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 9.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 10.0, 12.0, 29.0, 33.0, 39.0, 49.0, 74.0, 105.0, 185.0, 581.0, 4876.0, 102722.0, 905777.0, 31211.0, 2026.0, 346.0, 146.0, 75.0, 62.0, 40.0, 28.0, 20.0, 16.0, 11.0, 10.0, 4.0, 12.0, 6.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.0151519775390625, -0.014683246612548828, -0.014214515686035156, -0.013745784759521484, -0.013277053833007812, -0.01280832290649414, -0.012339591979980469, -0.011870861053466797, -0.011402130126953125, -0.010933399200439453, -0.010464668273925781, -0.00999593734741211, -0.009527206420898438, -0.009058475494384766, -0.008589744567871094, -0.008121013641357422, -0.00765228271484375, -0.007183551788330078, -0.006714820861816406, -0.006246089935302734, -0.0057773590087890625, -0.005308628082275391, -0.004839897155761719, -0.004371166229248047, -0.003902435302734375, -0.003433704376220703, -0.0029649734497070312, -0.0024962425231933594, -0.0020275115966796875, -0.0015587806701660156, -0.0010900497436523438, -0.0006213188171386719, -0.000152587890625, 0.0003161430358886719, 0.0007848739624023438, 0.0012536048889160156, 0.0017223358154296875, 0.0021910667419433594, 0.0026597976684570312, 0.003128528594970703, 0.003597259521484375, 0.004065990447998047, 0.004534721374511719, 0.005003452301025391, 0.0054721832275390625, 0.005940914154052734, 0.006409645080566406, 0.006878376007080078, 0.00734710693359375, 0.007815837860107422, 0.008284568786621094, 0.008753299713134766, 0.009222030639648438, 0.00969076156616211, 0.010159492492675781, 0.010628223419189453, 0.011096954345703125, 0.011565685272216797, 0.012034416198730469, 0.01250314712524414, 0.012971878051757812, 0.013440608978271484, 0.013909339904785156, 0.014378070831298828, 0.0148468017578125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 58.0, 937.0, 21.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020125017035752535, -0.0014199453871697187, -0.0008273891871795058, -0.0002348329871892929, 0.00035772332921624184, 0.0009502796456217766, 0.0015428357291966677, 0.0021353920456022024, 0.002727948362007737, 0.003320504678413272, 0.003913060761988163, 0.004505617078393698, 0.0050981733947992325, 0.005690729711204767, 0.006283286027610302, 0.006875841878354549, 0.0074683986604213715, 0.008060954511165619, 0.008653511293232441, 0.009246067143976688, 0.00983862392604351, 0.010431179776787758, 0.011023735627532005, 0.011616292409598827, 0.012208848260343075, 0.012801404111087322, 0.013393960893154144, 0.013986516743898392, 0.014579073525965214, 0.015171629376709461, 0.015764186158776283, 0.01635674200952053, 0.016949297860264778, 0.017541853711009026, 0.018134409561753273, 0.01872696727514267, 0.019319523125886917, 0.019912078976631165, 0.020504634827375412, 0.02109719067811966, 0.021689748391509056, 0.022282304242253304, 0.02287486009299755, 0.023467417806386948, 0.024059973657131195, 0.024652529507875443, 0.02524508535861969, 0.025837641209363937, 0.026430197060108185, 0.027022752910852432, 0.02761530876159668, 0.028207866474986076, 0.028800422325730324, 0.02939297817647457, 0.02998553402721882, 0.030578091740608215, 0.031170647591352463, 0.03176320344209671, 0.03235575929284096, 0.032948315143585205, 0.03354087099432945, 0.034133430570364, 0.034725986421108246, 0.03531854227185249, 0.03591109812259674]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 6.0, 11.0, 22.0, 25.0, 40.0, 59.0, 79.0, 65.0, 105.0, 103.0, 84.0, 94.0, 88.0, 64.0, 49.0, 52.0, 21.0, 15.0, 7.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018720626831054688, -0.0018301485106348991, -0.0017882343381643295, -0.00174632016569376, -0.0017044059932231903, -0.0016624918207526207, -0.001620577648282051, -0.0015786634758114815, -0.0015367493033409119, -0.0014948351308703423, -0.0014529209583997726, -0.001411006785929203, -0.0013690926134586334, -0.0013271784409880638, -0.0012852642685174942, -0.0012433500960469246, -0.001201435923576355, -0.0011595217511057854, -0.0011176075786352158, -0.0010756934061646461, -0.0010337792336940765, -0.000991865061223507, -0.0009499508887529373, -0.0009080367162823677, -0.0008661225438117981, -0.0008242083713412285, -0.0007822941988706589, -0.0007403800264000893, -0.0006984658539295197, -0.00065655168145895, -0.0006146375089883804, -0.0005727233365178108, -0.0005308091640472412, -0.0004888949915766716, -0.000446980819106102, -0.0004050666466355324, -0.00036315247416496277, -0.00032123830169439316, -0.00027932412922382355, -0.00023740995675325394, -0.00019549578428268433, -0.00015358161181211472, -0.0001116674393415451, -6.97532668709755e-05, -2.7839094400405884e-05, 1.4075078070163727e-05, 5.598925054073334e-05, 9.790342301130295e-05, 0.00013981759548187256, 0.00018173176795244217, 0.00022364594042301178, 0.0002655601128935814, 0.000307474285364151, 0.0003493884578347206, 0.0003913026303052902, 0.00043321680277585983, 0.00047513097524642944, 0.000517045147716999, 0.0005589593201875687, 0.0006008734926581383, 0.0006427876651287079, 0.0006847018375992775, 0.0007266160100698471, 0.0007685301825404167, 0.0008104443550109863]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 5.0, 7.0, 4.0, 11.0, 5.0, 10.0, 9.0, 14.0, 14.0, 18.0, 18.0, 28.0, 26.0, 30.0, 30.0, 37.0, 37.0, 39.0, 38.0, 54.0, 38.0, 39.0, 44.0, 47.0, 38.0, 41.0, 38.0, 33.0, 36.0, 35.0, 28.0, 28.0, 23.0, 13.0, 15.0, 17.0, 13.0, 9.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.5078125, -3.403350830078125, -3.29888916015625, -3.194427490234375, -3.0899658203125, -2.985504150390625, -2.88104248046875, -2.776580810546875, -2.672119140625, -2.567657470703125, -2.46319580078125, -2.358734130859375, -2.2542724609375, -2.149810791015625, -2.04534912109375, -1.940887451171875, -1.83642578125, -1.731964111328125, -1.62750244140625, -1.523040771484375, -1.4185791015625, -1.314117431640625, -1.20965576171875, -1.105194091796875, -1.000732421875, -0.896270751953125, -0.79180908203125, -0.687347412109375, -0.5828857421875, -0.478424072265625, -0.37396240234375, -0.269500732421875, -0.1650390625, -0.060577392578125, 0.04388427734375, 0.148345947265625, 0.2528076171875, 0.357269287109375, 0.46173095703125, 0.566192626953125, 0.670654296875, 0.775115966796875, 0.87957763671875, 0.984039306640625, 1.0885009765625, 1.192962646484375, 1.29742431640625, 1.401885986328125, 1.50634765625, 1.610809326171875, 1.71527099609375, 1.819732666015625, 1.9241943359375, 2.028656005859375, 2.13311767578125, 2.237579345703125, 2.342041015625, 2.446502685546875, 2.55096435546875, 2.655426025390625, 2.7598876953125, 2.864349365234375, 2.96881103515625, 3.073272705078125, 3.177734375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 13.0, 10.0, 15.0, 25.0, 27.0, 56.0, 80.0, 112.0, 186.0, 278.0, 418.0, 680.0, 1120.0, 1896.0, 3546.0, 6606.0, 14382.0, 34509.0, 93444.0, 308098.0, 389377.0, 117773.0, 41652.0, 16943.0, 7741.0, 3997.0, 2230.0, 1212.0, 776.0, 471.0, 304.0, 183.0, 121.0, 90.0, 61.0, 40.0, 30.0, 15.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.84765625, -6.62750244140625, -6.4073486328125, -6.18719482421875, -5.967041015625, -5.74688720703125, -5.5267333984375, -5.30657958984375, -5.08642578125, -4.86627197265625, -4.6461181640625, -4.42596435546875, -4.205810546875, -3.98565673828125, -3.7655029296875, -3.54534912109375, -3.3251953125, -3.10504150390625, -2.8848876953125, -2.66473388671875, -2.444580078125, -2.22442626953125, -2.0042724609375, -1.78411865234375, -1.56396484375, -1.34381103515625, -1.1236572265625, -0.90350341796875, -0.683349609375, -0.46319580078125, -0.2430419921875, -0.02288818359375, 0.197265625, 0.41741943359375, 0.6375732421875, 0.85772705078125, 1.077880859375, 1.29803466796875, 1.5181884765625, 1.73834228515625, 1.95849609375, 2.17864990234375, 2.3988037109375, 2.61895751953125, 2.839111328125, 3.05926513671875, 3.2794189453125, 3.49957275390625, 3.7197265625, 3.93988037109375, 4.1600341796875, 4.38018798828125, 4.600341796875, 4.82049560546875, 5.0406494140625, 5.26080322265625, 5.48095703125, 5.70111083984375, 5.9212646484375, 6.14141845703125, 6.361572265625, 6.58172607421875, 6.8018798828125, 7.02203369140625, 7.2421875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 7.0, 10.0, 6.0, 9.0, 8.0, 14.0, 17.0, 12.0, 24.0, 22.0, 29.0, 37.0, 20.0, 45.0, 41.0, 52.0, 61.0, 98.0, 135.0, 200.0, 1294.0, 218.0, 152.0, 94.0, 72.0, 55.0, 49.0, 41.0, 40.0, 30.0, 26.0, 29.0, 23.0, 16.0, 12.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-11.1796875, -10.85693359375, -10.5341796875, -10.21142578125, -9.888671875, -9.56591796875, -9.2431640625, -8.92041015625, -8.59765625, -8.27490234375, -7.9521484375, -7.62939453125, -7.306640625, -6.98388671875, -6.6611328125, -6.33837890625, -6.015625, -5.69287109375, -5.3701171875, -5.04736328125, -4.724609375, -4.40185546875, -4.0791015625, -3.75634765625, -3.43359375, -3.11083984375, -2.7880859375, -2.46533203125, -2.142578125, -1.81982421875, -1.4970703125, -1.17431640625, -0.8515625, -0.52880859375, -0.2060546875, 0.11669921875, 0.439453125, 0.76220703125, 1.0849609375, 1.40771484375, 1.73046875, 2.05322265625, 2.3759765625, 2.69873046875, 3.021484375, 3.34423828125, 3.6669921875, 3.98974609375, 4.3125, 4.63525390625, 4.9580078125, 5.28076171875, 5.603515625, 5.92626953125, 6.2490234375, 6.57177734375, 6.89453125, 7.21728515625, 7.5400390625, 7.86279296875, 8.185546875, 8.50830078125, 8.8310546875, 9.15380859375, 9.4765625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 8.0, 4.0, 8.0, 9.0, 7.0, 4.0, 11.0, 17.0, 20.0, 23.0, 40.0, 56.0, 78.0, 102.0, 142.0, 233.0, 433.0, 933.0, 2373.0, 7585.0, 43016.0, 724148.0, 2235220.0, 110875.0, 13990.0, 3539.0, 1356.0, 566.0, 278.0, 183.0, 103.0, 82.0, 67.0, 44.0, 39.0, 25.0, 19.0, 20.0, 11.0, 9.0, 6.0, 10.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.6875, -16.115966796875, -15.54443359375, -14.972900390625, -14.4013671875, -13.829833984375, -13.25830078125, -12.686767578125, -12.115234375, -11.543701171875, -10.97216796875, -10.400634765625, -9.8291015625, -9.257568359375, -8.68603515625, -8.114501953125, -7.54296875, -6.971435546875, -6.39990234375, -5.828369140625, -5.2568359375, -4.685302734375, -4.11376953125, -3.542236328125, -2.970703125, -2.399169921875, -1.82763671875, -1.256103515625, -0.6845703125, -0.113037109375, 0.45849609375, 1.030029296875, 1.6015625, 2.173095703125, 2.74462890625, 3.316162109375, 3.8876953125, 4.459228515625, 5.03076171875, 5.602294921875, 6.173828125, 6.745361328125, 7.31689453125, 7.888427734375, 8.4599609375, 9.031494140625, 9.60302734375, 10.174560546875, 10.74609375, 11.317626953125, 11.88916015625, 12.460693359375, 13.0322265625, 13.603759765625, 14.17529296875, 14.746826171875, 15.318359375, 15.889892578125, 16.46142578125, 17.032958984375, 17.6044921875, 18.176025390625, 18.74755859375, 19.319091796875, 19.890625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 12.0, 34.0, 75.0, 212.0, 287.0, 246.0, 97.0, 34.0, 16.0, 3.0, 3.0], "bins": [-139.24452209472656, -136.82455444335938, -134.40460205078125, -131.98464965820312, -129.56468200683594, -127.14472198486328, -124.72476196289062, -122.30480194091797, -119.88484191894531, -117.46488189697266, -115.044921875, -112.62496185302734, -110.20500183105469, -107.78504180908203, -105.36508178710938, -102.94512176513672, -100.52516174316406, -98.1052017211914, -95.68524169921875, -93.2652816772461, -90.84532165527344, -88.42536163330078, -86.00540161132812, -83.58544158935547, -81.16548156738281, -78.74552154541016, -76.3255615234375, -73.90560150146484, -71.48564147949219, -69.06568145751953, -66.64572143554688, -64.22576141357422, -61.80579376220703, -59.385833740234375, -56.96587371826172, -54.54591369628906, -52.125953674316406, -49.70599365234375, -47.286033630371094, -44.86607360839844, -42.44611358642578, -40.026153564453125, -37.60619354248047, -35.18623352050781, -32.766273498535156, -30.3463134765625, -27.926353454589844, -25.506393432617188, -23.086435317993164, -20.666475296020508, -18.24651527404785, -15.826555252075195, -13.406595230102539, -10.986635208129883, -8.566675186157227, -6.14671516418457, -3.726755142211914, -1.3067951202392578, 1.1131649017333984, 3.5331249237060547, 5.953084945678711, 8.373044967651367, 10.793004989624023, 13.21296501159668, 15.632925033569336]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 8.0, 4.0, 13.0, 13.0, 22.0, 20.0, 23.0, 22.0, 31.0, 23.0, 29.0, 30.0, 37.0, 44.0, 48.0, 50.0, 39.0, 39.0, 48.0, 42.0, 35.0, 37.0, 34.0, 43.0, 36.0, 31.0, 25.0, 28.0, 15.0, 22.0, 17.0, 19.0, 17.0, 14.0, 5.0, 7.0, 7.0, 5.0, 4.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.509851455688477, -27.478479385375977, -26.447107315063477, -25.415735244750977, -24.384363174438477, -23.352991104125977, -22.321619033813477, -21.290246963500977, -20.258874893188477, -19.227502822875977, -18.196130752563477, -17.164758682250977, -16.133386611938477, -15.102014541625977, -14.070642471313477, -13.039270401000977, -12.007898330688477, -10.976526260375977, -9.945154190063477, -8.913782119750977, -7.882410049438477, -6.851037979125977, -5.819665908813477, -4.788293838500977, -3.7569217681884766, -2.7255496978759766, -1.6941776275634766, -0.6628055572509766, 0.36856651306152344, 1.3999385833740234, 2.4313106536865234, 3.4626827239990234, 4.494052886962891, 5.525424957275391, 6.556797027587891, 7.588169097900391, 8.61954116821289, 9.65091323852539, 10.68228530883789, 11.71365737915039, 12.74502944946289, 13.77640151977539, 14.80777359008789, 15.83914566040039, 16.87051773071289, 17.90188980102539, 18.93326187133789, 19.96463394165039, 20.99600601196289, 22.02737808227539, 23.05875015258789, 24.09012222290039, 25.12149429321289, 26.15286636352539, 27.18423843383789, 28.21561050415039, 29.24698257446289, 30.27835464477539, 31.30972671508789, 32.34109878540039, 33.37247085571289, 34.40384292602539, 35.43521499633789, 36.46658706665039, 37.49795913696289]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 4.0, 8.0, 5.0, 10.0, 6.0, 13.0, 18.0, 17.0, 17.0, 21.0, 22.0, 32.0, 33.0, 27.0, 32.0, 28.0, 44.0, 47.0, 44.0, 34.0, 46.0, 49.0, 39.0, 39.0, 44.0, 49.0, 31.0, 28.0, 28.0, 25.0, 28.0, 17.0, 25.0, 9.0, 9.0, 12.0, 18.0, 2.0, 9.0, 4.0, 3.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.5546875, -3.44476318359375, -3.3348388671875, -3.22491455078125, -3.114990234375, -3.00506591796875, -2.8951416015625, -2.78521728515625, -2.67529296875, -2.56536865234375, -2.4554443359375, -2.34552001953125, -2.235595703125, -2.12567138671875, -2.0157470703125, -1.90582275390625, -1.7958984375, -1.68597412109375, -1.5760498046875, -1.46612548828125, -1.356201171875, -1.24627685546875, -1.1363525390625, -1.02642822265625, -0.91650390625, -0.80657958984375, -0.6966552734375, -0.58673095703125, -0.476806640625, -0.36688232421875, -0.2569580078125, -0.14703369140625, -0.037109375, 0.07281494140625, 0.1827392578125, 0.29266357421875, 0.402587890625, 0.51251220703125, 0.6224365234375, 0.73236083984375, 0.84228515625, 0.95220947265625, 1.0621337890625, 1.17205810546875, 1.281982421875, 1.39190673828125, 1.5018310546875, 1.61175537109375, 1.7216796875, 1.83160400390625, 1.9415283203125, 2.05145263671875, 2.161376953125, 2.27130126953125, 2.3812255859375, 2.49114990234375, 2.60107421875, 2.71099853515625, 2.8209228515625, 2.93084716796875, 3.040771484375, 3.15069580078125, 3.2606201171875, 3.37054443359375, 3.48046875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 8.0, 8.0, 10.0, 16.0, 24.0, 42.0, 70.0, 90.0, 144.0, 246.0, 448.0, 914.0, 1681.0, 3807.0, 9888.0, 37363.0, 320521.0, 2743810.0, 967320.0, 80734.0, 16426.0, 5712.0, 2459.0, 1115.0, 587.0, 292.0, 205.0, 105.0, 77.0, 54.0, 43.0, 20.0, 17.0, 10.0, 7.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6875, -10.3394775390625, -9.991455078125, -9.6434326171875, -9.29541015625, -8.9473876953125, -8.599365234375, -8.2513427734375, -7.9033203125, -7.5552978515625, -7.207275390625, -6.8592529296875, -6.51123046875, -6.1632080078125, -5.815185546875, -5.4671630859375, -5.119140625, -4.7711181640625, -4.423095703125, -4.0750732421875, -3.72705078125, -3.3790283203125, -3.031005859375, -2.6829833984375, -2.3349609375, -1.9869384765625, -1.638916015625, -1.2908935546875, -0.94287109375, -0.5948486328125, -0.246826171875, 0.1011962890625, 0.44921875, 0.7972412109375, 1.145263671875, 1.4932861328125, 1.84130859375, 2.1893310546875, 2.537353515625, 2.8853759765625, 3.2333984375, 3.5814208984375, 3.929443359375, 4.2774658203125, 4.62548828125, 4.9735107421875, 5.321533203125, 5.6695556640625, 6.017578125, 6.3656005859375, 6.713623046875, 7.0616455078125, 7.40966796875, 7.7576904296875, 8.105712890625, 8.4537353515625, 8.8017578125, 9.1497802734375, 9.497802734375, 9.8458251953125, 10.19384765625, 10.5418701171875, 10.889892578125, 11.2379150390625, 11.5859375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 9.0, 10.0, 5.0, 18.0, 23.0, 11.0, 30.0, 33.0, 49.0, 72.0, 98.0, 147.0, 220.0, 312.0, 453.0, 544.0, 564.0, 417.0, 343.0, 228.0, 145.0, 94.0, 74.0, 43.0, 37.0, 24.0, 18.0, 12.0, 12.0, 4.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.6796875, -8.416259765625, -8.15283203125, -7.889404296875, -7.6259765625, -7.362548828125, -7.09912109375, -6.835693359375, -6.572265625, -6.308837890625, -6.04541015625, -5.781982421875, -5.5185546875, -5.255126953125, -4.99169921875, -4.728271484375, -4.46484375, -4.201416015625, -3.93798828125, -3.674560546875, -3.4111328125, -3.147705078125, -2.88427734375, -2.620849609375, -2.357421875, -2.093994140625, -1.83056640625, -1.567138671875, -1.3037109375, -1.040283203125, -0.77685546875, -0.513427734375, -0.25, 0.013427734375, 0.27685546875, 0.540283203125, 0.8037109375, 1.067138671875, 1.33056640625, 1.593994140625, 1.857421875, 2.120849609375, 2.38427734375, 2.647705078125, 2.9111328125, 3.174560546875, 3.43798828125, 3.701416015625, 3.96484375, 4.228271484375, 4.49169921875, 4.755126953125, 5.0185546875, 5.281982421875, 5.54541015625, 5.808837890625, 6.072265625, 6.335693359375, 6.59912109375, 6.862548828125, 7.1259765625, 7.389404296875, 7.65283203125, 7.916259765625, 8.1796875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 4.0, 7.0, 12.0, 12.0, 14.0, 20.0, 27.0, 45.0, 42.0, 97.0, 143.0, 252.0, 604.0, 2460.0, 26530.0, 3408415.0, 742719.0, 10380.0, 1415.0, 462.0, 204.0, 121.0, 79.0, 56.0, 36.0, 26.0, 18.0, 23.0, 17.0, 6.0, 6.0, 12.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.75, -36.564453125, -35.37890625, -34.193359375, -33.0078125, -31.822265625, -30.63671875, -29.451171875, -28.265625, -27.080078125, -25.89453125, -24.708984375, -23.5234375, -22.337890625, -21.15234375, -19.966796875, -18.78125, -17.595703125, -16.41015625, -15.224609375, -14.0390625, -12.853515625, -11.66796875, -10.482421875, -9.296875, -8.111328125, -6.92578125, -5.740234375, -4.5546875, -3.369140625, -2.18359375, -0.998046875, 0.1875, 1.373046875, 2.55859375, 3.744140625, 4.9296875, 6.115234375, 7.30078125, 8.486328125, 9.671875, 10.857421875, 12.04296875, 13.228515625, 14.4140625, 15.599609375, 16.78515625, 17.970703125, 19.15625, 20.341796875, 21.52734375, 22.712890625, 23.8984375, 25.083984375, 26.26953125, 27.455078125, 28.640625, 29.826171875, 31.01171875, 32.197265625, 33.3828125, 34.568359375, 35.75390625, 36.939453125, 38.125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 2.0, 6.0, 16.0, 21.0, 23.0, 36.0, 58.0, 53.0, 68.0, 73.0, 78.0, 89.0, 99.0, 85.0, 77.0, 54.0, 39.0, 28.0, 30.0, 20.0, 12.0, 10.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.624752044677734, -40.56349182128906, -39.502227783203125, -38.44096755981445, -37.37970733642578, -36.31844711303711, -35.25718307495117, -34.1959228515625, -33.13466262817383, -32.073402404785156, -31.01214027404785, -29.950878143310547, -28.889617919921875, -27.82835578918457, -26.767093658447266, -25.705833435058594, -24.64457130432129, -23.583309173583984, -22.522048950195312, -21.460786819458008, -20.399526596069336, -19.33826446533203, -18.27700424194336, -17.215742111206055, -16.15447998046875, -15.093218803405762, -14.031957626342773, -12.970695495605469, -11.909435272216797, -10.848173141479492, -9.786911964416504, -8.725650787353516, -7.664388656616211, -6.603127479553223, -5.541866302490234, -4.480604648590088, -3.4193434715270996, -2.3580822944641113, -1.2968206405639648, -0.23555946350097656, 0.8257017135620117, 1.8869630098342896, 2.9482243061065674, 4.009485721588135, 5.070746898651123, 6.132008075714111, 7.193269729614258, 8.254530906677246, 9.315792083740234, 10.377053260803223, 11.438314437866211, 12.499576568603516, 13.560836791992188, 14.622098922729492, 15.68336009979248, 16.74462127685547, 17.80588150024414, 18.867143630981445, 19.928403854370117, 20.989665985107422, 22.050926208496094, 23.1121883392334, 24.173450469970703, 25.234710693359375, 26.29597282409668]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 0.0, 6.0, 6.0, 8.0, 7.0, 12.0, 10.0, 9.0, 21.0, 20.0, 35.0, 17.0, 29.0, 27.0, 39.0, 40.0, 39.0, 47.0, 35.0, 38.0, 30.0, 39.0, 41.0, 41.0, 44.0, 40.0, 40.0, 34.0, 27.0, 28.0, 29.0, 28.0, 32.0, 23.0, 11.0, 17.0, 10.0, 7.0, 5.0, 12.0, 9.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-29.379417419433594, -28.551237106323242, -27.723058700561523, -26.894878387451172, -26.066699981689453, -25.2385196685791, -24.41033935546875, -23.58216094970703, -22.75398063659668, -21.925800323486328, -21.09762191772461, -20.269441604614258, -19.441261291503906, -18.613082885742188, -17.784902572631836, -16.956722259521484, -16.128543853759766, -15.30036449432373, -14.472185134887695, -13.644004821777344, -12.815825462341309, -11.987646102905273, -11.159465789794922, -10.331286430358887, -9.503107070922852, -8.674927711486816, -7.846747875213623, -7.01856803894043, -6.1903886795043945, -5.362209320068359, -4.534029483795166, -3.7058496475219727, -2.8776721954345703, -2.049492597579956, -1.2213129997253418, -0.39313340187072754, 0.4350461959838867, 1.2632255554199219, 2.0914053916931152, 2.9195852279663086, 3.7477645874023438, 4.575943946838379, 5.404123783111572, 6.232303619384766, 7.060482978820801, 7.888662338256836, 8.716842651367188, 9.545022010803223, 10.373201370239258, 11.201380729675293, 12.029560089111328, 12.85774040222168, 13.685919761657715, 14.51409912109375, 15.342279434204102, 16.170459747314453, 16.998638153076172, 17.826818466186523, 18.654996871948242, 19.483177185058594, 20.311355590820312, 21.139535903930664, 21.967716217041016, 22.795894622802734, 23.624074935913086]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 7.0, 9.0, 12.0, 12.0, 13.0, 19.0, 21.0, 23.0, 19.0, 25.0, 29.0, 29.0, 37.0, 33.0, 36.0, 42.0, 41.0, 53.0, 38.0, 49.0, 46.0, 43.0, 49.0, 32.0, 27.0, 25.0, 29.0, 28.0, 23.0, 22.0, 21.0, 13.0, 12.0, 14.0, 10.0, 14.0, 3.0, 4.0, 7.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.30078125, -3.192108154296875, -3.08343505859375, -2.974761962890625, -2.8660888671875, -2.757415771484375, -2.64874267578125, -2.540069580078125, -2.431396484375, -2.322723388671875, -2.21405029296875, -2.105377197265625, -1.9967041015625, -1.888031005859375, -1.77935791015625, -1.670684814453125, -1.56201171875, -1.453338623046875, -1.34466552734375, -1.235992431640625, -1.1273193359375, -1.018646240234375, -0.90997314453125, -0.801300048828125, -0.692626953125, -0.583953857421875, -0.47528076171875, -0.366607666015625, -0.2579345703125, -0.149261474609375, -0.04058837890625, 0.068084716796875, 0.1767578125, 0.285430908203125, 0.39410400390625, 0.502777099609375, 0.6114501953125, 0.720123291015625, 0.82879638671875, 0.937469482421875, 1.046142578125, 1.154815673828125, 1.26348876953125, 1.372161865234375, 1.4808349609375, 1.589508056640625, 1.69818115234375, 1.806854248046875, 1.91552734375, 2.024200439453125, 2.13287353515625, 2.241546630859375, 2.3502197265625, 2.458892822265625, 2.56756591796875, 2.676239013671875, 2.784912109375, 2.893585205078125, 3.00225830078125, 3.110931396484375, 3.2196044921875, 3.328277587890625, 3.43695068359375, 3.545623779296875, 3.654296875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 8.0, 11.0, 15.0, 29.0, 33.0, 53.0, 83.0, 120.0, 162.0, 228.0, 338.0, 503.0, 715.0, 1068.0, 1619.0, 2398.0, 3720.0, 5652.0, 8930.0, 14046.0, 22945.0, 38002.0, 66224.0, 122581.0, 314410.0, 212692.0, 94900.0, 53442.0, 31328.0, 18958.0, 11664.0, 7432.0, 4784.0, 3113.0, 2068.0, 1376.0, 927.0, 584.0, 429.0, 323.0, 212.0, 135.0, 84.0, 76.0, 54.0, 30.0, 18.0, 14.0, 10.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1890869140625, -0.18294906616210938, -0.17681121826171875, -0.17067337036132812, -0.1645355224609375, -0.15839767456054688, -0.15225982666015625, -0.14612197875976562, -0.139984130859375, -0.13384628295898438, -0.12770843505859375, -0.12157058715820312, -0.1154327392578125, -0.10929489135742188, -0.10315704345703125, -0.09701919555664062, -0.09088134765625, -0.08474349975585938, -0.07860565185546875, -0.07246780395507812, -0.0663299560546875, -0.060192108154296875, -0.05405426025390625, -0.047916412353515625, -0.041778564453125, -0.035640716552734375, -0.02950286865234375, -0.023365020751953125, -0.0172271728515625, -0.011089324951171875, -0.00495147705078125, 0.001186370849609375, 0.00732421875, 0.013462066650390625, 0.01959991455078125, 0.025737762451171875, 0.0318756103515625, 0.038013458251953125, 0.04415130615234375, 0.050289154052734375, 0.056427001953125, 0.06256484985351562, 0.06870269775390625, 0.07484054565429688, 0.0809783935546875, 0.08711624145507812, 0.09325408935546875, 0.09939193725585938, 0.10552978515625, 0.11166763305664062, 0.11780548095703125, 0.12394332885742188, 0.1300811767578125, 0.13621902465820312, 0.14235687255859375, 0.14849472045898438, 0.154632568359375, 0.16077041625976562, 0.16690826416015625, 0.17304611206054688, 0.1791839599609375, 0.18532180786132812, 0.19145965576171875, 0.19759750366210938, 0.2037353515625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 6.0, 6.0, 5.0, 10.0, 8.0, 9.0, 11.0, 19.0, 17.0, 15.0, 9.0, 19.0, 24.0, 28.0, 32.0, 32.0, 30.0, 41.0, 39.0, 33.0, 44.0, 31.0, 44.0, 1056.0, 33.0, 31.0, 40.0, 43.0, 31.0, 33.0, 30.0, 33.0, 27.0, 18.0, 26.0, 17.0, 15.0, 12.0, 12.0, 10.0, 8.0, 9.0, 8.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.90234375, -2.815399169921875, -2.72845458984375, -2.641510009765625, -2.5545654296875, -2.467620849609375, -2.38067626953125, -2.293731689453125, -2.206787109375, -2.119842529296875, -2.03289794921875, -1.945953369140625, -1.8590087890625, -1.772064208984375, -1.68511962890625, -1.598175048828125, -1.51123046875, -1.424285888671875, -1.33734130859375, -1.250396728515625, -1.1634521484375, -1.076507568359375, -0.98956298828125, -0.902618408203125, -0.815673828125, -0.728729248046875, -0.64178466796875, -0.554840087890625, -0.4678955078125, -0.380950927734375, -0.29400634765625, -0.207061767578125, -0.1201171875, -0.033172607421875, 0.05377197265625, 0.140716552734375, 0.2276611328125, 0.314605712890625, 0.40155029296875, 0.488494873046875, 0.575439453125, 0.662384033203125, 0.74932861328125, 0.836273193359375, 0.9232177734375, 1.010162353515625, 1.09710693359375, 1.184051513671875, 1.27099609375, 1.357940673828125, 1.44488525390625, 1.531829833984375, 1.6187744140625, 1.705718994140625, 1.79266357421875, 1.879608154296875, 1.966552734375, 2.053497314453125, 2.14044189453125, 2.227386474609375, 2.3143310546875, 2.401275634765625, 2.48822021484375, 2.575164794921875, 2.662109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 8.0, 13.0, 17.0, 20.0, 40.0, 44.0, 69.0, 97.0, 166.0, 212.0, 330.0, 484.0, 728.0, 1118.0, 1618.0, 2386.0, 3736.0, 5950.0, 9205.0, 14501.0, 23140.0, 38395.0, 63919.0, 120484.0, 1282399.0, 273595.0, 104591.0, 56894.0, 34110.0, 21072.0, 13216.0, 8484.0, 5481.0, 3542.0, 2297.0, 1486.0, 1039.0, 670.0, 495.0, 313.0, 224.0, 161.0, 110.0, 93.0, 51.0, 45.0, 28.0, 12.0, 13.0, 13.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0692138671875, -0.06697368621826172, -0.06473350524902344, -0.062493324279785156, -0.060253143310546875, -0.058012962341308594, -0.05577278137207031, -0.05353260040283203, -0.05129241943359375, -0.04905223846435547, -0.04681205749511719, -0.044571876525878906, -0.042331695556640625, -0.040091514587402344, -0.03785133361816406, -0.03561115264892578, -0.0333709716796875, -0.03113079071044922, -0.028890609741210938, -0.026650428771972656, -0.024410247802734375, -0.022170066833496094, -0.019929885864257812, -0.01768970489501953, -0.01544952392578125, -0.013209342956542969, -0.010969161987304688, -0.008728981018066406, -0.006488800048828125, -0.004248619079589844, -0.0020084381103515625, 0.00023174285888671875, 0.002471923828125, 0.004712104797363281, 0.0069522857666015625, 0.009192466735839844, 0.011432647705078125, 0.013672828674316406, 0.015913009643554688, 0.01815319061279297, 0.02039337158203125, 0.02263355255126953, 0.024873733520507812, 0.027113914489746094, 0.029354095458984375, 0.031594276428222656, 0.03383445739746094, 0.03607463836669922, 0.0383148193359375, 0.04055500030517578, 0.04279518127441406, 0.045035362243652344, 0.047275543212890625, 0.049515724182128906, 0.05175590515136719, 0.05399608612060547, 0.05623626708984375, 0.05847644805908203, 0.06071662902832031, 0.0629568099975586, 0.06519699096679688, 0.06743717193603516, 0.06967735290527344, 0.07191753387451172, 0.07415771484375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 7.0, 14.0, 13.0, 17.0, 17.0, 14.0, 17.0, 24.0, 27.0, 38.0, 27.0, 39.0, 42.0, 51.0, 44.0, 62.0, 48.0, 72.0, 55.0, 50.0, 37.0, 43.0, 33.0, 35.0, 25.0, 25.0, 25.0, 15.0, 11.0, 14.0, 9.0, 15.0, 7.0, 4.0, 2.0, 3.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0008521080017089844, -0.0008273199200630188, -0.0008025318384170532, -0.0007777437567710876, -0.0007529556751251221, -0.0007281675934791565, -0.0007033795118331909, -0.0006785914301872253, -0.0006538033485412598, -0.0006290152668952942, -0.0006042271852493286, -0.000579439103603363, -0.0005546510219573975, -0.0005298629403114319, -0.0005050748586654663, -0.00048028677701950073, -0.00045549869537353516, -0.0004307106137275696, -0.000405922532081604, -0.00038113445043563843, -0.00035634636878967285, -0.0003315582871437073, -0.0003067702054977417, -0.0002819821238517761, -0.00025719404220581055, -0.00023240596055984497, -0.0002076178789138794, -0.00018282979726791382, -0.00015804171562194824, -0.00013325363397598267, -0.00010846555233001709, -8.367747068405151e-05, -5.888938903808594e-05, -3.410130739212036e-05, -9.313225746154785e-06, 1.547485589981079e-05, 4.026293754577637e-05, 6.505101919174194e-05, 8.983910083770752e-05, 0.0001146271824836731, 0.00013941526412963867, 0.00016420334577560425, 0.00018899142742156982, 0.0002137795090675354, 0.00023856759071350098, 0.00026335567235946655, 0.00028814375400543213, 0.0003129318356513977, 0.0003377199172973633, 0.00036250799894332886, 0.00038729608058929443, 0.00041208416223526, 0.0004368722438812256, 0.00046166032552719116, 0.00048644840717315674, 0.0005112364888191223, 0.0005360245704650879, 0.0005608126521110535, 0.000585600733757019, 0.0006103888154029846, 0.0006351768970489502, 0.0006599649786949158, 0.0006847530603408813, 0.0007095411419868469, 0.0007343292236328125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 2.0, 5.0, 11.0, 10.0, 8.0, 8.0, 15.0, 21.0, 23.0, 27.0, 33.0, 39.0, 42.0, 92.0, 138.0, 386.0, 2134.0, 34680.0, 934023.0, 72376.0, 3417.0, 523.0, 165.0, 98.0, 52.0, 49.0, 28.0, 31.0, 14.0, 16.0, 15.0, 13.0, 18.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01458740234375, -0.01409459114074707, -0.01360177993774414, -0.013108968734741211, -0.012616157531738281, -0.012123346328735352, -0.011630535125732422, -0.011137723922729492, -0.010644912719726562, -0.010152101516723633, -0.009659290313720703, -0.009166479110717773, -0.008673667907714844, -0.008180856704711914, -0.007688045501708984, -0.007195234298706055, -0.006702423095703125, -0.006209611892700195, -0.005716800689697266, -0.005223989486694336, -0.004731178283691406, -0.0042383670806884766, -0.003745555877685547, -0.003252744674682617, -0.0027599334716796875, -0.002267122268676758, -0.0017743110656738281, -0.0012814998626708984, -0.0007886886596679688, -0.00029587745666503906, 0.00019693374633789062, 0.0006897449493408203, 0.00118255615234375, 0.0016753673553466797, 0.0021681785583496094, 0.002660989761352539, 0.0031538009643554688, 0.0036466121673583984, 0.004139423370361328, 0.004632234573364258, 0.0051250457763671875, 0.005617856979370117, 0.006110668182373047, 0.0066034793853759766, 0.007096290588378906, 0.007589101791381836, 0.008081912994384766, 0.008574724197387695, 0.009067535400390625, 0.009560346603393555, 0.010053157806396484, 0.010545969009399414, 0.011038780212402344, 0.011531591415405273, 0.012024402618408203, 0.012517213821411133, 0.013010025024414062, 0.013502836227416992, 0.013995647430419922, 0.014488458633422852, 0.014981269836425781, 0.015474081039428711, 0.01596689224243164, 0.01645970344543457, 0.0169525146484375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 861.0, 155.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002205475000664592, -0.001434606732800603, -0.0006637385813519359, 0.00010712957009673119, 0.0008779978379607201, 0.001648866105824709, 0.002419734140858054, 0.003190602408722043, 0.003961470909416676, 0.0047323391772806644, 0.005503207445144653, 0.006274075247347355, 0.007044943980872631, 0.007815811783075333, 0.008586680516600609, 0.00935754831880331, 0.010128416121006012, 0.010899283923208714, 0.01167015265673399, 0.012441020458936691, 0.013211889192461967, 0.013982756994664669, 0.01475362479686737, 0.015524493530392647, 0.016295362263917923, 0.0170662309974432, 0.017837097868323326, 0.018607966601848602, 0.01937883533537388, 0.020149704068899155, 0.02092057093977928, 0.021691439673304558, 0.022462306544184685, 0.02323317527770996, 0.024004042148590088, 0.024774910882115364, 0.02554577961564064, 0.026316648349165916, 0.027087515220046043, 0.02785838395357132, 0.028629252687096596, 0.029400121420621872, 0.030170988291502, 0.030941857025027275, 0.03171272575855255, 0.03248359262943268, 0.033254463225603104, 0.03402533009648323, 0.03479619696736336, 0.035567063838243484, 0.03633793443441391, 0.03710880130529404, 0.037879668176174164, 0.03865053877234459, 0.039421405643224716, 0.04019227623939514, 0.04096314311027527, 0.041734009981155396, 0.04250488057732582, 0.04327574744820595, 0.044046614319086075, 0.0448174849152565, 0.04558835178613663, 0.046359218657016754, 0.04713008925318718]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 19.0, 17.0, 36.0, 44.0, 71.0, 87.0, 99.0, 97.0, 75.0, 93.0, 77.0, 77.0, 50.0, 42.0, 49.0, 26.0, 14.0, 11.0, 7.0, 5.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.002314150333404541, -0.002266271971166134, -0.0022183936089277267, -0.0021705152466893196, -0.0021226368844509125, -0.0020747585222125053, -0.002026880159974098, -0.001979001797735691, -0.001931123435497284, -0.0018832450732588768, -0.0018353667110204697, -0.0017874883487820625, -0.0017396099865436554, -0.0016917316243052483, -0.0016438532620668411, -0.001595974899828434, -0.0015480965375900269, -0.0015002181753516197, -0.0014523398131132126, -0.0014044614508748055, -0.0013565830886363983, -0.0013087047263979912, -0.001260826364159584, -0.001212948001921177, -0.0011650696396827698, -0.0011171912774443626, -0.0010693129152059555, -0.0010214345529675484, -0.0009735561907291412, -0.0009256778284907341, -0.000877799466252327, -0.0008299211040139198, -0.0007820427417755127, -0.0007341643795371056, -0.0006862860172986984, -0.0006384076550602913, -0.0005905292928218842, -0.000542650930583477, -0.0004947725683450699, -0.00044689420610666275, -0.0003990158438682556, -0.0003511374816298485, -0.00030325911939144135, -0.0002553807571530342, -0.00020750239491462708, -0.00015962403267621994, -0.0001117456704378128, -6.386730819940567e-05, -1.5988945960998535e-05, 3.18894162774086e-05, 7.976777851581573e-05, 0.00012764614075422287, 0.00017552450299263, 0.00022340286523103714, 0.0002712812274694443, 0.0003191595897078514, 0.00036703795194625854, 0.0004149163141846657, 0.0004627946764230728, 0.00051067303866148, 0.0005585514008998871, 0.0006064297631382942, 0.0006543081253767014, 0.0007021864876151085, 0.0007500648498535156]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 7.0, 9.0, 12.0, 12.0, 13.0, 19.0, 22.0, 22.0, 19.0, 25.0, 29.0, 29.0, 37.0, 33.0, 36.0, 42.0, 41.0, 53.0, 38.0, 49.0, 46.0, 43.0, 49.0, 32.0, 27.0, 25.0, 29.0, 28.0, 23.0, 22.0, 21.0, 13.0, 12.0, 14.0, 10.0, 14.0, 3.0, 4.0, 7.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.30078125, -3.192108154296875, -3.08343505859375, -2.974761962890625, -2.8660888671875, -2.757415771484375, -2.64874267578125, -2.540069580078125, -2.431396484375, -2.322723388671875, -2.21405029296875, -2.105377197265625, -1.9967041015625, -1.888031005859375, -1.77935791015625, -1.670684814453125, -1.56201171875, -1.453338623046875, -1.34466552734375, -1.235992431640625, -1.1273193359375, -1.018646240234375, -0.90997314453125, -0.801300048828125, -0.692626953125, -0.583953857421875, -0.47528076171875, -0.366607666015625, -0.2579345703125, -0.149261474609375, -0.04058837890625, 0.068084716796875, 0.1767578125, 0.285430908203125, 0.39410400390625, 0.502777099609375, 0.6114501953125, 0.720123291015625, 0.82879638671875, 0.937469482421875, 1.046142578125, 1.154815673828125, 1.26348876953125, 1.372161865234375, 1.4808349609375, 1.589508056640625, 1.69818115234375, 1.806854248046875, 1.91552734375, 2.024200439453125, 2.13287353515625, 2.241546630859375, 2.3502197265625, 2.458892822265625, 2.56756591796875, 2.676239013671875, 2.784912109375, 2.893585205078125, 3.00225830078125, 3.110931396484375, 3.2196044921875, 3.328277587890625, 3.43695068359375, 3.545623779296875, 3.654296875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 8.0, 10.0, 13.0, 18.0, 22.0, 38.0, 55.0, 80.0, 117.0, 190.0, 296.0, 441.0, 690.0, 1100.0, 1864.0, 3358.0, 6333.0, 12422.0, 25297.0, 64792.0, 317007.0, 460345.0, 90875.0, 31388.0, 14630.0, 7494.0, 3979.0, 2188.0, 1258.0, 808.0, 491.0, 309.0, 216.0, 145.0, 81.0, 63.0, 36.0, 32.0, 16.0, 15.0, 9.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.078125, -7.83428955078125, -7.5904541015625, -7.34661865234375, -7.102783203125, -6.85894775390625, -6.6151123046875, -6.37127685546875, -6.12744140625, -5.88360595703125, -5.6397705078125, -5.39593505859375, -5.152099609375, -4.90826416015625, -4.6644287109375, -4.42059326171875, -4.1767578125, -3.93292236328125, -3.6890869140625, -3.44525146484375, -3.201416015625, -2.95758056640625, -2.7137451171875, -2.46990966796875, -2.22607421875, -1.98223876953125, -1.7384033203125, -1.49456787109375, -1.250732421875, -1.00689697265625, -0.7630615234375, -0.51922607421875, -0.275390625, -0.03155517578125, 0.2122802734375, 0.45611572265625, 0.699951171875, 0.94378662109375, 1.1876220703125, 1.43145751953125, 1.67529296875, 1.91912841796875, 2.1629638671875, 2.40679931640625, 2.650634765625, 2.89447021484375, 3.1383056640625, 3.38214111328125, 3.6259765625, 3.86981201171875, 4.1136474609375, 4.35748291015625, 4.601318359375, 4.84515380859375, 5.0889892578125, 5.33282470703125, 5.57666015625, 5.82049560546875, 6.0643310546875, 6.30816650390625, 6.552001953125, 6.79583740234375, 7.0396728515625, 7.28350830078125, 7.52734375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 8.0, 10.0, 9.0, 21.0, 17.0, 10.0, 14.0, 21.0, 21.0, 29.0, 38.0, 37.0, 62.0, 53.0, 84.0, 111.0, 237.0, 1437.0, 229.0, 131.0, 84.0, 60.0, 47.0, 49.0, 43.0, 33.0, 35.0, 28.0, 18.0, 18.0, 14.0, 4.0, 7.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.21875, -11.8046875, -11.390625, -10.9765625, -10.5625, -10.1484375, -9.734375, -9.3203125, -8.90625, -8.4921875, -8.078125, -7.6640625, -7.25, -6.8359375, -6.421875, -6.0078125, -5.59375, -5.1796875, -4.765625, -4.3515625, -3.9375, -3.5234375, -3.109375, -2.6953125, -2.28125, -1.8671875, -1.453125, -1.0390625, -0.625, -0.2109375, 0.203125, 0.6171875, 1.03125, 1.4453125, 1.859375, 2.2734375, 2.6875, 3.1015625, 3.515625, 3.9296875, 4.34375, 4.7578125, 5.171875, 5.5859375, 6.0, 6.4140625, 6.828125, 7.2421875, 7.65625, 8.0703125, 8.484375, 8.8984375, 9.3125, 9.7265625, 10.140625, 10.5546875, 10.96875, 11.3828125, 11.796875, 12.2109375, 12.625, 13.0390625, 13.453125, 13.8671875, 14.28125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 7.0, 7.0, 8.0, 12.0, 15.0, 23.0, 29.0, 50.0, 46.0, 65.0, 90.0, 158.0, 287.0, 767.0, 4076.0, 43965.0, 2597837.0, 479536.0, 15562.0, 1952.0, 507.0, 208.0, 130.0, 89.0, 64.0, 48.0, 40.0, 27.0, 19.0, 16.0, 16.0, 14.0, 9.0, 10.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.25, -27.4384765625, -26.626953125, -25.8154296875, -25.00390625, -24.1923828125, -23.380859375, -22.5693359375, -21.7578125, -20.9462890625, -20.134765625, -19.3232421875, -18.51171875, -17.7001953125, -16.888671875, -16.0771484375, -15.265625, -14.4541015625, -13.642578125, -12.8310546875, -12.01953125, -11.2080078125, -10.396484375, -9.5849609375, -8.7734375, -7.9619140625, -7.150390625, -6.3388671875, -5.52734375, -4.7158203125, -3.904296875, -3.0927734375, -2.28125, -1.4697265625, -0.658203125, 0.1533203125, 0.96484375, 1.7763671875, 2.587890625, 3.3994140625, 4.2109375, 5.0224609375, 5.833984375, 6.6455078125, 7.45703125, 8.2685546875, 9.080078125, 9.8916015625, 10.703125, 11.5146484375, 12.326171875, 13.1376953125, 13.94921875, 14.7607421875, 15.572265625, 16.3837890625, 17.1953125, 18.0068359375, 18.818359375, 19.6298828125, 20.44140625, 21.2529296875, 22.064453125, 22.8759765625, 23.6875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 62.0, 412.0, 460.0, 79.0, 4.0, 1.0, 1.0], "bins": [-264.3245544433594, -259.8451232910156, -255.3656768798828, -250.88624572753906, -246.40679931640625, -241.9273681640625, -237.44793701171875, -232.96849060058594, -228.4890594482422, -224.00962829589844, -219.53018188476562, -215.05075073242188, -210.57130432128906, -206.0918731689453, -201.6124267578125, -197.13299560546875, -192.653564453125, -188.17413330078125, -183.69468688964844, -179.2152557373047, -174.73580932617188, -170.25637817382812, -165.77694702148438, -161.29750061035156, -156.81805419921875, -152.338623046875, -147.8591766357422, -143.37974548339844, -138.90029907226562, -134.42086791992188, -129.94143676757812, -125.46199035644531, -120.98255920410156, -116.50312042236328, -112.023681640625, -107.54425048828125, -103.06481170654297, -98.58537292480469, -94.1059341430664, -89.62649536132812, -85.14705657958984, -80.66761779785156, -76.18817901611328, -71.708740234375, -67.22930908203125, -62.74987030029297, -58.27043151855469, -53.790992736816406, -49.31155776977539, -44.83211898803711, -40.352684020996094, -35.87324523925781, -31.393808364868164, -26.914371490478516, -22.434932708740234, -17.955495834350586, -13.476058959960938, -8.996622085571289, -4.517184257507324, -0.037746429443359375, 4.441690444946289, 8.921127319335938, 13.400566101074219, 17.880002975463867, 22.359439849853516]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 11.0, 7.0, 5.0, 10.0, 11.0, 8.0, 10.0, 18.0, 19.0, 17.0, 18.0, 33.0, 36.0, 39.0, 33.0, 32.0, 39.0, 44.0, 39.0, 36.0, 40.0, 46.0, 37.0, 40.0, 31.0, 29.0, 32.0, 28.0, 27.0, 30.0, 30.0, 18.0, 21.0, 15.0, 10.0, 13.0, 12.0, 13.0, 8.0, 12.0, 9.0, 6.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-28.69312858581543, -27.771778106689453, -26.850425720214844, -25.929075241088867, -25.00772476196289, -24.08637237548828, -23.165021896362305, -22.243671417236328, -21.32231903076172, -20.400968551635742, -19.479616165161133, -18.558265686035156, -17.636913299560547, -16.71556282043457, -15.794212341308594, -14.8728609085083, -13.951509475708008, -13.030158042907715, -12.108806610107422, -11.187456130981445, -10.266104698181152, -9.34475326538086, -8.423402786254883, -7.50205135345459, -6.580699920654297, -5.659348487854004, -4.737997531890869, -3.8166463375091553, -2.8952951431274414, -1.9739437103271484, -1.0525927543640137, -0.1312417984008789, 0.7901096343994141, 1.711460828781128, 2.632812023162842, 3.5541632175445557, 4.4755144119262695, 5.3968658447265625, 6.318216800689697, 7.239567756652832, 8.160919189453125, 9.082270622253418, 10.003622055053711, 10.924972534179688, 11.84632396697998, 12.767675399780273, 13.68902587890625, 14.610377311706543, 15.531728744506836, 16.453079223632812, 17.374431610107422, 18.2957820892334, 19.217132568359375, 20.138484954833984, 21.05983543395996, 21.981185913085938, 22.902538299560547, 23.823888778686523, 24.745241165161133, 25.66659164428711, 26.58794403076172, 27.509294509887695, 28.430644989013672, 29.35199737548828, 30.273347854614258]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 6.0, 8.0, 5.0, 12.0, 17.0, 10.0, 13.0, 22.0, 21.0, 31.0, 26.0, 28.0, 26.0, 41.0, 36.0, 32.0, 50.0, 52.0, 51.0, 46.0, 56.0, 52.0, 44.0, 39.0, 27.0, 33.0, 29.0, 27.0, 14.0, 24.0, 27.0, 17.0, 14.0, 14.0, 7.0, 13.0, 4.0, 1.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.619140625, -3.498321533203125, -3.37750244140625, -3.256683349609375, -3.1358642578125, -3.015045166015625, -2.89422607421875, -2.773406982421875, -2.652587890625, -2.531768798828125, -2.41094970703125, -2.290130615234375, -2.1693115234375, -2.048492431640625, -1.92767333984375, -1.806854248046875, -1.68603515625, -1.565216064453125, -1.44439697265625, -1.323577880859375, -1.2027587890625, -1.081939697265625, -0.96112060546875, -0.840301513671875, -0.719482421875, -0.598663330078125, -0.47784423828125, -0.357025146484375, -0.2362060546875, -0.115386962890625, 0.00543212890625, 0.126251220703125, 0.2470703125, 0.367889404296875, 0.48870849609375, 0.609527587890625, 0.7303466796875, 0.851165771484375, 0.97198486328125, 1.092803955078125, 1.213623046875, 1.334442138671875, 1.45526123046875, 1.576080322265625, 1.6968994140625, 1.817718505859375, 1.93853759765625, 2.059356689453125, 2.18017578125, 2.300994873046875, 2.42181396484375, 2.542633056640625, 2.6634521484375, 2.784271240234375, 2.90509033203125, 3.025909423828125, 3.146728515625, 3.267547607421875, 3.38836669921875, 3.509185791015625, 3.6300048828125, 3.750823974609375, 3.87164306640625, 3.992462158203125, 4.11328125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 8.0, 11.0, 12.0, 21.0, 29.0, 37.0, 56.0, 108.0, 163.0, 334.0, 885.0, 2570.0, 12295.0, 195303.0, 3681141.0, 281830.0, 14652.0, 2955.0, 942.0, 403.0, 198.0, 112.0, 55.0, 39.0, 36.0, 15.0, 18.0, 14.0, 9.0, 6.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.09375, -16.494873046875, -15.89599609375, -15.297119140625, -14.6982421875, -14.099365234375, -13.50048828125, -12.901611328125, -12.302734375, -11.703857421875, -11.10498046875, -10.506103515625, -9.9072265625, -9.308349609375, -8.70947265625, -8.110595703125, -7.51171875, -6.912841796875, -6.31396484375, -5.715087890625, -5.1162109375, -4.517333984375, -3.91845703125, -3.319580078125, -2.720703125, -2.121826171875, -1.52294921875, -0.924072265625, -0.3251953125, 0.273681640625, 0.87255859375, 1.471435546875, 2.0703125, 2.669189453125, 3.26806640625, 3.866943359375, 4.4658203125, 5.064697265625, 5.66357421875, 6.262451171875, 6.861328125, 7.460205078125, 8.05908203125, 8.657958984375, 9.2568359375, 9.855712890625, 10.45458984375, 11.053466796875, 11.65234375, 12.251220703125, 12.85009765625, 13.448974609375, 14.0478515625, 14.646728515625, 15.24560546875, 15.844482421875, 16.443359375, 17.042236328125, 17.64111328125, 18.239990234375, 18.8388671875, 19.437744140625, 20.03662109375, 20.635498046875, 21.234375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 12.0, 12.0, 15.0, 22.0, 27.0, 69.0, 101.0, 142.0, 222.0, 393.0, 543.0, 784.0, 669.0, 425.0, 234.0, 161.0, 95.0, 50.0, 33.0, 16.0, 12.0, 11.0, 12.0, 5.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.669677734375, -8.33154296875, -7.993408203125, -7.6552734375, -7.317138671875, -6.97900390625, -6.640869140625, -6.302734375, -5.964599609375, -5.62646484375, -5.288330078125, -4.9501953125, -4.612060546875, -4.27392578125, -3.935791015625, -3.59765625, -3.259521484375, -2.92138671875, -2.583251953125, -2.2451171875, -1.906982421875, -1.56884765625, -1.230712890625, -0.892578125, -0.554443359375, -0.21630859375, 0.121826171875, 0.4599609375, 0.798095703125, 1.13623046875, 1.474365234375, 1.8125, 2.150634765625, 2.48876953125, 2.826904296875, 3.1650390625, 3.503173828125, 3.84130859375, 4.179443359375, 4.517578125, 4.855712890625, 5.19384765625, 5.531982421875, 5.8701171875, 6.208251953125, 6.54638671875, 6.884521484375, 7.22265625, 7.560791015625, 7.89892578125, 8.237060546875, 8.5751953125, 8.913330078125, 9.25146484375, 9.589599609375, 9.927734375, 10.265869140625, 10.60400390625, 10.942138671875, 11.2802734375, 11.618408203125, 11.95654296875, 12.294677734375, 12.6328125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 12.0, 6.0, 19.0, 12.0, 28.0, 41.0, 80.0, 172.0, 308.0, 966.0, 12364.0, 3949046.0, 227451.0, 2637.0, 547.0, 258.0, 117.0, 89.0, 43.0, 26.0, 18.0, 10.0, 17.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.8125, -60.17529296875, -58.5380859375, -56.90087890625, -55.263671875, -53.62646484375, -51.9892578125, -50.35205078125, -48.71484375, -47.07763671875, -45.4404296875, -43.80322265625, -42.166015625, -40.52880859375, -38.8916015625, -37.25439453125, -35.6171875, -33.97998046875, -32.3427734375, -30.70556640625, -29.068359375, -27.43115234375, -25.7939453125, -24.15673828125, -22.51953125, -20.88232421875, -19.2451171875, -17.60791015625, -15.970703125, -14.33349609375, -12.6962890625, -11.05908203125, -9.421875, -7.78466796875, -6.1474609375, -4.51025390625, -2.873046875, -1.23583984375, 0.4013671875, 2.03857421875, 3.67578125, 5.31298828125, 6.9501953125, 8.58740234375, 10.224609375, 11.86181640625, 13.4990234375, 15.13623046875, 16.7734375, 18.41064453125, 20.0478515625, 21.68505859375, 23.322265625, 24.95947265625, 26.5966796875, 28.23388671875, 29.87109375, 31.50830078125, 33.1455078125, 34.78271484375, 36.419921875, 38.05712890625, 39.6943359375, 41.33154296875, 42.96875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 16.0, 20.0, 24.0, 39.0, 52.0, 78.0, 80.0, 106.0, 116.0, 98.0, 93.0, 75.0, 59.0, 39.0, 36.0, 30.0, 11.0, 8.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.172107696533203, -19.05388069152832, -17.935653686523438, -16.817428588867188, -15.699201583862305, -14.580974578857422, -13.462747573852539, -12.344520568847656, -11.22629451751709, -10.108067512512207, -8.98984146118164, -7.871614456176758, -6.753387928009033, -5.635161399841309, -4.516934394836426, -3.398707866668701, -2.2804813385009766, -1.1622546911239624, -0.04402804374694824, 1.0741987228393555, 2.19242525100708, 3.3106517791748047, 4.4288787841796875, 5.547105312347412, 6.665331840515137, 7.783558368682861, 8.901784896850586, 10.020011901855469, 11.138238906860352, 12.256464958190918, 13.3746919631958, 14.492918014526367, 15.61114501953125, 16.729372024536133, 17.847599029541016, 18.965824127197266, 20.08405113220215, 21.20227813720703, 22.320505142211914, 23.438732147216797, 24.556957244873047, 25.67518424987793, 26.793411254882812, 27.911636352539062, 29.029863357543945, 30.148090362548828, 31.26631736755371, 32.384544372558594, 33.502769470214844, 34.620994567871094, 35.73922348022461, 36.85744857788086, 37.975677490234375, 39.093902587890625, 40.212127685546875, 41.33035659790039, 42.448585510253906, 43.566810607910156, 44.68503952026367, 45.80326461791992, 46.92149353027344, 48.03971862792969, 49.15794372558594, 50.27617263793945, 51.3943977355957]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 4.0, 7.0, 5.0, 13.0, 11.0, 11.0, 15.0, 21.0, 20.0, 23.0, 25.0, 25.0, 33.0, 38.0, 45.0, 30.0, 47.0, 45.0, 47.0, 53.0, 45.0, 44.0, 46.0, 50.0, 40.0, 39.0, 34.0, 25.0, 27.0, 24.0, 28.0, 14.0, 19.0, 15.0, 10.0, 5.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-31.912277221679688, -31.053913116455078, -30.19554901123047, -29.337182998657227, -28.478818893432617, -27.620454788208008, -26.762088775634766, -25.903724670410156, -25.045360565185547, -24.186996459960938, -23.328632354736328, -22.470266342163086, -21.611902236938477, -20.753538131713867, -19.895172119140625, -19.036808013916016, -18.178443908691406, -17.320079803466797, -16.461715698242188, -15.603349685668945, -14.744985580444336, -13.886621475219727, -13.0282564163208, -12.169891357421875, -11.311527252197266, -10.453163146972656, -9.59479808807373, -8.736433029174805, -7.878068923950195, -7.019704341888428, -6.16133975982666, -5.302975177764893, -4.444612503051758, -3.5862479209899902, -2.7278833389282227, -1.869518756866455, -1.0111541748046875, -0.15278959274291992, 0.7055749893188477, 1.5639395713806152, 2.422304153442383, 3.2806687355041504, 4.139033317565918, 4.9973978996276855, 5.855762481689453, 6.714127063751221, 7.572491645812988, 8.430856704711914, 9.289220809936523, 10.147584915161133, 11.005949974060059, 11.864315032958984, 12.722679138183594, 13.581043243408203, 14.439408302307129, 15.297773361206055, 16.156137466430664, 17.014501571655273, 17.872867584228516, 18.731231689453125, 19.589595794677734, 20.447959899902344, 21.306324005126953, 22.164690017700195, 23.023054122924805]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 2.0, 4.0, 9.0, 2.0, 10.0, 12.0, 10.0, 23.0, 14.0, 24.0, 18.0, 31.0, 24.0, 19.0, 34.0, 39.0, 34.0, 34.0, 43.0, 46.0, 50.0, 41.0, 54.0, 51.0, 44.0, 34.0, 33.0, 33.0, 24.0, 28.0, 16.0, 25.0, 28.0, 20.0, 21.0, 11.0, 13.0, 8.0, 11.0, 1.0, 9.0, 2.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.521484375, -3.405242919921875, -3.28900146484375, -3.172760009765625, -3.0565185546875, -2.940277099609375, -2.82403564453125, -2.707794189453125, -2.591552734375, -2.475311279296875, -2.35906982421875, -2.242828369140625, -2.1265869140625, -2.010345458984375, -1.89410400390625, -1.777862548828125, -1.66162109375, -1.545379638671875, -1.42913818359375, -1.312896728515625, -1.1966552734375, -1.080413818359375, -0.96417236328125, -0.847930908203125, -0.731689453125, -0.615447998046875, -0.49920654296875, -0.382965087890625, -0.2667236328125, -0.150482177734375, -0.03424072265625, 0.082000732421875, 0.1982421875, 0.314483642578125, 0.43072509765625, 0.546966552734375, 0.6632080078125, 0.779449462890625, 0.89569091796875, 1.011932373046875, 1.128173828125, 1.244415283203125, 1.36065673828125, 1.476898193359375, 1.5931396484375, 1.709381103515625, 1.82562255859375, 1.941864013671875, 2.05810546875, 2.174346923828125, 2.29058837890625, 2.406829833984375, 2.5230712890625, 2.639312744140625, 2.75555419921875, 2.871795654296875, 2.988037109375, 3.104278564453125, 3.22052001953125, 3.336761474609375, 3.4530029296875, 3.569244384765625, 3.68548583984375, 3.801727294921875, 3.91796875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 11.0, 5.0, 20.0, 18.0, 25.0, 22.0, 45.0, 59.0, 90.0, 112.0, 114.0, 212.0, 342.0, 492.0, 571.0, 933.0, 1289.0, 1713.0, 2590.0, 3689.0, 5434.0, 7995.0, 12017.0, 17903.0, 26344.0, 40451.0, 64383.0, 114507.0, 261002.0, 217331.0, 98990.0, 57762.0, 36982.0, 24292.0, 16013.0, 10706.0, 7558.0, 5167.0, 3380.0, 2418.0, 1659.0, 1108.0, 791.0, 615.0, 364.0, 286.0, 221.0, 153.0, 112.0, 69.0, 46.0, 51.0, 28.0, 30.0, 14.0, 10.0, 8.0, 8.0, 4.0, 5.0], "bins": [-0.1783447265625, -0.17292213439941406, -0.16749954223632812, -0.1620769500732422, -0.15665435791015625, -0.1512317657470703, -0.14580917358398438, -0.14038658142089844, -0.1349639892578125, -0.12954139709472656, -0.12411880493164062, -0.11869621276855469, -0.11327362060546875, -0.10785102844238281, -0.10242843627929688, -0.09700584411621094, -0.091583251953125, -0.08616065979003906, -0.08073806762695312, -0.07531547546386719, -0.06989288330078125, -0.06447029113769531, -0.059047698974609375, -0.05362510681152344, -0.0482025146484375, -0.04277992248535156, -0.037357330322265625, -0.03193473815917969, -0.02651214599609375, -0.021089553833007812, -0.015666961669921875, -0.010244369506835938, -0.00482177734375, 0.0006008148193359375, 0.006023406982421875, 0.011445999145507812, 0.01686859130859375, 0.022291183471679688, 0.027713775634765625, 0.03313636779785156, 0.0385589599609375, 0.04398155212402344, 0.049404144287109375, 0.05482673645019531, 0.06024932861328125, 0.06567192077636719, 0.07109451293945312, 0.07651710510253906, 0.081939697265625, 0.08736228942871094, 0.09278488159179688, 0.09820747375488281, 0.10363006591796875, 0.10905265808105469, 0.11447525024414062, 0.11989784240722656, 0.1253204345703125, 0.13074302673339844, 0.13616561889648438, 0.1415882110595703, 0.14701080322265625, 0.1524333953857422, 0.15785598754882812, 0.16327857971191406, 0.168701171875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 6.0, 5.0, 12.0, 10.0, 14.0, 17.0, 14.0, 21.0, 23.0, 24.0, 25.0, 26.0, 43.0, 32.0, 40.0, 41.0, 33.0, 35.0, 53.0, 1070.0, 55.0, 56.0, 49.0, 32.0, 40.0, 39.0, 33.0, 34.0, 33.0, 23.0, 16.0, 21.0, 9.0, 9.0, 11.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.462890625, -3.35888671875, -3.2548828125, -3.15087890625, -3.046875, -2.94287109375, -2.8388671875, -2.73486328125, -2.630859375, -2.52685546875, -2.4228515625, -2.31884765625, -2.21484375, -2.11083984375, -2.0068359375, -1.90283203125, -1.798828125, -1.69482421875, -1.5908203125, -1.48681640625, -1.3828125, -1.27880859375, -1.1748046875, -1.07080078125, -0.966796875, -0.86279296875, -0.7587890625, -0.65478515625, -0.55078125, -0.44677734375, -0.3427734375, -0.23876953125, -0.134765625, -0.03076171875, 0.0732421875, 0.17724609375, 0.28125, 0.38525390625, 0.4892578125, 0.59326171875, 0.697265625, 0.80126953125, 0.9052734375, 1.00927734375, 1.11328125, 1.21728515625, 1.3212890625, 1.42529296875, 1.529296875, 1.63330078125, 1.7373046875, 1.84130859375, 1.9453125, 2.04931640625, 2.1533203125, 2.25732421875, 2.361328125, 2.46533203125, 2.5693359375, 2.67333984375, 2.77734375, 2.88134765625, 2.9853515625, 3.08935546875, 3.193359375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 11.0, 8.0, 12.0, 16.0, 24.0, 45.0, 51.0, 86.0, 115.0, 175.0, 236.0, 365.0, 500.0, 711.0, 1105.0, 1582.0, 2295.0, 3457.0, 4911.0, 6964.0, 10494.0, 15649.0, 23735.0, 36908.0, 60520.0, 107590.0, 301436.0, 1208540.0, 122648.0, 67216.0, 40913.0, 26180.0, 16784.0, 11308.0, 7702.0, 5199.0, 3534.0, 2515.0, 1664.0, 1224.0, 830.0, 579.0, 399.0, 313.0, 183.0, 145.0, 75.0, 63.0, 37.0, 30.0, 20.0, 17.0, 4.0, 8.0, 5.0, 2.0, 5.0, 1.0], "bins": [-0.05926513671875, -0.057474613189697266, -0.05568408966064453, -0.0538935661315918, -0.05210304260253906, -0.05031251907348633, -0.048521995544433594, -0.04673147201538086, -0.044940948486328125, -0.04315042495727539, -0.041359901428222656, -0.03956937789916992, -0.03777885437011719, -0.03598833084106445, -0.03419780731201172, -0.032407283782958984, -0.03061676025390625, -0.028826236724853516, -0.02703571319580078, -0.025245189666748047, -0.023454666137695312, -0.021664142608642578, -0.019873619079589844, -0.01808309555053711, -0.016292572021484375, -0.01450204849243164, -0.012711524963378906, -0.010921001434326172, -0.009130477905273438, -0.007339954376220703, -0.005549430847167969, -0.0037589073181152344, -0.0019683837890625, -0.00017786026000976562, 0.0016126632690429688, 0.003403186798095703, 0.0051937103271484375, 0.006984233856201172, 0.008774757385253906, 0.01056528091430664, 0.012355804443359375, 0.01414632797241211, 0.015936851501464844, 0.017727375030517578, 0.019517898559570312, 0.021308422088623047, 0.02309894561767578, 0.024889469146728516, 0.02667999267578125, 0.028470516204833984, 0.03026103973388672, 0.03205156326293945, 0.03384208679199219, 0.03563261032104492, 0.037423133850097656, 0.03921365737915039, 0.041004180908203125, 0.04279470443725586, 0.044585227966308594, 0.04637575149536133, 0.04816627502441406, 0.0499567985534668, 0.05174732208251953, 0.053537845611572266, 0.055328369140625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 4.0, 6.0, 11.0, 17.0, 17.0, 25.0, 32.0, 32.0, 41.0, 60.0, 74.0, 73.0, 80.0, 90.0, 73.0, 68.0, 49.0, 45.0, 36.0, 29.0, 21.0, 22.0, 18.0, 16.0, 11.0, 8.0, 3.0, 6.0, 4.0, 1.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014886856079101562, -0.0014462918043136597, -0.001403898000717163, -0.0013615041971206665, -0.00131911039352417, -0.0012767165899276733, -0.0012343227863311768, -0.0011919289827346802, -0.0011495351791381836, -0.001107141375541687, -0.0010647475719451904, -0.0010223537683486938, -0.0009799599647521973, -0.0009375661611557007, -0.0008951723575592041, -0.0008527785539627075, -0.0008103847503662109, -0.0007679909467697144, -0.0007255971431732178, -0.0006832033395767212, -0.0006408095359802246, -0.000598415732383728, -0.0005560219287872314, -0.0005136281251907349, -0.0004712343215942383, -0.0004288405179977417, -0.0003864467144012451, -0.00034405291080474854, -0.00030165910720825195, -0.00025926530361175537, -0.0002168715000152588, -0.0001744776964187622, -0.00013208389282226562, -8.969008922576904e-05, -4.729628562927246e-05, -4.902482032775879e-06, 3.74913215637207e-05, 7.988512516021729e-05, 0.00012227892875671387, 0.00016467273235321045, 0.00020706653594970703, 0.0002494603395462036, 0.0002918541431427002, 0.0003342479467391968, 0.00037664175033569336, 0.00041903555393218994, 0.0004614293575286865, 0.0005038231611251831, 0.0005462169647216797, 0.0005886107683181763, 0.0006310045719146729, 0.0006733983755111694, 0.000715792179107666, 0.0007581859827041626, 0.0008005797863006592, 0.0008429735898971558, 0.0008853673934936523, 0.0009277611970901489, 0.0009701550006866455, 0.001012548804283142, 0.0010549426078796387, 0.0010973364114761353, 0.0011397302150726318, 0.0011821240186691284, 0.001224517822265625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 3.0, 7.0, 2.0, 9.0, 9.0, 20.0, 18.0, 23.0, 25.0, 29.0, 43.0, 68.0, 120.0, 342.0, 3412.0, 882491.0, 160013.0, 1301.0, 261.0, 112.0, 57.0, 38.0, 40.0, 26.0, 17.0, 16.0, 10.0, 7.0, 4.0, 11.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.026042938232421875, -0.02510833740234375, -0.024173736572265625, -0.0232391357421875, -0.022304534912109375, -0.02136993408203125, -0.020435333251953125, -0.019500732421875, -0.018566131591796875, -0.01763153076171875, -0.016696929931640625, -0.0157623291015625, -0.014827728271484375, -0.01389312744140625, -0.012958526611328125, -0.01202392578125, -0.011089324951171875, -0.01015472412109375, -0.009220123291015625, -0.0082855224609375, -0.007350921630859375, -0.00641632080078125, -0.005481719970703125, -0.004547119140625, -0.003612518310546875, -0.00267791748046875, -0.001743316650390625, -0.0008087158203125, 0.000125885009765625, 0.00106048583984375, 0.001995086669921875, 0.0029296875, 0.003864288330078125, 0.00479888916015625, 0.005733489990234375, 0.0066680908203125, 0.007602691650390625, 0.00853729248046875, 0.009471893310546875, 0.010406494140625, 0.011341094970703125, 0.01227569580078125, 0.013210296630859375, 0.0141448974609375, 0.015079498291015625, 0.01601409912109375, 0.016948699951171875, 0.01788330078125, 0.018817901611328125, 0.01975250244140625, 0.020687103271484375, 0.0216217041015625, 0.022556304931640625, 0.02349090576171875, 0.024425506591796875, 0.025360107421875, 0.026294708251953125, 0.02722930908203125, 0.028163909912109375, 0.0290985107421875, 0.030033111572265625, 0.03096771240234375, 0.031902313232421875, 0.0328369140625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 61.0, 951.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002530066529288888, -0.001415963633917272, -0.0003018607385456562, 0.0008122420404106379, 0.0019263450521975756, 0.0030404480639845133, 0.004154550842940807, 0.005268653854727745, 0.006382756866514683, 0.0074968598783016205, 0.008610962890088558, 0.009725065901875496, 0.010839167982339859, 0.011953271925449371, 0.013067374005913734, 0.014181477017700672, 0.01529558002948761, 0.016409682109951973, 0.017523786053061485, 0.01863788813352585, 0.01975199207663536, 0.020866094157099724, 0.021980196237564087, 0.0230943001806736, 0.024208402261137962, 0.025322504341602325, 0.026436608284711838, 0.0275507103651762, 0.028664814308285713, 0.029778916388750076, 0.03089302033185959, 0.0320071205496788, 0.033121224492788315, 0.03423532843589783, 0.03534942865371704, 0.03646353259682655, 0.037577636539936066, 0.03869174048304558, 0.03980584070086479, 0.040919944643974304, 0.042034048587083817, 0.04314815253019333, 0.04426225274801254, 0.045376356691122055, 0.04649046063423157, 0.04760456457734108, 0.048718664795160294, 0.049832768738269806, 0.05094686895608902, 0.05206097289919853, 0.053175073117017746, 0.05428917706012726, 0.05540328100323677, 0.05651738494634628, 0.0576314851641655, 0.05874558910727501, 0.05985969305038452, 0.060973796993494034, 0.06208789721131325, 0.06320200115442276, 0.06431610137224197, 0.06543020904064178, 0.066544309258461, 0.06765840947628021, 0.06877251714468002]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 11.0, 20.0, 21.0, 26.0, 54.0, 69.0, 76.0, 80.0, 93.0, 102.0, 97.0, 84.0, 80.0, 49.0, 41.0, 32.0, 27.0, 18.0, 12.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0030908584594726562, -0.00302241463214159, -0.002953970804810524, -0.002885526977479458, -0.0028170831501483917, -0.0027486393228173256, -0.0026801954954862595, -0.0026117516681551933, -0.002543307840824127, -0.002474864013493061, -0.002406420186161995, -0.002337976358830929, -0.0022695325314998627, -0.0022010887041687965, -0.0021326448768377304, -0.0020642010495066643, -0.001995757222175598, -0.001927313394844532, -0.0018588695675134659, -0.0017904257401823997, -0.0017219819128513336, -0.0016535380855202675, -0.0015850942581892014, -0.0015166504308581352, -0.001448206603527069, -0.001379762776196003, -0.0013113189488649368, -0.0012428751215338707, -0.0011744312942028046, -0.0011059874668717384, -0.0010375436395406723, -0.0009690998122096062, -0.00090065598487854, -0.0008322121575474739, -0.0007637683302164078, -0.0006953245028853416, -0.0006268806755542755, -0.0005584368482232094, -0.0004899930208921432, -0.0004215491935610771, -0.000353105366230011, -0.00028466153889894485, -0.00021621771156787872, -0.0001477738842368126, -7.933005690574646e-05, -1.0886229574680328e-05, 5.75575977563858e-05, 0.00012600142508745193, 0.00019444525241851807, 0.0002628890797495842, 0.00033133290708065033, 0.00039977673441171646, 0.0004682205617427826, 0.0005366643890738487, 0.0006051082164049149, 0.000673552043735981, 0.0007419958710670471, 0.0008104396983981133, 0.0008788835257291794, 0.0009473273530602455, 0.0010157711803913116, 0.0010842150077223778, 0.001152658835053444, 0.00122110266238451, 0.0012895464897155762]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 2.0, 4.0, 9.0, 2.0, 10.0, 12.0, 10.0, 23.0, 14.0, 24.0, 18.0, 31.0, 24.0, 19.0, 34.0, 39.0, 34.0, 34.0, 43.0, 46.0, 50.0, 41.0, 54.0, 51.0, 44.0, 34.0, 33.0, 33.0, 24.0, 28.0, 16.0, 25.0, 28.0, 20.0, 21.0, 11.0, 13.0, 8.0, 11.0, 1.0, 9.0, 2.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.521484375, -3.405242919921875, -3.28900146484375, -3.172760009765625, -3.0565185546875, -2.940277099609375, -2.82403564453125, -2.707794189453125, -2.591552734375, -2.475311279296875, -2.35906982421875, -2.242828369140625, -2.1265869140625, -2.010345458984375, -1.89410400390625, -1.777862548828125, -1.66162109375, -1.545379638671875, -1.42913818359375, -1.312896728515625, -1.1966552734375, -1.080413818359375, -0.96417236328125, -0.847930908203125, -0.731689453125, -0.615447998046875, -0.49920654296875, -0.382965087890625, -0.2667236328125, -0.150482177734375, -0.03424072265625, 0.082000732421875, 0.1982421875, 0.314483642578125, 0.43072509765625, 0.546966552734375, 0.6632080078125, 0.779449462890625, 0.89569091796875, 1.011932373046875, 1.128173828125, 1.244415283203125, 1.36065673828125, 1.476898193359375, 1.5931396484375, 1.709381103515625, 1.82562255859375, 1.941864013671875, 2.05810546875, 2.174346923828125, 2.29058837890625, 2.406829833984375, 2.5230712890625, 2.639312744140625, 2.75555419921875, 2.871795654296875, 2.988037109375, 3.104278564453125, 3.22052001953125, 3.336761474609375, 3.4530029296875, 3.569244384765625, 3.68548583984375, 3.801727294921875, 3.91796875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 1.0, 4.0, 3.0, 11.0, 9.0, 24.0, 24.0, 50.0, 63.0, 95.0, 182.0, 273.0, 403.0, 672.0, 1102.0, 1981.0, 3472.0, 6392.0, 12736.0, 25439.0, 58949.0, 178297.0, 448747.0, 192822.0, 61508.0, 26591.0, 12959.0, 6892.0, 3745.0, 2097.0, 1171.0, 721.0, 396.0, 241.0, 151.0, 112.0, 62.0, 45.0, 32.0, 31.0, 22.0, 9.0, 9.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.2109375, -6.9892578125, -6.767578125, -6.5458984375, -6.32421875, -6.1025390625, -5.880859375, -5.6591796875, -5.4375, -5.2158203125, -4.994140625, -4.7724609375, -4.55078125, -4.3291015625, -4.107421875, -3.8857421875, -3.6640625, -3.4423828125, -3.220703125, -2.9990234375, -2.77734375, -2.5556640625, -2.333984375, -2.1123046875, -1.890625, -1.6689453125, -1.447265625, -1.2255859375, -1.00390625, -0.7822265625, -0.560546875, -0.3388671875, -0.1171875, 0.1044921875, 0.326171875, 0.5478515625, 0.76953125, 0.9912109375, 1.212890625, 1.4345703125, 1.65625, 1.8779296875, 2.099609375, 2.3212890625, 2.54296875, 2.7646484375, 2.986328125, 3.2080078125, 3.4296875, 3.6513671875, 3.873046875, 4.0947265625, 4.31640625, 4.5380859375, 4.759765625, 4.9814453125, 5.203125, 5.4248046875, 5.646484375, 5.8681640625, 6.08984375, 6.3115234375, 6.533203125, 6.7548828125, 6.9765625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 5.0, 8.0, 6.0, 5.0, 21.0, 15.0, 18.0, 18.0, 20.0, 20.0, 26.0, 27.0, 37.0, 43.0, 44.0, 59.0, 75.0, 126.0, 196.0, 1320.0, 261.0, 152.0, 112.0, 75.0, 64.0, 37.0, 30.0, 26.0, 28.0, 33.0, 23.0, 26.0, 15.0, 9.0, 12.0, 9.0, 11.0, 11.0, 11.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8828125, -9.540771484375, -9.19873046875, -8.856689453125, -8.5146484375, -8.172607421875, -7.83056640625, -7.488525390625, -7.146484375, -6.804443359375, -6.46240234375, -6.120361328125, -5.7783203125, -5.436279296875, -5.09423828125, -4.752197265625, -4.41015625, -4.068115234375, -3.72607421875, -3.384033203125, -3.0419921875, -2.699951171875, -2.35791015625, -2.015869140625, -1.673828125, -1.331787109375, -0.98974609375, -0.647705078125, -0.3056640625, 0.036376953125, 0.37841796875, 0.720458984375, 1.0625, 1.404541015625, 1.74658203125, 2.088623046875, 2.4306640625, 2.772705078125, 3.11474609375, 3.456787109375, 3.798828125, 4.140869140625, 4.48291015625, 4.824951171875, 5.1669921875, 5.509033203125, 5.85107421875, 6.193115234375, 6.53515625, 6.877197265625, 7.21923828125, 7.561279296875, 7.9033203125, 8.245361328125, 8.58740234375, 8.929443359375, 9.271484375, 9.613525390625, 9.95556640625, 10.297607421875, 10.6396484375, 10.981689453125, 11.32373046875, 11.665771484375, 12.0078125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 3.0, 9.0, 10.0, 26.0, 17.0, 24.0, 38.0, 57.0, 82.0, 125.0, 177.0, 378.0, 867.0, 2956.0, 17889.0, 363015.0, 2652274.0, 95966.0, 8586.0, 1828.0, 611.0, 293.0, 141.0, 87.0, 54.0, 52.0, 45.0, 22.0, 17.0, 13.0, 4.0, 6.0, 7.0, 6.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.953125, -22.30322265625, -21.6533203125, -21.00341796875, -20.353515625, -19.70361328125, -19.0537109375, -18.40380859375, -17.75390625, -17.10400390625, -16.4541015625, -15.80419921875, -15.154296875, -14.50439453125, -13.8544921875, -13.20458984375, -12.5546875, -11.90478515625, -11.2548828125, -10.60498046875, -9.955078125, -9.30517578125, -8.6552734375, -8.00537109375, -7.35546875, -6.70556640625, -6.0556640625, -5.40576171875, -4.755859375, -4.10595703125, -3.4560546875, -2.80615234375, -2.15625, -1.50634765625, -0.8564453125, -0.20654296875, 0.443359375, 1.09326171875, 1.7431640625, 2.39306640625, 3.04296875, 3.69287109375, 4.3427734375, 4.99267578125, 5.642578125, 6.29248046875, 6.9423828125, 7.59228515625, 8.2421875, 8.89208984375, 9.5419921875, 10.19189453125, 10.841796875, 11.49169921875, 12.1416015625, 12.79150390625, 13.44140625, 14.09130859375, 14.7412109375, 15.39111328125, 16.041015625, 16.69091796875, 17.3408203125, 17.99072265625, 18.640625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 12.0, 22.0, 50.0, 85.0, 115.0, 139.0, 150.0, 147.0, 110.0, 72.0, 50.0, 31.0, 18.0, 7.0, 3.0], "bins": [-60.706565856933594, -59.61306381225586, -58.51956558227539, -57.426063537597656, -56.33256530761719, -55.23906326293945, -54.14556121826172, -53.05206298828125, -51.958560943603516, -50.86505889892578, -49.77156066894531, -48.67805862426758, -47.584556579589844, -46.491058349609375, -45.39755630493164, -44.30405807495117, -43.21055603027344, -42.1170539855957, -41.023555755615234, -39.9300537109375, -38.83655548095703, -37.7430534362793, -36.64955139160156, -35.556053161621094, -34.46255111694336, -33.369049072265625, -32.275550842285156, -31.182048797607422, -30.08854866027832, -28.99504852294922, -27.901546478271484, -26.808046340942383, -25.714550018310547, -24.621049880981445, -23.527549743652344, -22.43404769897461, -21.340547561645508, -20.247047424316406, -19.153545379638672, -18.06004524230957, -16.96654510498047, -15.873044967651367, -14.77954387664795, -13.686042785644531, -12.59254264831543, -11.499042510986328, -10.40554141998291, -9.312040328979492, -8.21854019165039, -7.125039577484131, -6.031538963317871, -4.938038349151611, -3.8445377349853516, -2.751037120819092, -1.657536506652832, -0.5640358924865723, 0.5294647216796875, 1.6229653358459473, 2.716465950012207, 3.809966564178467, 4.903467178344727, 5.996967792510986, 7.090468406677246, 8.183969497680664, 9.277469635009766]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 11.0, 8.0, 9.0, 11.0, 13.0, 21.0, 16.0, 24.0, 31.0, 29.0, 31.0, 27.0, 28.0, 37.0, 41.0, 47.0, 46.0, 28.0, 50.0, 54.0, 47.0, 50.0, 33.0, 39.0, 33.0, 44.0, 22.0, 20.0, 21.0, 18.0, 19.0, 19.0, 7.0, 8.0, 21.0, 6.0, 11.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.46092987060547, -33.44132995605469, -32.421730041503906, -31.402130126953125, -30.382530212402344, -29.362930297851562, -28.34332847595215, -27.323728561401367, -26.304128646850586, -25.284528732299805, -24.264928817749023, -23.245328903198242, -22.225727081298828, -21.206127166748047, -20.186527252197266, -19.166927337646484, -18.147327423095703, -17.127727508544922, -16.10812759399414, -15.088526725769043, -14.068926811218262, -13.04932689666748, -12.029726028442383, -11.010126113891602, -9.99052619934082, -8.970926284790039, -7.9513258934021, -6.93172550201416, -5.912125587463379, -4.892525672912598, -3.872925281524658, -2.8533248901367188, -1.8337249755859375, -0.8141248226165771, 0.2054753303527832, 1.2250754833221436, 2.244675636291504, 3.264275550842285, 4.283875942230225, 5.303476333618164, 6.323076248168945, 7.342676162719727, 8.362276077270508, 9.381876945495605, 10.401476860046387, 11.421076774597168, 12.440677642822266, 13.460277557373047, 14.479877471923828, 15.49947738647461, 16.51907730102539, 17.538677215576172, 18.558277130126953, 19.577877044677734, 20.59747886657715, 21.61707878112793, 22.63667869567871, 23.656278610229492, 24.675878524780273, 25.695478439331055, 26.71508026123047, 27.73468017578125, 28.75428009033203, 29.773880004882812, 30.793479919433594]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 11.0, 18.0, 12.0, 8.0, 17.0, 17.0, 21.0, 29.0, 20.0, 25.0, 36.0, 34.0, 42.0, 40.0, 53.0, 37.0, 51.0, 58.0, 49.0, 48.0, 29.0, 34.0, 27.0, 33.0, 29.0, 28.0, 30.0, 18.0, 27.0, 17.0, 13.0, 10.0, 22.0, 9.0, 8.0, 6.0, 6.0, 4.0, 7.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.035614013671875, -3.91107177734375, -3.786529541015625, -3.6619873046875, -3.537445068359375, -3.41290283203125, -3.288360595703125, -3.163818359375, -3.039276123046875, -2.91473388671875, -2.790191650390625, -2.6656494140625, -2.541107177734375, -2.41656494140625, -2.292022705078125, -2.16748046875, -2.042938232421875, -1.91839599609375, -1.793853759765625, -1.6693115234375, -1.544769287109375, -1.42022705078125, -1.295684814453125, -1.171142578125, -1.046600341796875, -0.92205810546875, -0.797515869140625, -0.6729736328125, -0.548431396484375, -0.42388916015625, -0.299346923828125, -0.1748046875, -0.050262451171875, 0.07427978515625, 0.198822021484375, 0.3233642578125, 0.447906494140625, 0.57244873046875, 0.696990966796875, 0.821533203125, 0.946075439453125, 1.07061767578125, 1.195159912109375, 1.3197021484375, 1.444244384765625, 1.56878662109375, 1.693328857421875, 1.81787109375, 1.942413330078125, 2.06695556640625, 2.191497802734375, 2.3160400390625, 2.440582275390625, 2.56512451171875, 2.689666748046875, 2.814208984375, 2.938751220703125, 3.06329345703125, 3.187835693359375, 3.3123779296875, 3.436920166015625, 3.56146240234375, 3.686004638671875, 3.810546875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 17.0, 15.0, 9.0, 19.0, 22.0, 30.0, 45.0, 53.0, 75.0, 142.0, 212.0, 361.0, 748.0, 1482.0, 3365.0, 8978.0, 31787.0, 191536.0, 1580116.0, 2048505.0, 267471.0, 40742.0, 10886.0, 3931.0, 1745.0, 839.0, 408.0, 229.0, 146.0, 87.0, 83.0, 38.0, 33.0, 29.0, 24.0, 24.0, 13.0, 5.0, 10.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6875, -8.398681640625, -8.10986328125, -7.821044921875, -7.5322265625, -7.243408203125, -6.95458984375, -6.665771484375, -6.376953125, -6.088134765625, -5.79931640625, -5.510498046875, -5.2216796875, -4.932861328125, -4.64404296875, -4.355224609375, -4.06640625, -3.777587890625, -3.48876953125, -3.199951171875, -2.9111328125, -2.622314453125, -2.33349609375, -2.044677734375, -1.755859375, -1.467041015625, -1.17822265625, -0.889404296875, -0.6005859375, -0.311767578125, -0.02294921875, 0.265869140625, 0.5546875, 0.843505859375, 1.13232421875, 1.421142578125, 1.7099609375, 1.998779296875, 2.28759765625, 2.576416015625, 2.865234375, 3.154052734375, 3.44287109375, 3.731689453125, 4.0205078125, 4.309326171875, 4.59814453125, 4.886962890625, 5.17578125, 5.464599609375, 5.75341796875, 6.042236328125, 6.3310546875, 6.619873046875, 6.90869140625, 7.197509765625, 7.486328125, 7.775146484375, 8.06396484375, 8.352783203125, 8.6416015625, 8.930419921875, 9.21923828125, 9.508056640625, 9.796875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 5.0, 16.0, 12.0, 26.0, 27.0, 45.0, 55.0, 78.0, 93.0, 141.0, 215.0, 279.0, 397.0, 524.0, 573.0, 446.0, 319.0, 247.0, 148.0, 129.0, 72.0, 62.0, 40.0, 35.0, 15.0, 15.0, 14.0, 10.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.23828125, -7.006591796875, -6.77490234375, -6.543212890625, -6.3115234375, -6.079833984375, -5.84814453125, -5.616455078125, -5.384765625, -5.153076171875, -4.92138671875, -4.689697265625, -4.4580078125, -4.226318359375, -3.99462890625, -3.762939453125, -3.53125, -3.299560546875, -3.06787109375, -2.836181640625, -2.6044921875, -2.372802734375, -2.14111328125, -1.909423828125, -1.677734375, -1.446044921875, -1.21435546875, -0.982666015625, -0.7509765625, -0.519287109375, -0.28759765625, -0.055908203125, 0.17578125, 0.407470703125, 0.63916015625, 0.870849609375, 1.1025390625, 1.334228515625, 1.56591796875, 1.797607421875, 2.029296875, 2.260986328125, 2.49267578125, 2.724365234375, 2.9560546875, 3.187744140625, 3.41943359375, 3.651123046875, 3.8828125, 4.114501953125, 4.34619140625, 4.577880859375, 4.8095703125, 5.041259765625, 5.27294921875, 5.504638671875, 5.736328125, 5.968017578125, 6.19970703125, 6.431396484375, 6.6630859375, 6.894775390625, 7.12646484375, 7.358154296875, 7.58984375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 12.0, 14.0, 10.0, 12.0, 16.0, 25.0, 28.0, 48.0, 65.0, 87.0, 164.0, 218.0, 431.0, 1856.0, 53715.0, 4043571.0, 90323.0, 2389.0, 473.0, 288.0, 156.0, 101.0, 84.0, 60.0, 35.0, 28.0, 17.0, 19.0, 10.0, 9.0, 3.0, 5.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-45.125, -43.81884765625, -42.5126953125, -41.20654296875, -39.900390625, -38.59423828125, -37.2880859375, -35.98193359375, -34.67578125, -33.36962890625, -32.0634765625, -30.75732421875, -29.451171875, -28.14501953125, -26.8388671875, -25.53271484375, -24.2265625, -22.92041015625, -21.6142578125, -20.30810546875, -19.001953125, -17.69580078125, -16.3896484375, -15.08349609375, -13.77734375, -12.47119140625, -11.1650390625, -9.85888671875, -8.552734375, -7.24658203125, -5.9404296875, -4.63427734375, -3.328125, -2.02197265625, -0.7158203125, 0.59033203125, 1.896484375, 3.20263671875, 4.5087890625, 5.81494140625, 7.12109375, 8.42724609375, 9.7333984375, 11.03955078125, 12.345703125, 13.65185546875, 14.9580078125, 16.26416015625, 17.5703125, 18.87646484375, 20.1826171875, 21.48876953125, 22.794921875, 24.10107421875, 25.4072265625, 26.71337890625, 28.01953125, 29.32568359375, 30.6318359375, 31.93798828125, 33.244140625, 34.55029296875, 35.8564453125, 37.16259765625, 38.46875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 20.0, 53.0, 92.0, 138.0, 177.0, 168.0, 149.0, 105.0, 55.0, 24.0, 13.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.600791931152344, -17.844432830810547, -16.08807373046875, -14.33171558380127, -12.575357437133789, -10.818998336791992, -9.062639236450195, -7.306281089782715, -5.549921989440918, -3.7935633659362793, -2.0372045040130615, -0.28084564208984375, 1.475512981414795, 3.2318716049194336, 4.9882307052612305, 6.744588851928711, 8.500947952270508, 10.257307052612305, 12.013665199279785, 13.770024299621582, 15.526382446289062, 17.28274154663086, 19.039100646972656, 20.795459747314453, 22.55181884765625, 24.308177947998047, 26.064537048339844, 27.82089614868164, 29.577253341674805, 31.3336124420166, 33.08997344970703, 34.84632873535156, 36.60268783569336, 38.359046936035156, 40.11540603637695, 41.87176513671875, 43.62812423706055, 45.384483337402344, 47.140838623046875, 48.89719772338867, 50.65355682373047, 52.409915924072266, 54.16627502441406, 55.92263412475586, 57.678993225097656, 59.43534851074219, 61.19171142578125, 62.94806671142578, 64.70442962646484, 66.46078491210938, 68.21714782714844, 69.97350311279297, 71.72986602783203, 73.48622131347656, 75.24258422851562, 76.99893951416016, 78.75529479980469, 80.51165008544922, 82.26801300048828, 84.02436828613281, 85.78073120117188, 87.5370864868164, 89.29344940185547, 91.0498046875, 92.80616760253906]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 6.0, 10.0, 4.0, 7.0, 9.0, 8.0, 13.0, 24.0, 15.0, 23.0, 30.0, 28.0, 27.0, 28.0, 42.0, 38.0, 27.0, 35.0, 32.0, 33.0, 31.0, 32.0, 37.0, 35.0, 39.0, 41.0, 39.0, 29.0, 42.0, 25.0, 37.0, 25.0, 21.0, 17.0, 14.0, 12.0, 13.0, 13.0, 10.0, 10.0, 6.0, 12.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 5.0, 1.0], "bins": [-22.695520401000977, -22.04084587097168, -21.386171340942383, -20.73149871826172, -20.076824188232422, -19.422149658203125, -18.767475128173828, -18.11280059814453, -17.458126068115234, -16.803451538085938, -16.14877700805664, -15.49410343170166, -14.83942985534668, -14.184755325317383, -13.530080795288086, -12.875406265258789, -12.220733642578125, -11.566059112548828, -10.911385536193848, -10.25671100616455, -9.60203742980957, -8.947362899780273, -8.292688369750977, -7.638014316558838, -6.983340263366699, -6.3286662101745605, -5.673992156982422, -5.019317626953125, -4.364643573760986, -3.7099695205688477, -3.05529522895813, -2.400620937347412, -1.7459487915039062, -1.091274619102478, -0.4366004467010498, 0.21807372570037842, 0.8727478981018066, 1.5274219512939453, 2.182096242904663, 2.836770534515381, 3.4914445877075195, 4.146118640899658, 4.800792694091797, 5.455467224121094, 6.110141277313232, 6.764815330505371, 7.419489860534668, 8.074163436889648, 8.728837966918945, 9.383512496948242, 10.038186073303223, 10.69286060333252, 11.3475341796875, 12.002208709716797, 12.656883239746094, 13.31155776977539, 13.966231346130371, 14.620905876159668, 15.275579452514648, 15.930253982543945, 16.584928512573242, 17.239601135253906, 17.894275665283203, 18.5489501953125, 19.203624725341797]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 8.0, 2.0, 7.0, 3.0, 9.0, 8.0, 11.0, 11.0, 12.0, 11.0, 19.0, 26.0, 24.0, 19.0, 38.0, 23.0, 38.0, 44.0, 39.0, 53.0, 38.0, 38.0, 37.0, 42.0, 45.0, 33.0, 45.0, 29.0, 33.0, 28.0, 24.0, 23.0, 25.0, 25.0, 13.0, 17.0, 17.0, 22.0, 17.0, 15.0, 7.0, 5.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.939453125, -3.82269287109375, -3.7059326171875, -3.58917236328125, -3.472412109375, -3.35565185546875, -3.2388916015625, -3.12213134765625, -3.00537109375, -2.88861083984375, -2.7718505859375, -2.65509033203125, -2.538330078125, -2.42156982421875, -2.3048095703125, -2.18804931640625, -2.0712890625, -1.95452880859375, -1.8377685546875, -1.72100830078125, -1.604248046875, -1.48748779296875, -1.3707275390625, -1.25396728515625, -1.13720703125, -1.02044677734375, -0.9036865234375, -0.78692626953125, -0.670166015625, -0.55340576171875, -0.4366455078125, -0.31988525390625, -0.203125, -0.08636474609375, 0.0303955078125, 0.14715576171875, 0.263916015625, 0.38067626953125, 0.4974365234375, 0.61419677734375, 0.73095703125, 0.84771728515625, 0.9644775390625, 1.08123779296875, 1.197998046875, 1.31475830078125, 1.4315185546875, 1.54827880859375, 1.6650390625, 1.78179931640625, 1.8985595703125, 2.01531982421875, 2.132080078125, 2.24884033203125, 2.3656005859375, 2.48236083984375, 2.59912109375, 2.71588134765625, 2.8326416015625, 2.94940185546875, 3.066162109375, 3.18292236328125, 3.2996826171875, 3.41644287109375, 3.533203125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 8.0, 12.0, 12.0, 15.0, 32.0, 41.0, 70.0, 122.0, 168.0, 209.0, 354.0, 515.0, 822.0, 1201.0, 1686.0, 2515.0, 3845.0, 5872.0, 8390.0, 12648.0, 19356.0, 30151.0, 49108.0, 85605.0, 177136.0, 305986.0, 144983.0, 74906.0, 43469.0, 27036.0, 17387.0, 11355.0, 7623.0, 5209.0, 3494.0, 2367.0, 1602.0, 1083.0, 707.0, 486.0, 334.0, 209.0, 134.0, 95.0, 64.0, 57.0, 27.0, 21.0, 13.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.170654296875, -0.1650371551513672, -0.15942001342773438, -0.15380287170410156, -0.14818572998046875, -0.14256858825683594, -0.13695144653320312, -0.1313343048095703, -0.1257171630859375, -0.12010002136230469, -0.11448287963867188, -0.10886573791503906, -0.10324859619140625, -0.09763145446777344, -0.09201431274414062, -0.08639717102050781, -0.080780029296875, -0.07516288757324219, -0.06954574584960938, -0.06392860412597656, -0.05831146240234375, -0.05269432067871094, -0.047077178955078125, -0.04146003723144531, -0.0358428955078125, -0.030225753784179688, -0.024608612060546875, -0.018991470336914062, -0.01337432861328125, -0.0077571868896484375, -0.002140045166015625, 0.0034770965576171875, 0.00909423828125, 0.014711380004882812, 0.020328521728515625, 0.025945663452148438, 0.03156280517578125, 0.03717994689941406, 0.042797088623046875, 0.04841423034667969, 0.0540313720703125, 0.05964851379394531, 0.06526565551757812, 0.07088279724121094, 0.07649993896484375, 0.08211708068847656, 0.08773422241210938, 0.09335136413574219, 0.098968505859375, 0.10458564758300781, 0.11020278930664062, 0.11581993103027344, 0.12143707275390625, 0.12705421447753906, 0.13267135620117188, 0.1382884979248047, 0.1439056396484375, 0.1495227813720703, 0.15513992309570312, 0.16075706481933594, 0.16637420654296875, 0.17199134826660156, 0.17760848999023438, 0.1832256317138672, 0.1888427734375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 5.0, 9.0, 8.0, 10.0, 15.0, 15.0, 14.0, 19.0, 19.0, 26.0, 25.0, 23.0, 33.0, 37.0, 31.0, 33.0, 33.0, 36.0, 40.0, 40.0, 1061.0, 34.0, 30.0, 42.0, 56.0, 34.0, 30.0, 24.0, 26.0, 20.0, 21.0, 32.0, 18.0, 16.0, 13.0, 17.0, 10.0, 7.0, 6.0, 6.0, 10.0, 4.0, 5.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.822265625, -2.72857666015625, -2.6348876953125, -2.54119873046875, -2.447509765625, -2.35382080078125, -2.2601318359375, -2.16644287109375, -2.07275390625, -1.97906494140625, -1.8853759765625, -1.79168701171875, -1.697998046875, -1.60430908203125, -1.5106201171875, -1.41693115234375, -1.3232421875, -1.22955322265625, -1.1358642578125, -1.04217529296875, -0.948486328125, -0.85479736328125, -0.7611083984375, -0.66741943359375, -0.57373046875, -0.48004150390625, -0.3863525390625, -0.29266357421875, -0.198974609375, -0.10528564453125, -0.0115966796875, 0.08209228515625, 0.17578125, 0.26947021484375, 0.3631591796875, 0.45684814453125, 0.550537109375, 0.64422607421875, 0.7379150390625, 0.83160400390625, 0.92529296875, 1.01898193359375, 1.1126708984375, 1.20635986328125, 1.300048828125, 1.39373779296875, 1.4874267578125, 1.58111572265625, 1.6748046875, 1.76849365234375, 1.8621826171875, 1.95587158203125, 2.049560546875, 2.14324951171875, 2.2369384765625, 2.33062744140625, 2.42431640625, 2.51800537109375, 2.6116943359375, 2.70538330078125, 2.799072265625, 2.89276123046875, 2.9864501953125, 3.08013916015625, 3.173828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 6.0, 1.0, 1.0, 6.0, 7.0, 12.0, 22.0, 13.0, 36.0, 48.0, 67.0, 95.0, 156.0, 211.0, 342.0, 475.0, 698.0, 965.0, 1561.0, 2176.0, 3274.0, 4992.0, 7461.0, 11118.0, 17063.0, 26337.0, 41901.0, 68749.0, 123315.0, 1250471.0, 259724.0, 107324.0, 61036.0, 37490.0, 23842.0, 15728.0, 9995.0, 6704.0, 4494.0, 2921.0, 1995.0, 1435.0, 904.0, 624.0, 402.0, 300.0, 188.0, 137.0, 95.0, 73.0, 52.0, 29.0, 22.0, 26.0, 7.0, 9.0, 3.0, 8.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.060638427734375, -0.058675289154052734, -0.05671215057373047, -0.0547490119934082, -0.05278587341308594, -0.05082273483276367, -0.048859596252441406, -0.04689645767211914, -0.044933319091796875, -0.04297018051147461, -0.041007041931152344, -0.03904390335083008, -0.03708076477050781, -0.03511762619018555, -0.03315448760986328, -0.031191349029541016, -0.02922821044921875, -0.027265071868896484, -0.02530193328857422, -0.023338794708251953, -0.021375656127929688, -0.019412517547607422, -0.017449378967285156, -0.01548624038696289, -0.013523101806640625, -0.01155996322631836, -0.009596824645996094, -0.007633686065673828, -0.0056705474853515625, -0.003707408905029297, -0.0017442703247070312, 0.00021886825561523438, 0.0021820068359375, 0.004145145416259766, 0.006108283996582031, 0.008071422576904297, 0.010034561157226562, 0.011997699737548828, 0.013960838317871094, 0.01592397689819336, 0.017887115478515625, 0.01985025405883789, 0.021813392639160156, 0.023776531219482422, 0.025739669799804688, 0.027702808380126953, 0.02966594696044922, 0.031629085540771484, 0.03359222412109375, 0.035555362701416016, 0.03751850128173828, 0.03948163986206055, 0.04144477844238281, 0.04340791702270508, 0.045371055603027344, 0.04733419418334961, 0.049297332763671875, 0.05126047134399414, 0.053223609924316406, 0.05518674850463867, 0.05714988708496094, 0.0591130256652832, 0.06107616424560547, 0.06303930282592773, 0.06500244140625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 9.0, 6.0, 4.0, 5.0, 10.0, 9.0, 17.0, 18.0, 27.0, 21.0, 29.0, 29.0, 49.0, 47.0, 56.0, 57.0, 76.0, 92.0, 70.0, 62.0, 43.0, 44.0, 38.0, 26.0, 29.0, 24.0, 15.0, 16.0, 9.0, 10.0, 13.0, 8.0, 7.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0008101463317871094, -0.0007843151688575745, -0.0007584840059280396, -0.0007326528429985046, -0.0007068216800689697, -0.0006809905171394348, -0.0006551593542098999, -0.000629328191280365, -0.0006034970283508301, -0.0005776658654212952, -0.0005518347024917603, -0.0005260035395622253, -0.0005001723766326904, -0.0004743412137031555, -0.0004485100507736206, -0.0004226788878440857, -0.0003968477249145508, -0.00037101656198501587, -0.00034518539905548096, -0.00031935423612594604, -0.00029352307319641113, -0.0002676919102668762, -0.0002418607473373413, -0.0002160295844078064, -0.00019019842147827148, -0.00016436725854873657, -0.00013853609561920166, -0.00011270493268966675, -8.687376976013184e-05, -6.104260683059692e-05, -3.521144390106201e-05, -9.3802809715271e-06, 1.6450881958007812e-05, 4.2282044887542725e-05, 6.811320781707764e-05, 9.394437074661255e-05, 0.00011977553367614746, 0.00014560669660568237, 0.00017143785953521729, 0.0001972690224647522, 0.0002231001853942871, 0.000248931348323822, 0.00027476251125335693, 0.00030059367418289185, 0.00032642483711242676, 0.00035225600004196167, 0.0003780871629714966, 0.0004039183259010315, 0.0004297494888305664, 0.0004555806517601013, 0.00048141181468963623, 0.0005072429776191711, 0.0005330741405487061, 0.000558905303478241, 0.0005847364664077759, 0.0006105676293373108, 0.0006363987922668457, 0.0006622299551963806, 0.0006880611181259155, 0.0007138922810554504, 0.0007397234439849854, 0.0007655546069145203, 0.0007913857698440552, 0.0008172169327735901, 0.000843048095703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 6.0, 3.0, 1.0, 3.0, 5.0, 6.0, 15.0, 8.0, 7.0, 20.0, 13.0, 24.0, 33.0, 29.0, 41.0, 70.0, 129.0, 275.0, 2429.0, 931986.0, 112052.0, 814.0, 181.0, 109.0, 74.0, 38.0, 32.0, 30.0, 26.0, 16.0, 21.0, 14.0, 6.0, 4.0, 4.0, 7.0, 8.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0198822021484375, -0.01927661895751953, -0.018671035766601562, -0.018065452575683594, -0.017459869384765625, -0.016854286193847656, -0.016248703002929688, -0.01564311981201172, -0.01503753662109375, -0.014431953430175781, -0.013826370239257812, -0.013220787048339844, -0.012615203857421875, -0.012009620666503906, -0.011404037475585938, -0.010798454284667969, -0.01019287109375, -0.009587287902832031, -0.008981704711914062, -0.008376121520996094, -0.007770538330078125, -0.007164955139160156, -0.0065593719482421875, -0.005953788757324219, -0.00534820556640625, -0.004742622375488281, -0.0041370391845703125, -0.0035314559936523438, -0.002925872802734375, -0.0023202896118164062, -0.0017147064208984375, -0.0011091232299804688, -0.0005035400390625, 0.00010204315185546875, 0.0007076263427734375, 0.0013132095336914062, 0.001918792724609375, 0.0025243759155273438, 0.0031299591064453125, 0.0037355422973632812, 0.00434112548828125, 0.004946708679199219, 0.0055522918701171875, 0.006157875061035156, 0.006763458251953125, 0.007369041442871094, 0.007974624633789062, 0.008580207824707031, 0.009185791015625, 0.009791374206542969, 0.010396957397460938, 0.011002540588378906, 0.011608123779296875, 0.012213706970214844, 0.012819290161132812, 0.013424873352050781, 0.01403045654296875, 0.014636039733886719, 0.015241622924804688, 0.015847206115722656, 0.016452789306640625, 0.017058372497558594, 0.017663955688476562, 0.01826953887939453, 0.0188751220703125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 940.0, 67.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034326589666306973, -0.003038111375644803, -0.002643563784658909, -0.002249015960842371, -0.0018544683698564768, -0.0014599207788705826, -0.0010653729550540447, -0.0006708253640681505, -0.0002762777730822563, 0.0001182698761112988, 0.0005128175253048539, 0.00090736523270607, 0.0013019128236919641, 0.0016964604146778584, 0.002091008238494396, 0.0024855558294802904, 0.0028801034204661846, 0.003274651011452079, 0.003669198602437973, 0.004063746426254511, 0.004458294250071049, 0.004852841608226299, 0.005247389432042837, 0.005641937255859375, 0.0060364846140146255, 0.006431032437831163, 0.006825579795986414, 0.007220127619802952, 0.007614674977958202, 0.008009223267436028, 0.008403770625591278, 0.008798317983746529, 0.00919286534190178, 0.00958741270005703, 0.009981960989534855, 0.010376508347690105, 0.010771055705845356, 0.011165603995323181, 0.011560151353478432, 0.011954698711633682, 0.012349246069788933, 0.012743793427944183, 0.013138341717422009, 0.013532889075577259, 0.01392743643373251, 0.014321984723210335, 0.014716532081365585, 0.015111079439520836, 0.015505627728998661, 0.015900176018476486, 0.016294723376631737, 0.016689270734786987, 0.017083818092942238, 0.01747836545109749, 0.017872914671897888, 0.01826746203005314, 0.01866200938820839, 0.01905655674636364, 0.01945110410451889, 0.01984565332531929, 0.02024020068347454, 0.02063474804162979, 0.021029295399785042, 0.021423842757940292, 0.021818390116095543]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 7.0, 5.0, 2.0, 8.0, 5.0, 2.0, 8.0, 13.0, 24.0, 21.0, 25.0, 26.0, 24.0, 27.0, 42.0, 40.0, 43.0, 44.0, 54.0, 49.0, 50.0, 42.0, 66.0, 68.0, 50.0, 42.0, 42.0, 30.0, 23.0, 32.0, 20.0, 19.0, 19.0, 12.0, 9.0, 3.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009229183197021484, -0.0008987244218587875, -0.0008745305240154266, -0.0008503366261720657, -0.0008261427283287048, -0.0008019488304853439, -0.000777754932641983, -0.0007535610347986221, -0.0007293671369552612, -0.0007051732391119003, -0.0006809793412685394, -0.0006567854434251785, -0.0006325915455818176, -0.0006083976477384567, -0.0005842037498950958, -0.0005600098520517349, -0.000535815954208374, -0.0005116220563650131, -0.0004874281585216522, -0.0004632342606782913, -0.0004390403628349304, -0.0004148464649915695, -0.0003906525671482086, -0.0003664586693048477, -0.0003422647714614868, -0.0003180708736181259, -0.000293876975774765, -0.0002696830779314041, -0.0002454891800880432, -0.0002212952822446823, -0.0001971013844013214, -0.0001729074865579605, -0.0001487135887145996, -0.0001245196908712387, -0.00010032579302787781, -7.61318951845169e-05, -5.1937997341156006e-05, -2.7744099497795105e-05, -3.550201654434204e-06, 2.0643696188926697e-05, 4.48375940322876e-05, 6.90314918756485e-05, 9.32253897190094e-05, 0.0001174192875623703, 0.0001416131854057312, 0.0001658070832490921, 0.000190000981092453, 0.0002141948789358139, 0.0002383887767791748, 0.0002625826746225357, 0.0002867765724658966, 0.0003109704703092575, 0.0003351643681526184, 0.0003593582659959793, 0.0003835521638393402, 0.0004077460616827011, 0.000431939959526062, 0.0004561338573694229, 0.0004803277552127838, 0.0005045216530561447, 0.0005287155508995056, 0.0005529094487428665, 0.0005771033465862274, 0.0006012972444295883, 0.0006254911422729492]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 8.0, 2.0, 7.0, 3.0, 9.0, 8.0, 11.0, 11.0, 12.0, 11.0, 19.0, 26.0, 24.0, 19.0, 38.0, 23.0, 38.0, 44.0, 39.0, 53.0, 38.0, 38.0, 37.0, 42.0, 45.0, 33.0, 45.0, 29.0, 33.0, 28.0, 24.0, 23.0, 25.0, 25.0, 13.0, 17.0, 17.0, 22.0, 17.0, 15.0, 7.0, 5.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.939453125, -3.82269287109375, -3.7059326171875, -3.58917236328125, -3.472412109375, -3.35565185546875, -3.2388916015625, -3.12213134765625, -3.00537109375, -2.88861083984375, -2.7718505859375, -2.65509033203125, -2.538330078125, -2.42156982421875, -2.3048095703125, -2.18804931640625, -2.0712890625, -1.95452880859375, -1.8377685546875, -1.72100830078125, -1.604248046875, -1.48748779296875, -1.3707275390625, -1.25396728515625, -1.13720703125, -1.02044677734375, -0.9036865234375, -0.78692626953125, -0.670166015625, -0.55340576171875, -0.4366455078125, -0.31988525390625, -0.203125, -0.08636474609375, 0.0303955078125, 0.14715576171875, 0.263916015625, 0.38067626953125, 0.4974365234375, 0.61419677734375, 0.73095703125, 0.84771728515625, 0.9644775390625, 1.08123779296875, 1.197998046875, 1.31475830078125, 1.4315185546875, 1.54827880859375, 1.6650390625, 1.78179931640625, 1.8985595703125, 2.01531982421875, 2.132080078125, 2.24884033203125, 2.3656005859375, 2.48236083984375, 2.59912109375, 2.71588134765625, 2.8326416015625, 2.94940185546875, 3.066162109375, 3.18292236328125, 3.2996826171875, 3.41644287109375, 3.533203125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 5.0, 11.0, 12.0, 19.0, 32.0, 37.0, 62.0, 91.0, 128.0, 232.0, 442.0, 682.0, 1142.0, 1971.0, 3624.0, 7217.0, 15408.0, 35202.0, 93157.0, 350008.0, 372525.0, 97460.0, 36383.0, 16312.0, 7617.0, 3892.0, 2030.0, 1125.0, 645.0, 388.0, 228.0, 175.0, 103.0, 62.0, 50.0, 31.0, 20.0, 8.0, 9.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61328125, -6.39300537109375, -6.1727294921875, -5.95245361328125, -5.732177734375, -5.51190185546875, -5.2916259765625, -5.07135009765625, -4.85107421875, -4.63079833984375, -4.4105224609375, -4.19024658203125, -3.969970703125, -3.74969482421875, -3.5294189453125, -3.30914306640625, -3.0888671875, -2.86859130859375, -2.6483154296875, -2.42803955078125, -2.207763671875, -1.98748779296875, -1.7672119140625, -1.54693603515625, -1.32666015625, -1.10638427734375, -0.8861083984375, -0.66583251953125, -0.445556640625, -0.22528076171875, -0.0050048828125, 0.21527099609375, 0.435546875, 0.65582275390625, 0.8760986328125, 1.09637451171875, 1.316650390625, 1.53692626953125, 1.7572021484375, 1.97747802734375, 2.19775390625, 2.41802978515625, 2.6383056640625, 2.85858154296875, 3.078857421875, 3.29913330078125, 3.5194091796875, 3.73968505859375, 3.9599609375, 4.18023681640625, 4.4005126953125, 4.62078857421875, 4.841064453125, 5.06134033203125, 5.2816162109375, 5.50189208984375, 5.72216796875, 5.94244384765625, 6.1627197265625, 6.38299560546875, 6.603271484375, 6.82354736328125, 7.0438232421875, 7.26409912109375, 7.484375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 8.0, 4.0, 12.0, 10.0, 9.0, 8.0, 16.0, 11.0, 22.0, 18.0, 34.0, 37.0, 30.0, 36.0, 42.0, 43.0, 58.0, 55.0, 113.0, 191.0, 1405.0, 262.0, 126.0, 78.0, 66.0, 54.0, 38.0, 27.0, 46.0, 24.0, 28.0, 29.0, 21.0, 17.0, 13.0, 17.0, 10.0, 9.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.5703125, -12.1861572265625, -11.802001953125, -11.4178466796875, -11.03369140625, -10.6495361328125, -10.265380859375, -9.8812255859375, -9.4970703125, -9.1129150390625, -8.728759765625, -8.3446044921875, -7.96044921875, -7.5762939453125, -7.192138671875, -6.8079833984375, -6.423828125, -6.0396728515625, -5.655517578125, -5.2713623046875, -4.88720703125, -4.5030517578125, -4.118896484375, -3.7347412109375, -3.3505859375, -2.9664306640625, -2.582275390625, -2.1981201171875, -1.81396484375, -1.4298095703125, -1.045654296875, -0.6614990234375, -0.27734375, 0.1068115234375, 0.490966796875, 0.8751220703125, 1.25927734375, 1.6434326171875, 2.027587890625, 2.4117431640625, 2.7958984375, 3.1800537109375, 3.564208984375, 3.9483642578125, 4.33251953125, 4.7166748046875, 5.100830078125, 5.4849853515625, 5.869140625, 6.2532958984375, 6.637451171875, 7.0216064453125, 7.40576171875, 7.7899169921875, 8.174072265625, 8.5582275390625, 8.9423828125, 9.3265380859375, 9.710693359375, 10.0948486328125, 10.47900390625, 10.8631591796875, 11.247314453125, 11.6314697265625, 12.015625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 10.0, 9.0, 25.0, 22.0, 27.0, 26.0, 45.0, 44.0, 70.0, 102.0, 159.0, 357.0, 775.0, 2267.0, 8140.0, 57964.0, 1946268.0, 1076769.0, 42504.0, 6701.0, 1889.0, 690.0, 278.0, 159.0, 94.0, 65.0, 50.0, 37.0, 33.0, 23.0, 18.0, 16.0, 10.0, 10.0, 8.0, 7.0, 3.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.921875, -19.27783203125, -18.6337890625, -17.98974609375, -17.345703125, -16.70166015625, -16.0576171875, -15.41357421875, -14.76953125, -14.12548828125, -13.4814453125, -12.83740234375, -12.193359375, -11.54931640625, -10.9052734375, -10.26123046875, -9.6171875, -8.97314453125, -8.3291015625, -7.68505859375, -7.041015625, -6.39697265625, -5.7529296875, -5.10888671875, -4.46484375, -3.82080078125, -3.1767578125, -2.53271484375, -1.888671875, -1.24462890625, -0.6005859375, 0.04345703125, 0.6875, 1.33154296875, 1.9755859375, 2.61962890625, 3.263671875, 3.90771484375, 4.5517578125, 5.19580078125, 5.83984375, 6.48388671875, 7.1279296875, 7.77197265625, 8.416015625, 9.06005859375, 9.7041015625, 10.34814453125, 10.9921875, 11.63623046875, 12.2802734375, 12.92431640625, 13.568359375, 14.21240234375, 14.8564453125, 15.50048828125, 16.14453125, 16.78857421875, 17.4326171875, 18.07666015625, 18.720703125, 19.36474609375, 20.0087890625, 20.65283203125, 21.296875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [4.0, 41.0, 190.0, 412.0, 294.0, 71.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.550666809082031, -8.441230773925781, -5.331793785095215, -2.2223567962646484, 0.8870792388916016, 3.9965152740478516, 7.105953216552734, 10.215389251708984, 13.324825286865234, 16.434261322021484, 19.543697357177734, 22.653135299682617, 25.762571334838867, 28.872007369995117, 31.9814453125, 35.09088134765625, 38.2003173828125, 41.30975341796875, 44.419189453125, 47.52862548828125, 50.6380615234375, 53.74749755859375, 56.856937408447266, 59.966373443603516, 63.075809478759766, 66.18524932861328, 69.29468536376953, 72.40412139892578, 75.51355743408203, 78.62299346923828, 81.73242950439453, 84.84186553955078, 87.9512939453125, 91.06072998046875, 94.170166015625, 97.27960205078125, 100.3890380859375, 103.49847412109375, 106.60791015625, 109.71734619140625, 112.8267822265625, 115.93621826171875, 119.045654296875, 122.15509033203125, 125.2645263671875, 128.37396240234375, 131.4833984375, 134.59283447265625, 137.7022705078125, 140.81170654296875, 143.921142578125, 147.03057861328125, 150.1400146484375, 153.24945068359375, 156.35888671875, 159.46832275390625, 162.57777404785156, 165.6872100830078, 168.79664611816406, 171.9060821533203, 175.01551818847656, 178.1249542236328, 181.23439025878906, 184.3438262939453, 187.45326232910156]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 4.0, 8.0, 4.0, 4.0, 15.0, 12.0, 17.0, 12.0, 16.0, 16.0, 20.0, 27.0, 30.0, 31.0, 28.0, 25.0, 50.0, 46.0, 41.0, 40.0, 46.0, 48.0, 41.0, 38.0, 45.0, 33.0, 38.0, 35.0, 22.0, 23.0, 25.0, 30.0, 18.0, 22.0, 10.0, 19.0, 13.0, 15.0, 11.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.978919982910156, -37.775390625, -36.571861267089844, -35.36833572387695, -34.1648063659668, -32.96127700805664, -31.757749557495117, -30.554222106933594, -29.350692749023438, -28.14716339111328, -26.943635940551758, -25.740108489990234, -24.536579132080078, -23.333049774169922, -22.1295223236084, -20.925994873046875, -19.72246551513672, -18.518936157226562, -17.31540870666504, -16.111881256103516, -14.90835189819336, -13.70482349395752, -12.50129508972168, -11.29776668548584, -10.09423828125, -8.89070987701416, -7.68718147277832, -6.4836530685424805, -5.280124664306641, -4.076596260070801, -2.873067855834961, -1.669539451599121, -0.4660148620605469, 0.737513542175293, 1.9410419464111328, 3.1445703506469727, 4.3480987548828125, 5.551627159118652, 6.755155563354492, 7.958683967590332, 9.162212371826172, 10.365740776062012, 11.569269180297852, 12.772797584533691, 13.976325988769531, 15.179854393005371, 16.38338279724121, 17.586910247802734, 18.79043960571289, 19.993968963623047, 21.19749641418457, 22.401023864746094, 23.60455322265625, 24.808082580566406, 26.01161003112793, 27.215137481689453, 28.41866683959961, 29.622196197509766, 30.82572364807129, 32.02925109863281, 33.23278045654297, 34.436309814453125, 35.63983917236328, 36.84336471557617, 38.04689407348633]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 2.0, 4.0, 8.0, 7.0, 8.0, 9.0, 5.0, 10.0, 15.0, 25.0, 15.0, 15.0, 26.0, 32.0, 33.0, 33.0, 34.0, 30.0, 45.0, 45.0, 55.0, 41.0, 39.0, 50.0, 24.0, 48.0, 36.0, 22.0, 20.0, 32.0, 24.0, 30.0, 25.0, 18.0, 16.0, 22.0, 23.0, 16.0, 11.0, 8.0, 13.0, 5.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.3359375, -4.212860107421875, -4.08978271484375, -3.966705322265625, -3.8436279296875, -3.720550537109375, -3.59747314453125, -3.474395751953125, -3.351318359375, -3.228240966796875, -3.10516357421875, -2.982086181640625, -2.8590087890625, -2.735931396484375, -2.61285400390625, -2.489776611328125, -2.36669921875, -2.243621826171875, -2.12054443359375, -1.997467041015625, -1.8743896484375, -1.751312255859375, -1.62823486328125, -1.505157470703125, -1.382080078125, -1.259002685546875, -1.13592529296875, -1.012847900390625, -0.8897705078125, -0.766693115234375, -0.64361572265625, -0.520538330078125, -0.3974609375, -0.274383544921875, -0.15130615234375, -0.028228759765625, 0.0948486328125, 0.217926025390625, 0.34100341796875, 0.464080810546875, 0.587158203125, 0.710235595703125, 0.83331298828125, 0.956390380859375, 1.0794677734375, 1.202545166015625, 1.32562255859375, 1.448699951171875, 1.57177734375, 1.694854736328125, 1.81793212890625, 1.941009521484375, 2.0640869140625, 2.187164306640625, 2.31024169921875, 2.433319091796875, 2.556396484375, 2.679473876953125, 2.80255126953125, 2.925628662109375, 3.0487060546875, 3.171783447265625, 3.29486083984375, 3.417938232421875, 3.541015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 7.0, 11.0, 13.0, 11.0, 26.0, 29.0, 30.0, 61.0, 76.0, 139.0, 227.0, 503.0, 1390.0, 4773.0, 28063.0, 527902.0, 3220112.0, 381677.0, 22859.0, 4111.0, 1179.0, 440.0, 222.0, 129.0, 93.0, 46.0, 40.0, 31.0, 20.0, 19.0, 7.0, 12.0, 6.0, 3.0, 3.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7109375, -12.26416015625, -11.8173828125, -11.37060546875, -10.923828125, -10.47705078125, -10.0302734375, -9.58349609375, -9.13671875, -8.68994140625, -8.2431640625, -7.79638671875, -7.349609375, -6.90283203125, -6.4560546875, -6.00927734375, -5.5625, -5.11572265625, -4.6689453125, -4.22216796875, -3.775390625, -3.32861328125, -2.8818359375, -2.43505859375, -1.98828125, -1.54150390625, -1.0947265625, -0.64794921875, -0.201171875, 0.24560546875, 0.6923828125, 1.13916015625, 1.5859375, 2.03271484375, 2.4794921875, 2.92626953125, 3.373046875, 3.81982421875, 4.2666015625, 4.71337890625, 5.16015625, 5.60693359375, 6.0537109375, 6.50048828125, 6.947265625, 7.39404296875, 7.8408203125, 8.28759765625, 8.734375, 9.18115234375, 9.6279296875, 10.07470703125, 10.521484375, 10.96826171875, 11.4150390625, 11.86181640625, 12.30859375, 12.75537109375, 13.2021484375, 13.64892578125, 14.095703125, 14.54248046875, 14.9892578125, 15.43603515625, 15.8828125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 11.0, 12.0, 20.0, 32.0, 42.0, 30.0, 71.0, 113.0, 174.0, 243.0, 352.0, 535.0, 668.0, 515.0, 403.0, 248.0, 180.0, 130.0, 90.0, 62.0, 44.0, 25.0, 31.0, 12.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.515625, -10.2432861328125, -9.970947265625, -9.6986083984375, -9.42626953125, -9.1539306640625, -8.881591796875, -8.6092529296875, -8.3369140625, -8.0645751953125, -7.792236328125, -7.5198974609375, -7.24755859375, -6.9752197265625, -6.702880859375, -6.4305419921875, -6.158203125, -5.8858642578125, -5.613525390625, -5.3411865234375, -5.06884765625, -4.7965087890625, -4.524169921875, -4.2518310546875, -3.9794921875, -3.7071533203125, -3.434814453125, -3.1624755859375, -2.89013671875, -2.6177978515625, -2.345458984375, -2.0731201171875, -1.80078125, -1.5284423828125, -1.256103515625, -0.9837646484375, -0.71142578125, -0.4390869140625, -0.166748046875, 0.1055908203125, 0.3779296875, 0.6502685546875, 0.922607421875, 1.1949462890625, 1.46728515625, 1.7396240234375, 2.011962890625, 2.2843017578125, 2.556640625, 2.8289794921875, 3.101318359375, 3.3736572265625, 3.64599609375, 3.9183349609375, 4.190673828125, 4.4630126953125, 4.7353515625, 5.0076904296875, 5.280029296875, 5.5523681640625, 5.82470703125, 6.0970458984375, 6.369384765625, 6.6417236328125, 6.9140625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 2.0, 7.0, 16.0, 33.0, 34.0, 59.0, 97.0, 143.0, 260.0, 524.0, 1540.0, 15132.0, 3219881.0, 947011.0, 7383.0, 1176.0, 435.0, 211.0, 112.0, 64.0, 45.0, 43.0, 20.0, 15.0, 10.0, 5.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.734375, -28.585693359375, -27.43701171875, -26.288330078125, -25.1396484375, -23.990966796875, -22.84228515625, -21.693603515625, -20.544921875, -19.396240234375, -18.24755859375, -17.098876953125, -15.9501953125, -14.801513671875, -13.65283203125, -12.504150390625, -11.35546875, -10.206787109375, -9.05810546875, -7.909423828125, -6.7607421875, -5.612060546875, -4.46337890625, -3.314697265625, -2.166015625, -1.017333984375, 0.13134765625, 1.280029296875, 2.4287109375, 3.577392578125, 4.72607421875, 5.874755859375, 7.0234375, 8.172119140625, 9.32080078125, 10.469482421875, 11.6181640625, 12.766845703125, 13.91552734375, 15.064208984375, 16.212890625, 17.361572265625, 18.51025390625, 19.658935546875, 20.8076171875, 21.956298828125, 23.10498046875, 24.253662109375, 25.40234375, 26.551025390625, 27.69970703125, 28.848388671875, 29.9970703125, 31.145751953125, 32.29443359375, 33.443115234375, 34.591796875, 35.740478515625, 36.88916015625, 38.037841796875, 39.1865234375, 40.335205078125, 41.48388671875, 42.632568359375, 43.78125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 65.0, 224.0, 365.0, 250.0, 84.0, 11.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.75772476196289, -38.14714431762695, -34.53656005859375, -30.925979614257812, -27.315399169921875, -23.704818725585938, -20.094236373901367, -16.483654022216797, -12.87307357788086, -9.262492179870605, -5.651910781860352, -2.0413293838500977, 1.5692520141601562, 5.179832458496094, 8.790414810180664, 12.400997161865234, 16.011577606201172, 19.62215805053711, 23.23274040222168, 26.84332275390625, 30.453903198242188, 34.064483642578125, 37.67506408691406, 41.285648345947266, 44.8962287902832, 48.50680923461914, 52.117393493652344, 55.72797393798828, 59.33855438232422, 62.949134826660156, 66.5597152709961, 70.17030334472656, 73.7808837890625, 77.39146423339844, 81.00204467773438, 84.61262512207031, 88.22320556640625, 91.83378601074219, 95.44437408447266, 99.0549545288086, 102.66553497314453, 106.27611541748047, 109.8866958618164, 113.49727630615234, 117.10786437988281, 120.71844482421875, 124.32902526855469, 127.93960571289062, 131.55018615722656, 135.1607666015625, 138.77134704589844, 142.38192749023438, 145.9925079345703, 149.60308837890625, 153.2136688232422, 156.82424926757812, 160.43484497070312, 164.04542541503906, 167.656005859375, 171.26658630371094, 174.87716674804688, 178.4877471923828, 182.09832763671875, 185.70892333984375, 189.31948852539062]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 7.0, 6.0, 8.0, 10.0, 14.0, 12.0, 18.0, 12.0, 16.0, 24.0, 34.0, 30.0, 21.0, 35.0, 37.0, 31.0, 42.0, 47.0, 46.0, 43.0, 35.0, 35.0, 36.0, 42.0, 34.0, 32.0, 35.0, 27.0, 38.0, 33.0, 23.0, 23.0, 8.0, 17.0, 23.0, 10.0, 10.0, 14.0, 9.0, 2.0, 5.0, 3.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.64120101928711, -23.8935489654541, -23.145896911621094, -22.39824676513672, -21.65059471130371, -20.902942657470703, -20.155290603637695, -19.407638549804688, -18.659988403320312, -17.912336349487305, -17.164684295654297, -16.417034149169922, -15.669382095336914, -14.921730041503906, -14.174077987670898, -13.426426887512207, -12.6787748336792, -11.931122779846191, -11.1834716796875, -10.435819625854492, -9.6881685256958, -8.940516471862793, -8.192865371704102, -7.445213317871094, -6.697561740875244, -5.9499101638793945, -5.202258586883545, -4.454607009887695, -3.7069551944732666, -2.959303617477417, -2.2116518020629883, -1.4640002250671387, -0.7163486480712891, 0.03130298852920532, 0.7789546251296997, 1.5266063213348389, 2.2742578983306885, 3.021909475326538, 3.769561290740967, 4.517212867736816, 5.264864444732666, 6.012516021728516, 6.760167598724365, 7.507819175720215, 8.255471229553223, 9.003122329711914, 9.750774383544922, 10.49842643737793, 11.246077537536621, 11.993729591369629, 12.74138069152832, 13.489032745361328, 14.23668384552002, 14.984335899353027, 15.731986999511719, 16.479639053344727, 17.227291107177734, 17.974943161010742, 18.72259521484375, 19.470245361328125, 20.217897415161133, 20.96554946899414, 21.71320152282715, 22.460853576660156, 23.20850372314453]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 8.0, 8.0, 2.0, 8.0, 15.0, 19.0, 19.0, 18.0, 28.0, 28.0, 28.0, 31.0, 39.0, 46.0, 48.0, 31.0, 45.0, 42.0, 46.0, 45.0, 38.0, 42.0, 33.0, 35.0, 32.0, 33.0, 36.0, 27.0, 22.0, 15.0, 23.0, 13.0, 20.0, 19.0, 6.0, 13.0, 7.0, 4.0, 5.0, 2.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.44921875, -4.320526123046875, -4.19183349609375, -4.063140869140625, -3.9344482421875, -3.805755615234375, -3.67706298828125, -3.548370361328125, -3.419677734375, -3.290985107421875, -3.16229248046875, -3.033599853515625, -2.9049072265625, -2.776214599609375, -2.64752197265625, -2.518829345703125, -2.39013671875, -2.261444091796875, -2.13275146484375, -2.004058837890625, -1.8753662109375, -1.746673583984375, -1.61798095703125, -1.489288330078125, -1.360595703125, -1.231903076171875, -1.10321044921875, -0.974517822265625, -0.8458251953125, -0.717132568359375, -0.58843994140625, -0.459747314453125, -0.3310546875, -0.202362060546875, -0.07366943359375, 0.055023193359375, 0.1837158203125, 0.312408447265625, 0.44110107421875, 0.569793701171875, 0.698486328125, 0.827178955078125, 0.95587158203125, 1.084564208984375, 1.2132568359375, 1.341949462890625, 1.47064208984375, 1.599334716796875, 1.72802734375, 1.856719970703125, 1.98541259765625, 2.114105224609375, 2.2427978515625, 2.371490478515625, 2.50018310546875, 2.628875732421875, 2.757568359375, 2.886260986328125, 3.01495361328125, 3.143646240234375, 3.2723388671875, 3.401031494140625, 3.52972412109375, 3.658416748046875, 3.787109375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 14.0, 10.0, 16.0, 28.0, 45.0, 59.0, 110.0, 117.0, 210.0, 298.0, 475.0, 714.0, 1012.0, 1613.0, 2412.0, 3592.0, 5607.0, 8718.0, 13382.0, 20489.0, 33493.0, 56108.0, 101231.0, 208453.0, 277830.0, 131057.0, 70448.0, 40382.0, 25410.0, 15671.0, 10186.0, 6549.0, 4367.0, 2937.0, 1857.0, 1234.0, 783.0, 525.0, 362.0, 239.0, 170.0, 116.0, 71.0, 41.0, 40.0, 22.0, 18.0, 11.0, 6.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.1827392578125, -0.17723464965820312, -0.17173004150390625, -0.16622543334960938, -0.1607208251953125, -0.15521621704101562, -0.14971160888671875, -0.14420700073242188, -0.138702392578125, -0.13319778442382812, -0.12769317626953125, -0.12218856811523438, -0.1166839599609375, -0.11117935180664062, -0.10567474365234375, -0.10017013549804688, -0.09466552734375, -0.08916091918945312, -0.08365631103515625, -0.07815170288085938, -0.0726470947265625, -0.06714248657226562, -0.06163787841796875, -0.056133270263671875, -0.050628662109375, -0.045124053955078125, -0.03961944580078125, -0.034114837646484375, -0.0286102294921875, -0.023105621337890625, -0.01760101318359375, -0.012096405029296875, -0.006591796875, -0.001087188720703125, 0.00441741943359375, 0.009922027587890625, 0.0154266357421875, 0.020931243896484375, 0.02643585205078125, 0.031940460205078125, 0.037445068359375, 0.042949676513671875, 0.04845428466796875, 0.053958892822265625, 0.0594635009765625, 0.06496810913085938, 0.07047271728515625, 0.07597732543945312, 0.08148193359375, 0.08698654174804688, 0.09249114990234375, 0.09799575805664062, 0.1035003662109375, 0.10900497436523438, 0.11450958251953125, 0.12001419067382812, 0.125518798828125, 0.13102340698242188, 0.13652801513671875, 0.14203262329101562, 0.1475372314453125, 0.15304183959960938, 0.15854644775390625, 0.16405105590820312, 0.1695556640625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 4.0, 4.0, 8.0, 5.0, 8.0, 10.0, 8.0, 16.0, 18.0, 16.0, 12.0, 22.0, 22.0, 25.0, 29.0, 36.0, 45.0, 26.0, 39.0, 48.0, 43.0, 27.0, 30.0, 1062.0, 34.0, 42.0, 38.0, 34.0, 34.0, 42.0, 30.0, 33.0, 29.0, 20.0, 24.0, 23.0, 13.0, 13.0, 8.0, 13.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.4722900390625, -3.356689453125, -3.2410888671875, -3.12548828125, -3.0098876953125, -2.894287109375, -2.7786865234375, -2.6630859375, -2.5474853515625, -2.431884765625, -2.3162841796875, -2.20068359375, -2.0850830078125, -1.969482421875, -1.8538818359375, -1.73828125, -1.6226806640625, -1.507080078125, -1.3914794921875, -1.27587890625, -1.1602783203125, -1.044677734375, -0.9290771484375, -0.8134765625, -0.6978759765625, -0.582275390625, -0.4666748046875, -0.35107421875, -0.2354736328125, -0.119873046875, -0.0042724609375, 0.111328125, 0.2269287109375, 0.342529296875, 0.4581298828125, 0.57373046875, 0.6893310546875, 0.804931640625, 0.9205322265625, 1.0361328125, 1.1517333984375, 1.267333984375, 1.3829345703125, 1.49853515625, 1.6141357421875, 1.729736328125, 1.8453369140625, 1.9609375, 2.0765380859375, 2.192138671875, 2.3077392578125, 2.42333984375, 2.5389404296875, 2.654541015625, 2.7701416015625, 2.8857421875, 3.0013427734375, 3.116943359375, 3.2325439453125, 3.34814453125, 3.4637451171875, 3.579345703125, 3.6949462890625, 3.810546875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 6.0, 9.0, 10.0, 11.0, 10.0, 18.0, 31.0, 63.0, 79.0, 100.0, 141.0, 217.0, 283.0, 394.0, 632.0, 851.0, 1354.0, 1786.0, 2623.0, 3815.0, 5628.0, 8140.0, 11710.0, 17467.0, 26299.0, 40533.0, 64305.0, 111075.0, 248333.0, 1223109.0, 123900.0, 71448.0, 44280.0, 28608.0, 18970.0, 12884.0, 8700.0, 5894.0, 4047.0, 2885.0, 1987.0, 1372.0, 969.0, 659.0, 465.0, 321.0, 221.0, 162.0, 94.0, 78.0, 56.0, 33.0, 26.0, 20.0, 9.0, 5.0, 7.0, 6.0, 5.0, 4.0], "bins": [-0.06500244140625, -0.06303834915161133, -0.061074256896972656, -0.059110164642333984, -0.05714607238769531, -0.05518198013305664, -0.05321788787841797, -0.0512537956237793, -0.049289703369140625, -0.04732561111450195, -0.04536151885986328, -0.04339742660522461, -0.04143333435058594, -0.039469242095947266, -0.037505149841308594, -0.03554105758666992, -0.03357696533203125, -0.03161287307739258, -0.029648780822753906, -0.027684688568115234, -0.025720596313476562, -0.02375650405883789, -0.02179241180419922, -0.019828319549560547, -0.017864227294921875, -0.015900135040283203, -0.013936042785644531, -0.01197195053100586, -0.010007858276367188, -0.008043766021728516, -0.006079673767089844, -0.004115581512451172, -0.0021514892578125, -0.00018739700317382812, 0.0017766952514648438, 0.0037407875061035156, 0.0057048797607421875, 0.007668972015380859, 0.009633064270019531, 0.011597156524658203, 0.013561248779296875, 0.015525341033935547, 0.01748943328857422, 0.01945352554321289, 0.021417617797851562, 0.023381710052490234, 0.025345802307128906, 0.027309894561767578, 0.02927398681640625, 0.031238079071044922, 0.033202171325683594, 0.035166263580322266, 0.03713035583496094, 0.03909444808959961, 0.04105854034423828, 0.04302263259887695, 0.044986724853515625, 0.0469508171081543, 0.04891490936279297, 0.05087900161743164, 0.05284309387207031, 0.054807186126708984, 0.056771278381347656, 0.05873537063598633, 0.060699462890625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 7.0, 4.0, 4.0, 4.0, 5.0, 6.0, 15.0, 9.0, 8.0, 17.0, 17.0, 21.0, 38.0, 52.0, 66.0, 88.0, 127.0, 124.0, 85.0, 70.0, 44.0, 40.0, 25.0, 19.0, 15.0, 16.0, 12.0, 13.0, 10.0, 6.0, 5.0, 7.0, 7.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.00091552734375, -0.0008915364742279053, -0.0008675456047058105, -0.0008435547351837158, -0.0008195638656616211, -0.0007955729961395264, -0.0007715821266174316, -0.0007475912570953369, -0.0007236003875732422, -0.0006996095180511475, -0.0006756186485290527, -0.000651627779006958, -0.0006276369094848633, -0.0006036460399627686, -0.0005796551704406738, -0.0005556643009185791, -0.0005316734313964844, -0.0005076825618743896, -0.0004836916923522949, -0.0004597008228302002, -0.00043570995330810547, -0.00041171908378601074, -0.000387728214263916, -0.0003637373447418213, -0.00033974647521972656, -0.00031575560569763184, -0.0002917647361755371, -0.0002677738666534424, -0.00024378299713134766, -0.00021979212760925293, -0.0001958012580871582, -0.00017181038856506348, -0.00014781951904296875, -0.00012382864952087402, -9.98377799987793e-05, -7.584691047668457e-05, -5.1856040954589844e-05, -2.7865171432495117e-05, -3.874301910400391e-06, 2.0116567611694336e-05, 4.410743713378906e-05, 6.809830665588379e-05, 9.208917617797852e-05, 0.00011608004570007324, 0.00014007091522216797, 0.0001640617847442627, 0.00018805265426635742, 0.00021204352378845215, 0.00023603439331054688, 0.0002600252628326416, 0.00028401613235473633, 0.00030800700187683105, 0.0003319978713989258, 0.0003559887409210205, 0.00037997961044311523, 0.00040397047996520996, 0.0004279613494873047, 0.0004519522190093994, 0.00047594308853149414, 0.0004999339580535889, 0.0005239248275756836, 0.0005479156970977783, 0.000571906566619873, 0.0005958974361419678, 0.0006198883056640625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 8.0, 5.0, 6.0, 5.0, 12.0, 12.0, 14.0, 16.0, 15.0, 22.0, 36.0, 61.0, 69.0, 197.0, 943.0, 931711.0, 114467.0, 512.0, 157.0, 85.0, 49.0, 37.0, 20.0, 15.0, 7.0, 12.0, 11.0, 8.0, 7.0, 3.0, 4.0, 5.0, 8.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015228271484375, -0.014639616012573242, -0.014050960540771484, -0.013462305068969727, -0.012873649597167969, -0.012284994125366211, -0.011696338653564453, -0.011107683181762695, -0.010519027709960938, -0.00993037223815918, -0.009341716766357422, -0.008753061294555664, -0.008164405822753906, -0.0075757503509521484, -0.006987094879150391, -0.006398439407348633, -0.005809783935546875, -0.005221128463745117, -0.004632472991943359, -0.0040438175201416016, -0.0034551620483398438, -0.002866506576538086, -0.002277851104736328, -0.0016891956329345703, -0.0011005401611328125, -0.0005118846893310547, 7.677078247070312e-05, 0.0006654262542724609, 0.0012540817260742188, 0.0018427371978759766, 0.0024313926696777344, 0.003020048141479492, 0.00360870361328125, 0.004197359085083008, 0.004786014556884766, 0.0053746700286865234, 0.005963325500488281, 0.006551980972290039, 0.007140636444091797, 0.007729291915893555, 0.008317947387695312, 0.00890660285949707, 0.009495258331298828, 0.010083913803100586, 0.010672569274902344, 0.011261224746704102, 0.01184988021850586, 0.012438535690307617, 0.013027191162109375, 0.013615846633911133, 0.01420450210571289, 0.014793157577514648, 0.015381813049316406, 0.015970468521118164, 0.016559123992919922, 0.01714777946472168, 0.017736434936523438, 0.018325090408325195, 0.018913745880126953, 0.01950240135192871, 0.02009105682373047, 0.020679712295532227, 0.021268367767333984, 0.021857023239135742, 0.0224456787109375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 72.0, 884.0, 61.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002409297041594982, -0.0022169805597513914, -0.002024663845077157, -0.0018323473632335663, -0.001640030648559332, -0.0014477141667157412, -0.0012553975684568286, -0.001063080970197916, -0.0008707643719390035, -0.0006784477736800909, -0.0004861312045250088, -0.0002938146353699267, -0.00010149803711101413, 9.081856114789844e-05, 0.0002831351011991501, 0.00047545169945806265, 0.0006677682977169752, 0.0008600848959758878, 0.0010524014942348003, 0.001244717976078391, 0.0014370346907526255, 0.0016293511725962162, 0.0018216677708551288, 0.0020139843691140413, 0.002206300850957632, 0.002398617332801223, 0.002590934047475457, 0.002783250529319048, 0.0029755672439932823, 0.003167883725836873, 0.003360200207680464, 0.003552516922354698, 0.0037448336370289326, 0.003937150351703167, 0.004129466600716114, 0.0043217833153903484, 0.004514100030064583, 0.004706416744738817, 0.004898732993751764, 0.005091049708425999, 0.005283366423100233, 0.0054756831377744675, 0.0056679993867874146, 0.005860316101461649, 0.006052632816135883, 0.006244949530810118, 0.006437265779823065, 0.006629582494497299, 0.006821898743510246, 0.007014215458184481, 0.007206531707197428, 0.007398848421871662, 0.0075911651365458965, 0.007783481851220131, 0.007975798100233078, 0.008168114349246025, 0.008360431529581547, 0.008552747778594494, 0.008745064958930016, 0.008937381207942963, 0.00912969745695591, 0.009322014637291431, 0.009514330886304379, 0.0097066480666399, 0.009898964315652847]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 10.0, 19.0, 15.0, 16.0, 23.0, 25.0, 25.0, 24.0, 32.0, 39.0, 39.0, 38.0, 38.0, 42.0, 45.0, 51.0, 46.0, 40.0, 39.0, 43.0, 37.0, 36.0, 35.0, 27.0, 35.0, 21.0, 23.0, 12.0, 10.0, 19.0, 15.0, 14.0, 10.0, 5.0, 9.0, 2.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0004904270172119141, -0.0004765978083014488, -0.0004627685993909836, -0.00044893939048051834, -0.0004351101815700531, -0.00042128097265958786, -0.0004074517637491226, -0.0003936225548386574, -0.00037979334592819214, -0.0003659641370177269, -0.00035213492810726166, -0.0003383057191967964, -0.0003244765102863312, -0.00031064730137586594, -0.0002968180924654007, -0.00028298888355493546, -0.0002691596746444702, -0.000255330465734005, -0.00024150125682353973, -0.0002276720479130745, -0.00021384283900260925, -0.000200013630092144, -0.00018618442118167877, -0.00017235521227121353, -0.0001585260033607483, -0.00014469679445028305, -0.0001308675855398178, -0.00011703837662935257, -0.00010320916771888733, -8.937995880842209e-05, -7.555074989795685e-05, -6.172154098749161e-05, -4.789233207702637e-05, -3.406312316656113e-05, -2.0233914256095886e-05, -6.404705345630646e-06, 7.424503564834595e-06, 2.1253712475299835e-05, 3.5082921385765076e-05, 4.8912130296230316e-05, 6.274133920669556e-05, 7.65705481171608e-05, 9.039975702762604e-05, 0.00010422896593809128, 0.00011805817484855652, 0.00013188738375902176, 0.000145716592669487, 0.00015954580157995224, 0.00017337501049041748, 0.00018720421940088272, 0.00020103342831134796, 0.0002148626372218132, 0.00022869184613227844, 0.00024252105504274368, 0.0002563502639532089, 0.00027017947286367416, 0.0002840086817741394, 0.00029783789068460464, 0.0003116670995950699, 0.0003254963085055351, 0.00033932551741600037, 0.0003531547263264656, 0.00036698393523693085, 0.0003808131441473961, 0.00039464235305786133]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 8.0, 8.0, 2.0, 8.0, 15.0, 19.0, 19.0, 18.0, 28.0, 28.0, 28.0, 31.0, 39.0, 46.0, 48.0, 31.0, 45.0, 42.0, 46.0, 45.0, 38.0, 42.0, 33.0, 35.0, 32.0, 33.0, 36.0, 27.0, 22.0, 15.0, 23.0, 13.0, 20.0, 19.0, 6.0, 13.0, 7.0, 4.0, 5.0, 2.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.44921875, -4.320526123046875, -4.19183349609375, -4.063140869140625, -3.9344482421875, -3.805755615234375, -3.67706298828125, -3.548370361328125, -3.419677734375, -3.290985107421875, -3.16229248046875, -3.033599853515625, -2.9049072265625, -2.776214599609375, -2.64752197265625, -2.518829345703125, -2.39013671875, -2.261444091796875, -2.13275146484375, -2.004058837890625, -1.8753662109375, -1.746673583984375, -1.61798095703125, -1.489288330078125, -1.360595703125, -1.231903076171875, -1.10321044921875, -0.974517822265625, -0.8458251953125, -0.717132568359375, -0.58843994140625, -0.459747314453125, -0.3310546875, -0.202362060546875, -0.07366943359375, 0.055023193359375, 0.1837158203125, 0.312408447265625, 0.44110107421875, 0.569793701171875, 0.698486328125, 0.827178955078125, 0.95587158203125, 1.084564208984375, 1.2132568359375, 1.341949462890625, 1.47064208984375, 1.599334716796875, 1.72802734375, 1.856719970703125, 1.98541259765625, 2.114105224609375, 2.2427978515625, 2.371490478515625, 2.50018310546875, 2.628875732421875, 2.757568359375, 2.886260986328125, 3.01495361328125, 3.143646240234375, 3.2723388671875, 3.401031494140625, 3.52972412109375, 3.658416748046875, 3.787109375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 10.0, 14.0, 27.0, 44.0, 57.0, 81.0, 140.0, 195.0, 290.0, 467.0, 694.0, 1078.0, 1615.0, 2686.0, 4119.0, 6863.0, 10796.0, 17771.0, 28542.0, 48818.0, 93650.0, 210939.0, 300369.0, 148193.0, 70398.0, 38848.0, 23248.0, 14204.0, 9056.0, 5638.0, 3548.0, 2202.0, 1398.0, 881.0, 536.0, 383.0, 255.0, 178.0, 114.0, 71.0, 46.0, 32.0, 21.0, 14.0, 7.0, 9.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-4.828125, -4.68310546875, -4.5380859375, -4.39306640625, -4.248046875, -4.10302734375, -3.9580078125, -3.81298828125, -3.66796875, -3.52294921875, -3.3779296875, -3.23291015625, -3.087890625, -2.94287109375, -2.7978515625, -2.65283203125, -2.5078125, -2.36279296875, -2.2177734375, -2.07275390625, -1.927734375, -1.78271484375, -1.6376953125, -1.49267578125, -1.34765625, -1.20263671875, -1.0576171875, -0.91259765625, -0.767578125, -0.62255859375, -0.4775390625, -0.33251953125, -0.1875, -0.04248046875, 0.1025390625, 0.24755859375, 0.392578125, 0.53759765625, 0.6826171875, 0.82763671875, 0.97265625, 1.11767578125, 1.2626953125, 1.40771484375, 1.552734375, 1.69775390625, 1.8427734375, 1.98779296875, 2.1328125, 2.27783203125, 2.4228515625, 2.56787109375, 2.712890625, 2.85791015625, 3.0029296875, 3.14794921875, 3.29296875, 3.43798828125, 3.5830078125, 3.72802734375, 3.873046875, 4.01806640625, 4.1630859375, 4.30810546875, 4.453125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 1.0, 7.0, 4.0, 5.0, 6.0, 9.0, 5.0, 16.0, 13.0, 12.0, 9.0, 11.0, 26.0, 23.0, 32.0, 37.0, 29.0, 44.0, 38.0, 54.0, 67.0, 81.0, 147.0, 211.0, 1346.0, 197.0, 127.0, 63.0, 75.0, 56.0, 43.0, 41.0, 37.0, 29.0, 16.0, 18.0, 25.0, 11.0, 10.0, 14.0, 14.0, 13.0, 4.0, 5.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.5078125, -10.1380615234375, -9.768310546875, -9.3985595703125, -9.02880859375, -8.6590576171875, -8.289306640625, -7.9195556640625, -7.5498046875, -7.1800537109375, -6.810302734375, -6.4405517578125, -6.07080078125, -5.7010498046875, -5.331298828125, -4.9615478515625, -4.591796875, -4.2220458984375, -3.852294921875, -3.4825439453125, -3.11279296875, -2.7430419921875, -2.373291015625, -2.0035400390625, -1.6337890625, -1.2640380859375, -0.894287109375, -0.5245361328125, -0.15478515625, 0.2149658203125, 0.584716796875, 0.9544677734375, 1.32421875, 1.6939697265625, 2.063720703125, 2.4334716796875, 2.80322265625, 3.1729736328125, 3.542724609375, 3.9124755859375, 4.2822265625, 4.6519775390625, 5.021728515625, 5.3914794921875, 5.76123046875, 6.1309814453125, 6.500732421875, 6.8704833984375, 7.240234375, 7.6099853515625, 7.979736328125, 8.3494873046875, 8.71923828125, 9.0889892578125, 9.458740234375, 9.8284912109375, 10.1982421875, 10.5679931640625, 10.937744140625, 11.3074951171875, 11.67724609375, 12.0469970703125, 12.416748046875, 12.7864990234375, 13.15625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 5.0, 3.0, 4.0, 11.0, 5.0, 12.0, 7.0, 18.0, 15.0, 20.0, 33.0, 42.0, 51.0, 57.0, 93.0, 110.0, 186.0, 330.0, 644.0, 1719.0, 6042.0, 26518.0, 153274.0, 1776731.0, 1049072.0, 103653.0, 19510.0, 4646.0, 1391.0, 536.0, 274.0, 165.0, 143.0, 98.0, 67.0, 51.0, 29.0, 28.0, 23.0, 18.0, 13.0, 11.0, 11.0, 15.0, 6.0, 8.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-13.546875, -13.15869140625, -12.7705078125, -12.38232421875, -11.994140625, -11.60595703125, -11.2177734375, -10.82958984375, -10.44140625, -10.05322265625, -9.6650390625, -9.27685546875, -8.888671875, -8.50048828125, -8.1123046875, -7.72412109375, -7.3359375, -6.94775390625, -6.5595703125, -6.17138671875, -5.783203125, -5.39501953125, -5.0068359375, -4.61865234375, -4.23046875, -3.84228515625, -3.4541015625, -3.06591796875, -2.677734375, -2.28955078125, -1.9013671875, -1.51318359375, -1.125, -0.73681640625, -0.3486328125, 0.03955078125, 0.427734375, 0.81591796875, 1.2041015625, 1.59228515625, 1.98046875, 2.36865234375, 2.7568359375, 3.14501953125, 3.533203125, 3.92138671875, 4.3095703125, 4.69775390625, 5.0859375, 5.47412109375, 5.8623046875, 6.25048828125, 6.638671875, 7.02685546875, 7.4150390625, 7.80322265625, 8.19140625, 8.57958984375, 8.9677734375, 9.35595703125, 9.744140625, 10.13232421875, 10.5205078125, 10.90869140625, 11.296875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 10.0, 14.0, 34.0, 35.0, 58.0, 86.0, 103.0, 124.0, 113.0, 120.0, 93.0, 77.0, 58.0, 30.0, 23.0, 9.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.431642532348633, -19.52145767211914, -18.61127471923828, -17.70108985900879, -16.79090690612793, -15.880722045898438, -14.970538139343262, -14.060354232788086, -13.15017032623291, -12.239986419677734, -11.329802513122559, -10.419618606567383, -9.50943374633789, -8.599250793457031, -7.689065933227539, -6.778882026672363, -5.8686981201171875, -4.958514213562012, -4.048330307006836, -3.138145923614502, -2.227962017059326, -1.3177781105041504, -0.4075937271118164, 0.5025901794433594, 1.4127740859985352, 2.322957992553711, 3.233142137527466, 4.143326282501221, 5.0535101890563965, 5.963694095611572, 6.873878479003906, 7.784062385559082, 8.694244384765625, 9.6044282913208, 10.514612197875977, 11.424797058105469, 12.334980010986328, 13.24516487121582, 14.155348777770996, 15.065532684326172, 15.975716590881348, 16.885900497436523, 17.796085357666016, 18.706268310546875, 19.616453170776367, 20.526636123657227, 21.43682098388672, 22.347003936767578, 23.25718879699707, 24.167373657226562, 25.077556610107422, 25.987741470336914, 26.897924423217773, 27.808109283447266, 28.718292236328125, 29.628477096557617, 30.53866195678711, 31.4488468170166, 32.359031677246094, 33.26921463012695, 34.17939758300781, 35.08958053588867, 35.9997673034668, 36.909950256347656, 37.820133209228516]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 9.0, 9.0, 11.0, 11.0, 15.0, 17.0, 23.0, 23.0, 26.0, 23.0, 31.0, 31.0, 46.0, 45.0, 34.0, 37.0, 51.0, 51.0, 52.0, 44.0, 33.0, 43.0, 34.0, 43.0, 44.0, 25.0, 19.0, 30.0, 15.0, 27.0, 13.0, 16.0, 12.0, 14.0, 9.0, 2.0, 11.0, 6.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.04414367675781, -32.93817901611328, -31.832218170166016, -30.726255416870117, -29.62029266357422, -28.51432991027832, -27.408367156982422, -26.302404403686523, -25.196441650390625, -24.090478897094727, -22.984516143798828, -21.87855339050293, -20.77259063720703, -19.666627883911133, -18.560665130615234, -17.454702377319336, -16.348739624023438, -15.242776870727539, -14.13681411743164, -13.030851364135742, -11.924888610839844, -10.818925857543945, -9.712963104248047, -8.607000350952148, -7.50103759765625, -6.395074844360352, -5.289112091064453, -4.183149337768555, -3.0771865844726562, -1.9712238311767578, -0.8652610778808594, 0.24070167541503906, 1.3466682434082031, 2.4526309967041016, 3.55859375, 4.664556503295898, 5.770519256591797, 6.876482009887695, 7.982444763183594, 9.088407516479492, 10.19437026977539, 11.300333023071289, 12.406295776367188, 13.512258529663086, 14.618221282958984, 15.724184036254883, 16.83014678955078, 17.93610954284668, 19.042072296142578, 20.148035049438477, 21.253997802734375, 22.359960556030273, 23.465923309326172, 24.57188606262207, 25.67784881591797, 26.783811569213867, 27.889774322509766, 28.995737075805664, 30.101699829101562, 31.20766258239746, 32.31362533569336, 33.419586181640625, 34.525550842285156, 35.63151550292969, 36.73747634887695]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 5.0, 6.0, 6.0, 5.0, 7.0, 16.0, 15.0, 13.0, 19.0, 19.0, 20.0, 18.0, 36.0, 46.0, 33.0, 38.0, 42.0, 42.0, 42.0, 40.0, 42.0, 38.0, 46.0, 35.0, 39.0, 35.0, 37.0, 28.0, 30.0, 22.0, 30.0, 24.0, 26.0, 13.0, 15.0, 14.0, 19.0, 7.0, 6.0, 4.0, 6.0, 5.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0], "bins": [-4.6953125, -4.564361572265625, -4.43341064453125, -4.302459716796875, -4.1715087890625, -4.040557861328125, -3.90960693359375, -3.778656005859375, -3.647705078125, -3.516754150390625, -3.38580322265625, -3.254852294921875, -3.1239013671875, -2.992950439453125, -2.86199951171875, -2.731048583984375, -2.60009765625, -2.469146728515625, -2.33819580078125, -2.207244873046875, -2.0762939453125, -1.945343017578125, -1.81439208984375, -1.683441162109375, -1.552490234375, -1.421539306640625, -1.29058837890625, -1.159637451171875, -1.0286865234375, -0.897735595703125, -0.76678466796875, -0.635833740234375, -0.5048828125, -0.373931884765625, -0.24298095703125, -0.112030029296875, 0.0189208984375, 0.149871826171875, 0.28082275390625, 0.411773681640625, 0.542724609375, 0.673675537109375, 0.80462646484375, 0.935577392578125, 1.0665283203125, 1.197479248046875, 1.32843017578125, 1.459381103515625, 1.59033203125, 1.721282958984375, 1.85223388671875, 1.983184814453125, 2.1141357421875, 2.245086669921875, 2.37603759765625, 2.506988525390625, 2.637939453125, 2.768890380859375, 2.89984130859375, 3.030792236328125, 3.1617431640625, 3.292694091796875, 3.42364501953125, 3.554595947265625, 3.685546875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 11.0, 11.0, 12.0, 14.0, 22.0, 33.0, 42.0, 65.0, 59.0, 127.0, 184.0, 289.0, 493.0, 964.0, 2076.0, 5440.0, 20010.0, 116945.0, 1016475.0, 2528107.0, 429394.0, 54856.0, 11300.0, 3715.0, 1589.0, 824.0, 445.0, 225.0, 145.0, 115.0, 78.0, 54.0, 43.0, 25.0, 14.0, 18.0, 17.0, 3.0, 7.0, 11.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-10.6875, -10.384765625, -10.08203125, -9.779296875, -9.4765625, -9.173828125, -8.87109375, -8.568359375, -8.265625, -7.962890625, -7.66015625, -7.357421875, -7.0546875, -6.751953125, -6.44921875, -6.146484375, -5.84375, -5.541015625, -5.23828125, -4.935546875, -4.6328125, -4.330078125, -4.02734375, -3.724609375, -3.421875, -3.119140625, -2.81640625, -2.513671875, -2.2109375, -1.908203125, -1.60546875, -1.302734375, -1.0, -0.697265625, -0.39453125, -0.091796875, 0.2109375, 0.513671875, 0.81640625, 1.119140625, 1.421875, 1.724609375, 2.02734375, 2.330078125, 2.6328125, 2.935546875, 3.23828125, 3.541015625, 3.84375, 4.146484375, 4.44921875, 4.751953125, 5.0546875, 5.357421875, 5.66015625, 5.962890625, 6.265625, 6.568359375, 6.87109375, 7.173828125, 7.4765625, 7.779296875, 8.08203125, 8.384765625, 8.6875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 14.0, 24.0, 18.0, 31.0, 45.0, 72.0, 117.0, 167.0, 253.0, 381.0, 519.0, 613.0, 545.0, 395.0, 292.0, 162.0, 127.0, 76.0, 62.0, 41.0, 28.0, 25.0, 19.0, 14.0, 7.0, 5.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.953125, -8.6866455078125, -8.420166015625, -8.1536865234375, -7.88720703125, -7.6207275390625, -7.354248046875, -7.0877685546875, -6.8212890625, -6.5548095703125, -6.288330078125, -6.0218505859375, -5.75537109375, -5.4888916015625, -5.222412109375, -4.9559326171875, -4.689453125, -4.4229736328125, -4.156494140625, -3.8900146484375, -3.62353515625, -3.3570556640625, -3.090576171875, -2.8240966796875, -2.5576171875, -2.2911376953125, -2.024658203125, -1.7581787109375, -1.49169921875, -1.2252197265625, -0.958740234375, -0.6922607421875, -0.42578125, -0.1593017578125, 0.107177734375, 0.3736572265625, 0.64013671875, 0.9066162109375, 1.173095703125, 1.4395751953125, 1.7060546875, 1.9725341796875, 2.239013671875, 2.5054931640625, 2.77197265625, 3.0384521484375, 3.304931640625, 3.5714111328125, 3.837890625, 4.1043701171875, 4.370849609375, 4.6373291015625, 4.90380859375, 5.1702880859375, 5.436767578125, 5.7032470703125, 5.9697265625, 6.2362060546875, 6.502685546875, 6.7691650390625, 7.03564453125, 7.3021240234375, 7.568603515625, 7.8350830078125, 8.1015625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 18.0, 13.0, 23.0, 41.0, 49.0, 74.0, 103.0, 228.0, 386.0, 1093.0, 7105.0, 302912.0, 3806578.0, 70754.0, 3380.0, 740.0, 345.0, 163.0, 105.0, 46.0, 30.0, 30.0, 16.0, 15.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.265625, -28.268310546875, -27.27099609375, -26.273681640625, -25.2763671875, -24.279052734375, -23.28173828125, -22.284423828125, -21.287109375, -20.289794921875, -19.29248046875, -18.295166015625, -17.2978515625, -16.300537109375, -15.30322265625, -14.305908203125, -13.30859375, -12.311279296875, -11.31396484375, -10.316650390625, -9.3193359375, -8.322021484375, -7.32470703125, -6.327392578125, -5.330078125, -4.332763671875, -3.33544921875, -2.338134765625, -1.3408203125, -0.343505859375, 0.65380859375, 1.651123046875, 2.6484375, 3.645751953125, 4.64306640625, 5.640380859375, 6.6376953125, 7.635009765625, 8.63232421875, 9.629638671875, 10.626953125, 11.624267578125, 12.62158203125, 13.618896484375, 14.6162109375, 15.613525390625, 16.61083984375, 17.608154296875, 18.60546875, 19.602783203125, 20.60009765625, 21.597412109375, 22.5947265625, 23.592041015625, 24.58935546875, 25.586669921875, 26.583984375, 27.581298828125, 28.57861328125, 29.575927734375, 30.5732421875, 31.570556640625, 32.56787109375, 33.565185546875, 34.5625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 18.0, 63.0, 159.0, 265.0, 251.0, 158.0, 68.0, 19.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.928932189941406, -38.51460266113281, -36.10027313232422, -33.685943603515625, -31.27161407470703, -28.857284545898438, -26.44295310974121, -24.028623580932617, -21.614294052124023, -19.19996452331543, -16.785634994506836, -14.371304512023926, -11.956974983215332, -9.542645454406738, -7.128314971923828, -4.713985443115234, -2.2996559143066406, 0.11467385292053223, 2.529003620147705, 4.943333625793457, 7.357663154602051, 9.771992683410645, 12.186323165893555, 14.600652694702148, 17.014982223510742, 19.429311752319336, 21.84364128112793, 24.257972717285156, 26.67230224609375, 29.086631774902344, 31.500961303710938, 33.91529083251953, 36.329620361328125, 38.74394989013672, 41.15827941894531, 43.572608947753906, 45.9869384765625, 48.401268005371094, 50.81559753417969, 53.22992706298828, 55.644256591796875, 58.05858612060547, 60.47291564941406, 62.887245178222656, 65.30157470703125, 67.71590423583984, 70.13023376464844, 72.54456329345703, 74.95889282226562, 77.37322235107422, 79.78755187988281, 82.2018814086914, 84.6162109375, 87.0305404663086, 89.44486999511719, 91.85919952392578, 94.2735366821289, 96.6878662109375, 99.1021957397461, 101.51652526855469, 103.93085479736328, 106.34518432617188, 108.75951385498047, 111.17384338378906, 113.58817291259766]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 7.0, 10.0, 12.0, 11.0, 15.0, 11.0, 15.0, 23.0, 25.0, 25.0, 29.0, 32.0, 30.0, 34.0, 39.0, 34.0, 28.0, 37.0, 54.0, 45.0, 41.0, 42.0, 38.0, 29.0, 40.0, 39.0, 34.0, 32.0, 36.0, 18.0, 16.0, 22.0, 18.0, 12.0, 13.0, 11.0, 12.0, 6.0, 4.0, 8.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.781631469726562, -21.092193603515625, -20.402755737304688, -19.71331787109375, -19.023880004882812, -18.334442138671875, -17.645004272460938, -16.95556640625, -16.266128540039062, -15.576690673828125, -14.887252807617188, -14.19781494140625, -13.508377075195312, -12.818939208984375, -12.129501342773438, -11.4400634765625, -10.750624656677246, -10.061186790466309, -9.371748924255371, -8.682311058044434, -7.992873191833496, -7.303435325622559, -6.613996982574463, -5.924559116363525, -5.235121250152588, -4.54568338394165, -3.856245517730713, -3.1668074131011963, -2.477369546890259, -1.7879316806793213, -1.0984935760498047, -0.4090557098388672, 0.2803821563720703, 0.9698200821876526, 1.6592580080032349, 2.348695993423462, 3.0381338596343994, 3.727571725845337, 4.4170098304748535, 5.106447696685791, 5.7958855628967285, 6.485323429107666, 7.1747612953186035, 7.864199638366699, 8.553637504577637, 9.243075370788574, 9.932513236999512, 10.62195110321045, 11.311388969421387, 12.000826835632324, 12.690264701843262, 13.3797025680542, 14.069140434265137, 14.758578300476074, 15.448017120361328, 16.137454986572266, 16.826892852783203, 17.51633071899414, 18.205768585205078, 18.895206451416016, 19.584644317626953, 20.27408218383789, 20.963520050048828, 21.652957916259766, 22.342395782470703]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 4.0, 6.0, 7.0, 18.0, 16.0, 14.0, 12.0, 19.0, 24.0, 28.0, 22.0, 23.0, 34.0, 32.0, 44.0, 39.0, 33.0, 32.0, 33.0, 43.0, 45.0, 51.0, 30.0, 35.0, 42.0, 36.0, 30.0, 31.0, 28.0, 21.0, 24.0, 16.0, 19.0, 15.0, 12.0, 12.0, 14.0, 10.0, 11.0, 2.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.625, -4.498931884765625, -4.37286376953125, -4.246795654296875, -4.1207275390625, -3.994659423828125, -3.86859130859375, -3.742523193359375, -3.616455078125, -3.490386962890625, -3.36431884765625, -3.238250732421875, -3.1121826171875, -2.986114501953125, -2.86004638671875, -2.733978271484375, -2.60791015625, -2.481842041015625, -2.35577392578125, -2.229705810546875, -2.1036376953125, -1.977569580078125, -1.85150146484375, -1.725433349609375, -1.599365234375, -1.473297119140625, -1.34722900390625, -1.221160888671875, -1.0950927734375, -0.969024658203125, -0.84295654296875, -0.716888427734375, -0.5908203125, -0.464752197265625, -0.33868408203125, -0.212615966796875, -0.0865478515625, 0.039520263671875, 0.16558837890625, 0.291656494140625, 0.417724609375, 0.543792724609375, 0.66986083984375, 0.795928955078125, 0.9219970703125, 1.048065185546875, 1.17413330078125, 1.300201416015625, 1.42626953125, 1.552337646484375, 1.67840576171875, 1.804473876953125, 1.9305419921875, 2.056610107421875, 2.18267822265625, 2.308746337890625, 2.434814453125, 2.560882568359375, 2.68695068359375, 2.813018798828125, 2.9390869140625, 3.065155029296875, 3.19122314453125, 3.317291259765625, 3.443359375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 11.0, 17.0, 17.0, 24.0, 38.0, 59.0, 74.0, 130.0, 193.0, 255.0, 325.0, 540.0, 682.0, 1004.0, 1456.0, 2148.0, 3097.0, 4459.0, 6469.0, 9369.0, 13539.0, 19965.0, 29504.0, 43999.0, 71187.0, 129268.0, 256506.0, 189680.0, 94398.0, 56455.0, 36180.0, 24258.0, 16640.0, 11363.0, 7739.0, 5308.0, 3713.0, 2534.0, 1792.0, 1295.0, 866.0, 611.0, 415.0, 304.0, 199.0, 134.0, 104.0, 73.0, 61.0, 46.0, 25.0, 11.0, 6.0, 8.0, 3.0, 0.0, 0.0, 6.0], "bins": [-0.1502685546875, -0.14568138122558594, -0.14109420776367188, -0.1365070343017578, -0.13191986083984375, -0.1273326873779297, -0.12274551391601562, -0.11815834045410156, -0.1135711669921875, -0.10898399353027344, -0.10439682006835938, -0.09980964660644531, -0.09522247314453125, -0.09063529968261719, -0.08604812622070312, -0.08146095275878906, -0.076873779296875, -0.07228660583496094, -0.06769943237304688, -0.06311225891113281, -0.05852508544921875, -0.05393791198730469, -0.049350738525390625, -0.04476356506347656, -0.0401763916015625, -0.03558921813964844, -0.031002044677734375, -0.026414871215820312, -0.02182769775390625, -0.017240524291992188, -0.012653350830078125, -0.008066177368164062, -0.00347900390625, 0.0011081695556640625, 0.005695343017578125, 0.010282516479492188, 0.01486968994140625, 0.019456863403320312, 0.024044036865234375, 0.028631210327148438, 0.0332183837890625, 0.03780555725097656, 0.042392730712890625, 0.04697990417480469, 0.05156707763671875, 0.05615425109863281, 0.060741424560546875, 0.06532859802246094, 0.069915771484375, 0.07450294494628906, 0.07909011840820312, 0.08367729187011719, 0.08826446533203125, 0.09285163879394531, 0.09743881225585938, 0.10202598571777344, 0.1066131591796875, 0.11120033264160156, 0.11578750610351562, 0.12037467956542969, 0.12496185302734375, 0.1295490264892578, 0.13413619995117188, 0.13872337341308594, 0.143310546875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 5.0, 5.0, 8.0, 9.0, 11.0, 15.0, 13.0, 15.0, 22.0, 24.0, 24.0, 26.0, 29.0, 21.0, 27.0, 37.0, 36.0, 46.0, 33.0, 1067.0, 52.0, 36.0, 42.0, 49.0, 45.0, 37.0, 30.0, 44.0, 30.0, 29.0, 25.0, 13.0, 16.0, 25.0, 14.0, 10.0, 7.0, 8.0, 7.0, 6.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.787109375, -3.668365478515625, -3.54962158203125, -3.430877685546875, -3.3121337890625, -3.193389892578125, -3.07464599609375, -2.955902099609375, -2.837158203125, -2.718414306640625, -2.59967041015625, -2.480926513671875, -2.3621826171875, -2.243438720703125, -2.12469482421875, -2.005950927734375, -1.88720703125, -1.768463134765625, -1.64971923828125, -1.530975341796875, -1.4122314453125, -1.293487548828125, -1.17474365234375, -1.055999755859375, -0.937255859375, -0.818511962890625, -0.69976806640625, -0.581024169921875, -0.4622802734375, -0.343536376953125, -0.22479248046875, -0.106048583984375, 0.0126953125, 0.131439208984375, 0.25018310546875, 0.368927001953125, 0.4876708984375, 0.606414794921875, 0.72515869140625, 0.843902587890625, 0.962646484375, 1.081390380859375, 1.20013427734375, 1.318878173828125, 1.4376220703125, 1.556365966796875, 1.67510986328125, 1.793853759765625, 1.91259765625, 2.031341552734375, 2.15008544921875, 2.268829345703125, 2.3875732421875, 2.506317138671875, 2.62506103515625, 2.743804931640625, 2.862548828125, 2.981292724609375, 3.10003662109375, 3.218780517578125, 3.3375244140625, 3.456268310546875, 3.57501220703125, 3.693756103515625, 3.8125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 6.0, 5.0, 15.0, 14.0, 30.0, 35.0, 51.0, 82.0, 109.0, 147.0, 219.0, 321.0, 461.0, 659.0, 1046.0, 1497.0, 2162.0, 3214.0, 4618.0, 6749.0, 10223.0, 15669.0, 24027.0, 36993.0, 60929.0, 107170.0, 214845.0, 1285791.0, 127578.0, 71110.0, 42447.0, 26862.0, 17252.0, 11402.0, 7629.0, 5060.0, 3420.0, 2257.0, 1517.0, 1102.0, 737.0, 515.0, 371.0, 252.0, 167.0, 116.0, 81.0, 50.0, 45.0, 33.0, 18.0, 13.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.06304931640625, -0.06102466583251953, -0.05900001525878906, -0.056975364685058594, -0.054950714111328125, -0.052926063537597656, -0.05090141296386719, -0.04887676239013672, -0.04685211181640625, -0.04482746124267578, -0.04280281066894531, -0.040778160095214844, -0.038753509521484375, -0.036728858947753906, -0.03470420837402344, -0.03267955780029297, -0.0306549072265625, -0.02863025665283203, -0.026605606079101562, -0.024580955505371094, -0.022556304931640625, -0.020531654357910156, -0.018507003784179688, -0.01648235321044922, -0.01445770263671875, -0.012433052062988281, -0.010408401489257812, -0.008383750915527344, -0.006359100341796875, -0.004334449768066406, -0.0023097991943359375, -0.00028514862060546875, 0.001739501953125, 0.0037641525268554688, 0.0057888031005859375, 0.007813453674316406, 0.009838104248046875, 0.011862754821777344, 0.013887405395507812, 0.01591205596923828, 0.01793670654296875, 0.01996135711669922, 0.021986007690429688, 0.024010658264160156, 0.026035308837890625, 0.028059959411621094, 0.030084609985351562, 0.03210926055908203, 0.0341339111328125, 0.03615856170654297, 0.03818321228027344, 0.040207862854003906, 0.042232513427734375, 0.044257164001464844, 0.04628181457519531, 0.04830646514892578, 0.05033111572265625, 0.05235576629638672, 0.05438041687011719, 0.056405067443847656, 0.058429718017578125, 0.060454368591308594, 0.06247901916503906, 0.06450366973876953, 0.0665283203125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 11.0, 6.0, 7.0, 9.0, 8.0, 13.0, 13.0, 25.0, 18.0, 43.0, 28.0, 56.0, 67.0, 71.0, 86.0, 86.0, 82.0, 65.0, 51.0, 40.0, 30.0, 25.0, 26.0, 17.0, 20.0, 11.0, 18.0, 8.0, 11.0, 7.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0002872943878173828, -0.00027855485677719116, -0.0002698153257369995, -0.00026107579469680786, -0.0002523362636566162, -0.00024359673261642456, -0.0002348572015762329, -0.00022611767053604126, -0.0002173781394958496, -0.00020863860845565796, -0.0001998990774154663, -0.00019115954637527466, -0.000182420015335083, -0.00017368048429489136, -0.0001649409532546997, -0.00015620142221450806, -0.0001474618911743164, -0.00013872236013412476, -0.0001299828290939331, -0.00012124329805374146, -0.0001125037670135498, -0.00010376423597335815, -9.50247049331665e-05, -8.628517389297485e-05, -7.75456428527832e-05, -6.880611181259155e-05, -6.00665807723999e-05, -5.132704973220825e-05, -4.25875186920166e-05, -3.384798765182495e-05, -2.51084566116333e-05, -1.636892557144165e-05, -7.62939453125e-06, 1.1101365089416504e-06, 9.8496675491333e-06, 1.858919858932495e-05, 2.73287296295166e-05, 3.606826066970825e-05, 4.48077917098999e-05, 5.354732275009155e-05, 6.22868537902832e-05, 7.102638483047485e-05, 7.97659158706665e-05, 8.850544691085815e-05, 9.72449779510498e-05, 0.00010598450899124146, 0.0001147240400314331, 0.00012346357107162476, 0.0001322031021118164, 0.00014094263315200806, 0.0001496821641921997, 0.00015842169523239136, 0.000167161226272583, 0.00017590075731277466, 0.0001846402883529663, 0.00019337981939315796, 0.0002021193504333496, 0.00021085888147354126, 0.0002195984125137329, 0.00022833794355392456, 0.0002370774745941162, 0.00024581700563430786, 0.0002545565366744995, 0.00026329606771469116, 0.0002720355987548828]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 0.0, 3.0, 4.0, 5.0, 4.0, 9.0, 7.0, 10.0, 12.0, 21.0, 19.0, 24.0, 26.0, 38.0, 40.0, 92.0, 165.0, 648.0, 7752.0, 257446.0, 764361.0, 16240.0, 1117.0, 195.0, 104.0, 51.0, 29.0, 27.0, 19.0, 17.0, 7.0, 14.0, 7.0, 10.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0066375732421875, -0.006417214870452881, -0.006196856498718262, -0.005976498126983643, -0.0057561397552490234, -0.005535781383514404, -0.005315423011779785, -0.005095064640045166, -0.004874706268310547, -0.004654347896575928, -0.004433989524841309, -0.0042136311531066895, -0.00399327278137207, -0.003772914409637451, -0.003552556037902832, -0.003332197666168213, -0.0031118392944335938, -0.0028914809226989746, -0.0026711225509643555, -0.0024507641792297363, -0.002230405807495117, -0.002010047435760498, -0.001789689064025879, -0.0015693306922912598, -0.0013489723205566406, -0.0011286139488220215, -0.0009082555770874023, -0.0006878972053527832, -0.00046753883361816406, -0.0002471804618835449, -2.682209014892578e-05, 0.00019353628158569336, 0.0004138946533203125, 0.0006342530250549316, 0.0008546113967895508, 0.00107496976852417, 0.001295328140258789, 0.0015156865119934082, 0.0017360448837280273, 0.0019564032554626465, 0.0021767616271972656, 0.0023971199989318848, 0.002617478370666504, 0.002837836742401123, 0.003058195114135742, 0.0032785534858703613, 0.0034989118576049805, 0.0037192702293395996, 0.003939628601074219, 0.004159986972808838, 0.004380345344543457, 0.004600703716278076, 0.004821062088012695, 0.0050414204597473145, 0.005261778831481934, 0.005482137203216553, 0.005702495574951172, 0.005922853946685791, 0.00614321231842041, 0.006363570690155029, 0.0065839290618896484, 0.006804287433624268, 0.007024645805358887, 0.007245004177093506, 0.007465362548828125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 4.0, 16.0, 13.0, 37.0, 46.0, 105.0, 189.0, 248.0, 148.0, 83.0, 40.0, 25.0, 17.0, 11.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.00111119425855577, -0.001089525525458157, -0.001067856908775866, -0.0010461881756782532, -0.0010245195589959621, -0.0010028508258983493, -0.0009811822092160583, -0.0009595134761184454, -0.0009378448012284935, -0.0009161761263385415, -0.0008945074514485896, -0.0008728387765586376, -0.0008511700434610248, -0.0008295013685710728, -0.0008078326936811209, -0.0007861640187911689, -0.000764495343901217, -0.000742826669011265, -0.0007211579941213131, -0.0006994893192313612, -0.0006778206443414092, -0.0006561519112437963, -0.0006344832363538444, -0.0006128145614638925, -0.0005911458865739405, -0.0005694772116839886, -0.0005478085367940366, -0.0005261398619040847, -0.0005044711288064718, -0.00048280248302035034, -0.00046113377902656794, -0.000439465104136616, -0.0004177964583504945, -0.00039612778346054256, -0.00037445907946676016, -0.0003527904045768082, -0.00033112172968685627, -0.0003094530547969043, -0.0002877843799069524, -0.00026611567591317, -0.00024444700102321804, -0.0002227783261332661, -0.00020110963669139892, -0.00017944094724953175, -0.0001577722723595798, -0.00013610359746962786, -0.00011443490802776068, -9.276621858589351e-05, -7.109754369594157e-05, -4.942886153003201e-05, -2.776017936412245e-05, -6.091497198212892e-06, 1.5577184967696667e-05, 3.7245867133606225e-05, 5.8914549299515784e-05, 8.058323874138296e-05, 0.0001022519136313349, 0.00012392058852128685, 0.00014558927796315402, 0.0001672579674050212, 0.00018892664229497313, 0.00021059531718492508, 0.00023226400662679225, 0.0002539326960686594, 0.00027560137095861137]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 12.0, 9.0, 6.0, 17.0, 21.0, 15.0, 27.0, 28.0, 33.0, 40.0, 48.0, 42.0, 40.0, 46.0, 58.0, 49.0, 54.0, 51.0, 46.0, 50.0, 37.0, 39.0, 43.0, 25.0, 32.0, 24.0, 28.0, 14.0, 13.0, 12.0, 9.0, 4.0, 11.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0001927018165588379, -0.00018705707043409348, -0.00018141232430934906, -0.00017576757818460464, -0.00017012283205986023, -0.00016447808593511581, -0.0001588333398103714, -0.00015318859368562698, -0.00014754384756088257, -0.00014189910143613815, -0.00013625435531139374, -0.00013060960918664932, -0.0001249648630619049, -0.00011932011693716049, -0.00011367537081241608, -0.00010803062468767166, -0.00010238587856292725, -9.674113243818283e-05, -9.109638631343842e-05, -8.5451640188694e-05, -7.980689406394958e-05, -7.416214793920517e-05, -6.851740181446075e-05, -6.287265568971634e-05, -5.7227909564971924e-05, -5.158316344022751e-05, -4.593841731548309e-05, -4.029367119073868e-05, -3.464892506599426e-05, -2.9004178941249847e-05, -2.3359432816505432e-05, -1.7714686691761017e-05, -1.2069940567016602e-05, -6.425194442272186e-06, -7.80448317527771e-07, 4.864297807216644e-06, 1.050904393196106e-05, 1.6153790056705475e-05, 2.179853618144989e-05, 2.7443282306194305e-05, 3.308802843093872e-05, 3.8732774555683136e-05, 4.437752068042755e-05, 5.0022266805171967e-05, 5.566701292991638e-05, 6.13117590546608e-05, 6.695650517940521e-05, 7.260125130414963e-05, 7.824599742889404e-05, 8.389074355363846e-05, 8.953548967838287e-05, 9.518023580312729e-05, 0.0001008249819278717, 0.00010646972805261612, 0.00011211447417736053, 0.00011775922030210495, 0.00012340396642684937, 0.00012904871255159378, 0.0001346934586763382, 0.0001403382048010826, 0.00014598295092582703, 0.00015162769705057144, 0.00015727244317531586, 0.00016291718930006027, 0.0001685619354248047]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 4.0, 6.0, 7.0, 18.0, 16.0, 14.0, 12.0, 19.0, 24.0, 28.0, 22.0, 23.0, 34.0, 32.0, 44.0, 39.0, 33.0, 32.0, 33.0, 43.0, 45.0, 51.0, 30.0, 35.0, 42.0, 36.0, 30.0, 31.0, 28.0, 21.0, 24.0, 16.0, 19.0, 15.0, 12.0, 12.0, 14.0, 10.0, 11.0, 2.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.625, -4.498931884765625, -4.37286376953125, -4.246795654296875, -4.1207275390625, -3.994659423828125, -3.86859130859375, -3.742523193359375, -3.616455078125, -3.490386962890625, -3.36431884765625, -3.238250732421875, -3.1121826171875, -2.986114501953125, -2.86004638671875, -2.733978271484375, -2.60791015625, -2.481842041015625, -2.35577392578125, -2.229705810546875, -2.1036376953125, -1.977569580078125, -1.85150146484375, -1.725433349609375, -1.599365234375, -1.473297119140625, -1.34722900390625, -1.221160888671875, -1.0950927734375, -0.969024658203125, -0.84295654296875, -0.716888427734375, -0.5908203125, -0.464752197265625, -0.33868408203125, -0.212615966796875, -0.0865478515625, 0.039520263671875, 0.16558837890625, 0.291656494140625, 0.417724609375, 0.543792724609375, 0.66986083984375, 0.795928955078125, 0.9219970703125, 1.048065185546875, 1.17413330078125, 1.300201416015625, 1.42626953125, 1.552337646484375, 1.67840576171875, 1.804473876953125, 1.9305419921875, 2.056610107421875, 2.18267822265625, 2.308746337890625, 2.434814453125, 2.560882568359375, 2.68695068359375, 2.813018798828125, 2.9390869140625, 3.065155029296875, 3.19122314453125, 3.317291259765625, 3.443359375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 6.0, 12.0, 11.0, 27.0, 33.0, 49.0, 59.0, 82.0, 138.0, 216.0, 316.0, 512.0, 784.0, 1154.0, 1976.0, 3350.0, 5653.0, 10131.0, 19394.0, 43950.0, 116288.0, 303441.0, 321516.0, 125963.0, 47450.0, 20506.0, 10701.0, 5858.0, 3400.0, 2015.0, 1236.0, 813.0, 484.0, 318.0, 254.0, 141.0, 105.0, 72.0, 45.0, 34.0, 21.0, 11.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.75494384765625, -5.5567626953125, -5.35858154296875, -5.160400390625, -4.96221923828125, -4.7640380859375, -4.56585693359375, -4.36767578125, -4.16949462890625, -3.9713134765625, -3.77313232421875, -3.574951171875, -3.37677001953125, -3.1785888671875, -2.98040771484375, -2.7822265625, -2.58404541015625, -2.3858642578125, -2.18768310546875, -1.989501953125, -1.79132080078125, -1.5931396484375, -1.39495849609375, -1.19677734375, -0.99859619140625, -0.8004150390625, -0.60223388671875, -0.404052734375, -0.20587158203125, -0.0076904296875, 0.19049072265625, 0.388671875, 0.58685302734375, 0.7850341796875, 0.98321533203125, 1.181396484375, 1.37957763671875, 1.5777587890625, 1.77593994140625, 1.97412109375, 2.17230224609375, 2.3704833984375, 2.56866455078125, 2.766845703125, 2.96502685546875, 3.1632080078125, 3.36138916015625, 3.5595703125, 3.75775146484375, 3.9559326171875, 4.15411376953125, 4.352294921875, 4.55047607421875, 4.7486572265625, 4.94683837890625, 5.14501953125, 5.34320068359375, 5.5413818359375, 5.73956298828125, 5.937744140625, 6.13592529296875, 6.3341064453125, 6.53228759765625, 6.73046875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 9.0, 5.0, 10.0, 14.0, 15.0, 15.0, 20.0, 27.0, 23.0, 20.0, 31.0, 38.0, 40.0, 50.0, 63.0, 75.0, 139.0, 252.0, 1406.0, 248.0, 129.0, 62.0, 59.0, 40.0, 51.0, 33.0, 27.0, 22.0, 30.0, 15.0, 16.0, 13.0, 10.0, 8.0, 8.0, 6.0, 7.0, 1.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3671875, -12.9285888671875, -12.489990234375, -12.0513916015625, -11.61279296875, -11.1741943359375, -10.735595703125, -10.2969970703125, -9.8583984375, -9.4197998046875, -8.981201171875, -8.5426025390625, -8.10400390625, -7.6654052734375, -7.226806640625, -6.7882080078125, -6.349609375, -5.9110107421875, -5.472412109375, -5.0338134765625, -4.59521484375, -4.1566162109375, -3.718017578125, -3.2794189453125, -2.8408203125, -2.4022216796875, -1.963623046875, -1.5250244140625, -1.08642578125, -0.6478271484375, -0.209228515625, 0.2293701171875, 0.66796875, 1.1065673828125, 1.545166015625, 1.9837646484375, 2.42236328125, 2.8609619140625, 3.299560546875, 3.7381591796875, 4.1767578125, 4.6153564453125, 5.053955078125, 5.4925537109375, 5.93115234375, 6.3697509765625, 6.808349609375, 7.2469482421875, 7.685546875, 8.1241455078125, 8.562744140625, 9.0013427734375, 9.43994140625, 9.8785400390625, 10.317138671875, 10.7557373046875, 11.1943359375, 11.6329345703125, 12.071533203125, 12.5101318359375, 12.94873046875, 13.3873291015625, 13.825927734375, 14.2645263671875, 14.703125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 7.0, 13.0, 11.0, 17.0, 26.0, 31.0, 54.0, 81.0, 88.0, 162.0, 286.0, 514.0, 1076.0, 3235.0, 15708.0, 135203.0, 2454310.0, 491251.0, 34495.0, 5874.0, 1649.0, 633.0, 346.0, 200.0, 138.0, 78.0, 59.0, 37.0, 35.0, 25.0, 17.0, 11.0, 13.0, 4.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.947509765625, -15.41064453125, -14.873779296875, -14.3369140625, -13.800048828125, -13.26318359375, -12.726318359375, -12.189453125, -11.652587890625, -11.11572265625, -10.578857421875, -10.0419921875, -9.505126953125, -8.96826171875, -8.431396484375, -7.89453125, -7.357666015625, -6.82080078125, -6.283935546875, -5.7470703125, -5.210205078125, -4.67333984375, -4.136474609375, -3.599609375, -3.062744140625, -2.52587890625, -1.989013671875, -1.4521484375, -0.915283203125, -0.37841796875, 0.158447265625, 0.6953125, 1.232177734375, 1.76904296875, 2.305908203125, 2.8427734375, 3.379638671875, 3.91650390625, 4.453369140625, 4.990234375, 5.527099609375, 6.06396484375, 6.600830078125, 7.1376953125, 7.674560546875, 8.21142578125, 8.748291015625, 9.28515625, 9.822021484375, 10.35888671875, 10.895751953125, 11.4326171875, 11.969482421875, 12.50634765625, 13.043212890625, 13.580078125, 14.116943359375, 14.65380859375, 15.190673828125, 15.7275390625, 16.264404296875, 16.80126953125, 17.338134765625, 17.875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 45.0, 275.0, 450.0, 212.0, 32.0, 1.0], "bins": [-228.4581756591797, -224.67642211914062, -220.89466857910156, -217.1129150390625, -213.33116149902344, -209.54940795898438, -205.76763916015625, -201.98590087890625, -198.20413208007812, -194.42237854003906, -190.640625, -186.85887145996094, -183.07711791992188, -179.2953643798828, -175.51361083984375, -171.73184204101562, -167.95010375976562, -164.16835021972656, -160.3865966796875, -156.60484313964844, -152.82308959960938, -149.0413360595703, -145.25958251953125, -141.47781372070312, -137.69606018066406, -133.914306640625, -130.13255310058594, -126.35079956054688, -122.56903839111328, -118.78728485107422, -115.00553131103516, -111.2237777709961, -107.44202423095703, -103.66027069091797, -99.8785171508789, -96.09675598144531, -92.31500244140625, -88.53324890136719, -84.75149536132812, -80.96974182128906, -77.18798828125, -73.40623474121094, -69.62448120117188, -65.84272766113281, -62.060970306396484, -58.279212951660156, -54.497459411621094, -50.71570587158203, -46.93395233154297, -43.152198791503906, -39.37044143676758, -35.588687896728516, -31.806934356689453, -28.025178909301758, -24.243423461914062, -20.461669921875, -16.679912567138672, -12.898158073425293, -9.116403579711914, -5.334648132324219, -1.5528936386108398, 2.228860855102539, 6.010616302490234, 9.792369842529297, 13.574124336242676]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 2.0, 11.0, 5.0, 12.0, 15.0, 11.0, 8.0, 16.0, 12.0, 28.0, 21.0, 20.0, 44.0, 36.0, 39.0, 35.0, 50.0, 43.0, 37.0, 50.0, 45.0, 46.0, 41.0, 37.0, 32.0, 41.0, 39.0, 32.0, 18.0, 28.0, 30.0, 15.0, 17.0, 8.0, 13.0, 6.0, 9.0, 15.0, 11.0, 9.0, 2.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.09288787841797, -35.01768493652344, -33.942481994628906, -32.867279052734375, -31.79207420349121, -30.71687126159668, -29.641666412353516, -28.566463470458984, -27.491260528564453, -26.416057586669922, -25.34085464477539, -24.265649795532227, -23.190446853637695, -22.115243911743164, -21.0400390625, -19.96483612060547, -18.889633178710938, -17.814430236816406, -16.739227294921875, -15.664022445678711, -14.58881950378418, -13.513616561889648, -12.4384126663208, -11.363208770751953, -10.288005828857422, -9.21280288696289, -8.137598991394043, -7.0623955726623535, -5.987192153930664, -4.911988735198975, -3.836785316467285, -2.7615818977355957, -1.6863784790039062, -0.6111750602722168, 0.46402835845947266, 1.539231777191162, 2.6144351959228516, 3.689638614654541, 4.7648420333862305, 5.84004545211792, 6.915248870849609, 7.990452289581299, 9.065655708312988, 10.140859603881836, 11.216062545776367, 12.291265487670898, 13.366469383239746, 14.441673278808594, 15.516876220703125, 16.592079162597656, 17.667282104492188, 18.74248695373535, 19.817689895629883, 20.892892837524414, 21.968097686767578, 23.04330062866211, 24.11850357055664, 25.193706512451172, 26.268909454345703, 27.344114303588867, 28.4193172454834, 29.49452018737793, 30.569725036621094, 31.644927978515625, 32.720130920410156]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 1.0, 8.0, 5.0, 7.0, 5.0, 6.0, 13.0, 18.0, 14.0, 17.0, 18.0, 15.0, 21.0, 24.0, 25.0, 25.0, 39.0, 31.0, 37.0, 20.0, 50.0, 30.0, 50.0, 39.0, 46.0, 29.0, 39.0, 38.0, 34.0, 35.0, 37.0, 17.0, 21.0, 20.0, 30.0, 16.0, 21.0, 18.0, 15.0, 12.0, 9.0, 16.0, 9.0, 4.0, 5.0, 4.0, 2.0, 5.0, 2.0, 2.0], "bins": [-4.7265625, -4.599578857421875, -4.47259521484375, -4.345611572265625, -4.2186279296875, -4.091644287109375, -3.96466064453125, -3.837677001953125, -3.710693359375, -3.583709716796875, -3.45672607421875, -3.329742431640625, -3.2027587890625, -3.075775146484375, -2.94879150390625, -2.821807861328125, -2.69482421875, -2.567840576171875, -2.44085693359375, -2.313873291015625, -2.1868896484375, -2.059906005859375, -1.93292236328125, -1.805938720703125, -1.678955078125, -1.551971435546875, -1.42498779296875, -1.298004150390625, -1.1710205078125, -1.044036865234375, -0.91705322265625, -0.790069580078125, -0.6630859375, -0.536102294921875, -0.40911865234375, -0.282135009765625, -0.1551513671875, -0.028167724609375, 0.09881591796875, 0.225799560546875, 0.352783203125, 0.479766845703125, 0.60675048828125, 0.733734130859375, 0.8607177734375, 0.987701416015625, 1.11468505859375, 1.241668701171875, 1.36865234375, 1.495635986328125, 1.62261962890625, 1.749603271484375, 1.8765869140625, 2.003570556640625, 2.13055419921875, 2.257537841796875, 2.384521484375, 2.511505126953125, 2.63848876953125, 2.765472412109375, 2.8924560546875, 3.019439697265625, 3.14642333984375, 3.273406982421875, 3.400390625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 6.0, 8.0, 7.0, 5.0, 7.0, 14.0, 19.0, 29.0, 34.0, 47.0, 67.0, 135.0, 216.0, 452.0, 805.0, 1526.0, 3234.0, 7592.0, 21529.0, 79508.0, 361455.0, 1517815.0, 1652139.0, 415171.0, 91828.0, 24597.0, 8537.0, 3641.0, 1660.0, 919.0, 498.0, 307.0, 165.0, 115.0, 58.0, 43.0, 32.0, 15.0, 20.0, 8.0, 8.0, 4.0, 2.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.6640625, -7.44537353515625, -7.2266845703125, -7.00799560546875, -6.789306640625, -6.57061767578125, -6.3519287109375, -6.13323974609375, -5.91455078125, -5.69586181640625, -5.4771728515625, -5.25848388671875, -5.039794921875, -4.82110595703125, -4.6024169921875, -4.38372802734375, -4.1650390625, -3.94635009765625, -3.7276611328125, -3.50897216796875, -3.290283203125, -3.07159423828125, -2.8529052734375, -2.63421630859375, -2.41552734375, -2.19683837890625, -1.9781494140625, -1.75946044921875, -1.540771484375, -1.32208251953125, -1.1033935546875, -0.88470458984375, -0.666015625, -0.44732666015625, -0.2286376953125, -0.00994873046875, 0.208740234375, 0.42742919921875, 0.6461181640625, 0.86480712890625, 1.08349609375, 1.30218505859375, 1.5208740234375, 1.73956298828125, 1.958251953125, 2.17694091796875, 2.3956298828125, 2.61431884765625, 2.8330078125, 3.05169677734375, 3.2703857421875, 3.48907470703125, 3.707763671875, 3.92645263671875, 4.1451416015625, 4.36383056640625, 4.58251953125, 4.80120849609375, 5.0198974609375, 5.23858642578125, 5.457275390625, 5.67596435546875, 5.8946533203125, 6.11334228515625, 6.33203125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 8.0, 6.0, 16.0, 15.0, 19.0, 34.0, 40.0, 83.0, 108.0, 158.0, 212.0, 313.0, 410.0, 593.0, 568.0, 422.0, 348.0, 211.0, 153.0, 109.0, 79.0, 44.0, 26.0, 25.0, 15.0, 11.0, 7.0, 11.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.51171875, -7.25286865234375, -6.9940185546875, -6.73516845703125, -6.476318359375, -6.21746826171875, -5.9586181640625, -5.69976806640625, -5.44091796875, -5.18206787109375, -4.9232177734375, -4.66436767578125, -4.405517578125, -4.14666748046875, -3.8878173828125, -3.62896728515625, -3.3701171875, -3.11126708984375, -2.8524169921875, -2.59356689453125, -2.334716796875, -2.07586669921875, -1.8170166015625, -1.55816650390625, -1.29931640625, -1.04046630859375, -0.7816162109375, -0.52276611328125, -0.263916015625, -0.00506591796875, 0.2537841796875, 0.51263427734375, 0.771484375, 1.03033447265625, 1.2891845703125, 1.54803466796875, 1.806884765625, 2.06573486328125, 2.3245849609375, 2.58343505859375, 2.84228515625, 3.10113525390625, 3.3599853515625, 3.61883544921875, 3.877685546875, 4.13653564453125, 4.3953857421875, 4.65423583984375, 4.9130859375, 5.17193603515625, 5.4307861328125, 5.68963623046875, 5.948486328125, 6.20733642578125, 6.4661865234375, 6.72503662109375, 6.98388671875, 7.24273681640625, 7.5015869140625, 7.76043701171875, 8.019287109375, 8.27813720703125, 8.5369873046875, 8.79583740234375, 9.0546875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 11.0, 17.0, 9.0, 22.0, 24.0, 46.0, 65.0, 113.0, 174.0, 350.0, 772.0, 2563.0, 13255.0, 212913.0, 3605022.0, 336952.0, 17146.0, 2937.0, 938.0, 402.0, 208.0, 107.0, 76.0, 62.0, 20.0, 18.0, 15.0, 15.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -24.8740234375, -24.154296875, -23.4345703125, -22.71484375, -21.9951171875, -21.275390625, -20.5556640625, -19.8359375, -19.1162109375, -18.396484375, -17.6767578125, -16.95703125, -16.2373046875, -15.517578125, -14.7978515625, -14.078125, -13.3583984375, -12.638671875, -11.9189453125, -11.19921875, -10.4794921875, -9.759765625, -9.0400390625, -8.3203125, -7.6005859375, -6.880859375, -6.1611328125, -5.44140625, -4.7216796875, -4.001953125, -3.2822265625, -2.5625, -1.8427734375, -1.123046875, -0.4033203125, 0.31640625, 1.0361328125, 1.755859375, 2.4755859375, 3.1953125, 3.9150390625, 4.634765625, 5.3544921875, 6.07421875, 6.7939453125, 7.513671875, 8.2333984375, 8.953125, 9.6728515625, 10.392578125, 11.1123046875, 11.83203125, 12.5517578125, 13.271484375, 13.9912109375, 14.7109375, 15.4306640625, 16.150390625, 16.8701171875, 17.58984375, 18.3095703125, 19.029296875, 19.7490234375, 20.46875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 44.0, 239.0, 458.0, 223.0, 40.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.15943145751953, -55.67448425292969, -51.18954086303711, -46.70459747314453, -42.21965026855469, -37.734703063964844, -33.249759674072266, -28.764814376831055, -24.279869079589844, -19.794923782348633, -15.309978485107422, -10.825033187866211, -6.340087890625, -1.855142593383789, 2.629802703857422, 7.114748001098633, 11.599693298339844, 16.084638595581055, 20.569583892822266, 25.054529190063477, 29.539474487304688, 34.02442169189453, 38.50936508178711, 42.99430847167969, 47.47925567626953, 51.964202880859375, 56.44914627075195, 60.93408966064453, 65.41903686523438, 69.90398406982422, 74.38893127441406, 78.87387084960938, 83.35881042480469, 87.84375762939453, 92.32870483398438, 96.81364440917969, 101.29859161376953, 105.78353881835938, 110.26847839355469, 114.75342559814453, 119.23837280273438, 123.72332000732422, 128.20826721191406, 132.69320678710938, 137.17816162109375, 141.66310119628906, 146.14804077148438, 150.63299560546875, 155.11793518066406, 159.60287475585938, 164.08782958984375, 168.57276916503906, 173.05770874023438, 177.54266357421875, 182.02760314941406, 186.51255798339844, 190.99749755859375, 195.48243713378906, 199.96739196777344, 204.45233154296875, 208.93728637695312, 213.42222595214844, 217.90716552734375, 222.39212036132812, 226.87705993652344]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 7.0, 8.0, 7.0, 19.0, 16.0, 14.0, 13.0, 22.0, 20.0, 25.0, 28.0, 28.0, 35.0, 32.0, 39.0, 38.0, 30.0, 33.0, 37.0, 35.0, 42.0, 32.0, 41.0, 42.0, 32.0, 38.0, 38.0, 21.0, 30.0, 25.0, 20.0, 20.0, 22.0, 20.0, 8.0, 15.0, 13.0, 9.0, 8.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-24.05582618713379, -23.329723358154297, -22.603622436523438, -21.877519607543945, -21.151416778564453, -20.425315856933594, -19.6992130279541, -18.97311019897461, -18.24700927734375, -17.520906448364258, -16.7948055267334, -16.068702697753906, -15.342599868774414, -14.616497993469238, -13.890396118164062, -13.16429328918457, -12.438190460205078, -11.712088584899902, -10.98598575592041, -10.259883880615234, -9.533781051635742, -8.807679176330566, -8.08157730102539, -7.355474948883057, -6.629372596740723, -5.903270244598389, -5.177167892456055, -4.451066017150879, -3.724963665008545, -2.998861312866211, -2.272759437561035, -1.5466570854187012, -0.8205528259277344, -0.09445059299468994, 0.6316516399383545, 1.3577537536621094, 2.0838561058044434, 2.8099584579467773, 3.536060333251953, 4.262162685394287, 4.988265037536621, 5.714367389678955, 6.440469741821289, 7.166571617126465, 7.892673969268799, 8.618776321411133, 9.344878196716309, 10.070980072021484, 10.797082901000977, 11.523184776306152, 12.249287605285645, 12.97538948059082, 13.701492309570312, 14.427594184875488, 15.153696060180664, 15.879798889160156, 16.605899810791016, 17.332002639770508, 18.058103561401367, 18.78420639038086, 19.51030921936035, 20.236412048339844, 20.962512969970703, 21.688615798950195, 22.414718627929688]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 8.0, 12.0, 9.0, 13.0, 9.0, 12.0, 16.0, 13.0, 19.0, 31.0, 19.0, 12.0, 31.0, 34.0, 33.0, 36.0, 33.0, 30.0, 39.0, 40.0, 47.0, 31.0, 31.0, 45.0, 32.0, 36.0, 35.0, 35.0, 29.0, 25.0, 19.0, 23.0, 26.0, 25.0, 21.0, 13.0, 12.0, 13.0, 10.0, 8.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.640625, -4.510589599609375, -4.38055419921875, -4.250518798828125, -4.1204833984375, -3.990447998046875, -3.86041259765625, -3.730377197265625, -3.600341796875, -3.470306396484375, -3.34027099609375, -3.210235595703125, -3.0802001953125, -2.950164794921875, -2.82012939453125, -2.690093994140625, -2.56005859375, -2.430023193359375, -2.29998779296875, -2.169952392578125, -2.0399169921875, -1.909881591796875, -1.77984619140625, -1.649810791015625, -1.519775390625, -1.389739990234375, -1.25970458984375, -1.129669189453125, -0.9996337890625, -0.869598388671875, -0.73956298828125, -0.609527587890625, -0.4794921875, -0.349456787109375, -0.21942138671875, -0.089385986328125, 0.0406494140625, 0.170684814453125, 0.30072021484375, 0.430755615234375, 0.560791015625, 0.690826416015625, 0.82086181640625, 0.950897216796875, 1.0809326171875, 1.210968017578125, 1.34100341796875, 1.471038818359375, 1.60107421875, 1.731109619140625, 1.86114501953125, 1.991180419921875, 2.1212158203125, 2.251251220703125, 2.38128662109375, 2.511322021484375, 2.641357421875, 2.771392822265625, 2.90142822265625, 3.031463623046875, 3.1614990234375, 3.291534423828125, 3.42156982421875, 3.551605224609375, 3.681640625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 8.0, 10.0, 16.0, 22.0, 39.0, 62.0, 65.0, 129.0, 163.0, 233.0, 401.0, 642.0, 912.0, 1355.0, 1977.0, 3016.0, 4568.0, 7157.0, 10657.0, 16430.0, 26320.0, 43260.0, 75871.0, 144626.0, 282185.0, 190852.0, 95884.0, 53646.0, 31573.0, 19703.0, 12554.0, 8239.0, 5368.0, 3477.0, 2425.0, 1610.0, 1073.0, 663.0, 435.0, 283.0, 231.0, 148.0, 94.0, 54.0, 42.0, 25.0, 17.0, 9.0, 13.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.156005859375, -0.1509227752685547, -0.14583969116210938, -0.14075660705566406, -0.13567352294921875, -0.13059043884277344, -0.12550735473632812, -0.12042427062988281, -0.1153411865234375, -0.11025810241699219, -0.10517501831054688, -0.10009193420410156, -0.09500885009765625, -0.08992576599121094, -0.08484268188476562, -0.07975959777832031, -0.074676513671875, -0.06959342956542969, -0.06451034545898438, -0.05942726135253906, -0.05434417724609375, -0.04926109313964844, -0.044178009033203125, -0.03909492492675781, -0.0340118408203125, -0.028928756713867188, -0.023845672607421875, -0.018762588500976562, -0.01367950439453125, -0.008596420288085938, -0.003513336181640625, 0.0015697479248046875, 0.00665283203125, 0.011735916137695312, 0.016819000244140625, 0.021902084350585938, 0.02698516845703125, 0.03206825256347656, 0.037151336669921875, 0.04223442077636719, 0.0473175048828125, 0.05240058898925781, 0.057483673095703125, 0.06256675720214844, 0.06764984130859375, 0.07273292541503906, 0.07781600952148438, 0.08289909362792969, 0.087982177734375, 0.09306526184082031, 0.09814834594726562, 0.10323143005371094, 0.10831451416015625, 0.11339759826660156, 0.11848068237304688, 0.12356376647949219, 0.1286468505859375, 0.1337299346923828, 0.13881301879882812, 0.14389610290527344, 0.14897918701171875, 0.15406227111816406, 0.15914535522460938, 0.1642284393310547, 0.1693115234375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 2.0, 4.0, 3.0, 8.0, 9.0, 12.0, 11.0, 8.0, 14.0, 21.0, 14.0, 22.0, 27.0, 19.0, 32.0, 28.0, 39.0, 34.0, 36.0, 41.0, 45.0, 38.0, 1072.0, 48.0, 42.0, 32.0, 30.0, 41.0, 24.0, 39.0, 33.0, 30.0, 25.0, 17.0, 23.0, 16.0, 21.0, 11.0, 14.0, 5.0, 10.0, 6.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.662109375, -3.537933349609375, -3.41375732421875, -3.289581298828125, -3.1654052734375, -3.041229248046875, -2.91705322265625, -2.792877197265625, -2.668701171875, -2.544525146484375, -2.42034912109375, -2.296173095703125, -2.1719970703125, -2.047821044921875, -1.92364501953125, -1.799468994140625, -1.67529296875, -1.551116943359375, -1.42694091796875, -1.302764892578125, -1.1785888671875, -1.054412841796875, -0.93023681640625, -0.806060791015625, -0.681884765625, -0.557708740234375, -0.43353271484375, -0.309356689453125, -0.1851806640625, -0.061004638671875, 0.06317138671875, 0.187347412109375, 0.3115234375, 0.435699462890625, 0.55987548828125, 0.684051513671875, 0.8082275390625, 0.932403564453125, 1.05657958984375, 1.180755615234375, 1.304931640625, 1.429107666015625, 1.55328369140625, 1.677459716796875, 1.8016357421875, 1.925811767578125, 2.04998779296875, 2.174163818359375, 2.29833984375, 2.422515869140625, 2.54669189453125, 2.670867919921875, 2.7950439453125, 2.919219970703125, 3.04339599609375, 3.167572021484375, 3.291748046875, 3.415924072265625, 3.54010009765625, 3.664276123046875, 3.7884521484375, 3.912628173828125, 4.03680419921875, 4.160980224609375, 4.28515625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 10.0, 25.0, 34.0, 52.0, 67.0, 84.0, 130.0, 172.0, 246.0, 342.0, 459.0, 613.0, 886.0, 1247.0, 1631.0, 2326.0, 3319.0, 4559.0, 6274.0, 8840.0, 12787.0, 18205.0, 26840.0, 40401.0, 65178.0, 111778.0, 232978.0, 1225629.0, 122952.0, 70677.0, 43718.0, 28533.0, 19228.0, 13491.0, 9531.0, 6624.0, 4763.0, 3394.0, 2514.0, 1920.0, 1366.0, 958.0, 721.0, 455.0, 362.0, 222.0, 173.0, 115.0, 94.0, 61.0, 45.0, 33.0, 20.0, 17.0, 15.0, 5.0, 7.0, 4.0], "bins": [-0.062469482421875, -0.060581207275390625, -0.05869293212890625, -0.056804656982421875, -0.0549163818359375, -0.053028106689453125, -0.05113983154296875, -0.049251556396484375, -0.04736328125, -0.045475006103515625, -0.04358673095703125, -0.041698455810546875, -0.0398101806640625, -0.037921905517578125, -0.03603363037109375, -0.034145355224609375, -0.032257080078125, -0.030368804931640625, -0.02848052978515625, -0.026592254638671875, -0.0247039794921875, -0.022815704345703125, -0.02092742919921875, -0.019039154052734375, -0.01715087890625, -0.015262603759765625, -0.01337432861328125, -0.011486053466796875, -0.0095977783203125, -0.007709503173828125, -0.00582122802734375, -0.003932952880859375, -0.002044677734375, -0.000156402587890625, 0.00173187255859375, 0.003620147705078125, 0.0055084228515625, 0.007396697998046875, 0.00928497314453125, 0.011173248291015625, 0.0130615234375, 0.014949798583984375, 0.01683807373046875, 0.018726348876953125, 0.0206146240234375, 0.022502899169921875, 0.02439117431640625, 0.026279449462890625, 0.028167724609375, 0.030055999755859375, 0.03194427490234375, 0.033832550048828125, 0.0357208251953125, 0.037609100341796875, 0.03949737548828125, 0.041385650634765625, 0.04327392578125, 0.045162200927734375, 0.04705047607421875, 0.048938751220703125, 0.0508270263671875, 0.052715301513671875, 0.05460357666015625, 0.056491851806640625, 0.058380126953125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 9.0, 7.0, 13.0, 25.0, 31.0, 34.0, 45.0, 62.0, 80.0, 122.0, 141.0, 104.0, 73.0, 51.0, 39.0, 26.0, 29.0, 13.0, 11.0, 9.0, 12.0, 8.0, 10.0, 3.0, 5.0, 3.0, 1.0, 1.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005860328674316406, -0.000567898154258728, -0.0005497634410858154, -0.0005316287279129028, -0.0005134940147399902, -0.0004953593015670776, -0.00047722458839416504, -0.00045908987522125244, -0.00044095516204833984, -0.00042282044887542725, -0.00040468573570251465, -0.00038655102252960205, -0.00036841630935668945, -0.00035028159618377686, -0.00033214688301086426, -0.00031401216983795166, -0.00029587745666503906, -0.00027774274349212646, -0.00025960803031921387, -0.00024147331714630127, -0.00022333860397338867, -0.00020520389080047607, -0.00018706917762756348, -0.00016893446445465088, -0.00015079975128173828, -0.00013266503810882568, -0.00011453032493591309, -9.639561176300049e-05, -7.826089859008789e-05, -6.012618541717529e-05, -4.1991472244262695e-05, -2.3856759071350098e-05, -5.7220458984375e-06, 1.2412667274475098e-05, 3.0547380447387695e-05, 4.868209362030029e-05, 6.681680679321289e-05, 8.495151996612549e-05, 0.00010308623313903809, 0.00012122094631195068, 0.00013935565948486328, 0.00015749037265777588, 0.00017562508583068848, 0.00019375979900360107, 0.00021189451217651367, 0.00023002922534942627, 0.00024816393852233887, 0.00026629865169525146, 0.00028443336486816406, 0.00030256807804107666, 0.00032070279121398926, 0.00033883750438690186, 0.00035697221755981445, 0.00037510693073272705, 0.00039324164390563965, 0.00041137635707855225, 0.00042951107025146484, 0.00044764578342437744, 0.00046578049659729004, 0.00048391520977020264, 0.0005020499229431152, 0.0005201846361160278, 0.0005383193492889404, 0.000556454062461853, 0.0005745887756347656]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 0.0, 1.0, 4.0, 3.0, 7.0, 8.0, 10.0, 7.0, 13.0, 12.0, 18.0, 21.0, 34.0, 49.0, 86.0, 197.0, 2066.0, 1012311.0, 33020.0, 331.0, 106.0, 82.0, 38.0, 39.0, 26.0, 12.0, 4.0, 11.0, 13.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01427459716796875, -0.01382458209991455, -0.013374567031860352, -0.012924551963806152, -0.012474536895751953, -0.012024521827697754, -0.011574506759643555, -0.011124491691589355, -0.010674476623535156, -0.010224461555480957, -0.009774446487426758, -0.009324431419372559, -0.00887441635131836, -0.00842440128326416, -0.007974386215209961, -0.007524371147155762, -0.0070743560791015625, -0.006624341011047363, -0.006174325942993164, -0.005724310874938965, -0.005274295806884766, -0.004824280738830566, -0.004374265670776367, -0.003924250602722168, -0.0034742355346679688, -0.0030242204666137695, -0.0025742053985595703, -0.002124190330505371, -0.0016741752624511719, -0.0012241601943969727, -0.0007741451263427734, -0.0003241300582885742, 0.000125885009765625, 0.0005759000778198242, 0.0010259151458740234, 0.0014759302139282227, 0.0019259452819824219, 0.002375960350036621, 0.0028259754180908203, 0.0032759904861450195, 0.0037260055541992188, 0.004176020622253418, 0.004626035690307617, 0.005076050758361816, 0.005526065826416016, 0.005976080894470215, 0.006426095962524414, 0.006876111030578613, 0.0073261260986328125, 0.007776141166687012, 0.008226156234741211, 0.00867617130279541, 0.00912618637084961, 0.009576201438903809, 0.010026216506958008, 0.010476231575012207, 0.010926246643066406, 0.011376261711120605, 0.011826276779174805, 0.012276291847229004, 0.012726306915283203, 0.013176321983337402, 0.013626337051391602, 0.0140763521194458, 0.0145263671875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 11.0, 101.0, 676.0, 209.0, 21.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033415743382647634, -0.00026288485969416797, -0.0001916122855618596, -0.00012033971142955124, -4.906713729724288e-05, 2.2205436835065484e-05, 9.347801096737385e-05, 0.00016475055599585176, 0.00023602315923199058, 0.00030729573336429894, 0.0003785683074966073, 0.00044984088162891567, 0.000521113455761224, 0.0005923860007897019, 0.0006636586040258408, 0.0007349311490543187, 0.0008062037522904575, 0.0008774762973189354, 0.0009487489005550742, 0.001020021503791213, 0.00109129399061203, 0.0011625665938481688, 0.0012338391970843077, 0.0013051116839051247, 0.0013763844035565853, 0.0014476570067927241, 0.001518929610028863, 0.00159020209684968, 0.0016614747000858188, 0.0017327473033219576, 0.0018040197901427746, 0.0018752923933789134, 0.0019465647637844086, 0.0020178372506052256, 0.002089109970256686, 0.002160382457077503, 0.002231655176728964, 0.002302927663549781, 0.002374200150370598, 0.0024454728700220585, 0.0025167453568428755, 0.0025880178436636925, 0.002659290563315153, 0.00273056305013597, 0.002801835536956787, 0.0028731082566082478, 0.0029443807434290648, 0.0030156532302498817, 0.0030869259499013424, 0.0031581984367221594, 0.00322947115637362, 0.003300743643194437, 0.0033720163628458977, 0.0034432888496667147, 0.0035145613364875317, 0.0035858340561389923, 0.0036571065429598093, 0.0037283790297806263, 0.003799651749432087, 0.003870924236252904, 0.003942196723073721, 0.004013469442725182, 0.004084742162376642, 0.004156014416366816, 0.004227287136018276]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 10.0, 7.0, 9.0, 10.0, 11.0, 18.0, 15.0, 21.0, 25.0, 35.0, 27.0, 18.0, 31.0, 42.0, 34.0, 36.0, 55.0, 41.0, 48.0, 48.0, 43.0, 53.0, 33.0, 43.0, 38.0, 49.0, 26.0, 28.0, 29.0, 25.0, 10.0, 25.0, 12.0, 4.0, 9.0, 8.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002391338348388672, -0.0002312762662768364, -0.0002234186977148056, -0.0002155611291527748, -0.00020770356059074402, -0.00019984599202871323, -0.00019198842346668243, -0.00018413085490465164, -0.00017627328634262085, -0.00016841571778059006, -0.00016055814921855927, -0.00015270058065652847, -0.00014484301209449768, -0.0001369854435324669, -0.0001291278749704361, -0.0001212703064084053, -0.00011341273784637451, -0.00010555516928434372, -9.769760072231293e-05, -8.984003216028214e-05, -8.198246359825134e-05, -7.412489503622055e-05, -6.626732647418976e-05, -5.8409757912158966e-05, -5.0552189350128174e-05, -4.269462078809738e-05, -3.483705222606659e-05, -2.6979483664035797e-05, -1.9121915102005005e-05, -1.1264346539974213e-05, -3.4067779779434204e-06, 4.450790584087372e-06, 1.2308359146118164e-05, 2.0165927708148956e-05, 2.802349627017975e-05, 3.588106483221054e-05, 4.373863339424133e-05, 5.1596201956272125e-05, 5.945377051830292e-05, 6.731133908033371e-05, 7.51689076423645e-05, 8.30264762043953e-05, 9.088404476642609e-05, 9.874161332845688e-05, 0.00010659918189048767, 0.00011445675045251846, 0.00012231431901454926, 0.00013017188757658005, 0.00013802945613861084, 0.00014588702470064163, 0.00015374459326267242, 0.00016160216182470322, 0.000169459730386734, 0.0001773172989487648, 0.0001851748675107956, 0.00019303243607282639, 0.00020089000463485718, 0.00020874757319688797, 0.00021660514175891876, 0.00022446271032094955, 0.00023232027888298035, 0.00024017784744501114, 0.00024803541600704193, 0.0002558929845690727, 0.0002637505531311035]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 8.0, 12.0, 9.0, 13.0, 9.0, 12.0, 16.0, 13.0, 19.0, 31.0, 19.0, 12.0, 31.0, 34.0, 33.0, 36.0, 33.0, 30.0, 39.0, 40.0, 47.0, 31.0, 31.0, 45.0, 32.0, 36.0, 35.0, 35.0, 29.0, 25.0, 19.0, 23.0, 26.0, 25.0, 21.0, 13.0, 12.0, 13.0, 10.0, 8.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.640625, -4.510589599609375, -4.38055419921875, -4.250518798828125, -4.1204833984375, -3.990447998046875, -3.86041259765625, -3.730377197265625, -3.600341796875, -3.470306396484375, -3.34027099609375, -3.210235595703125, -3.0802001953125, -2.950164794921875, -2.82012939453125, -2.690093994140625, -2.56005859375, -2.430023193359375, -2.29998779296875, -2.169952392578125, -2.0399169921875, -1.909881591796875, -1.77984619140625, -1.649810791015625, -1.519775390625, -1.389739990234375, -1.25970458984375, -1.129669189453125, -0.9996337890625, -0.869598388671875, -0.73956298828125, -0.609527587890625, -0.4794921875, -0.349456787109375, -0.21942138671875, -0.089385986328125, 0.0406494140625, 0.170684814453125, 0.30072021484375, 0.430755615234375, 0.560791015625, 0.690826416015625, 0.82086181640625, 0.950897216796875, 1.0809326171875, 1.210968017578125, 1.34100341796875, 1.471038818359375, 1.60107421875, 1.731109619140625, 1.86114501953125, 1.991180419921875, 2.1212158203125, 2.251251220703125, 2.38128662109375, 2.511322021484375, 2.641357421875, 2.771392822265625, 2.90142822265625, 3.031463623046875, 3.1614990234375, 3.291534423828125, 3.42156982421875, 3.551605224609375, 3.681640625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 4.0, 12.0, 14.0, 14.0, 20.0, 21.0, 45.0, 46.0, 79.0, 125.0, 170.0, 228.0, 395.0, 701.0, 1140.0, 1935.0, 3716.0, 6685.0, 12810.0, 26560.0, 60354.0, 182171.0, 480187.0, 163080.0, 56389.0, 24782.0, 12206.0, 6268.0, 3503.0, 1921.0, 1142.0, 652.0, 388.0, 252.0, 168.0, 108.0, 71.0, 54.0, 34.0, 36.0, 20.0, 11.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.68359375, -6.45672607421875, -6.2298583984375, -6.00299072265625, -5.776123046875, -5.54925537109375, -5.3223876953125, -5.09552001953125, -4.86865234375, -4.64178466796875, -4.4149169921875, -4.18804931640625, -3.961181640625, -3.73431396484375, -3.5074462890625, -3.28057861328125, -3.0537109375, -2.82684326171875, -2.5999755859375, -2.37310791015625, -2.146240234375, -1.91937255859375, -1.6925048828125, -1.46563720703125, -1.23876953125, -1.01190185546875, -0.7850341796875, -0.55816650390625, -0.331298828125, -0.10443115234375, 0.1224365234375, 0.34930419921875, 0.576171875, 0.80303955078125, 1.0299072265625, 1.25677490234375, 1.483642578125, 1.71051025390625, 1.9373779296875, 2.16424560546875, 2.39111328125, 2.61798095703125, 2.8448486328125, 3.07171630859375, 3.298583984375, 3.52545166015625, 3.7523193359375, 3.97918701171875, 4.2060546875, 4.43292236328125, 4.6597900390625, 4.88665771484375, 5.113525390625, 5.34039306640625, 5.5672607421875, 5.79412841796875, 6.02099609375, 6.24786376953125, 6.4747314453125, 6.70159912109375, 6.928466796875, 7.15533447265625, 7.3822021484375, 7.60906982421875, 7.8359375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 8.0, 7.0, 11.0, 10.0, 10.0, 30.0, 22.0, 24.0, 40.0, 33.0, 36.0, 29.0, 54.0, 69.0, 69.0, 112.0, 201.0, 1392.0, 252.0, 121.0, 91.0, 76.0, 42.0, 39.0, 31.0, 42.0, 39.0, 25.0, 27.0, 14.0, 19.0, 18.0, 8.0, 14.0, 8.0, 6.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.7734375, -12.3699951171875, -11.966552734375, -11.5631103515625, -11.15966796875, -10.7562255859375, -10.352783203125, -9.9493408203125, -9.5458984375, -9.1424560546875, -8.739013671875, -8.3355712890625, -7.93212890625, -7.5286865234375, -7.125244140625, -6.7218017578125, -6.318359375, -5.9149169921875, -5.511474609375, -5.1080322265625, -4.70458984375, -4.3011474609375, -3.897705078125, -3.4942626953125, -3.0908203125, -2.6873779296875, -2.283935546875, -1.8804931640625, -1.47705078125, -1.0736083984375, -0.670166015625, -0.2667236328125, 0.13671875, 0.5401611328125, 0.943603515625, 1.3470458984375, 1.75048828125, 2.1539306640625, 2.557373046875, 2.9608154296875, 3.3642578125, 3.7677001953125, 4.171142578125, 4.5745849609375, 4.97802734375, 5.3814697265625, 5.784912109375, 6.1883544921875, 6.591796875, 6.9952392578125, 7.398681640625, 7.8021240234375, 8.20556640625, 8.6090087890625, 9.012451171875, 9.4158935546875, 9.8193359375, 10.2227783203125, 10.626220703125, 11.0296630859375, 11.43310546875, 11.8365478515625, 12.239990234375, 12.6434326171875, 13.046875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 4.0, 8.0, 10.0, 14.0, 10.0, 12.0, 27.0, 34.0, 53.0, 76.0, 126.0, 182.0, 264.0, 461.0, 827.0, 2060.0, 7056.0, 37158.0, 412344.0, 2486086.0, 170518.0, 20528.0, 4531.0, 1477.0, 692.0, 416.0, 239.0, 139.0, 97.0, 64.0, 58.0, 28.0, 24.0, 18.0, 12.0, 17.0, 10.0, 6.0, 1.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 4.0], "bins": [-18.9375, -18.4163818359375, -17.895263671875, -17.3741455078125, -16.85302734375, -16.3319091796875, -15.810791015625, -15.2896728515625, -14.7685546875, -14.2474365234375, -13.726318359375, -13.2052001953125, -12.68408203125, -12.1629638671875, -11.641845703125, -11.1207275390625, -10.599609375, -10.0784912109375, -9.557373046875, -9.0362548828125, -8.51513671875, -7.9940185546875, -7.472900390625, -6.9517822265625, -6.4306640625, -5.9095458984375, -5.388427734375, -4.8673095703125, -4.34619140625, -3.8250732421875, -3.303955078125, -2.7828369140625, -2.26171875, -1.7406005859375, -1.219482421875, -0.6983642578125, -0.17724609375, 0.3438720703125, 0.864990234375, 1.3861083984375, 1.9072265625, 2.4283447265625, 2.949462890625, 3.4705810546875, 3.99169921875, 4.5128173828125, 5.033935546875, 5.5550537109375, 6.076171875, 6.5972900390625, 7.118408203125, 7.6395263671875, 8.16064453125, 8.6817626953125, 9.202880859375, 9.7239990234375, 10.2451171875, 10.7662353515625, 11.287353515625, 11.8084716796875, 12.32958984375, 12.8507080078125, 13.371826171875, 13.8929443359375, 14.4140625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 87.0, 509.0, 368.0, 45.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-250.22364807128906, -245.8242950439453, -241.4249267578125, -237.02557373046875, -232.62620544433594, -228.2268524169922, -223.82748413085938, -219.42813110351562, -215.02877807617188, -210.62942504882812, -206.2300567626953, -201.83070373535156, -197.43133544921875, -193.031982421875, -188.6326141357422, -184.23326110839844, -179.83389282226562, -175.43453979492188, -171.03517150878906, -166.6358184814453, -162.2364501953125, -157.83709716796875, -153.43772888183594, -149.0383758544922, -144.63900756835938, -140.23965454101562, -135.8402862548828, -131.44093322753906, -127.04156494140625, -122.6422119140625, -118.24285125732422, -113.84349060058594, -109.44413757324219, -105.0447769165039, -100.64541625976562, -96.24605560302734, -91.84669494628906, -87.44734191894531, -83.04798126220703, -78.64862060546875, -74.24925994873047, -69.84989929199219, -65.4505386352539, -61.05118179321289, -56.65182113647461, -52.25246047973633, -47.85310363769531, -43.45374298095703, -39.05438232421875, -34.65502166748047, -30.25566291809082, -25.856304168701172, -21.45694351196289, -17.05758285522461, -12.658224105834961, -8.258865356445312, -3.8595046997070312, 0.5398550033569336, 4.939214706420898, 9.338574409484863, 13.737934112548828, 18.13729476928711, 22.536653518676758, 26.936012268066406, 31.335372924804688]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 5.0, 6.0, 5.0, 6.0, 12.0, 10.0, 17.0, 30.0, 16.0, 20.0, 17.0, 21.0, 33.0, 29.0, 31.0, 17.0, 42.0, 28.0, 35.0, 44.0, 35.0, 37.0, 32.0, 33.0, 41.0, 38.0, 25.0, 46.0, 29.0, 31.0, 31.0, 26.0, 17.0, 17.0, 14.0, 21.0, 17.0, 5.0, 17.0, 12.0, 11.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0], "bins": [-30.363006591796875, -29.4329833984375, -28.502960205078125, -27.57293701171875, -26.642915725708008, -25.712892532348633, -24.782869338989258, -23.852846145629883, -22.922822952270508, -21.992799758911133, -21.062776565551758, -20.132755279541016, -19.20273208618164, -18.272708892822266, -17.34268569946289, -16.412662506103516, -15.482640266418457, -14.552617073059082, -13.622594833374023, -12.692571640014648, -11.762548446655273, -10.832525253295898, -9.90250301361084, -8.972479820251465, -8.042457580566406, -7.1124348640441895, -6.1824116706848145, -5.252388954162598, -4.322365760803223, -3.392343044281006, -2.462320327758789, -1.532297134399414, -0.6022739410400391, 0.32774895429611206, 1.2577718496322632, 2.1877946853637695, 3.1178176403045654, 4.047840595245361, 4.977863311767578, 5.907886505126953, 6.83790922164917, 7.767931938171387, 8.697955131530762, 9.62797737121582, 10.558000564575195, 11.48802375793457, 12.418046951293945, 13.34807014465332, 14.278092384338379, 15.208115577697754, 16.138137817382812, 17.068161010742188, 17.998184204101562, 18.928207397460938, 19.858230590820312, 20.788253784179688, 21.71827507019043, 22.648298263549805, 23.57832145690918, 24.508342742919922, 25.438365936279297, 26.368389129638672, 27.298412322998047, 28.228435516357422, 29.158458709716797]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 11.0, 7.0, 6.0, 17.0, 15.0, 13.0, 13.0, 17.0, 19.0, 26.0, 20.0, 20.0, 36.0, 31.0, 24.0, 41.0, 31.0, 27.0, 37.0, 37.0, 36.0, 35.0, 38.0, 39.0, 39.0, 38.0, 32.0, 33.0, 21.0, 26.0, 19.0, 22.0, 27.0, 19.0, 17.0, 14.0, 13.0, 14.0, 11.0, 5.0, 9.0, 5.0, 5.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.2421875, -4.11468505859375, -3.9871826171875, -3.85968017578125, -3.732177734375, -3.60467529296875, -3.4771728515625, -3.34967041015625, -3.22216796875, -3.09466552734375, -2.9671630859375, -2.83966064453125, -2.712158203125, -2.58465576171875, -2.4571533203125, -2.32965087890625, -2.2021484375, -2.07464599609375, -1.9471435546875, -1.81964111328125, -1.692138671875, -1.56463623046875, -1.4371337890625, -1.30963134765625, -1.18212890625, -1.05462646484375, -0.9271240234375, -0.79962158203125, -0.672119140625, -0.54461669921875, -0.4171142578125, -0.28961181640625, -0.162109375, -0.03460693359375, 0.0928955078125, 0.22039794921875, 0.347900390625, 0.47540283203125, 0.6029052734375, 0.73040771484375, 0.85791015625, 0.98541259765625, 1.1129150390625, 1.24041748046875, 1.367919921875, 1.49542236328125, 1.6229248046875, 1.75042724609375, 1.8779296875, 2.00543212890625, 2.1329345703125, 2.26043701171875, 2.387939453125, 2.51544189453125, 2.6429443359375, 2.77044677734375, 2.89794921875, 3.02545166015625, 3.1529541015625, 3.28045654296875, 3.407958984375, 3.53546142578125, 3.6629638671875, 3.79046630859375, 3.91796875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 9.0, 10.0, 12.0, 24.0, 33.0, 44.0, 63.0, 83.0, 122.0, 187.0, 301.0, 487.0, 887.0, 1822.0, 4047.0, 10502.0, 36558.0, 208679.0, 1468096.0, 2044994.0, 340484.0, 53285.0, 13435.0, 5010.0, 2236.0, 1098.0, 638.0, 388.0, 236.0, 139.0, 93.0, 65.0, 47.0, 41.0, 23.0, 21.0, 12.0, 15.0, 10.0, 4.0, 4.0, 2.0, 7.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.078125, -8.7767333984375, -8.475341796875, -8.1739501953125, -7.87255859375, -7.5711669921875, -7.269775390625, -6.9683837890625, -6.6669921875, -6.3656005859375, -6.064208984375, -5.7628173828125, -5.46142578125, -5.1600341796875, -4.858642578125, -4.5572509765625, -4.255859375, -3.9544677734375, -3.653076171875, -3.3516845703125, -3.05029296875, -2.7489013671875, -2.447509765625, -2.1461181640625, -1.8447265625, -1.5433349609375, -1.241943359375, -0.9405517578125, -0.63916015625, -0.3377685546875, -0.036376953125, 0.2650146484375, 0.56640625, 0.8677978515625, 1.169189453125, 1.4705810546875, 1.77197265625, 2.0733642578125, 2.374755859375, 2.6761474609375, 2.9775390625, 3.2789306640625, 3.580322265625, 3.8817138671875, 4.18310546875, 4.4844970703125, 4.785888671875, 5.0872802734375, 5.388671875, 5.6900634765625, 5.991455078125, 6.2928466796875, 6.59423828125, 6.8956298828125, 7.197021484375, 7.4984130859375, 7.7998046875, 8.1011962890625, 8.402587890625, 8.7039794921875, 9.00537109375, 9.3067626953125, 9.608154296875, 9.9095458984375, 10.2109375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 4.0, 12.0, 10.0, 13.0, 18.0, 23.0, 28.0, 26.0, 35.0, 47.0, 50.0, 97.0, 131.0, 180.0, 192.0, 281.0, 373.0, 422.0, 429.0, 422.0, 312.0, 246.0, 150.0, 129.0, 97.0, 67.0, 62.0, 50.0, 38.0, 26.0, 20.0, 16.0, 12.0, 17.0, 6.0, 5.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.80078125, -5.6025390625, -5.404296875, -5.2060546875, -5.0078125, -4.8095703125, -4.611328125, -4.4130859375, -4.21484375, -4.0166015625, -3.818359375, -3.6201171875, -3.421875, -3.2236328125, -3.025390625, -2.8271484375, -2.62890625, -2.4306640625, -2.232421875, -2.0341796875, -1.8359375, -1.6376953125, -1.439453125, -1.2412109375, -1.04296875, -0.8447265625, -0.646484375, -0.4482421875, -0.25, -0.0517578125, 0.146484375, 0.3447265625, 0.54296875, 0.7412109375, 0.939453125, 1.1376953125, 1.3359375, 1.5341796875, 1.732421875, 1.9306640625, 2.12890625, 2.3271484375, 2.525390625, 2.7236328125, 2.921875, 3.1201171875, 3.318359375, 3.5166015625, 3.71484375, 3.9130859375, 4.111328125, 4.3095703125, 4.5078125, 4.7060546875, 4.904296875, 5.1025390625, 5.30078125, 5.4990234375, 5.697265625, 5.8955078125, 6.09375, 6.2919921875, 6.490234375, 6.6884765625, 6.88671875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 0.0, 5.0, 4.0, 5.0, 9.0, 10.0, 12.0, 27.0, 16.0, 26.0, 30.0, 51.0, 80.0, 100.0, 168.0, 248.0, 411.0, 802.0, 1760.0, 5027.0, 21086.0, 139569.0, 1843245.0, 1999434.0, 150385.0, 22486.0, 5377.0, 1823.0, 860.0, 439.0, 250.0, 148.0, 104.0, 74.0, 54.0, 39.0, 36.0, 23.0, 14.0, 15.0, 8.0, 7.0, 3.0, 3.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-17.40625, -16.9229736328125, -16.439697265625, -15.9564208984375, -15.47314453125, -14.9898681640625, -14.506591796875, -14.0233154296875, -13.5400390625, -13.0567626953125, -12.573486328125, -12.0902099609375, -11.60693359375, -11.1236572265625, -10.640380859375, -10.1571044921875, -9.673828125, -9.1905517578125, -8.707275390625, -8.2239990234375, -7.74072265625, -7.2574462890625, -6.774169921875, -6.2908935546875, -5.8076171875, -5.3243408203125, -4.841064453125, -4.3577880859375, -3.87451171875, -3.3912353515625, -2.907958984375, -2.4246826171875, -1.94140625, -1.4581298828125, -0.974853515625, -0.4915771484375, -0.00830078125, 0.4749755859375, 0.958251953125, 1.4415283203125, 1.9248046875, 2.4080810546875, 2.891357421875, 3.3746337890625, 3.85791015625, 4.3411865234375, 4.824462890625, 5.3077392578125, 5.791015625, 6.2742919921875, 6.757568359375, 7.2408447265625, 7.72412109375, 8.2073974609375, 8.690673828125, 9.1739501953125, 9.6572265625, 10.1405029296875, 10.623779296875, 11.1070556640625, 11.59033203125, 12.0736083984375, 12.556884765625, 13.0401611328125, 13.5234375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 13.0, 63.0, 191.0, 350.0, 259.0, 102.0, 29.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.66197204589844, -52.304664611816406, -48.947357177734375, -45.59005355834961, -42.23274612426758, -38.87543869018555, -35.51813507080078, -32.16082763671875, -28.80352020263672, -25.446212768554688, -22.08890724182129, -18.73160171508789, -15.37429428100586, -12.016986846923828, -8.65968132019043, -5.302375793457031, -1.945068359375, 1.4122381210327148, 4.76954460144043, 8.126851081848145, 11.48415756225586, 14.84146499633789, 18.19877052307129, 21.556076049804688, 24.91338348388672, 28.27069091796875, 31.62799644470215, 34.98530197143555, 38.34260940551758, 41.69991683959961, 45.057220458984375, 48.414527893066406, 51.77183532714844, 55.12914276123047, 58.4864501953125, 61.843753814697266, 65.20106506347656, 68.55836486816406, 71.9156723022461, 75.27297973632812, 78.63028717041016, 81.98759460449219, 85.34490203857422, 88.70220947265625, 92.05950927734375, 95.41682434082031, 98.77412414550781, 102.13143157958984, 105.48873901367188, 108.8460464477539, 112.20335388183594, 115.56066131591797, 118.91796875, 122.2752685546875, 125.63257598876953, 128.98988342285156, 132.34719848632812, 135.70449829101562, 139.0618133544922, 142.4191131591797, 145.77642822265625, 149.13372802734375, 152.4910430908203, 155.8483428955078, 159.2056427001953]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 7.0, 5.0, 4.0, 9.0, 7.0, 15.0, 14.0, 21.0, 20.0, 19.0, 27.0, 26.0, 34.0, 27.0, 37.0, 34.0, 37.0, 38.0, 35.0, 48.0, 43.0, 38.0, 42.0, 35.0, 38.0, 52.0, 35.0, 31.0, 30.0, 27.0, 21.0, 24.0, 26.0, 12.0, 17.0, 9.0, 14.0, 9.0, 11.0, 5.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.901531219482422, -24.117189407348633, -23.33284568786621, -22.548503875732422, -21.76416015625, -20.97981834411621, -20.195476531982422, -19.4111328125, -18.626789093017578, -17.84244728088379, -17.058103561401367, -16.273761749267578, -15.489418029785156, -14.705076217651367, -13.920733451843262, -13.136390686035156, -12.352048873901367, -11.567706108093262, -10.783363342285156, -9.999021530151367, -9.214677810668945, -8.430335998535156, -7.645993232727051, -6.861650466918945, -6.07730770111084, -5.292964935302734, -4.508622169494629, -3.7242798805236816, -2.939937114715576, -2.1555943489074707, -1.3712520599365234, -0.586909294128418, 0.1974334716796875, 0.9817761182785034, 1.7661187648773193, 2.5504612922668457, 3.334804058074951, 4.119146823883057, 4.903489112854004, 5.687831878662109, 6.472174644470215, 7.25651741027832, 8.040860176086426, 8.825202941894531, 9.60954475402832, 10.393888473510742, 11.178230285644531, 11.962573051452637, 12.746915817260742, 13.531258583068848, 14.315601348876953, 15.099943161010742, 15.884286880493164, 16.668628692626953, 17.452972412109375, 18.237314224243164, 19.021656036376953, 19.805997848510742, 20.590341567993164, 21.374683380126953, 22.159027099609375, 22.943368911743164, 23.727710723876953, 24.512054443359375, 25.296398162841797]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 8.0, 13.0, 10.0, 5.0, 11.0, 9.0, 13.0, 18.0, 9.0, 21.0, 19.0, 17.0, 21.0, 32.0, 25.0, 32.0, 23.0, 44.0, 28.0, 31.0, 41.0, 40.0, 36.0, 42.0, 38.0, 36.0, 36.0, 40.0, 41.0, 19.0, 34.0, 28.0, 24.0, 22.0, 17.0, 15.0, 18.0, 16.0, 8.0, 13.0, 11.0, 9.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.56640625, -4.43212890625, -4.2978515625, -4.16357421875, -4.029296875, -3.89501953125, -3.7607421875, -3.62646484375, -3.4921875, -3.35791015625, -3.2236328125, -3.08935546875, -2.955078125, -2.82080078125, -2.6865234375, -2.55224609375, -2.41796875, -2.28369140625, -2.1494140625, -2.01513671875, -1.880859375, -1.74658203125, -1.6123046875, -1.47802734375, -1.34375, -1.20947265625, -1.0751953125, -0.94091796875, -0.806640625, -0.67236328125, -0.5380859375, -0.40380859375, -0.26953125, -0.13525390625, -0.0009765625, 0.13330078125, 0.267578125, 0.40185546875, 0.5361328125, 0.67041015625, 0.8046875, 0.93896484375, 1.0732421875, 1.20751953125, 1.341796875, 1.47607421875, 1.6103515625, 1.74462890625, 1.87890625, 2.01318359375, 2.1474609375, 2.28173828125, 2.416015625, 2.55029296875, 2.6845703125, 2.81884765625, 2.953125, 3.08740234375, 3.2216796875, 3.35595703125, 3.490234375, 3.62451171875, 3.7587890625, 3.89306640625, 4.02734375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 17.0, 19.0, 21.0, 36.0, 50.0, 70.0, 95.0, 134.0, 217.0, 349.0, 500.0, 642.0, 992.0, 1479.0, 2147.0, 3254.0, 4769.0, 7232.0, 10630.0, 16475.0, 24964.0, 39789.0, 66783.0, 120375.0, 252705.0, 221679.0, 107766.0, 60248.0, 36537.0, 23065.0, 15085.0, 9913.0, 6745.0, 4512.0, 2954.0, 1979.0, 1412.0, 908.0, 590.0, 466.0, 306.0, 191.0, 137.0, 103.0, 75.0, 37.0, 33.0, 22.0, 22.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.156982421875, -0.15221214294433594, -0.14744186401367188, -0.1426715850830078, -0.13790130615234375, -0.1331310272216797, -0.12836074829101562, -0.12359046936035156, -0.1188201904296875, -0.11404991149902344, -0.10927963256835938, -0.10450935363769531, -0.09973907470703125, -0.09496879577636719, -0.09019851684570312, -0.08542823791503906, -0.080657958984375, -0.07588768005371094, -0.07111740112304688, -0.06634712219238281, -0.06157684326171875, -0.05680656433105469, -0.052036285400390625, -0.04726600646972656, -0.0424957275390625, -0.03772544860839844, -0.032955169677734375, -0.028184890747070312, -0.02341461181640625, -0.018644332885742188, -0.013874053955078125, -0.009103775024414062, -0.00433349609375, 0.0004367828369140625, 0.005207061767578125, 0.009977340698242188, 0.01474761962890625, 0.019517898559570312, 0.024288177490234375, 0.029058456420898438, 0.0338287353515625, 0.03859901428222656, 0.043369293212890625, 0.04813957214355469, 0.05290985107421875, 0.05768013000488281, 0.062450408935546875, 0.06722068786621094, 0.071990966796875, 0.07676124572753906, 0.08153152465820312, 0.08630180358886719, 0.09107208251953125, 0.09584236145019531, 0.10061264038085938, 0.10538291931152344, 0.1101531982421875, 0.11492347717285156, 0.11969375610351562, 0.12446403503417969, 0.12923431396484375, 0.1340045928955078, 0.13877487182617188, 0.14354515075683594, 0.1483154296875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 9.0, 14.0, 9.0, 10.0, 15.0, 19.0, 24.0, 15.0, 24.0, 24.0, 34.0, 39.0, 32.0, 32.0, 38.0, 34.0, 41.0, 29.0, 38.0, 1056.0, 38.0, 41.0, 47.0, 38.0, 41.0, 34.0, 28.0, 24.0, 17.0, 20.0, 21.0, 14.0, 15.0, 13.0, 16.0, 12.0, 13.0, 6.0, 9.0, 5.0, 12.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4921875, -3.383758544921875, -3.27532958984375, -3.166900634765625, -3.0584716796875, -2.950042724609375, -2.84161376953125, -2.733184814453125, -2.624755859375, -2.516326904296875, -2.40789794921875, -2.299468994140625, -2.1910400390625, -2.082611083984375, -1.97418212890625, -1.865753173828125, -1.75732421875, -1.648895263671875, -1.54046630859375, -1.432037353515625, -1.3236083984375, -1.215179443359375, -1.10675048828125, -0.998321533203125, -0.889892578125, -0.781463623046875, -0.67303466796875, -0.564605712890625, -0.4561767578125, -0.347747802734375, -0.23931884765625, -0.130889892578125, -0.0224609375, 0.085968017578125, 0.19439697265625, 0.302825927734375, 0.4112548828125, 0.519683837890625, 0.62811279296875, 0.736541748046875, 0.844970703125, 0.953399658203125, 1.06182861328125, 1.170257568359375, 1.2786865234375, 1.387115478515625, 1.49554443359375, 1.603973388671875, 1.71240234375, 1.820831298828125, 1.92926025390625, 2.037689208984375, 2.1461181640625, 2.254547119140625, 2.36297607421875, 2.471405029296875, 2.579833984375, 2.688262939453125, 2.79669189453125, 2.905120849609375, 3.0135498046875, 3.121978759765625, 3.23040771484375, 3.338836669921875, 3.447265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 8.0, 4.0, 11.0, 21.0, 30.0, 46.0, 66.0, 87.0, 131.0, 201.0, 312.0, 411.0, 594.0, 903.0, 1406.0, 2067.0, 2996.0, 4286.0, 6288.0, 9321.0, 14073.0, 21696.0, 34385.0, 55239.0, 94115.0, 175796.0, 1300306.0, 150478.0, 83028.0, 49185.0, 30456.0, 19474.0, 13070.0, 8712.0, 6034.0, 3901.0, 2505.0, 1703.0, 1175.0, 827.0, 577.0, 408.0, 251.0, 174.0, 128.0, 74.0, 54.0, 42.0, 27.0, 15.0, 15.0, 9.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.0672607421875, -0.06518363952636719, -0.06310653686523438, -0.06102943420410156, -0.05895233154296875, -0.05687522888183594, -0.054798126220703125, -0.05272102355957031, -0.0506439208984375, -0.04856681823730469, -0.046489715576171875, -0.04441261291503906, -0.04233551025390625, -0.04025840759277344, -0.038181304931640625, -0.03610420227050781, -0.034027099609375, -0.03194999694824219, -0.029872894287109375, -0.027795791625976562, -0.02571868896484375, -0.023641586303710938, -0.021564483642578125, -0.019487380981445312, -0.0174102783203125, -0.015333175659179688, -0.013256072998046875, -0.011178970336914062, -0.00910186767578125, -0.0070247650146484375, -0.004947662353515625, -0.0028705596923828125, -0.00079345703125, 0.0012836456298828125, 0.003360748291015625, 0.0054378509521484375, 0.00751495361328125, 0.009592056274414062, 0.011669158935546875, 0.013746261596679688, 0.0158233642578125, 0.017900466918945312, 0.019977569580078125, 0.022054672241210938, 0.02413177490234375, 0.026208877563476562, 0.028285980224609375, 0.030363082885742188, 0.032440185546875, 0.03451728820800781, 0.036594390869140625, 0.03867149353027344, 0.04074859619140625, 0.04282569885253906, 0.044902801513671875, 0.04697990417480469, 0.0490570068359375, 0.05113410949707031, 0.053211212158203125, 0.05528831481933594, 0.05736541748046875, 0.05944252014160156, 0.061519622802734375, 0.06359672546386719, 0.065673828125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 11.0, 5.0, 6.0, 7.0, 9.0, 13.0, 17.0, 16.0, 19.0, 17.0, 10.0, 33.0, 37.0, 56.0, 76.0, 108.0, 125.0, 127.0, 61.0, 52.0, 43.0, 27.0, 15.0, 16.0, 14.0, 12.0, 3.0, 9.0, 8.0, 4.0, 6.0, 4.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0003745555877685547, -0.00036362186074256897, -0.00035268813371658325, -0.00034175440669059753, -0.0003308206796646118, -0.0003198869526386261, -0.0003089532256126404, -0.00029801949858665466, -0.00028708577156066895, -0.00027615204453468323, -0.0002652183175086975, -0.0002542845904827118, -0.00024335086345672607, -0.00023241713643074036, -0.00022148340940475464, -0.00021054968237876892, -0.0001996159553527832, -0.00018868222832679749, -0.00017774850130081177, -0.00016681477427482605, -0.00015588104724884033, -0.00014494732022285461, -0.0001340135931968689, -0.00012307986617088318, -0.00011214613914489746, -0.00010121241211891174, -9.027868509292603e-05, -7.934495806694031e-05, -6.841123104095459e-05, -5.747750401496887e-05, -4.6543776988983154e-05, -3.5610049962997437e-05, -2.467632293701172e-05, -1.3742595911026001e-05, -2.808868885040283e-06, 8.124858140945435e-06, 1.9058585166931152e-05, 2.999231219291687e-05, 4.092603921890259e-05, 5.1859766244888306e-05, 6.279349327087402e-05, 7.372722029685974e-05, 8.466094732284546e-05, 9.559467434883118e-05, 0.0001065284013748169, 0.00011746212840080261, 0.00012839585542678833, 0.00013932958245277405, 0.00015026330947875977, 0.00016119703650474548, 0.0001721307635307312, 0.00018306449055671692, 0.00019399821758270264, 0.00020493194460868835, 0.00021586567163467407, 0.0002267993986606598, 0.0002377331256866455, 0.0002486668527126312, 0.00025960057973861694, 0.00027053430676460266, 0.0002814680337905884, 0.0002924017608165741, 0.0003033354878425598, 0.00031426921486854553, 0.00032520294189453125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 5.0, 9.0, 7.0, 6.0, 18.0, 17.0, 22.0, 37.0, 67.0, 120.0, 244.0, 2139.0, 776753.0, 267178.0, 1378.0, 200.0, 104.0, 54.0, 26.0, 23.0, 18.0, 18.0, 17.0, 12.0, 9.0, 6.0, 5.0, 8.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00846099853515625, -0.008178353309631348, -0.007895708084106445, -0.007613062858581543, -0.007330417633056641, -0.007047772407531738, -0.006765127182006836, -0.006482481956481934, -0.006199836730957031, -0.005917191505432129, -0.0056345462799072266, -0.005351901054382324, -0.005069255828857422, -0.0047866106033325195, -0.004503965377807617, -0.004221320152282715, -0.0039386749267578125, -0.00365602970123291, -0.003373384475708008, -0.0030907392501831055, -0.002808094024658203, -0.0025254487991333008, -0.0022428035736083984, -0.001960158348083496, -0.0016775131225585938, -0.0013948678970336914, -0.001112222671508789, -0.0008295774459838867, -0.0005469322204589844, -0.00026428699493408203, 1.8358230590820312e-05, 0.00030100345611572266, 0.000583648681640625, 0.0008662939071655273, 0.0011489391326904297, 0.001431584358215332, 0.0017142295837402344, 0.0019968748092651367, 0.002279520034790039, 0.0025621652603149414, 0.0028448104858398438, 0.003127455711364746, 0.0034101009368896484, 0.0036927461624145508, 0.003975391387939453, 0.0042580366134643555, 0.004540681838989258, 0.00482332706451416, 0.0051059722900390625, 0.005388617515563965, 0.005671262741088867, 0.0059539079666137695, 0.006236553192138672, 0.006519198417663574, 0.0068018436431884766, 0.007084488868713379, 0.007367134094238281, 0.007649779319763184, 0.007932424545288086, 0.008215069770812988, 0.00849771499633789, 0.008780360221862793, 0.009063005447387695, 0.009345650672912598, 0.0096282958984375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 13.0, 32.0, 122.0, 371.0, 344.0, 97.0, 22.0, 10.0, 5.0, 0.0, 1.0], "bins": [-0.0019118670606985688, -0.001878263894468546, -0.001844660728238523, -0.0018110575620085, -0.0017774543957784772, -0.0017438512295484543, -0.0017102480633184314, -0.0016766448970884085, -0.0016430417308583856, -0.0016094385646283627, -0.0015758353983983397, -0.0015422322321683168, -0.001508629065938294, -0.001475025899708271, -0.0014414227334782481, -0.0014078195672482252, -0.0013742165174335241, -0.0013406133512035012, -0.0013070101849734783, -0.0012734070187434554, -0.0012398038525134325, -0.0012062006862834096, -0.0011725975200533867, -0.0011389943538233638, -0.0011053911875933409, -0.001071788021363318, -0.001038184855133295, -0.0010045816889032722, -0.0009709785226732492, -0.0009373753564432263, -0.0009037721902132034, -0.0008701690239831805, -0.0008365659159608185, -0.0008029627497307956, -0.0007693595835007727, -0.0007357564172707498, -0.0007021532510407269, -0.000668550084810704, -0.000634946976788342, -0.0006013438105583191, -0.0005677405861206353, -0.0005341374198906124, -0.0005005342536605895, -0.00046693108743056655, -0.00043332792120054364, -0.00039972475497052073, -0.0003661216178443283, -0.0003325184516143054, -0.0002989153144881129, -0.00026531214825809, -0.0002317089820280671, -0.00019810583034995943, -0.00016450266411993653, -0.00013089949788991362, -9.729634621180594e-05, -6.369317998178303e-05, -3.0089999199844897e-05, 3.5131633921992034e-06, 3.7116325984243304e-05, 7.07194849383086e-05, 0.0001043226511683315, 0.0001379258173983544, 0.0001715289690764621, 0.000205132135306485, 0.0002387353015365079]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 10.0, 11.0, 11.0, 18.0, 18.0, 18.0, 19.0, 26.0, 25.0, 32.0, 37.0, 36.0, 45.0, 36.0, 36.0, 34.0, 56.0, 44.0, 41.0, 38.0, 30.0, 45.0, 30.0, 29.0, 25.0, 29.0, 21.0, 23.0, 32.0, 23.0, 21.0, 12.0, 13.0, 10.0, 6.0, 8.0, 4.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.00018358230590820312, -0.00017814245074987411, -0.0001727025955915451, -0.0001672627404332161, -0.00016182288527488708, -0.00015638303011655807, -0.00015094317495822906, -0.00014550331979990005, -0.00014006346464157104, -0.00013462360948324203, -0.00012918375432491302, -0.00012374389916658401, -0.000118304044008255, -0.000112864188849926, -0.00010742433369159698, -0.00010198447853326797, -9.654462337493896e-05, -9.110476821660995e-05, -8.566491305828094e-05, -8.022505789995193e-05, -7.478520274162292e-05, -6.934534758329391e-05, -6.39054924249649e-05, -5.8465637266635895e-05, -5.3025782108306885e-05, -4.7585926949977875e-05, -4.2146071791648865e-05, -3.6706216633319855e-05, -3.1266361474990845e-05, -2.5826506316661835e-05, -2.0386651158332825e-05, -1.4946796000003815e-05, -9.506940841674805e-06, -4.067085683345795e-06, 1.3727694749832153e-06, 6.812624633312225e-06, 1.2252479791641235e-05, 1.7692334949970245e-05, 2.3132190108299255e-05, 2.8572045266628265e-05, 3.4011900424957275e-05, 3.9451755583286285e-05, 4.4891610741615295e-05, 5.0331465899944305e-05, 5.5771321058273315e-05, 6.121117621660233e-05, 6.665103137493134e-05, 7.209088653326035e-05, 7.753074169158936e-05, 8.297059684991837e-05, 8.841045200824738e-05, 9.385030716657639e-05, 9.92901623249054e-05, 0.0001047300174832344, 0.00011016987264156342, 0.00011560972779989243, 0.00012104958295822144, 0.00012648943811655045, 0.00013192929327487946, 0.00013736914843320847, 0.00014280900359153748, 0.00014824885874986649, 0.0001536887139081955, 0.0001591285690665245, 0.00016456842422485352]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 8.0, 13.0, 10.0, 5.0, 11.0, 9.0, 13.0, 18.0, 9.0, 21.0, 19.0, 17.0, 21.0, 32.0, 25.0, 32.0, 23.0, 44.0, 28.0, 31.0, 41.0, 40.0, 36.0, 42.0, 38.0, 36.0, 36.0, 40.0, 41.0, 19.0, 34.0, 28.0, 24.0, 22.0, 17.0, 16.0, 17.0, 16.0, 8.0, 13.0, 11.0, 9.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.56640625, -4.43212890625, -4.2978515625, -4.16357421875, -4.029296875, -3.89501953125, -3.7607421875, -3.62646484375, -3.4921875, -3.35791015625, -3.2236328125, -3.08935546875, -2.955078125, -2.82080078125, -2.6865234375, -2.55224609375, -2.41796875, -2.28369140625, -2.1494140625, -2.01513671875, -1.880859375, -1.74658203125, -1.6123046875, -1.47802734375, -1.34375, -1.20947265625, -1.0751953125, -0.94091796875, -0.806640625, -0.67236328125, -0.5380859375, -0.40380859375, -0.26953125, -0.13525390625, -0.0009765625, 0.13330078125, 0.267578125, 0.40185546875, 0.5361328125, 0.67041015625, 0.8046875, 0.93896484375, 1.0732421875, 1.20751953125, 1.341796875, 1.47607421875, 1.6103515625, 1.74462890625, 1.87890625, 2.01318359375, 2.1474609375, 2.28173828125, 2.416015625, 2.55029296875, 2.6845703125, 2.81884765625, 2.953125, 3.08740234375, 3.2216796875, 3.35595703125, 3.490234375, 3.62451171875, 3.7587890625, 3.89306640625, 4.02734375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 6.0, 21.0, 15.0, 32.0, 39.0, 51.0, 79.0, 145.0, 204.0, 270.0, 426.0, 576.0, 851.0, 1321.0, 1877.0, 2814.0, 4212.0, 6554.0, 10138.0, 15775.0, 25844.0, 41298.0, 69659.0, 119766.0, 189829.0, 205443.0, 139415.0, 81699.0, 48792.0, 29395.0, 18343.0, 11556.0, 7391.0, 4910.0, 3151.0, 2118.0, 1523.0, 971.0, 652.0, 437.0, 318.0, 222.0, 130.0, 104.0, 60.0, 39.0, 21.0, 19.0, 15.0, 12.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-5.125, -4.97039794921875, -4.8157958984375, -4.66119384765625, -4.506591796875, -4.35198974609375, -4.1973876953125, -4.04278564453125, -3.88818359375, -3.73358154296875, -3.5789794921875, -3.42437744140625, -3.269775390625, -3.11517333984375, -2.9605712890625, -2.80596923828125, -2.6513671875, -2.49676513671875, -2.3421630859375, -2.18756103515625, -2.032958984375, -1.87835693359375, -1.7237548828125, -1.56915283203125, -1.41455078125, -1.25994873046875, -1.1053466796875, -0.95074462890625, -0.796142578125, -0.64154052734375, -0.4869384765625, -0.33233642578125, -0.177734375, -0.02313232421875, 0.1314697265625, 0.28607177734375, 0.440673828125, 0.59527587890625, 0.7498779296875, 0.90447998046875, 1.05908203125, 1.21368408203125, 1.3682861328125, 1.52288818359375, 1.677490234375, 1.83209228515625, 1.9866943359375, 2.14129638671875, 2.2958984375, 2.45050048828125, 2.6051025390625, 2.75970458984375, 2.914306640625, 3.06890869140625, 3.2235107421875, 3.37811279296875, 3.53271484375, 3.68731689453125, 3.8419189453125, 3.99652099609375, 4.151123046875, 4.30572509765625, 4.4603271484375, 4.61492919921875, 4.76953125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 12.0, 1.0, 4.0, 9.0, 10.0, 7.0, 12.0, 7.0, 10.0, 15.0, 14.0, 24.0, 32.0, 31.0, 27.0, 34.0, 49.0, 48.0, 57.0, 70.0, 102.0, 139.0, 199.0, 1263.0, 193.0, 153.0, 104.0, 63.0, 54.0, 52.0, 41.0, 31.0, 28.0, 23.0, 19.0, 20.0, 11.0, 18.0, 10.0, 15.0, 8.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-12.296875, -11.9183349609375, -11.539794921875, -11.1612548828125, -10.78271484375, -10.4041748046875, -10.025634765625, -9.6470947265625, -9.2685546875, -8.8900146484375, -8.511474609375, -8.1329345703125, -7.75439453125, -7.3758544921875, -6.997314453125, -6.6187744140625, -6.240234375, -5.8616943359375, -5.483154296875, -5.1046142578125, -4.72607421875, -4.3475341796875, -3.968994140625, -3.5904541015625, -3.2119140625, -2.8333740234375, -2.454833984375, -2.0762939453125, -1.69775390625, -1.3192138671875, -0.940673828125, -0.5621337890625, -0.18359375, 0.1949462890625, 0.573486328125, 0.9520263671875, 1.33056640625, 1.7091064453125, 2.087646484375, 2.4661865234375, 2.8447265625, 3.2232666015625, 3.601806640625, 3.9803466796875, 4.35888671875, 4.7374267578125, 5.115966796875, 5.4945068359375, 5.873046875, 6.2515869140625, 6.630126953125, 7.0086669921875, 7.38720703125, 7.7657470703125, 8.144287109375, 8.5228271484375, 8.9013671875, 9.2799072265625, 9.658447265625, 10.0369873046875, 10.41552734375, 10.7940673828125, 11.172607421875, 11.5511474609375, 11.9296875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 7.0, 11.0, 12.0, 17.0, 19.0, 28.0, 33.0, 54.0, 78.0, 82.0, 126.0, 150.0, 228.0, 311.0, 450.0, 722.0, 1243.0, 2136.0, 4468.0, 10167.0, 27395.0, 94993.0, 506575.0, 1917699.0, 446380.0, 86990.0, 25913.0, 9643.0, 4216.0, 2175.0, 1150.0, 709.0, 440.0, 286.0, 215.0, 152.0, 110.0, 67.0, 61.0, 42.0, 36.0, 30.0, 15.0, 21.0, 16.0, 9.0, 5.0, 9.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.65625, -11.2972412109375, -10.938232421875, -10.5792236328125, -10.22021484375, -9.8612060546875, -9.502197265625, -9.1431884765625, -8.7841796875, -8.4251708984375, -8.066162109375, -7.7071533203125, -7.34814453125, -6.9891357421875, -6.630126953125, -6.2711181640625, -5.912109375, -5.5531005859375, -5.194091796875, -4.8350830078125, -4.47607421875, -4.1170654296875, -3.758056640625, -3.3990478515625, -3.0400390625, -2.6810302734375, -2.322021484375, -1.9630126953125, -1.60400390625, -1.2449951171875, -0.885986328125, -0.5269775390625, -0.16796875, 0.1910400390625, 0.550048828125, 0.9090576171875, 1.26806640625, 1.6270751953125, 1.986083984375, 2.3450927734375, 2.7041015625, 3.0631103515625, 3.422119140625, 3.7811279296875, 4.14013671875, 4.4991455078125, 4.858154296875, 5.2171630859375, 5.576171875, 5.9351806640625, 6.294189453125, 6.6531982421875, 7.01220703125, 7.3712158203125, 7.730224609375, 8.0892333984375, 8.4482421875, 8.8072509765625, 9.166259765625, 9.5252685546875, 9.88427734375, 10.2432861328125, 10.602294921875, 10.9613037109375, 11.3203125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 13.0, 107.0, 491.0, 338.0, 49.0, 13.0, 3.0, 0.0, 0.0, 1.0], "bins": [-445.2985534667969, -437.456787109375, -429.6150207519531, -421.7732238769531, -413.93145751953125, -406.0896911621094, -398.2479248046875, -390.4061279296875, -382.5643615722656, -374.72259521484375, -366.8808288574219, -359.0390319824219, -351.197265625, -343.3554992675781, -335.51373291015625, -327.67193603515625, -319.8301696777344, -311.9884033203125, -304.1466369628906, -296.3048400878906, -288.46307373046875, -280.6213073730469, -272.779541015625, -264.937744140625, -257.0959777832031, -249.25421142578125, -241.4124298095703, -233.57066345214844, -225.7288818359375, -217.88711547851562, -210.0453338623047, -202.2035675048828, -194.36180114746094, -186.52003479003906, -178.67825317382812, -170.83648681640625, -162.9947052001953, -155.15293884277344, -147.3111572265625, -139.46939086914062, -131.6276092529297, -123.78583526611328, -115.94406127929688, -108.10228729248047, -100.26051330566406, -92.41874694824219, -84.57696533203125, -76.73519897460938, -68.89341735839844, -61.05164337158203, -53.209869384765625, -45.36809539794922, -37.52632141113281, -29.684551239013672, -21.842777252197266, -14.00100326538086, -6.159233093261719, 1.6825404167175293, 9.524313926696777, 17.366086959838867, 25.207860946655273, 33.04963302612305, 40.89140701293945, 48.73318099975586, 56.574954986572266]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 8.0, 5.0, 13.0, 4.0, 6.0, 16.0, 11.0, 16.0, 12.0, 21.0, 24.0, 24.0, 27.0, 29.0, 18.0, 44.0, 31.0, 37.0, 29.0, 40.0, 34.0, 37.0, 37.0, 61.0, 38.0, 39.0, 47.0, 31.0, 38.0, 28.0, 30.0, 23.0, 23.0, 22.0, 21.0, 14.0, 9.0, 9.0, 13.0, 6.0, 7.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.93986129760742, -31.80710792541504, -30.674354553222656, -29.54159927368164, -28.408845901489258, -27.276092529296875, -26.14333724975586, -25.010583877563477, -23.877830505371094, -22.74507713317871, -21.612323760986328, -20.479568481445312, -19.34681510925293, -18.214061737060547, -17.08130645751953, -15.948553085327148, -14.815799713134766, -13.683046340942383, -12.550292015075684, -11.417537689208984, -10.284784317016602, -9.152030944824219, -8.01927661895752, -6.8865227699279785, -5.7537689208984375, -4.6210150718688965, -3.4882612228393555, -2.3555073738098145, -1.2227535247802734, -0.08999967575073242, 1.0427541732788086, 2.1755080223083496, 3.308258056640625, 4.441011905670166, 5.573765754699707, 6.706519603729248, 7.839273452758789, 8.972026824951172, 10.104781150817871, 11.23753547668457, 12.370288848876953, 13.503042221069336, 14.635796546936035, 15.768550872802734, 16.901304244995117, 18.0340576171875, 19.166812896728516, 20.2995662689209, 21.43231964111328, 22.565073013305664, 23.697826385498047, 24.830581665039062, 25.963335037231445, 27.096088409423828, 28.228843688964844, 29.361597061157227, 30.49435043334961, 31.627103805541992, 32.759857177734375, 33.89261245727539, 35.025367736816406, 36.158119201660156, 37.29087448120117, 38.42362594604492, 39.55638122558594]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 6.0, 4.0, 6.0, 8.0, 10.0, 12.0, 8.0, 8.0, 9.0, 20.0, 18.0, 18.0, 21.0, 19.0, 28.0, 23.0, 21.0, 33.0, 36.0, 34.0, 37.0, 30.0, 43.0, 43.0, 31.0, 26.0, 33.0, 47.0, 30.0, 35.0, 22.0, 37.0, 21.0, 26.0, 26.0, 19.0, 27.0, 19.0, 17.0, 15.0, 8.0, 7.0, 6.0, 14.0, 7.0, 7.0, 6.0, 3.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.6640625, -4.52679443359375, -4.3895263671875, -4.25225830078125, -4.114990234375, -3.97772216796875, -3.8404541015625, -3.70318603515625, -3.56591796875, -3.42864990234375, -3.2913818359375, -3.15411376953125, -3.016845703125, -2.87957763671875, -2.7423095703125, -2.60504150390625, -2.4677734375, -2.33050537109375, -2.1932373046875, -2.05596923828125, -1.918701171875, -1.78143310546875, -1.6441650390625, -1.50689697265625, -1.36962890625, -1.23236083984375, -1.0950927734375, -0.95782470703125, -0.820556640625, -0.68328857421875, -0.5460205078125, -0.40875244140625, -0.271484375, -0.13421630859375, 0.0030517578125, 0.14031982421875, 0.277587890625, 0.41485595703125, 0.5521240234375, 0.68939208984375, 0.82666015625, 0.96392822265625, 1.1011962890625, 1.23846435546875, 1.375732421875, 1.51300048828125, 1.6502685546875, 1.78753662109375, 1.9248046875, 2.06207275390625, 2.1993408203125, 2.33660888671875, 2.473876953125, 2.61114501953125, 2.7484130859375, 2.88568115234375, 3.02294921875, 3.16021728515625, 3.2974853515625, 3.43475341796875, 3.572021484375, 3.70928955078125, 3.8465576171875, 3.98382568359375, 4.12109375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 11.0, 8.0, 14.0, 19.0, 28.0, 44.0, 54.0, 72.0, 119.0, 147.0, 203.0, 270.0, 423.0, 576.0, 818.0, 1190.0, 1882.0, 2849.0, 4956.0, 8802.0, 18863.0, 50128.0, 185571.0, 855820.0, 2080893.0, 734155.0, 162894.0, 44920.0, 17290.0, 8303.0, 4652.0, 2832.0, 1705.0, 1173.0, 787.0, 521.0, 376.0, 255.0, 185.0, 148.0, 100.0, 60.0, 52.0, 27.0, 24.0, 9.0, 18.0, 9.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.703125, -7.45819091796875, -7.2132568359375, -6.96832275390625, -6.723388671875, -6.47845458984375, -6.2335205078125, -5.98858642578125, -5.74365234375, -5.49871826171875, -5.2537841796875, -5.00885009765625, -4.763916015625, -4.51898193359375, -4.2740478515625, -4.02911376953125, -3.7841796875, -3.53924560546875, -3.2943115234375, -3.04937744140625, -2.804443359375, -2.55950927734375, -2.3145751953125, -2.06964111328125, -1.82470703125, -1.57977294921875, -1.3348388671875, -1.08990478515625, -0.844970703125, -0.60003662109375, -0.3551025390625, -0.11016845703125, 0.134765625, 0.37969970703125, 0.6246337890625, 0.86956787109375, 1.114501953125, 1.35943603515625, 1.6043701171875, 1.84930419921875, 2.09423828125, 2.33917236328125, 2.5841064453125, 2.82904052734375, 3.073974609375, 3.31890869140625, 3.5638427734375, 3.80877685546875, 4.0537109375, 4.29864501953125, 4.5435791015625, 4.78851318359375, 5.033447265625, 5.27838134765625, 5.5233154296875, 5.76824951171875, 6.01318359375, 6.25811767578125, 6.5030517578125, 6.74798583984375, 6.992919921875, 7.23785400390625, 7.4827880859375, 7.72772216796875, 7.97265625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 14.0, 7.0, 11.0, 15.0, 18.0, 32.0, 54.0, 59.0, 74.0, 107.0, 179.0, 252.0, 393.0, 505.0, 682.0, 554.0, 379.0, 251.0, 127.0, 102.0, 65.0, 52.0, 31.0, 28.0, 16.0, 17.0, 10.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8125, -9.5098876953125, -9.207275390625, -8.9046630859375, -8.60205078125, -8.2994384765625, -7.996826171875, -7.6942138671875, -7.3916015625, -7.0889892578125, -6.786376953125, -6.4837646484375, -6.18115234375, -5.8785400390625, -5.575927734375, -5.2733154296875, -4.970703125, -4.6680908203125, -4.365478515625, -4.0628662109375, -3.76025390625, -3.4576416015625, -3.155029296875, -2.8524169921875, -2.5498046875, -2.2471923828125, -1.944580078125, -1.6419677734375, -1.33935546875, -1.0367431640625, -0.734130859375, -0.4315185546875, -0.12890625, 0.1737060546875, 0.476318359375, 0.7789306640625, 1.08154296875, 1.3841552734375, 1.686767578125, 1.9893798828125, 2.2919921875, 2.5946044921875, 2.897216796875, 3.1998291015625, 3.50244140625, 3.8050537109375, 4.107666015625, 4.4102783203125, 4.712890625, 5.0155029296875, 5.318115234375, 5.6207275390625, 5.92333984375, 6.2259521484375, 6.528564453125, 6.8311767578125, 7.1337890625, 7.4364013671875, 7.739013671875, 8.0416259765625, 8.34423828125, 8.6468505859375, 8.949462890625, 9.2520751953125, 9.5546875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 5.0, 16.0, 30.0, 47.0, 75.0, 117.0, 188.0, 327.0, 628.0, 1079.0, 2504.0, 6608.0, 23828.0, 167610.0, 2979044.0, 928226.0, 62954.0, 13081.0, 4184.0, 1781.0, 861.0, 442.0, 267.0, 135.0, 91.0, 48.0, 37.0, 26.0, 10.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.96875, -20.3291015625, -19.689453125, -19.0498046875, -18.41015625, -17.7705078125, -17.130859375, -16.4912109375, -15.8515625, -15.2119140625, -14.572265625, -13.9326171875, -13.29296875, -12.6533203125, -12.013671875, -11.3740234375, -10.734375, -10.0947265625, -9.455078125, -8.8154296875, -8.17578125, -7.5361328125, -6.896484375, -6.2568359375, -5.6171875, -4.9775390625, -4.337890625, -3.6982421875, -3.05859375, -2.4189453125, -1.779296875, -1.1396484375, -0.5, 0.1396484375, 0.779296875, 1.4189453125, 2.05859375, 2.6982421875, 3.337890625, 3.9775390625, 4.6171875, 5.2568359375, 5.896484375, 6.5361328125, 7.17578125, 7.8154296875, 8.455078125, 9.0947265625, 9.734375, 10.3740234375, 11.013671875, 11.6533203125, 12.29296875, 12.9326171875, 13.572265625, 14.2119140625, 14.8515625, 15.4912109375, 16.130859375, 16.7705078125, 17.41015625, 18.0498046875, 18.689453125, 19.3291015625, 19.96875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [3.0, 16.0, 60.0, 348.0, 424.0, 137.0, 23.0, 7.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.02175521850586, -17.56312370300293, -12.104493141174316, -6.645862579345703, -1.1872310638427734, 4.271400451660156, 9.730030059814453, 15.188663482666016, 20.647293090820312, 26.105924606323242, 31.564556121826172, 37.02318572998047, 42.48181915283203, 47.94044876098633, 53.399078369140625, 58.85771179199219, 64.31634521484375, 69.77497863769531, 75.23360443115234, 80.6922378540039, 86.15087127685547, 91.6094970703125, 97.06813049316406, 102.52676391601562, 107.98538970947266, 113.44402313232422, 118.90264892578125, 124.36128234863281, 129.81991577148438, 135.27854919433594, 140.7371826171875, 146.19580078125, 151.65443420410156, 157.11306762695312, 162.5717010498047, 168.03033447265625, 173.48895263671875, 178.9475860595703, 184.40621948242188, 189.86485290527344, 195.323486328125, 200.78211975097656, 206.24075317382812, 211.69937133789062, 217.1580047607422, 222.61663818359375, 228.0752716064453, 233.53390502929688, 238.99252319335938, 244.45115661621094, 249.9097900390625, 255.368408203125, 260.8270568847656, 266.2856750488281, 271.74432373046875, 277.20294189453125, 282.6615905761719, 288.1202087402344, 293.578857421875, 299.0374755859375, 304.4961242675781, 309.9547424316406, 315.41339111328125, 320.87200927734375, 326.33062744140625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 3.0, 7.0, 6.0, 7.0, 8.0, 9.0, 11.0, 20.0, 21.0, 20.0, 24.0, 28.0, 22.0, 27.0, 28.0, 38.0, 35.0, 43.0, 37.0, 49.0, 54.0, 38.0, 46.0, 44.0, 40.0, 35.0, 30.0, 36.0, 33.0, 25.0, 28.0, 28.0, 16.0, 11.0, 16.0, 10.0, 13.0, 8.0, 9.0, 7.0, 7.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.29015350341797, -26.372365951538086, -25.454578399658203, -24.536788940429688, -23.619001388549805, -22.701213836669922, -21.78342628479004, -20.865638732910156, -19.94784927368164, -19.030061721801758, -18.112274169921875, -17.19448471069336, -16.276697158813477, -15.358909606933594, -14.441122055053711, -13.523334503173828, -12.605546951293945, -11.687759399414062, -10.769970893859863, -9.85218334197998, -8.934394836425781, -8.016607284545898, -7.098819732666016, -6.181031703948975, -5.263243675231934, -4.345455646514893, -3.4276678562164307, -2.5098800659179688, -1.5920920372009277, -0.6743040084838867, 0.2434835433959961, 1.161271572113037, 2.079059600830078, 2.996847629547119, 3.914635419845581, 4.832423210144043, 5.750211238861084, 6.667999267578125, 7.585786819458008, 8.50357437133789, 9.42136287689209, 10.339150428771973, 11.256938934326172, 12.174726486206055, 13.092514038085938, 14.010302543640137, 14.92809009552002, 15.845878601074219, 16.7636661529541, 17.681453704833984, 18.599241256713867, 19.51702880859375, 20.434818267822266, 21.35260581970215, 22.27039337158203, 23.188180923461914, 24.105968475341797, 25.02375602722168, 25.941543579101562, 26.859333038330078, 27.77712059020996, 28.694908142089844, 29.612695693969727, 30.53048324584961, 31.448272705078125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 6.0, 9.0, 12.0, 21.0, 17.0, 23.0, 20.0, 35.0, 23.0, 30.0, 35.0, 35.0, 29.0, 41.0, 33.0, 41.0, 33.0, 51.0, 39.0, 37.0, 33.0, 38.0, 37.0, 36.0, 30.0, 26.0, 27.0, 32.0, 32.0, 21.0, 18.0, 16.0, 10.0, 10.0, 6.0, 12.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5625, -5.400146484375, -5.23779296875, -5.075439453125, -4.9130859375, -4.750732421875, -4.58837890625, -4.426025390625, -4.263671875, -4.101318359375, -3.93896484375, -3.776611328125, -3.6142578125, -3.451904296875, -3.28955078125, -3.127197265625, -2.96484375, -2.802490234375, -2.64013671875, -2.477783203125, -2.3154296875, -2.153076171875, -1.99072265625, -1.828369140625, -1.666015625, -1.503662109375, -1.34130859375, -1.178955078125, -1.0166015625, -0.854248046875, -0.69189453125, -0.529541015625, -0.3671875, -0.204833984375, -0.04248046875, 0.119873046875, 0.2822265625, 0.444580078125, 0.60693359375, 0.769287109375, 0.931640625, 1.093994140625, 1.25634765625, 1.418701171875, 1.5810546875, 1.743408203125, 1.90576171875, 2.068115234375, 2.23046875, 2.392822265625, 2.55517578125, 2.717529296875, 2.8798828125, 3.042236328125, 3.20458984375, 3.366943359375, 3.529296875, 3.691650390625, 3.85400390625, 4.016357421875, 4.1787109375, 4.341064453125, 4.50341796875, 4.665771484375, 4.828125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 5.0, 5.0, 10.0, 20.0, 23.0, 47.0, 47.0, 66.0, 110.0, 146.0, 198.0, 281.0, 455.0, 673.0, 932.0, 1283.0, 1884.0, 2638.0, 3964.0, 5737.0, 8309.0, 11807.0, 17408.0, 25686.0, 38718.0, 59696.0, 94983.0, 161028.0, 221048.0, 142178.0, 85234.0, 53966.0, 35153.0, 23267.0, 15762.0, 11014.0, 7736.0, 5168.0, 3605.0, 2540.0, 1689.0, 1268.0, 871.0, 612.0, 404.0, 260.0, 184.0, 144.0, 99.0, 62.0, 49.0, 34.0, 17.0, 16.0, 14.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.140380859375, -0.1359081268310547, -0.13143539428710938, -0.12696266174316406, -0.12248992919921875, -0.11801719665527344, -0.11354446411132812, -0.10907173156738281, -0.1045989990234375, -0.10012626647949219, -0.09565353393554688, -0.09118080139160156, -0.08670806884765625, -0.08223533630371094, -0.07776260375976562, -0.07328987121582031, -0.068817138671875, -0.06434440612792969, -0.059871673583984375, -0.05539894104003906, -0.05092620849609375, -0.04645347595214844, -0.041980743408203125, -0.03750801086425781, -0.0330352783203125, -0.028562545776367188, -0.024089813232421875, -0.019617080688476562, -0.01514434814453125, -0.010671615600585938, -0.006198883056640625, -0.0017261505126953125, 0.00274658203125, 0.0072193145751953125, 0.011692047119140625, 0.016164779663085938, 0.02063751220703125, 0.025110244750976562, 0.029582977294921875, 0.03405570983886719, 0.0385284423828125, 0.04300117492675781, 0.047473907470703125, 0.05194664001464844, 0.05641937255859375, 0.06089210510253906, 0.06536483764648438, 0.06983757019042969, 0.074310302734375, 0.07878303527832031, 0.08325576782226562, 0.08772850036621094, 0.09220123291015625, 0.09667396545410156, 0.10114669799804688, 0.10561943054199219, 0.1100921630859375, 0.11456489562988281, 0.11903762817382812, 0.12351036071777344, 0.12798309326171875, 0.13245582580566406, 0.13692855834960938, 0.1414012908935547, 0.1458740234375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 12.0, 9.0, 9.0, 8.0, 23.0, 7.0, 27.0, 21.0, 18.0, 19.0, 24.0, 36.0, 29.0, 22.0, 49.0, 25.0, 40.0, 35.0, 34.0, 1070.0, 56.0, 37.0, 42.0, 49.0, 36.0, 23.0, 35.0, 38.0, 33.0, 17.0, 25.0, 12.0, 17.0, 9.0, 13.0, 13.0, 6.0, 8.0, 11.0, 3.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0], "bins": [-4.46875, -4.33966064453125, -4.2105712890625, -4.08148193359375, -3.952392578125, -3.82330322265625, -3.6942138671875, -3.56512451171875, -3.43603515625, -3.30694580078125, -3.1778564453125, -3.04876708984375, -2.919677734375, -2.79058837890625, -2.6614990234375, -2.53240966796875, -2.4033203125, -2.27423095703125, -2.1451416015625, -2.01605224609375, -1.886962890625, -1.75787353515625, -1.6287841796875, -1.49969482421875, -1.37060546875, -1.24151611328125, -1.1124267578125, -0.98333740234375, -0.854248046875, -0.72515869140625, -0.5960693359375, -0.46697998046875, -0.337890625, -0.20880126953125, -0.0797119140625, 0.04937744140625, 0.178466796875, 0.30755615234375, 0.4366455078125, 0.56573486328125, 0.69482421875, 0.82391357421875, 0.9530029296875, 1.08209228515625, 1.211181640625, 1.34027099609375, 1.4693603515625, 1.59844970703125, 1.7275390625, 1.85662841796875, 1.9857177734375, 2.11480712890625, 2.243896484375, 2.37298583984375, 2.5020751953125, 2.63116455078125, 2.76025390625, 2.88934326171875, 3.0184326171875, 3.14752197265625, 3.276611328125, 3.40570068359375, 3.5347900390625, 3.66387939453125, 3.79296875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 10.0, 11.0, 22.0, 31.0, 23.0, 55.0, 77.0, 101.0, 153.0, 176.0, 282.0, 394.0, 523.0, 805.0, 1070.0, 1625.0, 2154.0, 3116.0, 4411.0, 6118.0, 8910.0, 12948.0, 19168.0, 28479.0, 44137.0, 71601.0, 123191.0, 1200283.0, 256551.0, 115251.0, 67271.0, 41893.0, 27159.0, 17954.0, 12331.0, 8596.0, 5958.0, 4213.0, 2830.0, 2080.0, 1478.0, 1073.0, 709.0, 572.0, 399.0, 287.0, 199.0, 141.0, 104.0, 64.0, 44.0, 36.0, 27.0, 19.0, 11.0, 6.0, 5.0, 2.0, 5.0], "bins": [-0.07073974609375, -0.06859207153320312, -0.06644439697265625, -0.06429672241210938, -0.0621490478515625, -0.060001373291015625, -0.05785369873046875, -0.055706024169921875, -0.053558349609375, -0.051410675048828125, -0.04926300048828125, -0.047115325927734375, -0.0449676513671875, -0.042819976806640625, -0.04067230224609375, -0.038524627685546875, -0.036376953125, -0.034229278564453125, -0.03208160400390625, -0.029933929443359375, -0.0277862548828125, -0.025638580322265625, -0.02349090576171875, -0.021343231201171875, -0.019195556640625, -0.017047882080078125, -0.01490020751953125, -0.012752532958984375, -0.0106048583984375, -0.008457183837890625, -0.00630950927734375, -0.004161834716796875, -0.00201416015625, 0.000133514404296875, 0.00228118896484375, 0.004428863525390625, 0.0065765380859375, 0.008724212646484375, 0.01087188720703125, 0.013019561767578125, 0.015167236328125, 0.017314910888671875, 0.01946258544921875, 0.021610260009765625, 0.0237579345703125, 0.025905609130859375, 0.02805328369140625, 0.030200958251953125, 0.0323486328125, 0.034496307373046875, 0.03664398193359375, 0.038791656494140625, 0.0409393310546875, 0.043087005615234375, 0.04523468017578125, 0.047382354736328125, 0.049530029296875, 0.051677703857421875, 0.05382537841796875, 0.055973052978515625, 0.0581207275390625, 0.060268402099609375, 0.06241607666015625, 0.06456375122070312, 0.06671142578125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 7.0, 8.0, 6.0, 7.0, 12.0, 9.0, 18.0, 21.0, 46.0, 67.0, 92.0, 149.0, 169.0, 109.0, 84.0, 47.0, 32.0, 22.0, 10.0, 15.0, 12.0, 5.0, 5.0, 6.0, 5.0, 10.0, 2.0, 5.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007557868957519531, -0.0007337108254432678, -0.0007116347551345825, -0.0006895586848258972, -0.0006674826145172119, -0.0006454065442085266, -0.0006233304738998413, -0.000601254403591156, -0.0005791783332824707, -0.0005571022629737854, -0.0005350261926651001, -0.0005129501223564148, -0.0004908740520477295, -0.0004687979817390442, -0.0004467219114303589, -0.0004246458411216736, -0.0004025697708129883, -0.000380493700504303, -0.0003584176301956177, -0.0003363415598869324, -0.00031426548957824707, -0.00029218941926956177, -0.00027011334896087646, -0.00024803727865219116, -0.00022596120834350586, -0.00020388513803482056, -0.00018180906772613525, -0.00015973299741744995, -0.00013765692710876465, -0.00011558085680007935, -9.350478649139404e-05, -7.142871618270874e-05, -4.935264587402344e-05, -2.7276575565338135e-05, -5.200505256652832e-06, 1.687556505203247e-05, 3.8951635360717773e-05, 6.1027705669403076e-05, 8.310377597808838e-05, 0.00010517984628677368, 0.00012725591659545898, 0.0001493319869041443, 0.0001714080572128296, 0.0001934841275215149, 0.0002155601978302002, 0.0002376362681388855, 0.0002597123384475708, 0.0002817884087562561, 0.0003038644790649414, 0.0003259405493736267, 0.000348016619682312, 0.0003700926899909973, 0.0003921687602996826, 0.0004142448306083679, 0.0004363209009170532, 0.0004583969712257385, 0.00048047304153442383, 0.0005025491118431091, 0.0005246251821517944, 0.0005467012524604797, 0.000568777322769165, 0.0005908533930778503, 0.0006129294633865356, 0.000635005533695221, 0.0006570816040039062]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 2.0, 10.0, 2.0, 7.0, 7.0, 6.0, 11.0, 19.0, 17.0, 37.0, 75.0, 113.0, 304.0, 1730.0, 985389.0, 59750.0, 592.0, 209.0, 111.0, 47.0, 27.0, 16.0, 16.0, 7.0, 4.0, 9.0, 6.0, 7.0, 3.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01580810546875, -0.015277624130249023, -0.014747142791748047, -0.01421666145324707, -0.013686180114746094, -0.013155698776245117, -0.01262521743774414, -0.012094736099243164, -0.011564254760742188, -0.011033773422241211, -0.010503292083740234, -0.009972810745239258, -0.009442329406738281, -0.008911848068237305, -0.008381366729736328, -0.007850885391235352, -0.007320404052734375, -0.0067899227142333984, -0.006259441375732422, -0.005728960037231445, -0.005198478698730469, -0.004667997360229492, -0.004137516021728516, -0.003607034683227539, -0.0030765533447265625, -0.002546072006225586, -0.0020155906677246094, -0.0014851093292236328, -0.0009546279907226562, -0.0004241466522216797, 0.00010633468627929688, 0.0006368160247802734, 0.00116729736328125, 0.0016977787017822266, 0.002228260040283203, 0.0027587413787841797, 0.0032892227172851562, 0.003819704055786133, 0.004350185394287109, 0.004880666732788086, 0.0054111480712890625, 0.005941629409790039, 0.006472110748291016, 0.007002592086791992, 0.007533073425292969, 0.008063554763793945, 0.008594036102294922, 0.009124517440795898, 0.009654998779296875, 0.010185480117797852, 0.010715961456298828, 0.011246442794799805, 0.011776924133300781, 0.012307405471801758, 0.012837886810302734, 0.013368368148803711, 0.013898849487304688, 0.014429330825805664, 0.01495981216430664, 0.015490293502807617, 0.016020774841308594, 0.01655125617980957, 0.017081737518310547, 0.017612218856811523, 0.0181427001953125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 42.0, 599.0, 341.0, 28.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016375152627006173, -0.0015273196622729301, -0.001417124061845243, -0.0013069284614175558, -0.0011967328609898686, -0.0010865372605621815, -0.0009763416019268334, -0.0008661460014991462, -0.0007559504010714591, -0.0006457548006437719, -0.0005355592002160847, -0.0004253635706845671, -0.0003151679702568799, -0.0002049723407253623, -9.477674029767513e-05, 1.5418860130012035e-05, 0.0001256144605576992, 0.00023581006098538637, 0.00034600566141307354, 0.00045620129094459116, 0.0005663968622684479, 0.000676592520903796, 0.0007867881213314831, 0.0008969837217591703, 0.0010071792639791965, 0.0011173748644068837, 0.0012275704648345709, 0.001337766065262258, 0.0014479616656899452, 0.0015581573825329542, 0.0016683528665453196, 0.0017785485833883286, 0.0018887443002313375, 0.0019989400170743465, 0.002109135501086712, 0.002219331217929721, 0.0023295267019420862, 0.002439722418785095, 0.0025499179027974606, 0.0026601136196404696, 0.002770309103652835, 0.002880504820495844, 0.0029907003045082092, 0.0031008960213512182, 0.0032110915053635836, 0.0033212872222065926, 0.003431482706218958, 0.003541678423061967, 0.003651874139904976, 0.003762069856747985, 0.0038722653407603502, 0.003982461057603359, 0.0040926565416157246, 0.00420285202562809, 0.0043130479753017426, 0.004423243459314108, 0.004533438943326473, 0.004643634427338839, 0.004753830377012491, 0.004864025861024857, 0.004974221345037222, 0.005084416829049587, 0.00519461277872324, 0.005304808262735605, 0.005415003746747971]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 8.0, 10.0, 11.0, 15.0, 10.0, 17.0, 27.0, 32.0, 30.0, 49.0, 36.0, 47.0, 41.0, 45.0, 56.0, 51.0, 53.0, 55.0, 47.0, 41.0, 45.0, 41.0, 46.0, 42.0, 32.0, 20.0, 21.0, 20.0, 14.0, 8.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002808570861816406, -0.0002685869112610817, -0.00025631673634052277, -0.00024404656141996384, -0.0002317763864994049, -0.00021950621157884598, -0.00020723603665828705, -0.00019496586173772812, -0.0001826956868171692, -0.00017042551189661026, -0.00015815533697605133, -0.0001458851620554924, -0.00013361498713493347, -0.00012134481221437454, -0.00010907463729381561, -9.680446237325668e-05, -8.453428745269775e-05, -7.226411253213882e-05, -5.9993937611579895e-05, -4.7723762691020966e-05, -3.5453587770462036e-05, -2.3183412849903107e-05, -1.0913237929344177e-05, 1.3569369912147522e-06, 1.3627111911773682e-05, 2.589728683233261e-05, 3.816746175289154e-05, 5.043763667345047e-05, 6.27078115940094e-05, 7.497798651456833e-05, 8.724816143512726e-05, 9.951833635568619e-05, 0.00011178851127624512, 0.00012405868619680405, 0.00013632886111736298, 0.0001485990360379219, 0.00016086921095848083, 0.00017313938587903976, 0.0001854095607995987, 0.00019767973572015762, 0.00020994991064071655, 0.00022222008556127548, 0.0002344902604818344, 0.00024676043540239334, 0.00025903061032295227, 0.0002713007852435112, 0.00028357096016407013, 0.00029584113508462906, 0.000308111310005188, 0.0003203814849257469, 0.00033265165984630585, 0.0003449218347668648, 0.0003571920096874237, 0.00036946218460798264, 0.00038173235952854156, 0.0003940025344491005, 0.0004062727093696594, 0.00041854288429021835, 0.0004308130592107773, 0.0004430832341313362, 0.00045535340905189514, 0.00046762358397245407, 0.000479893758893013, 0.0004921639338135719, 0.0005044341087341309]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 6.0, 9.0, 12.0, 21.0, 17.0, 23.0, 20.0, 35.0, 23.0, 30.0, 35.0, 35.0, 29.0, 41.0, 33.0, 41.0, 33.0, 51.0, 39.0, 37.0, 33.0, 38.0, 37.0, 36.0, 30.0, 26.0, 27.0, 32.0, 32.0, 21.0, 18.0, 16.0, 10.0, 10.0, 6.0, 12.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5625, -5.400146484375, -5.23779296875, -5.075439453125, -4.9130859375, -4.750732421875, -4.58837890625, -4.426025390625, -4.263671875, -4.101318359375, -3.93896484375, -3.776611328125, -3.6142578125, -3.451904296875, -3.28955078125, -3.127197265625, -2.96484375, -2.802490234375, -2.64013671875, -2.477783203125, -2.3154296875, -2.153076171875, -1.99072265625, -1.828369140625, -1.666015625, -1.503662109375, -1.34130859375, -1.178955078125, -1.0166015625, -0.854248046875, -0.69189453125, -0.529541015625, -0.3671875, -0.204833984375, -0.04248046875, 0.119873046875, 0.2822265625, 0.444580078125, 0.60693359375, 0.769287109375, 0.931640625, 1.093994140625, 1.25634765625, 1.418701171875, 1.5810546875, 1.743408203125, 1.90576171875, 2.068115234375, 2.23046875, 2.392822265625, 2.55517578125, 2.717529296875, 2.8798828125, 3.042236328125, 3.20458984375, 3.366943359375, 3.529296875, 3.691650390625, 3.85400390625, 4.016357421875, 4.1787109375, 4.341064453125, 4.50341796875, 4.665771484375, 4.828125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 11.0, 26.0, 23.0, 36.0, 69.0, 78.0, 132.0, 223.0, 320.0, 450.0, 709.0, 997.0, 1588.0, 2590.0, 3951.0, 6320.0, 10119.0, 15997.0, 24858.0, 40777.0, 71067.0, 142353.0, 288369.0, 204338.0, 96239.0, 52505.0, 31271.0, 19390.0, 12306.0, 7859.0, 4909.0, 3117.0, 1961.0, 1223.0, 844.0, 515.0, 335.0, 189.0, 145.0, 110.0, 67.0, 56.0, 34.0, 24.0, 12.0, 15.0, 9.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.75286865234375, -5.5526123046875, -5.35235595703125, -5.152099609375, -4.95184326171875, -4.7515869140625, -4.55133056640625, -4.35107421875, -4.15081787109375, -3.9505615234375, -3.75030517578125, -3.550048828125, -3.34979248046875, -3.1495361328125, -2.94927978515625, -2.7490234375, -2.54876708984375, -2.3485107421875, -2.14825439453125, -1.947998046875, -1.74774169921875, -1.5474853515625, -1.34722900390625, -1.14697265625, -0.94671630859375, -0.7464599609375, -0.54620361328125, -0.345947265625, -0.14569091796875, 0.0545654296875, 0.25482177734375, 0.455078125, 0.65533447265625, 0.8555908203125, 1.05584716796875, 1.256103515625, 1.45635986328125, 1.6566162109375, 1.85687255859375, 2.05712890625, 2.25738525390625, 2.4576416015625, 2.65789794921875, 2.858154296875, 3.05841064453125, 3.2586669921875, 3.45892333984375, 3.6591796875, 3.85943603515625, 4.0596923828125, 4.25994873046875, 4.460205078125, 4.66046142578125, 4.8607177734375, 5.06097412109375, 5.26123046875, 5.46148681640625, 5.6617431640625, 5.86199951171875, 6.062255859375, 6.26251220703125, 6.4627685546875, 6.66302490234375, 6.86328125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 15.0, 10.0, 20.0, 11.0, 27.0, 35.0, 37.0, 30.0, 39.0, 45.0, 34.0, 60.0, 78.0, 112.0, 168.0, 231.0, 1293.0, 186.0, 121.0, 76.0, 68.0, 48.0, 47.0, 45.0, 28.0, 38.0, 28.0, 22.0, 19.0, 16.0, 17.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.546875, -17.073974609375, -16.60107421875, -16.128173828125, -15.6552734375, -15.182373046875, -14.70947265625, -14.236572265625, -13.763671875, -13.290771484375, -12.81787109375, -12.344970703125, -11.8720703125, -11.399169921875, -10.92626953125, -10.453369140625, -9.98046875, -9.507568359375, -9.03466796875, -8.561767578125, -8.0888671875, -7.615966796875, -7.14306640625, -6.670166015625, -6.197265625, -5.724365234375, -5.25146484375, -4.778564453125, -4.3056640625, -3.832763671875, -3.35986328125, -2.886962890625, -2.4140625, -1.941162109375, -1.46826171875, -0.995361328125, -0.5224609375, -0.049560546875, 0.42333984375, 0.896240234375, 1.369140625, 1.842041015625, 2.31494140625, 2.787841796875, 3.2607421875, 3.733642578125, 4.20654296875, 4.679443359375, 5.15234375, 5.625244140625, 6.09814453125, 6.571044921875, 7.0439453125, 7.516845703125, 7.98974609375, 8.462646484375, 8.935546875, 9.408447265625, 9.88134765625, 10.354248046875, 10.8271484375, 11.300048828125, 11.77294921875, 12.245849609375, 12.71875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 7.0, 6.0, 3.0, 10.0, 10.0, 18.0, 22.0, 31.0, 54.0, 66.0, 110.0, 163.0, 223.0, 329.0, 462.0, 663.0, 1015.0, 1803.0, 3364.0, 7640.0, 22644.0, 92216.0, 897734.0, 1914844.0, 150484.0, 31920.0, 9869.0, 4151.0, 2104.0, 1292.0, 759.0, 518.0, 341.0, 244.0, 168.0, 126.0, 76.0, 70.0, 39.0, 28.0, 25.0, 16.0, 17.0, 9.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.671875, -16.136474609375, -15.60107421875, -15.065673828125, -14.5302734375, -13.994873046875, -13.45947265625, -12.924072265625, -12.388671875, -11.853271484375, -11.31787109375, -10.782470703125, -10.2470703125, -9.711669921875, -9.17626953125, -8.640869140625, -8.10546875, -7.570068359375, -7.03466796875, -6.499267578125, -5.9638671875, -5.428466796875, -4.89306640625, -4.357666015625, -3.822265625, -3.286865234375, -2.75146484375, -2.216064453125, -1.6806640625, -1.145263671875, -0.60986328125, -0.074462890625, 0.4609375, 0.996337890625, 1.53173828125, 2.067138671875, 2.6025390625, 3.137939453125, 3.67333984375, 4.208740234375, 4.744140625, 5.279541015625, 5.81494140625, 6.350341796875, 6.8857421875, 7.421142578125, 7.95654296875, 8.491943359375, 9.02734375, 9.562744140625, 10.09814453125, 10.633544921875, 11.1689453125, 11.704345703125, 12.23974609375, 12.775146484375, 13.310546875, 13.845947265625, 14.38134765625, 14.916748046875, 15.4521484375, 15.987548828125, 16.52294921875, 17.058349609375, 17.59375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 29.0, 46.0, 177.0, 383.0, 245.0, 86.0, 20.0, 17.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-220.758544921875, -214.1777801513672, -207.59701538085938, -201.01625061035156, -194.43548583984375, -187.854736328125, -181.2739715576172, -174.69320678710938, -168.11244201660156, -161.53167724609375, -154.95091247558594, -148.37014770507812, -141.78939819335938, -135.2086181640625, -128.62786865234375, -122.04710388183594, -115.46633911132812, -108.88557434082031, -102.3048095703125, -95.72405242919922, -89.1432876586914, -82.5625228881836, -75.98176574707031, -69.4010009765625, -62.82023620605469, -56.239471435546875, -49.65871047973633, -43.07794952392578, -36.49718475341797, -29.916419982910156, -23.33565902709961, -16.754898071289062, -10.174118041992188, -3.593355178833008, 2.987407684326172, 9.568170547485352, 16.14893341064453, 22.729698181152344, 29.31045913696289, 35.89122009277344, 42.47198486328125, 49.05274963378906, 55.63351058959961, 62.214271545410156, 68.79503631591797, 75.37580108642578, 81.95655822753906, 88.53732299804688, 95.11808776855469, 101.6988525390625, 108.27961730957031, 114.8603744506836, 121.4411392211914, 128.02191162109375, 134.6026611328125, 141.1834259033203, 147.76419067382812, 154.34495544433594, 160.92572021484375, 167.50648498535156, 174.08724975585938, 180.66799926757812, 187.24876403808594, 193.82952880859375, 200.41029357910156]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [5.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 8.0, 6.0, 4.0, 12.0, 20.0, 10.0, 14.0, 25.0, 24.0, 15.0, 29.0, 29.0, 20.0, 36.0, 38.0, 26.0, 50.0, 48.0, 43.0, 37.0, 23.0, 35.0, 38.0, 39.0, 34.0, 30.0, 29.0, 45.0, 32.0, 18.0, 37.0, 29.0, 25.0, 14.0, 18.0, 15.0, 8.0, 9.0, 5.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.59511947631836, -36.26951599121094, -34.943912506103516, -33.618309020996094, -32.29270935058594, -30.967103958129883, -29.641502380371094, -28.315898895263672, -26.99029541015625, -25.664691925048828, -24.339088439941406, -23.013486862182617, -21.687883377075195, -20.362279891967773, -19.036678314208984, -17.711074829101562, -16.38547134399414, -15.059867858886719, -13.734265327453613, -12.408662796020508, -11.083059310913086, -9.757455825805664, -8.431853294372559, -7.106250762939453, -5.780647277832031, -4.455044269561768, -3.129441261291504, -1.8038382530212402, -0.47823524475097656, 0.8473677635192871, 2.172970771789551, 3.4985733032226562, 4.8241729736328125, 6.149775981903076, 7.47537899017334, 8.800981521606445, 10.126585006713867, 11.452188491821289, 12.777791023254395, 14.1033935546875, 15.428997039794922, 16.754600524902344, 18.080204010009766, 19.405805587768555, 20.731409072875977, 22.0570125579834, 23.382614135742188, 24.70821762084961, 26.03382110595703, 27.359424591064453, 28.685028076171875, 30.010629653930664, 31.336233139038086, 32.661834716796875, 33.9874382019043, 35.31304168701172, 36.63864517211914, 37.96424865722656, 39.289852142333984, 40.615455627441406, 41.94105529785156, 43.266658782958984, 44.592262268066406, 45.91786575317383, 47.24346923828125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 3.0, 10.0, 7.0, 16.0, 6.0, 16.0, 16.0, 10.0, 23.0, 23.0, 25.0, 18.0, 36.0, 34.0, 32.0, 34.0, 31.0, 32.0, 34.0, 41.0, 42.0, 31.0, 32.0, 47.0, 39.0, 31.0, 31.0, 39.0, 39.0, 38.0, 18.0, 30.0, 24.0, 10.0, 16.0, 23.0, 15.0, 11.0, 6.0, 8.0, 1.0, 10.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.890625, -5.71673583984375, -5.5428466796875, -5.36895751953125, -5.195068359375, -5.02117919921875, -4.8472900390625, -4.67340087890625, -4.49951171875, -4.32562255859375, -4.1517333984375, -3.97784423828125, -3.803955078125, -3.63006591796875, -3.4561767578125, -3.28228759765625, -3.1083984375, -2.93450927734375, -2.7606201171875, -2.58673095703125, -2.412841796875, -2.23895263671875, -2.0650634765625, -1.89117431640625, -1.71728515625, -1.54339599609375, -1.3695068359375, -1.19561767578125, -1.021728515625, -0.84783935546875, -0.6739501953125, -0.50006103515625, -0.326171875, -0.15228271484375, 0.0216064453125, 0.19549560546875, 0.369384765625, 0.54327392578125, 0.7171630859375, 0.89105224609375, 1.06494140625, 1.23883056640625, 1.4127197265625, 1.58660888671875, 1.760498046875, 1.93438720703125, 2.1082763671875, 2.28216552734375, 2.4560546875, 2.62994384765625, 2.8038330078125, 2.97772216796875, 3.151611328125, 3.32550048828125, 3.4993896484375, 3.67327880859375, 3.84716796875, 4.02105712890625, 4.1949462890625, 4.36883544921875, 4.542724609375, 4.71661376953125, 4.8905029296875, 5.06439208984375, 5.23828125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 5.0, 5.0, 13.0, 15.0, 23.0, 23.0, 36.0, 45.0, 58.0, 86.0, 127.0, 189.0, 338.0, 647.0, 1914.0, 8705.0, 169969.0, 3963731.0, 40889.0, 4867.0, 1270.0, 501.0, 272.0, 179.0, 80.0, 76.0, 58.0, 46.0, 29.0, 17.0, 18.0, 13.0, 13.0, 9.0, 3.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.375, -45.81298828125, -44.2509765625, -42.68896484375, -41.126953125, -39.56494140625, -38.0029296875, -36.44091796875, -34.87890625, -33.31689453125, -31.7548828125, -30.19287109375, -28.630859375, -27.06884765625, -25.5068359375, -23.94482421875, -22.3828125, -20.82080078125, -19.2587890625, -17.69677734375, -16.134765625, -14.57275390625, -13.0107421875, -11.44873046875, -9.88671875, -8.32470703125, -6.7626953125, -5.20068359375, -3.638671875, -2.07666015625, -0.5146484375, 1.04736328125, 2.609375, 4.17138671875, 5.7333984375, 7.29541015625, 8.857421875, 10.41943359375, 11.9814453125, 13.54345703125, 15.10546875, 16.66748046875, 18.2294921875, 19.79150390625, 21.353515625, 22.91552734375, 24.4775390625, 26.03955078125, 27.6015625, 29.16357421875, 30.7255859375, 32.28759765625, 33.849609375, 35.41162109375, 36.9736328125, 38.53564453125, 40.09765625, 41.65966796875, 43.2216796875, 44.78369140625, 46.345703125, 47.90771484375, 49.4697265625, 51.03173828125, 52.59375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 21.0, 17.0, 58.0, 79.0, 164.0, 334.0, 715.0, 1436.0, 720.0, 249.0, 112.0, 75.0, 33.0, 21.0, 7.0, 8.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.328125, -13.593017578125, -12.85791015625, -12.122802734375, -11.3876953125, -10.652587890625, -9.91748046875, -9.182373046875, -8.447265625, -7.712158203125, -6.97705078125, -6.241943359375, -5.5068359375, -4.771728515625, -4.03662109375, -3.301513671875, -2.56640625, -1.831298828125, -1.09619140625, -0.361083984375, 0.3740234375, 1.109130859375, 1.84423828125, 2.579345703125, 3.314453125, 4.049560546875, 4.78466796875, 5.519775390625, 6.2548828125, 6.989990234375, 7.72509765625, 8.460205078125, 9.1953125, 9.930419921875, 10.66552734375, 11.400634765625, 12.1357421875, 12.870849609375, 13.60595703125, 14.341064453125, 15.076171875, 15.811279296875, 16.54638671875, 17.281494140625, 18.0166015625, 18.751708984375, 19.48681640625, 20.221923828125, 20.95703125, 21.692138671875, 22.42724609375, 23.162353515625, 23.8974609375, 24.632568359375, 25.36767578125, 26.102783203125, 26.837890625, 27.572998046875, 28.30810546875, 29.043212890625, 29.7783203125, 30.513427734375, 31.24853515625, 31.983642578125, 32.71875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 10.0, 12.0, 22.0, 27.0, 68.0, 163.0, 394.0, 938.0, 3039.0, 15951.0, 1631968.0, 2519084.0, 17629.0, 3273.0, 1018.0, 362.0, 150.0, 71.0, 44.0, 19.0, 18.0, 8.0, 10.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.71875, -41.81982421875, -39.9208984375, -38.02197265625, -36.123046875, -34.22412109375, -32.3251953125, -30.42626953125, -28.52734375, -26.62841796875, -24.7294921875, -22.83056640625, -20.931640625, -19.03271484375, -17.1337890625, -15.23486328125, -13.3359375, -11.43701171875, -9.5380859375, -7.63916015625, -5.740234375, -3.84130859375, -1.9423828125, -0.04345703125, 1.85546875, 3.75439453125, 5.6533203125, 7.55224609375, 9.451171875, 11.35009765625, 13.2490234375, 15.14794921875, 17.046875, 18.94580078125, 20.8447265625, 22.74365234375, 24.642578125, 26.54150390625, 28.4404296875, 30.33935546875, 32.23828125, 34.13720703125, 36.0361328125, 37.93505859375, 39.833984375, 41.73291015625, 43.6318359375, 45.53076171875, 47.4296875, 49.32861328125, 51.2275390625, 53.12646484375, 55.025390625, 56.92431640625, 58.8232421875, 60.72216796875, 62.62109375, 64.52001953125, 66.4189453125, 68.31787109375, 70.216796875, 72.11572265625, 74.0146484375, 75.91357421875, 77.8125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [2.0, 105.0, 740.0, 170.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.89746856689453, -22.230972290039062, -8.564477920532227, 5.102016448974609, 18.768512725830078, 32.43500518798828, 46.10150146484375, 59.76799774169922, 73.43449401855469, 87.10099029541016, 100.76748657226562, 114.43397521972656, 128.10047912597656, 141.7669677734375, 155.4334716796875, 169.09996032714844, 182.76644897460938, 196.4329376220703, 210.0994415283203, 223.76593017578125, 237.43243408203125, 251.0989227294922, 264.7654113769531, 278.4319152832031, 292.0984191894531, 305.7649230957031, 319.431396484375, 333.097900390625, 346.764404296875, 360.430908203125, 374.0973815917969, 387.7638854980469, 401.4303894042969, 415.0968933105469, 428.76336669921875, 442.42987060546875, 456.09637451171875, 469.76287841796875, 483.4293518066406, 497.0958557128906, 510.7623596191406, 524.4288330078125, 538.0953369140625, 551.7618408203125, 565.4283447265625, 579.0948486328125, 592.7613525390625, 606.4278564453125, 620.0942993164062, 633.7608032226562, 647.4273071289062, 661.0938110351562, 674.76025390625, 688.4267578125, 702.09326171875, 715.759765625, 729.42626953125, 743.0927734375, 756.75927734375, 770.42578125, 784.0922241210938, 797.7587280273438, 811.4252319335938, 825.0917358398438, 838.7582397460938]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 7.0, 12.0, 10.0, 11.0, 10.0, 20.0, 26.0, 22.0, 30.0, 30.0, 42.0, 44.0, 38.0, 54.0, 51.0, 53.0, 44.0, 31.0, 36.0, 38.0, 34.0, 44.0, 45.0, 33.0, 38.0, 23.0, 29.0, 21.0, 31.0, 15.0, 16.0, 13.0, 6.0, 5.0, 11.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.707557678222656, -38.42266845703125, -37.13777542114258, -35.852882385253906, -34.5679931640625, -33.283103942871094, -31.998210906982422, -30.713319778442383, -29.428428649902344, -28.143537521362305, -26.858646392822266, -25.573755264282227, -24.288864135742188, -23.00397300720215, -21.71908187866211, -20.43419075012207, -19.14929962158203, -17.864408493041992, -16.579517364501953, -15.294626235961914, -14.009735107421875, -12.724843978881836, -11.439952850341797, -10.155061721801758, -8.870170593261719, -7.58527946472168, -6.300388336181641, -5.015497207641602, -3.7306060791015625, -2.4457149505615234, -1.1608238220214844, 0.12406730651855469, 1.4089622497558594, 2.6938533782958984, 3.9787445068359375, 5.263635635375977, 6.548526763916016, 7.833417892456055, 9.118309020996094, 10.403200149536133, 11.688091278076172, 12.972982406616211, 14.25787353515625, 15.542764663696289, 16.827655792236328, 18.112546920776367, 19.397438049316406, 20.682329177856445, 21.967220306396484, 23.252111434936523, 24.537002563476562, 25.8218936920166, 27.10678482055664, 28.39167594909668, 29.67656707763672, 30.961458206176758, 32.2463493347168, 33.53124237060547, 34.816131591796875, 36.10102081298828, 37.38591384887695, 38.670806884765625, 39.95569610595703, 41.24058532714844, 42.52547836303711]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 6.0, 6.0, 8.0, 17.0, 13.0, 19.0, 16.0, 28.0, 26.0, 30.0, 46.0, 30.0, 35.0, 34.0, 34.0, 35.0, 43.0, 41.0, 52.0, 50.0, 46.0, 44.0, 48.0, 31.0, 32.0, 20.0, 31.0, 32.0, 27.0, 20.0, 16.0, 13.0, 13.0, 16.0, 10.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.7242431640625, -5.526611328125, -5.3289794921875, -5.13134765625, -4.9337158203125, -4.736083984375, -4.5384521484375, -4.3408203125, -4.1431884765625, -3.945556640625, -3.7479248046875, -3.55029296875, -3.3526611328125, -3.155029296875, -2.9573974609375, -2.759765625, -2.5621337890625, -2.364501953125, -2.1668701171875, -1.96923828125, -1.7716064453125, -1.573974609375, -1.3763427734375, -1.1787109375, -0.9810791015625, -0.783447265625, -0.5858154296875, -0.38818359375, -0.1905517578125, 0.007080078125, 0.2047119140625, 0.40234375, 0.5999755859375, 0.797607421875, 0.9952392578125, 1.19287109375, 1.3905029296875, 1.588134765625, 1.7857666015625, 1.9833984375, 2.1810302734375, 2.378662109375, 2.5762939453125, 2.77392578125, 2.9715576171875, 3.169189453125, 3.3668212890625, 3.564453125, 3.7620849609375, 3.959716796875, 4.1573486328125, 4.35498046875, 4.5526123046875, 4.750244140625, 4.9478759765625, 5.1455078125, 5.3431396484375, 5.540771484375, 5.7384033203125, 5.93603515625, 6.1336669921875, 6.331298828125, 6.5289306640625, 6.7265625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 10.0, 23.0, 28.0, 31.0, 73.0, 105.0, 149.0, 222.0, 352.0, 550.0, 871.0, 1376.0, 2100.0, 3465.0, 5733.0, 9373.0, 15598.0, 26042.0, 45571.0, 81833.0, 154295.0, 263621.0, 196452.0, 103565.0, 56464.0, 31967.0, 19120.0, 11473.0, 6814.0, 4158.0, 2655.0, 1645.0, 1020.0, 612.0, 378.0, 259.0, 188.0, 122.0, 82.0, 52.0, 31.0, 19.0, 13.0, 10.0, 12.0, 2.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2080078125, -0.20183372497558594, -0.19565963745117188, -0.1894855499267578, -0.18331146240234375, -0.1771373748779297, -0.17096328735351562, -0.16478919982910156, -0.1586151123046875, -0.15244102478027344, -0.14626693725585938, -0.1400928497314453, -0.13391876220703125, -0.1277446746826172, -0.12157058715820312, -0.11539649963378906, -0.109222412109375, -0.10304832458496094, -0.09687423706054688, -0.09070014953613281, -0.08452606201171875, -0.07835197448730469, -0.07217788696289062, -0.06600379943847656, -0.0598297119140625, -0.05365562438964844, -0.047481536865234375, -0.04130744934082031, -0.03513336181640625, -0.028959274291992188, -0.022785186767578125, -0.016611099243164062, -0.01043701171875, -0.0042629241943359375, 0.001911163330078125, 0.008085250854492188, 0.01425933837890625, 0.020433425903320312, 0.026607513427734375, 0.03278160095214844, 0.0389556884765625, 0.04512977600097656, 0.051303863525390625, 0.05747795104980469, 0.06365203857421875, 0.06982612609863281, 0.07600021362304688, 0.08217430114746094, 0.088348388671875, 0.09452247619628906, 0.10069656372070312, 0.10687065124511719, 0.11304473876953125, 0.11921882629394531, 0.12539291381835938, 0.13156700134277344, 0.1377410888671875, 0.14391517639160156, 0.15008926391601562, 0.1562633514404297, 0.16243743896484375, 0.1686115264892578, 0.17478561401367188, 0.18095970153808594, 0.1871337890625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 12.0, 11.0, 9.0, 11.0, 17.0, 21.0, 14.0, 24.0, 25.0, 25.0, 27.0, 30.0, 34.0, 33.0, 46.0, 48.0, 55.0, 45.0, 1079.0, 49.0, 43.0, 41.0, 28.0, 52.0, 31.0, 28.0, 19.0, 17.0, 26.0, 22.0, 20.0, 18.0, 10.0, 13.0, 12.0, 5.0, 8.0, 5.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.19921875, -6.02752685546875, -5.8558349609375, -5.68414306640625, -5.512451171875, -5.34075927734375, -5.1690673828125, -4.99737548828125, -4.82568359375, -4.65399169921875, -4.4822998046875, -4.31060791015625, -4.138916015625, -3.96722412109375, -3.7955322265625, -3.62384033203125, -3.4521484375, -3.28045654296875, -3.1087646484375, -2.93707275390625, -2.765380859375, -2.59368896484375, -2.4219970703125, -2.25030517578125, -2.07861328125, -1.90692138671875, -1.7352294921875, -1.56353759765625, -1.391845703125, -1.22015380859375, -1.0484619140625, -0.87677001953125, -0.705078125, -0.53338623046875, -0.3616943359375, -0.19000244140625, -0.018310546875, 0.15338134765625, 0.3250732421875, 0.49676513671875, 0.66845703125, 0.84014892578125, 1.0118408203125, 1.18353271484375, 1.355224609375, 1.52691650390625, 1.6986083984375, 1.87030029296875, 2.0419921875, 2.21368408203125, 2.3853759765625, 2.55706787109375, 2.728759765625, 2.90045166015625, 3.0721435546875, 3.24383544921875, 3.41552734375, 3.58721923828125, 3.7589111328125, 3.93060302734375, 4.102294921875, 4.27398681640625, 4.4456787109375, 4.61737060546875, 4.7890625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 7.0, 10.0, 11.0, 12.0, 21.0, 37.0, 52.0, 57.0, 96.0, 109.0, 178.0, 234.0, 373.0, 559.0, 850.0, 1253.0, 1891.0, 2841.0, 4538.0, 7006.0, 10963.0, 17213.0, 28047.0, 46035.0, 80060.0, 143195.0, 1290677.0, 195928.0, 107408.0, 60800.0, 35771.0, 21785.0, 13867.0, 8854.0, 5571.0, 3760.0, 2385.0, 1614.0, 999.0, 664.0, 486.0, 312.0, 193.0, 128.0, 86.0, 67.0, 43.0, 21.0, 14.0, 14.0, 12.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0], "bins": [-0.0875244140625, -0.08485221862792969, -0.08218002319335938, -0.07950782775878906, -0.07683563232421875, -0.07416343688964844, -0.07149124145507812, -0.06881904602050781, -0.0661468505859375, -0.06347465515136719, -0.060802459716796875, -0.05813026428222656, -0.05545806884765625, -0.05278587341308594, -0.050113677978515625, -0.04744148254394531, -0.044769287109375, -0.04209709167480469, -0.039424896240234375, -0.03675270080566406, -0.03408050537109375, -0.03140830993652344, -0.028736114501953125, -0.026063919067382812, -0.0233917236328125, -0.020719528198242188, -0.018047332763671875, -0.015375137329101562, -0.01270294189453125, -0.010030746459960938, -0.007358551025390625, -0.0046863555908203125, -0.00201416015625, 0.0006580352783203125, 0.003330230712890625, 0.0060024261474609375, 0.00867462158203125, 0.011346817016601562, 0.014019012451171875, 0.016691207885742188, 0.0193634033203125, 0.022035598754882812, 0.024707794189453125, 0.027379989624023438, 0.03005218505859375, 0.03272438049316406, 0.035396575927734375, 0.03806877136230469, 0.040740966796875, 0.04341316223144531, 0.046085357666015625, 0.04875755310058594, 0.05142974853515625, 0.05410194396972656, 0.056774139404296875, 0.05944633483886719, 0.0621185302734375, 0.06479072570800781, 0.06746292114257812, 0.07013511657714844, 0.07280731201171875, 0.07547950744628906, 0.07815170288085938, 0.08082389831542969, 0.08349609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 8.0, 5.0, 11.0, 14.0, 7.0, 11.0, 20.0, 12.0, 19.0, 24.0, 27.0, 39.0, 34.0, 72.0, 76.0, 107.0, 87.0, 78.0, 55.0, 43.0, 39.0, 48.0, 19.0, 16.0, 15.0, 16.0, 11.0, 16.0, 12.0, 7.0, 9.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0005183219909667969, -0.0005003586411476135, -0.0004823952913284302, -0.0004644319415092468, -0.0004464685916900635, -0.0004285052418708801, -0.0004105418920516968, -0.00039257854223251343, -0.0003746151924133301, -0.00035665184259414673, -0.0003386884927749634, -0.00032072514295578003, -0.0003027617931365967, -0.00028479844331741333, -0.00026683509349823, -0.00024887174367904663, -0.00023090839385986328, -0.00021294504404067993, -0.00019498169422149658, -0.00017701834440231323, -0.00015905499458312988, -0.00014109164476394653, -0.00012312829494476318, -0.00010516494512557983, -8.720159530639648e-05, -6.923824548721313e-05, -5.1274895668029785e-05, -3.3311545848846436e-05, -1.5348196029663086e-05, 2.6151537895202637e-06, 2.0578503608703613e-05, 3.854185342788696e-05, 5.650520324707031e-05, 7.446855306625366e-05, 9.243190288543701e-05, 0.00011039525270462036, 0.0001283586025238037, 0.00014632195234298706, 0.0001642853021621704, 0.00018224865198135376, 0.0002002120018005371, 0.00021817535161972046, 0.0002361387014389038, 0.00025410205125808716, 0.0002720654010772705, 0.00029002875089645386, 0.0003079921007156372, 0.00032595545053482056, 0.0003439188003540039, 0.00036188215017318726, 0.0003798454999923706, 0.00039780884981155396, 0.0004157721996307373, 0.00043373554944992065, 0.000451698899269104, 0.00046966224908828735, 0.0004876255989074707, 0.000505588948726654, 0.0005235522985458374, 0.0005415156483650208, 0.0005594789981842041, 0.0005774423480033875, 0.0005954056978225708, 0.0006133690476417542, 0.0006313323974609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 4.0, 9.0, 7.0, 10.0, 17.0, 17.0, 20.0, 20.0, 28.0, 39.0, 74.0, 92.0, 194.0, 359.0, 1980.0, 264832.0, 776533.0, 3268.0, 489.0, 189.0, 110.0, 58.0, 34.0, 25.0, 18.0, 24.0, 11.0, 9.0, 16.0, 11.0, 8.0, 9.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.01486968994140625, -0.014445781707763672, -0.014021873474121094, -0.013597965240478516, -0.013174057006835938, -0.01275014877319336, -0.012326240539550781, -0.011902332305908203, -0.011478424072265625, -0.011054515838623047, -0.010630607604980469, -0.01020669937133789, -0.009782791137695312, -0.009358882904052734, -0.008934974670410156, -0.008511066436767578, -0.008087158203125, -0.007663249969482422, -0.007239341735839844, -0.006815433502197266, -0.0063915252685546875, -0.005967617034912109, -0.005543708801269531, -0.005119800567626953, -0.004695892333984375, -0.004271984100341797, -0.0038480758666992188, -0.0034241676330566406, -0.0030002593994140625, -0.0025763511657714844, -0.0021524429321289062, -0.0017285346984863281, -0.00130462646484375, -0.0008807182312011719, -0.00045680999755859375, -3.2901763916015625e-05, 0.0003910064697265625, 0.0008149147033691406, 0.0012388229370117188, 0.0016627311706542969, 0.002086639404296875, 0.002510547637939453, 0.0029344558715820312, 0.0033583641052246094, 0.0037822723388671875, 0.004206180572509766, 0.004630088806152344, 0.005053997039794922, 0.0054779052734375, 0.005901813507080078, 0.006325721740722656, 0.006749629974365234, 0.0071735382080078125, 0.007597446441650391, 0.008021354675292969, 0.008445262908935547, 0.008869171142578125, 0.009293079376220703, 0.009716987609863281, 0.01014089584350586, 0.010564804077148438, 0.010988712310791016, 0.011412620544433594, 0.011836528778076172, 0.01226043701171875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 33.0, 247.0, 601.0, 111.0, 15.0, 4.0], "bins": [-0.0061801765114068985, -0.006077658850699663, -0.0059751407243311405, -0.005872623063623905, -0.00577010540291667, -0.005667587276548147, -0.005565069615840912, -0.005462551489472389, -0.005360033828765154, -0.0052575161680579185, -0.005154998041689396, -0.005052480380982161, -0.004949962720274925, -0.004847444593906403, -0.004744926933199167, -0.004642409272491932, -0.004539891146123409, -0.004437373485416174, -0.004334855359047651, -0.004232337698340416, -0.004129820037633181, -0.004027301911264658, -0.003924784250557423, -0.0038222663570195436, -0.0037197486963123083, -0.0036172308027744293, -0.003514713142067194, -0.003412195248529315, -0.003309677354991436, -0.0032071596942842007, -0.0031046418007463217, -0.0030021239072084427, -0.0028996060136705637, -0.0027970881201326847, -0.0026945704594254494, -0.0025920525658875704, -0.0024895346723496914, -0.002387017011642456, -0.002284499118104577, -0.002181981224566698, -0.0020794635638594627, -0.0019769456703215837, -0.0018744278931990266, -0.0017719101160764694, -0.0016693922225385904, -0.0015668744454160333, -0.001464356668293476, -0.0013618387747555971, -0.0012593208812177181, -0.001156803104095161, -0.001054285210557282, -0.0009517674334347248, -0.0008492495398968458, -0.0007467317627742887, -0.0006442139274440706, -0.0005416960921138525, -0.00043917822767980397, -0.0003366603923495859, -0.00023414257157128304, -0.0001316247507929802, -2.9106915462762117e-05, 7.34108907636255e-05, 0.00017592872609384358, 0.00027844656142406166, 0.00038096439675427973]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 5.0, 16.0, 14.0, 11.0, 15.0, 22.0, 18.0, 30.0, 24.0, 28.0, 28.0, 36.0, 43.0, 41.0, 40.0, 37.0, 35.0, 57.0, 55.0, 46.0, 40.0, 41.0, 37.0, 43.0, 23.0, 20.0, 16.0, 28.0, 21.0, 19.0, 9.0, 14.0, 10.0, 10.0, 9.0, 8.0, 9.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00036454200744628906, -0.0003531603142619133, -0.00034177862107753754, -0.0003303969278931618, -0.000319015234708786, -0.00030763354152441025, -0.0002962518483400345, -0.0002848701551556587, -0.00027348846197128296, -0.0002621067687869072, -0.00025072507560253143, -0.00023934338241815567, -0.0002279616892337799, -0.00021657999604940414, -0.00020519830286502838, -0.00019381660968065262, -0.00018243491649627686, -0.0001710532233119011, -0.00015967153012752533, -0.00014828983694314957, -0.0001369081437587738, -0.00012552645057439804, -0.00011414475739002228, -0.00010276306420564651, -9.138137102127075e-05, -7.999967783689499e-05, -6.861798465251923e-05, -5.723629146814346e-05, -4.58545982837677e-05, -3.447290509939194e-05, -2.3091211915016174e-05, -1.1709518730640411e-05, -3.2782554626464844e-07, 1.1053867638111115e-05, 2.2435560822486877e-05, 3.381725400686264e-05, 4.51989471912384e-05, 5.6580640375614166e-05, 6.796233355998993e-05, 7.934402674436569e-05, 9.072571992874146e-05, 0.00010210741311311722, 0.00011348910629749298, 0.00012487079948186874, 0.0001362524926662445, 0.00014763418585062027, 0.00015901587903499603, 0.0001703975722193718, 0.00018177926540374756, 0.00019316095858812332, 0.00020454265177249908, 0.00021592434495687485, 0.0002273060381412506, 0.00023868773132562637, 0.00025006942451000214, 0.0002614511176943779, 0.00027283281087875366, 0.0002842145040631294, 0.0002955961972475052, 0.00030697789043188095, 0.0003183595836162567, 0.0003297412768006325, 0.00034112296998500824, 0.000352504663169384, 0.00036388635635375977]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 6.0, 6.0, 8.0, 17.0, 13.0, 19.0, 16.0, 28.0, 26.0, 30.0, 46.0, 30.0, 35.0, 34.0, 34.0, 35.0, 43.0, 41.0, 52.0, 50.0, 46.0, 44.0, 48.0, 31.0, 32.0, 20.0, 31.0, 32.0, 27.0, 20.0, 16.0, 13.0, 13.0, 16.0, 10.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.7242431640625, -5.526611328125, -5.3289794921875, -5.13134765625, -4.9337158203125, -4.736083984375, -4.5384521484375, -4.3408203125, -4.1431884765625, -3.945556640625, -3.7479248046875, -3.55029296875, -3.3526611328125, -3.155029296875, -2.9573974609375, -2.759765625, -2.5621337890625, -2.364501953125, -2.1668701171875, -1.96923828125, -1.7716064453125, -1.573974609375, -1.3763427734375, -1.1787109375, -0.9810791015625, -0.783447265625, -0.5858154296875, -0.38818359375, -0.1905517578125, 0.007080078125, 0.2047119140625, 0.40234375, 0.5999755859375, 0.797607421875, 0.9952392578125, 1.19287109375, 1.3905029296875, 1.588134765625, 1.7857666015625, 1.9833984375, 2.1810302734375, 2.378662109375, 2.5762939453125, 2.77392578125, 2.9715576171875, 3.169189453125, 3.3668212890625, 3.564453125, 3.7620849609375, 3.959716796875, 4.1573486328125, 4.35498046875, 4.5526123046875, 4.750244140625, 4.9478759765625, 5.1455078125, 5.3431396484375, 5.540771484375, 5.7384033203125, 5.93603515625, 6.1336669921875, 6.331298828125, 6.5289306640625, 6.7265625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 11.0, 8.0, 13.0, 14.0, 32.0, 63.0, 129.0, 258.0, 539.0, 1497.0, 4147.0, 16373.0, 83455.0, 490559.0, 372037.0, 61172.0, 12546.0, 3565.0, 1139.0, 506.0, 219.0, 107.0, 52.0, 35.0, 15.0, 12.0, 13.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-23.390625, -22.679931640625, -21.96923828125, -21.258544921875, -20.5478515625, -19.837158203125, -19.12646484375, -18.415771484375, -17.705078125, -16.994384765625, -16.28369140625, -15.572998046875, -14.8623046875, -14.151611328125, -13.44091796875, -12.730224609375, -12.01953125, -11.308837890625, -10.59814453125, -9.887451171875, -9.1767578125, -8.466064453125, -7.75537109375, -7.044677734375, -6.333984375, -5.623291015625, -4.91259765625, -4.201904296875, -3.4912109375, -2.780517578125, -2.06982421875, -1.359130859375, -0.6484375, 0.062255859375, 0.77294921875, 1.483642578125, 2.1943359375, 2.905029296875, 3.61572265625, 4.326416015625, 5.037109375, 5.747802734375, 6.45849609375, 7.169189453125, 7.8798828125, 8.590576171875, 9.30126953125, 10.011962890625, 10.72265625, 11.433349609375, 12.14404296875, 12.854736328125, 13.5654296875, 14.276123046875, 14.98681640625, 15.697509765625, 16.408203125, 17.118896484375, 17.82958984375, 18.540283203125, 19.2509765625, 19.961669921875, 20.67236328125, 21.383056640625, 22.09375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 9.0, 17.0, 16.0, 24.0, 23.0, 37.0, 30.0, 64.0, 63.0, 79.0, 109.0, 187.0, 293.0, 1342.0, 187.0, 131.0, 100.0, 71.0, 49.0, 54.0, 32.0, 28.0, 23.0, 20.0, 11.0, 8.0, 12.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.9375, -17.32177734375, -16.7060546875, -16.09033203125, -15.474609375, -14.85888671875, -14.2431640625, -13.62744140625, -13.01171875, -12.39599609375, -11.7802734375, -11.16455078125, -10.548828125, -9.93310546875, -9.3173828125, -8.70166015625, -8.0859375, -7.47021484375, -6.8544921875, -6.23876953125, -5.623046875, -5.00732421875, -4.3916015625, -3.77587890625, -3.16015625, -2.54443359375, -1.9287109375, -1.31298828125, -0.697265625, -0.08154296875, 0.5341796875, 1.14990234375, 1.765625, 2.38134765625, 2.9970703125, 3.61279296875, 4.228515625, 4.84423828125, 5.4599609375, 6.07568359375, 6.69140625, 7.30712890625, 7.9228515625, 8.53857421875, 9.154296875, 9.77001953125, 10.3857421875, 11.00146484375, 11.6171875, 12.23291015625, 12.8486328125, 13.46435546875, 14.080078125, 14.69580078125, 15.3115234375, 15.92724609375, 16.54296875, 17.15869140625, 17.7744140625, 18.39013671875, 19.005859375, 19.62158203125, 20.2373046875, 20.85302734375, 21.46875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 12.0, 12.0, 15.0, 35.0, 37.0, 53.0, 79.0, 114.0, 155.0, 213.0, 333.0, 571.0, 1068.0, 3763.0, 50418.0, 2942086.0, 137825.0, 5739.0, 1326.0, 668.0, 385.0, 263.0, 174.0, 113.0, 84.0, 53.0, 35.0, 33.0, 27.0, 5.0, 8.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.75, -39.4189453125, -38.087890625, -36.7568359375, -35.42578125, -34.0947265625, -32.763671875, -31.4326171875, -30.1015625, -28.7705078125, -27.439453125, -26.1083984375, -24.77734375, -23.4462890625, -22.115234375, -20.7841796875, -19.453125, -18.1220703125, -16.791015625, -15.4599609375, -14.12890625, -12.7978515625, -11.466796875, -10.1357421875, -8.8046875, -7.4736328125, -6.142578125, -4.8115234375, -3.48046875, -2.1494140625, -0.818359375, 0.5126953125, 1.84375, 3.1748046875, 4.505859375, 5.8369140625, 7.16796875, 8.4990234375, 9.830078125, 11.1611328125, 12.4921875, 13.8232421875, 15.154296875, 16.4853515625, 17.81640625, 19.1474609375, 20.478515625, 21.8095703125, 23.140625, 24.4716796875, 25.802734375, 27.1337890625, 28.46484375, 29.7958984375, 31.126953125, 32.4580078125, 33.7890625, 35.1201171875, 36.451171875, 37.7822265625, 39.11328125, 40.4443359375, 41.775390625, 43.1064453125, 44.4375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 21.0, 47.0, 122.0, 239.0, 286.0, 176.0, 77.0, 27.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.66944885253906, -95.56439971923828, -91.4593505859375, -87.35430145263672, -83.24925231933594, -79.14420318603516, -75.03915405273438, -70.9341049194336, -66.82905578613281, -62.72400665283203, -58.61895751953125, -54.51390838623047, -50.40885925292969, -46.303810119628906, -42.198760986328125, -38.093711853027344, -33.98866271972656, -29.88361358642578, -25.778564453125, -21.67351531982422, -17.568466186523438, -13.463417053222656, -9.358367919921875, -5.253318786621094, -1.1482696533203125, 2.9567794799804688, 7.06182861328125, 11.166877746582031, 15.271926879882812, 19.376976013183594, 23.482025146484375, 27.587074279785156, 31.692108154296875, 35.797157287597656, 39.90220642089844, 44.00725555419922, 48.1123046875, 52.21735382080078, 56.32240295410156, 60.427452087402344, 64.53250122070312, 68.6375503540039, 72.74259948730469, 76.84764862060547, 80.95269775390625, 85.05774688720703, 89.16279602050781, 93.2678451538086, 97.37289428710938, 101.47794342041016, 105.58299255371094, 109.68804168701172, 113.7930908203125, 117.89813995361328, 122.00318908691406, 126.10823822021484, 130.21328735351562, 134.31832885742188, 138.4233856201172, 142.5284423828125, 146.63348388671875, 150.738525390625, 154.8435821533203, 158.94863891601562, 163.05368041992188]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 10.0, 5.0, 7.0, 11.0, 12.0, 14.0, 18.0, 17.0, 31.0, 21.0, 28.0, 23.0, 27.0, 39.0, 39.0, 32.0, 27.0, 38.0, 40.0, 43.0, 50.0, 45.0, 38.0, 44.0, 32.0, 37.0, 35.0, 36.0, 25.0, 24.0, 23.0, 23.0, 13.0, 16.0, 11.0, 11.0, 11.0, 6.0, 5.0, 7.0, 7.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.98893356323242, -49.46489715576172, -47.94085693359375, -46.41682052612305, -44.892784118652344, -43.368743896484375, -41.84470748901367, -40.32067108154297, -38.796630859375, -37.2725944519043, -35.74855422973633, -34.224517822265625, -32.700477600097656, -31.176441192626953, -29.65240478515625, -28.128366470336914, -26.604328155517578, -25.080289840698242, -23.556251525878906, -22.032215118408203, -20.508176803588867, -18.98413848876953, -17.460102081298828, -15.936063766479492, -14.412025451660156, -12.88798713684082, -11.3639497756958, -9.839912414550781, -8.315874099731445, -6.791836261749268, -5.26779842376709, -3.7437610626220703, -2.2197265625, -0.6956887245178223, 0.8283491134643555, 2.352386951446533, 3.876424789428711, 5.400462627410889, 6.924500465393066, 8.448537826538086, 9.972576141357422, 11.496614456176758, 13.020651817321777, 14.544689178466797, 16.068727493286133, 17.59276580810547, 19.116802215576172, 20.640840530395508, 22.164878845214844, 23.68891716003418, 25.212955474853516, 26.73699188232422, 28.261030197143555, 29.78506851196289, 31.309104919433594, 32.83314514160156, 34.357181549072266, 35.88121795654297, 37.40525817871094, 38.92929458618164, 40.453330993652344, 41.97737121582031, 43.501407623291016, 45.02544403076172, 46.54948425292969]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 6.0, 9.0, 13.0, 12.0, 13.0, 17.0, 25.0, 22.0, 28.0, 36.0, 29.0, 31.0, 33.0, 40.0, 40.0, 47.0, 43.0, 42.0, 45.0, 44.0, 49.0, 46.0, 39.0, 33.0, 28.0, 24.0, 32.0, 24.0, 24.0, 19.0, 10.0, 15.0, 18.0, 6.0, 9.0, 14.0, 3.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.71484375, -6.52154541015625, -6.3282470703125, -6.13494873046875, -5.941650390625, -5.74835205078125, -5.5550537109375, -5.36175537109375, -5.16845703125, -4.97515869140625, -4.7818603515625, -4.58856201171875, -4.395263671875, -4.20196533203125, -4.0086669921875, -3.81536865234375, -3.6220703125, -3.42877197265625, -3.2354736328125, -3.04217529296875, -2.848876953125, -2.65557861328125, -2.4622802734375, -2.26898193359375, -2.07568359375, -1.88238525390625, -1.6890869140625, -1.49578857421875, -1.302490234375, -1.10919189453125, -0.9158935546875, -0.72259521484375, -0.529296875, -0.33599853515625, -0.1427001953125, 0.05059814453125, 0.243896484375, 0.43719482421875, 0.6304931640625, 0.82379150390625, 1.01708984375, 1.21038818359375, 1.4036865234375, 1.59698486328125, 1.790283203125, 1.98358154296875, 2.1768798828125, 2.37017822265625, 2.5634765625, 2.75677490234375, 2.9500732421875, 3.14337158203125, 3.336669921875, 3.52996826171875, 3.7232666015625, 3.91656494140625, 4.10986328125, 4.30316162109375, 4.4964599609375, 4.68975830078125, 4.883056640625, 5.07635498046875, 5.2696533203125, 5.46295166015625, 5.65625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 8.0, 4.0, 11.0, 22.0, 38.0, 78.0, 112.0, 221.0, 382.0, 653.0, 1177.0, 2302.0, 5997.0, 23638.0, 404287.0, 3264174.0, 454559.0, 25200.0, 6208.0, 2456.0, 1172.0, 633.0, 407.0, 247.0, 119.0, 72.0, 45.0, 19.0, 14.0, 5.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.171875, -17.576416015625, -16.98095703125, -16.385498046875, -15.7900390625, -15.194580078125, -14.59912109375, -14.003662109375, -13.408203125, -12.812744140625, -12.21728515625, -11.621826171875, -11.0263671875, -10.430908203125, -9.83544921875, -9.239990234375, -8.64453125, -8.049072265625, -7.45361328125, -6.858154296875, -6.2626953125, -5.667236328125, -5.07177734375, -4.476318359375, -3.880859375, -3.285400390625, -2.68994140625, -2.094482421875, -1.4990234375, -0.903564453125, -0.30810546875, 0.287353515625, 0.8828125, 1.478271484375, 2.07373046875, 2.669189453125, 3.2646484375, 3.860107421875, 4.45556640625, 5.051025390625, 5.646484375, 6.241943359375, 6.83740234375, 7.432861328125, 8.0283203125, 8.623779296875, 9.21923828125, 9.814697265625, 10.41015625, 11.005615234375, 11.60107421875, 12.196533203125, 12.7919921875, 13.387451171875, 13.98291015625, 14.578369140625, 15.173828125, 15.769287109375, 16.36474609375, 16.960205078125, 17.5556640625, 18.151123046875, 18.74658203125, 19.342041015625, 19.9375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 6.0, 12.0, 9.0, 19.0, 22.0, 37.0, 44.0, 66.0, 136.0, 189.0, 300.0, 457.0, 740.0, 678.0, 447.0, 310.0, 180.0, 133.0, 85.0, 55.0, 35.0, 27.0, 20.0, 16.0, 10.0, 3.0, 6.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.688232421875, -10.30615234375, -9.924072265625, -9.5419921875, -9.159912109375, -8.77783203125, -8.395751953125, -8.013671875, -7.631591796875, -7.24951171875, -6.867431640625, -6.4853515625, -6.103271484375, -5.72119140625, -5.339111328125, -4.95703125, -4.574951171875, -4.19287109375, -3.810791015625, -3.4287109375, -3.046630859375, -2.66455078125, -2.282470703125, -1.900390625, -1.518310546875, -1.13623046875, -0.754150390625, -0.3720703125, 0.010009765625, 0.39208984375, 0.774169921875, 1.15625, 1.538330078125, 1.92041015625, 2.302490234375, 2.6845703125, 3.066650390625, 3.44873046875, 3.830810546875, 4.212890625, 4.594970703125, 4.97705078125, 5.359130859375, 5.7412109375, 6.123291015625, 6.50537109375, 6.887451171875, 7.26953125, 7.651611328125, 8.03369140625, 8.415771484375, 8.7978515625, 9.179931640625, 9.56201171875, 9.944091796875, 10.326171875, 10.708251953125, 11.09033203125, 11.472412109375, 11.8544921875, 12.236572265625, 12.61865234375, 13.000732421875, 13.3828125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 9.0, 5.0, 17.0, 33.0, 46.0, 63.0, 125.0, 192.0, 378.0, 792.0, 1869.0, 5212.0, 21332.0, 221749.0, 3631149.0, 278130.0, 23819.0, 5669.0, 1900.0, 833.0, 417.0, 233.0, 134.0, 56.0, 40.0, 29.0, 12.0, 13.0, 8.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.921875, -23.1865234375, -22.451171875, -21.7158203125, -20.98046875, -20.2451171875, -19.509765625, -18.7744140625, -18.0390625, -17.3037109375, -16.568359375, -15.8330078125, -15.09765625, -14.3623046875, -13.626953125, -12.8916015625, -12.15625, -11.4208984375, -10.685546875, -9.9501953125, -9.21484375, -8.4794921875, -7.744140625, -7.0087890625, -6.2734375, -5.5380859375, -4.802734375, -4.0673828125, -3.33203125, -2.5966796875, -1.861328125, -1.1259765625, -0.390625, 0.3447265625, 1.080078125, 1.8154296875, 2.55078125, 3.2861328125, 4.021484375, 4.7568359375, 5.4921875, 6.2275390625, 6.962890625, 7.6982421875, 8.43359375, 9.1689453125, 9.904296875, 10.6396484375, 11.375, 12.1103515625, 12.845703125, 13.5810546875, 14.31640625, 15.0517578125, 15.787109375, 16.5224609375, 17.2578125, 17.9931640625, 18.728515625, 19.4638671875, 20.19921875, 20.9345703125, 21.669921875, 22.4052734375, 23.140625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 14.0, 97.0, 381.0, 369.0, 131.0, 17.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.70587158203125, -128.3730926513672, -123.04029846191406, -117.70751190185547, -112.37472534179688, -107.04193878173828, -101.70915222167969, -96.37637329101562, -91.0435791015625, -85.7107925415039, -80.37800598144531, -75.04521942138672, -69.71243286132812, -64.37964630126953, -59.0468635559082, -53.71407699584961, -48.38129425048828, -43.04850769042969, -37.715721130371094, -32.3829345703125, -27.05014991760254, -21.717363357543945, -16.384578704833984, -11.05179214477539, -5.719005584716797, -0.38621950149536133, 4.946566581726074, 10.279352188110352, 15.612138748168945, 20.94492530822754, 26.2777099609375, 31.610496520996094, 36.94328308105469, 42.27606964111328, 47.608856201171875, 52.94164276123047, 58.27442932128906, 63.607215881347656, 68.94000244140625, 74.27278137207031, 79.60557556152344, 84.93836212158203, 90.27114868164062, 95.60393524169922, 100.93672180175781, 106.2695083618164, 111.602294921875, 116.93507385253906, 122.26786041259766, 127.60064697265625, 132.9334259033203, 138.26622009277344, 143.5989990234375, 148.93179321289062, 154.2645721435547, 159.5973663330078, 164.93014526367188, 170.26292419433594, 175.59571838378906, 180.92849731445312, 186.26129150390625, 191.5940704345703, 196.92686462402344, 202.2596435546875, 207.59243774414062]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 8.0, 11.0, 15.0, 23.0, 16.0, 26.0, 43.0, 55.0, 40.0, 57.0, 52.0, 63.0, 80.0, 85.0, 60.0, 60.0, 76.0, 60.0, 53.0, 44.0, 28.0, 26.0, 3.0, 6.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.37450408935547, -67.34610748291016, -65.31771850585938, -63.28932189941406, -61.26092529296875, -59.23252868652344, -57.20413589477539, -55.175743103027344, -53.14734649658203, -51.11894989013672, -49.09055709838867, -47.062164306640625, -45.03376770019531, -43.00537109375, -40.97697830200195, -38.948585510253906, -36.920188903808594, -34.89179229736328, -32.863399505615234, -30.835004806518555, -28.806610107421875, -26.778215408325195, -24.749820709228516, -22.721426010131836, -20.693031311035156, -18.664636611938477, -16.636241912841797, -14.607847213745117, -12.579452514648438, -10.551057815551758, -8.522663116455078, -6.494268417358398, -4.465869903564453, -2.4374752044677734, -0.40908050537109375, 1.619314193725586, 3.6477088928222656, 5.676103591918945, 7.704498291015625, 9.732892990112305, 11.761287689208984, 13.789682388305664, 15.818077087402344, 17.846471786499023, 19.874866485595703, 21.903261184692383, 23.931655883789062, 25.960050582885742, 27.988445281982422, 30.0168399810791, 32.04523468017578, 34.073631286621094, 36.10202407836914, 38.13041687011719, 40.1588134765625, 42.18721008300781, 44.21560287475586, 46.243995666503906, 48.27239227294922, 50.30078887939453, 52.32918167114258, 54.357574462890625, 56.38597106933594, 58.41436767578125, 60.4427604675293]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 13.0, 7.0, 16.0, 11.0, 18.0, 25.0, 21.0, 28.0, 25.0, 39.0, 30.0, 38.0, 29.0, 35.0, 33.0, 36.0, 40.0, 36.0, 50.0, 34.0, 37.0, 28.0, 42.0, 28.0, 31.0, 35.0, 29.0, 28.0, 21.0, 21.0, 18.0, 19.0, 11.0, 11.0, 14.0, 8.0, 4.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.97686767578125, -4.8092041015625, -4.64154052734375, -4.473876953125, -4.30621337890625, -4.1385498046875, -3.97088623046875, -3.80322265625, -3.63555908203125, -3.4678955078125, -3.30023193359375, -3.132568359375, -2.96490478515625, -2.7972412109375, -2.62957763671875, -2.4619140625, -2.29425048828125, -2.1265869140625, -1.95892333984375, -1.791259765625, -1.62359619140625, -1.4559326171875, -1.28826904296875, -1.12060546875, -0.95294189453125, -0.7852783203125, -0.61761474609375, -0.449951171875, -0.28228759765625, -0.1146240234375, 0.05303955078125, 0.220703125, 0.38836669921875, 0.5560302734375, 0.72369384765625, 0.891357421875, 1.05902099609375, 1.2266845703125, 1.39434814453125, 1.56201171875, 1.72967529296875, 1.8973388671875, 2.06500244140625, 2.232666015625, 2.40032958984375, 2.5679931640625, 2.73565673828125, 2.9033203125, 3.07098388671875, 3.2386474609375, 3.40631103515625, 3.573974609375, 3.74163818359375, 3.9093017578125, 4.07696533203125, 4.24462890625, 4.41229248046875, 4.5799560546875, 4.74761962890625, 4.915283203125, 5.08294677734375, 5.2506103515625, 5.41827392578125, 5.5859375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 4.0, 9.0, 15.0, 22.0, 28.0, 50.0, 77.0, 97.0, 128.0, 226.0, 301.0, 488.0, 703.0, 1033.0, 1550.0, 2314.0, 3562.0, 5375.0, 8054.0, 12101.0, 18168.0, 27374.0, 43215.0, 71542.0, 125205.0, 228969.0, 207752.0, 111111.0, 64414.0, 39626.0, 25123.0, 16421.0, 11088.0, 7229.0, 4943.0, 3390.0, 2208.0, 1511.0, 985.0, 707.0, 475.0, 309.0, 205.0, 135.0, 106.0, 75.0, 45.0, 27.0, 26.0, 12.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.164794921875, -0.15978622436523438, -0.15477752685546875, -0.14976882934570312, -0.1447601318359375, -0.13975143432617188, -0.13474273681640625, -0.12973403930664062, -0.124725341796875, -0.11971664428710938, -0.11470794677734375, -0.10969924926757812, -0.1046905517578125, -0.09968185424804688, -0.09467315673828125, -0.08966445922851562, -0.08465576171875, -0.07964706420898438, -0.07463836669921875, -0.06962966918945312, -0.0646209716796875, -0.059612274169921875, -0.05460357666015625, -0.049594879150390625, -0.044586181640625, -0.039577484130859375, -0.03456878662109375, -0.029560089111328125, -0.0245513916015625, -0.019542694091796875, -0.01453399658203125, -0.009525299072265625, -0.0045166015625, 0.000492095947265625, 0.00550079345703125, 0.010509490966796875, 0.0155181884765625, 0.020526885986328125, 0.02553558349609375, 0.030544281005859375, 0.035552978515625, 0.040561676025390625, 0.04557037353515625, 0.050579071044921875, 0.0555877685546875, 0.060596466064453125, 0.06560516357421875, 0.07061386108398438, 0.07562255859375, 0.08063125610351562, 0.08563995361328125, 0.09064865112304688, 0.0956573486328125, 0.10066604614257812, 0.10567474365234375, 0.11068344116210938, 0.115692138671875, 0.12070083618164062, 0.12570953369140625, 0.13071823120117188, 0.1357269287109375, 0.14073562622070312, 0.14574432373046875, 0.15075302124023438, 0.15576171875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 6.0, 5.0, 9.0, 10.0, 14.0, 14.0, 21.0, 18.0, 29.0, 27.0, 25.0, 33.0, 30.0, 49.0, 41.0, 26.0, 41.0, 28.0, 45.0, 49.0, 1072.0, 40.0, 22.0, 28.0, 42.0, 28.0, 36.0, 20.0, 33.0, 21.0, 20.0, 15.0, 29.0, 7.0, 16.0, 18.0, 11.0, 10.0, 6.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4453125, -4.28656005859375, -4.1278076171875, -3.96905517578125, -3.810302734375, -3.65155029296875, -3.4927978515625, -3.33404541015625, -3.17529296875, -3.01654052734375, -2.8577880859375, -2.69903564453125, -2.540283203125, -2.38153076171875, -2.2227783203125, -2.06402587890625, -1.9052734375, -1.74652099609375, -1.5877685546875, -1.42901611328125, -1.270263671875, -1.11151123046875, -0.9527587890625, -0.79400634765625, -0.63525390625, -0.47650146484375, -0.3177490234375, -0.15899658203125, -0.000244140625, 0.15850830078125, 0.3172607421875, 0.47601318359375, 0.634765625, 0.79351806640625, 0.9522705078125, 1.11102294921875, 1.269775390625, 1.42852783203125, 1.5872802734375, 1.74603271484375, 1.90478515625, 2.06353759765625, 2.2222900390625, 2.38104248046875, 2.539794921875, 2.69854736328125, 2.8572998046875, 3.01605224609375, 3.1748046875, 3.33355712890625, 3.4923095703125, 3.65106201171875, 3.809814453125, 3.96856689453125, 4.1273193359375, 4.28607177734375, 4.44482421875, 4.60357666015625, 4.7623291015625, 4.92108154296875, 5.079833984375, 5.23858642578125, 5.3973388671875, 5.55609130859375, 5.71484375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 7.0, 5.0, 14.0, 23.0, 32.0, 55.0, 89.0, 157.0, 225.0, 375.0, 669.0, 987.0, 1761.0, 2870.0, 4626.0, 7647.0, 12831.0, 22120.0, 39295.0, 73723.0, 149206.0, 1347233.0, 211501.0, 100252.0, 51773.0, 28340.0, 16374.0, 9950.0, 5949.0, 3504.0, 2101.0, 1293.0, 784.0, 496.0, 308.0, 190.0, 127.0, 79.0, 47.0, 33.0, 28.0, 11.0, 16.0, 4.0, 4.0, 7.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11102294921875, -0.10740947723388672, -0.10379600524902344, -0.10018253326416016, -0.09656906127929688, -0.0929555892944336, -0.08934211730957031, -0.08572864532470703, -0.08211517333984375, -0.07850170135498047, -0.07488822937011719, -0.0712747573852539, -0.06766128540039062, -0.06404781341552734, -0.06043434143066406, -0.05682086944580078, -0.0532073974609375, -0.04959392547607422, -0.04598045349121094, -0.042366981506347656, -0.038753509521484375, -0.035140037536621094, -0.03152656555175781, -0.02791309356689453, -0.02429962158203125, -0.02068614959716797, -0.017072677612304688, -0.013459205627441406, -0.009845733642578125, -0.006232261657714844, -0.0026187896728515625, 0.0009946823120117188, 0.004608154296875, 0.008221626281738281, 0.011835098266601562, 0.015448570251464844, 0.019062042236328125, 0.022675514221191406, 0.026288986206054688, 0.02990245819091797, 0.03351593017578125, 0.03712940216064453, 0.04074287414550781, 0.044356346130371094, 0.047969818115234375, 0.051583290100097656, 0.05519676208496094, 0.05881023406982422, 0.0624237060546875, 0.06603717803955078, 0.06965065002441406, 0.07326412200927734, 0.07687759399414062, 0.0804910659790039, 0.08410453796386719, 0.08771800994873047, 0.09133148193359375, 0.09494495391845703, 0.09855842590332031, 0.1021718978881836, 0.10578536987304688, 0.10939884185791016, 0.11301231384277344, 0.11662578582763672, 0.1202392578125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 8.0, 7.0, 9.0, 17.0, 35.0, 40.0, 56.0, 80.0, 96.0, 197.0, 164.0, 94.0, 57.0, 42.0, 27.0, 25.0, 14.0, 7.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006814002990722656, -0.0006584897637367249, -0.0006355792284011841, -0.0006126686930656433, -0.0005897581577301025, -0.0005668476223945618, -0.000543937087059021, -0.0005210265517234802, -0.0004981160163879395, -0.0004752054810523987, -0.0004522949457168579, -0.00042938441038131714, -0.00040647387504577637, -0.0003835633397102356, -0.0003606528043746948, -0.00033774226903915405, -0.0003148317337036133, -0.0002919211983680725, -0.00026901066303253174, -0.00024610012769699097, -0.0002231895923614502, -0.00020027905702590942, -0.00017736852169036865, -0.00015445798635482788, -0.0001315474510192871, -0.00010863691568374634, -8.572638034820557e-05, -6.28158450126648e-05, -3.9905309677124023e-05, -1.6994774341583252e-05, 5.9157609939575195e-06, 2.882629632949829e-05, 5.173683166503906e-05, 7.464736700057983e-05, 9.75579023361206e-05, 0.00012046843767166138, 0.00014337897300720215, 0.00016628950834274292, 0.0001892000436782837, 0.00021211057901382446, 0.00023502111434936523, 0.000257931649684906, 0.0002808421850204468, 0.00030375272035598755, 0.0003266632556915283, 0.0003495737910270691, 0.00037248432636260986, 0.00039539486169815063, 0.0004183053970336914, 0.0004412159323692322, 0.00046412646770477295, 0.0004870370030403137, 0.0005099475383758545, 0.0005328580737113953, 0.000555768609046936, 0.0005786791443824768, 0.0006015896797180176, 0.0006245002150535583, 0.0006474107503890991, 0.0006703212857246399, 0.0006932318210601807, 0.0007161423563957214, 0.0007390528917312622, 0.000761963427066803, 0.0007848739624023438]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 9.0, 7.0, 11.0, 17.0, 25.0, 40.0, 53.0, 130.0, 396.0, 22311.0, 1023468.0, 1599.0, 214.0, 101.0, 60.0, 46.0, 20.0, 14.0, 9.0, 9.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.01800537109375, -0.017480134963989258, -0.016954898834228516, -0.016429662704467773, -0.01590442657470703, -0.015379190444946289, -0.014853954315185547, -0.014328718185424805, -0.013803482055664062, -0.01327824592590332, -0.012753009796142578, -0.012227773666381836, -0.011702537536621094, -0.011177301406860352, -0.01065206527709961, -0.010126829147338867, -0.009601593017578125, -0.009076356887817383, -0.00855112075805664, -0.008025884628295898, -0.007500648498535156, -0.006975412368774414, -0.006450176239013672, -0.00592494010925293, -0.0053997039794921875, -0.004874467849731445, -0.004349231719970703, -0.003823995590209961, -0.0032987594604492188, -0.0027735233306884766, -0.0022482872009277344, -0.0017230510711669922, -0.00119781494140625, -0.0006725788116455078, -0.00014734268188476562, 0.00037789344787597656, 0.0009031295776367188, 0.001428365707397461, 0.001953601837158203, 0.0024788379669189453, 0.0030040740966796875, 0.0035293102264404297, 0.004054546356201172, 0.004579782485961914, 0.005105018615722656, 0.0056302547454833984, 0.006155490875244141, 0.006680727005004883, 0.007205963134765625, 0.007731199264526367, 0.00825643539428711, 0.008781671524047852, 0.009306907653808594, 0.009832143783569336, 0.010357379913330078, 0.01088261604309082, 0.011407852172851562, 0.011933088302612305, 0.012458324432373047, 0.012983560562133789, 0.013508796691894531, 0.014034032821655273, 0.014559268951416016, 0.015084505081176758, 0.0156097412109375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 16.0, 156.0, 658.0, 160.0, 19.0, 3.0], "bins": [-0.004613654688000679, -0.004537419881671667, -0.004461185075342655, -0.004384950269013643, -0.004308715462684631, -0.004232480656355619, -0.0041562458500266075, -0.004080011043697596, -0.004003776237368584, -0.003927541431039572, -0.00385130662471056, -0.003775071818381548, -0.003698837012052536, -0.003622602205723524, -0.003546367399394512, -0.0034701325930655003, -0.0033938977867364883, -0.0033176629804074764, -0.0032414281740784645, -0.0031651933677494526, -0.0030889585614204407, -0.0030127237550914288, -0.002936488948762417, -0.002860254142433405, -0.002784019336104393, -0.002707784529775381, -0.002631549723446369, -0.0025553149171173573, -0.0024790801107883453, -0.0024028453044593334, -0.0023266104981303215, -0.0022503756918013096, -0.0021741408854722977, -0.0020979060791432858, -0.002021671272814274, -0.001945436466485262, -0.00186920166015625, -0.001792966853827238, -0.0017167320474982262, -0.0016404972411692142, -0.0015642623184248805, -0.0014880275120958686, -0.0014117927057668567, -0.0013355578994378448, -0.0012593230931088328, -0.001183088286779821, -0.001106853480450809, -0.001030618674121797, -0.0009543838677927852, -0.0008781490614637733, -0.0008019142551347613, -0.0007256794488057494, -0.0006494446424767375, -0.0005732098361477256, -0.0004969750298187137, -0.00042074022348970175, -0.00034450541716068983, -0.0002682706108316779, -0.000192035804502666, -0.00011580099817365408, -3.956619184464216e-05, 3.6668614484369755e-05, 0.00011290342081338167, 0.0001891382271423936, 0.0002653730334714055]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 9.0, 8.0, 17.0, 15.0, 17.0, 16.0, 12.0, 21.0, 20.0, 17.0, 25.0, 31.0, 37.0, 39.0, 36.0, 40.0, 38.0, 41.0, 44.0, 38.0, 28.0, 46.0, 37.0, 43.0, 44.0, 32.0, 36.0, 26.0, 20.0, 25.0, 22.0, 16.0, 10.0, 13.0, 19.0, 14.0, 7.0, 7.0, 6.0, 7.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00025153160095214844, -0.0002434970811009407, -0.00023546256124973297, -0.00022742804139852524, -0.0002193935215473175, -0.00021135900169610977, -0.00020332448184490204, -0.0001952899619936943, -0.00018725544214248657, -0.00017922092229127884, -0.0001711864024400711, -0.00016315188258886337, -0.00015511736273765564, -0.0001470828428864479, -0.00013904832303524017, -0.00013101380318403244, -0.0001229792833328247, -0.00011494476348161697, -0.00010691024363040924, -9.887572377920151e-05, -9.084120392799377e-05, -8.280668407678604e-05, -7.477216422557831e-05, -6.673764437437057e-05, -5.870312452316284e-05, -5.066860467195511e-05, -4.2634084820747375e-05, -3.459956496953964e-05, -2.656504511833191e-05, -1.8530525267124176e-05, -1.0496005415916443e-05, -2.4614855647087097e-06, 5.5730342864990234e-06, 1.3607554137706757e-05, 2.164207398891449e-05, 2.9676593840122223e-05, 3.7711113691329956e-05, 4.574563354253769e-05, 5.378015339374542e-05, 6.181467324495316e-05, 6.984919309616089e-05, 7.788371294736862e-05, 8.591823279857635e-05, 9.395275264978409e-05, 0.00010198727250099182, 0.00011002179235219955, 0.00011805631220340729, 0.00012609083205461502, 0.00013412535190582275, 0.0001421598717570305, 0.00015019439160823822, 0.00015822891145944595, 0.0001662634313106537, 0.00017429795116186142, 0.00018233247101306915, 0.00019036699086427689, 0.00019840151071548462, 0.00020643603056669235, 0.00021447055041790009, 0.00022250507026910782, 0.00023053959012031555, 0.00023857410997152328, 0.000246608629822731, 0.00025464314967393875, 0.0002626776695251465]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 13.0, 6.0, 17.0, 11.0, 18.0, 25.0, 21.0, 28.0, 25.0, 39.0, 30.0, 38.0, 29.0, 35.0, 33.0, 36.0, 40.0, 36.0, 50.0, 34.0, 37.0, 28.0, 42.0, 28.0, 31.0, 35.0, 29.0, 28.0, 21.0, 21.0, 18.0, 19.0, 11.0, 11.0, 14.0, 8.0, 4.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.97686767578125, -4.8092041015625, -4.64154052734375, -4.473876953125, -4.30621337890625, -4.1385498046875, -3.97088623046875, -3.80322265625, -3.63555908203125, -3.4678955078125, -3.30023193359375, -3.132568359375, -2.96490478515625, -2.7972412109375, -2.62957763671875, -2.4619140625, -2.29425048828125, -2.1265869140625, -1.95892333984375, -1.791259765625, -1.62359619140625, -1.4559326171875, -1.28826904296875, -1.12060546875, -0.95294189453125, -0.7852783203125, -0.61761474609375, -0.449951171875, -0.28228759765625, -0.1146240234375, 0.05303955078125, 0.220703125, 0.38836669921875, 0.5560302734375, 0.72369384765625, 0.891357421875, 1.05902099609375, 1.2266845703125, 1.39434814453125, 1.56201171875, 1.72967529296875, 1.8973388671875, 2.06500244140625, 2.232666015625, 2.40032958984375, 2.5679931640625, 2.73565673828125, 2.9033203125, 3.07098388671875, 3.2386474609375, 3.40631103515625, 3.573974609375, 3.74163818359375, 3.9093017578125, 4.07696533203125, 4.24462890625, 4.41229248046875, 4.5799560546875, 4.74761962890625, 4.915283203125, 5.08294677734375, 5.2506103515625, 5.41827392578125, 5.5859375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 2.0, 3.0, 9.0, 5.0, 11.0, 21.0, 30.0, 50.0, 85.0, 107.0, 219.0, 420.0, 855.0, 1874.0, 4212.0, 10889.0, 31505.0, 112851.0, 496300.0, 288961.0, 66624.0, 20438.0, 7220.0, 3031.0, 1347.0, 662.0, 357.0, 172.0, 115.0, 55.0, 39.0, 20.0, 20.0, 10.0, 8.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.7059326171875, -11.325927734375, -10.9459228515625, -10.56591796875, -10.1859130859375, -9.805908203125, -9.4259033203125, -9.0458984375, -8.6658935546875, -8.285888671875, -7.9058837890625, -7.52587890625, -7.1458740234375, -6.765869140625, -6.3858642578125, -6.005859375, -5.6258544921875, -5.245849609375, -4.8658447265625, -4.48583984375, -4.1058349609375, -3.725830078125, -3.3458251953125, -2.9658203125, -2.5858154296875, -2.205810546875, -1.8258056640625, -1.44580078125, -1.0657958984375, -0.685791015625, -0.3057861328125, 0.07421875, 0.4542236328125, 0.834228515625, 1.2142333984375, 1.59423828125, 1.9742431640625, 2.354248046875, 2.7342529296875, 3.1142578125, 3.4942626953125, 3.874267578125, 4.2542724609375, 4.63427734375, 5.0142822265625, 5.394287109375, 5.7742919921875, 6.154296875, 6.5343017578125, 6.914306640625, 7.2943115234375, 7.67431640625, 8.0543212890625, 8.434326171875, 8.8143310546875, 9.1943359375, 9.5743408203125, 9.954345703125, 10.3343505859375, 10.71435546875, 11.0943603515625, 11.474365234375, 11.8543701171875, 12.234375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 6.0, 12.0, 2.0, 10.0, 11.0, 11.0, 12.0, 15.0, 24.0, 33.0, 43.0, 40.0, 57.0, 81.0, 102.0, 188.0, 363.0, 1406.0, 175.0, 105.0, 78.0, 49.0, 49.0, 38.0, 31.0, 23.0, 21.0, 18.0, 17.0, 7.0, 8.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.9375, -18.398193359375, -17.85888671875, -17.319580078125, -16.7802734375, -16.240966796875, -15.70166015625, -15.162353515625, -14.623046875, -14.083740234375, -13.54443359375, -13.005126953125, -12.4658203125, -11.926513671875, -11.38720703125, -10.847900390625, -10.30859375, -9.769287109375, -9.22998046875, -8.690673828125, -8.1513671875, -7.612060546875, -7.07275390625, -6.533447265625, -5.994140625, -5.454833984375, -4.91552734375, -4.376220703125, -3.8369140625, -3.297607421875, -2.75830078125, -2.218994140625, -1.6796875, -1.140380859375, -0.60107421875, -0.061767578125, 0.4775390625, 1.016845703125, 1.55615234375, 2.095458984375, 2.634765625, 3.174072265625, 3.71337890625, 4.252685546875, 4.7919921875, 5.331298828125, 5.87060546875, 6.409912109375, 6.94921875, 7.488525390625, 8.02783203125, 8.567138671875, 9.1064453125, 9.645751953125, 10.18505859375, 10.724365234375, 11.263671875, 11.802978515625, 12.34228515625, 12.881591796875, 13.4208984375, 13.960205078125, 14.49951171875, 15.038818359375, 15.578125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 6.0, 7.0, 11.0, 14.0, 21.0, 30.0, 38.0, 72.0, 110.0, 159.0, 227.0, 388.0, 694.0, 1621.0, 5860.0, 1483335.0, 1643553.0, 6190.0, 1577.0, 687.0, 400.0, 239.0, 180.0, 91.0, 69.0, 42.0, 30.0, 21.0, 11.0, 11.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.53125, -32.28955078125, -31.0478515625, -29.80615234375, -28.564453125, -27.32275390625, -26.0810546875, -24.83935546875, -23.59765625, -22.35595703125, -21.1142578125, -19.87255859375, -18.630859375, -17.38916015625, -16.1474609375, -14.90576171875, -13.6640625, -12.42236328125, -11.1806640625, -9.93896484375, -8.697265625, -7.45556640625, -6.2138671875, -4.97216796875, -3.73046875, -2.48876953125, -1.2470703125, -0.00537109375, 1.236328125, 2.47802734375, 3.7197265625, 4.96142578125, 6.203125, 7.44482421875, 8.6865234375, 9.92822265625, 11.169921875, 12.41162109375, 13.6533203125, 14.89501953125, 16.13671875, 17.37841796875, 18.6201171875, 19.86181640625, 21.103515625, 22.34521484375, 23.5869140625, 24.82861328125, 26.0703125, 27.31201171875, 28.5537109375, 29.79541015625, 31.037109375, 32.27880859375, 33.5205078125, 34.76220703125, 36.00390625, 37.24560546875, 38.4873046875, 39.72900390625, 40.970703125, 42.21240234375, 43.4541015625, 44.69580078125, 45.9375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 22.0, 171.0, 518.0, 266.0, 31.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.76693725585938, -214.76980590820312, -207.77267456054688, -200.7755584716797, -193.77842712402344, -186.7812957763672, -179.78416442871094, -172.78704833984375, -165.7899169921875, -158.79278564453125, -151.795654296875, -144.7985382080078, -137.80140686035156, -130.8042755126953, -123.80714416503906, -116.81002044677734, -109.8128890991211, -102.81575775146484, -95.81863403320312, -88.82150268554688, -81.82437896728516, -74.8272476196289, -67.83012390136719, -60.83299255371094, -53.83586502075195, -46.83873748779297, -39.841609954833984, -32.844482421875, -25.847352981567383, -18.850223541259766, -11.853096008300781, -4.855968475341797, 2.1411590576171875, 9.138286590576172, 16.135414123535156, 23.132543563842773, 30.129671096801758, 37.126800537109375, 44.12392807006836, 51.121055603027344, 58.11818313598633, 65.11531066894531, 72.11244201660156, 79.10956573486328, 86.10669708251953, 93.10382080078125, 100.1009521484375, 107.09808349609375, 114.09520721435547, 121.09233856201172, 128.08946228027344, 135.0865936279297, 142.08372497558594, 149.08084106445312, 156.07797241210938, 163.07510375976562, 170.07223510742188, 177.06936645507812, 184.06649780273438, 191.06361389160156, 198.0607452392578, 205.05787658691406, 212.0550079345703, 219.0521240234375, 226.04925537109375]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 9.0, 4.0, 12.0, 18.0, 6.0, 17.0, 20.0, 15.0, 18.0, 23.0, 21.0, 26.0, 37.0, 30.0, 34.0, 30.0, 41.0, 40.0, 42.0, 29.0, 49.0, 42.0, 49.0, 40.0, 37.0, 44.0, 34.0, 25.0, 31.0, 29.0, 20.0, 23.0, 18.0, 20.0, 12.0, 11.0, 8.0, 5.0, 9.0, 5.0, 5.0, 1.0, 9.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.837921142578125, -37.444236755371094, -36.05055236816406, -34.65686798095703, -33.263179779052734, -31.869495391845703, -30.475811004638672, -29.08212661743164, -27.688440322875977, -26.294755935668945, -24.90106964111328, -23.50738525390625, -22.11370086669922, -20.720014572143555, -19.326330184936523, -17.93264389038086, -16.538959503173828, -15.14527416229248, -13.751588821411133, -12.357904434204102, -10.964219093322754, -9.570533752441406, -8.176849365234375, -6.783164024353027, -5.38947868347168, -3.995793581008911, -2.6021084785461426, -1.2084236145019531, 0.18526172637939453, 1.5789470672607422, 2.9726314544677734, 4.366316795349121, 5.760002136230469, 7.153687477111816, 8.547372817993164, 9.941057205200195, 11.334742546081543, 12.72842788696289, 14.122112274169922, 15.51579761505127, 16.909482955932617, 18.30316734313965, 19.696853637695312, 21.090538024902344, 22.484222412109375, 23.87790870666504, 25.27159309387207, 26.665279388427734, 28.058963775634766, 29.452648162841797, 30.84633445739746, 32.240020751953125, 33.633705139160156, 35.02738952636719, 36.42107391357422, 37.81475830078125, 39.20844268798828, 40.60212707519531, 41.995811462402344, 43.389495849609375, 44.78318405151367, 46.1768684387207, 47.570552825927734, 48.964237213134766, 50.35792541503906]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 7.0, 7.0, 12.0, 16.0, 17.0, 14.0, 20.0, 22.0, 20.0, 28.0, 33.0, 32.0, 36.0, 32.0, 32.0, 32.0, 39.0, 41.0, 32.0, 40.0, 38.0, 34.0, 38.0, 43.0, 33.0, 35.0, 32.0, 31.0, 25.0, 20.0, 22.0, 11.0, 19.0, 15.0, 13.0, 15.0, 8.0, 10.0, 8.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.484375, -5.31842041015625, -5.1524658203125, -4.98651123046875, -4.820556640625, -4.65460205078125, -4.4886474609375, -4.32269287109375, -4.15673828125, -3.99078369140625, -3.8248291015625, -3.65887451171875, -3.492919921875, -3.32696533203125, -3.1610107421875, -2.99505615234375, -2.8291015625, -2.66314697265625, -2.4971923828125, -2.33123779296875, -2.165283203125, -1.99932861328125, -1.8333740234375, -1.66741943359375, -1.50146484375, -1.33551025390625, -1.1695556640625, -1.00360107421875, -0.837646484375, -0.67169189453125, -0.5057373046875, -0.33978271484375, -0.173828125, -0.00787353515625, 0.1580810546875, 0.32403564453125, 0.489990234375, 0.65594482421875, 0.8218994140625, 0.98785400390625, 1.15380859375, 1.31976318359375, 1.4857177734375, 1.65167236328125, 1.817626953125, 1.98358154296875, 2.1495361328125, 2.31549072265625, 2.4814453125, 2.64739990234375, 2.8133544921875, 2.97930908203125, 3.145263671875, 3.31121826171875, 3.4771728515625, 3.64312744140625, 3.80908203125, 3.97503662109375, 4.1409912109375, 4.30694580078125, 4.472900390625, 4.63885498046875, 4.8048095703125, 4.97076416015625, 5.13671875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 9.0, 11.0, 14.0, 11.0, 33.0, 30.0, 40.0, 37.0, 68.0, 110.0, 131.0, 166.0, 223.0, 320.0, 453.0, 660.0, 1038.0, 1605.0, 2715.0, 4971.0, 9889.0, 26003.0, 141450.0, 1081529.0, 2331394.0, 495122.0, 61913.0, 16687.0, 7325.0, 3798.0, 2206.0, 1312.0, 894.0, 604.0, 383.0, 302.0, 205.0, 174.0, 103.0, 83.0, 63.0, 57.0, 39.0, 25.0, 26.0, 16.0, 9.0, 8.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.15625, -10.7879638671875, -10.419677734375, -10.0513916015625, -9.68310546875, -9.3148193359375, -8.946533203125, -8.5782470703125, -8.2099609375, -7.8416748046875, -7.473388671875, -7.1051025390625, -6.73681640625, -6.3685302734375, -6.000244140625, -5.6319580078125, -5.263671875, -4.8953857421875, -4.527099609375, -4.1588134765625, -3.79052734375, -3.4222412109375, -3.053955078125, -2.6856689453125, -2.3173828125, -1.9490966796875, -1.580810546875, -1.2125244140625, -0.84423828125, -0.4759521484375, -0.107666015625, 0.2606201171875, 0.62890625, 0.9971923828125, 1.365478515625, 1.7337646484375, 2.10205078125, 2.4703369140625, 2.838623046875, 3.2069091796875, 3.5751953125, 3.9434814453125, 4.311767578125, 4.6800537109375, 5.04833984375, 5.4166259765625, 5.784912109375, 6.1531982421875, 6.521484375, 6.8897705078125, 7.258056640625, 7.6263427734375, 7.99462890625, 8.3629150390625, 8.731201171875, 9.0994873046875, 9.4677734375, 9.8360595703125, 10.204345703125, 10.5726318359375, 10.94091796875, 11.3092041015625, 11.677490234375, 12.0457763671875, 12.4140625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 9.0, 21.0, 38.0, 49.0, 90.0, 127.0, 217.0, 340.0, 562.0, 852.0, 658.0, 433.0, 252.0, 156.0, 88.0, 63.0, 31.0, 22.0, 21.0, 13.0, 6.0, 3.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.4765625, -9.0594482421875, -8.642333984375, -8.2252197265625, -7.80810546875, -7.3909912109375, -6.973876953125, -6.5567626953125, -6.1396484375, -5.7225341796875, -5.305419921875, -4.8883056640625, -4.47119140625, -4.0540771484375, -3.636962890625, -3.2198486328125, -2.802734375, -2.3856201171875, -1.968505859375, -1.5513916015625, -1.13427734375, -0.7171630859375, -0.300048828125, 0.1170654296875, 0.5341796875, 0.9512939453125, 1.368408203125, 1.7855224609375, 2.20263671875, 2.6197509765625, 3.036865234375, 3.4539794921875, 3.87109375, 4.2882080078125, 4.705322265625, 5.1224365234375, 5.53955078125, 5.9566650390625, 6.373779296875, 6.7908935546875, 7.2080078125, 7.6251220703125, 8.042236328125, 8.4593505859375, 8.87646484375, 9.2935791015625, 9.710693359375, 10.1278076171875, 10.544921875, 10.9620361328125, 11.379150390625, 11.7962646484375, 12.21337890625, 12.6304931640625, 13.047607421875, 13.4647216796875, 13.8818359375, 14.2989501953125, 14.716064453125, 15.1331787109375, 15.55029296875, 15.9674072265625, 16.384521484375, 16.8016357421875, 17.21875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 12.0, 9.0, 28.0, 31.0, 50.0, 57.0, 114.0, 162.0, 289.0, 526.0, 1436.0, 4722.0, 28356.0, 707687.0, 3349882.0, 87461.0, 9578.0, 2232.0, 753.0, 355.0, 199.0, 125.0, 75.0, 39.0, 29.0, 19.0, 15.0, 10.0, 2.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.640625, -19.9091796875, -19.177734375, -18.4462890625, -17.71484375, -16.9833984375, -16.251953125, -15.5205078125, -14.7890625, -14.0576171875, -13.326171875, -12.5947265625, -11.86328125, -11.1318359375, -10.400390625, -9.6689453125, -8.9375, -8.2060546875, -7.474609375, -6.7431640625, -6.01171875, -5.2802734375, -4.548828125, -3.8173828125, -3.0859375, -2.3544921875, -1.623046875, -0.8916015625, -0.16015625, 0.5712890625, 1.302734375, 2.0341796875, 2.765625, 3.4970703125, 4.228515625, 4.9599609375, 5.69140625, 6.4228515625, 7.154296875, 7.8857421875, 8.6171875, 9.3486328125, 10.080078125, 10.8115234375, 11.54296875, 12.2744140625, 13.005859375, 13.7373046875, 14.46875, 15.2001953125, 15.931640625, 16.6630859375, 17.39453125, 18.1259765625, 18.857421875, 19.5888671875, 20.3203125, 21.0517578125, 21.783203125, 22.5146484375, 23.24609375, 23.9775390625, 24.708984375, 25.4404296875, 26.171875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 70.0, 677.0, 261.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-499.9446105957031, -488.7540588378906, -477.5635070800781, -466.3729553222656, -455.1824035644531, -443.9918518066406, -432.8013000488281, -421.6107482910156, -410.4201965332031, -399.2296447753906, -388.0390930175781, -376.8485412597656, -365.6579895019531, -354.4674377441406, -343.2768859863281, -332.0863342285156, -320.895751953125, -309.7052001953125, -298.5146484375, -287.3240966796875, -276.133544921875, -264.9429931640625, -253.75244140625, -242.5618896484375, -231.371337890625, -220.1807861328125, -208.990234375, -197.7996826171875, -186.609130859375, -175.4185791015625, -164.22802734375, -153.0374755859375, -141.84693908691406, -130.65638732910156, -119.46583557128906, -108.27528381347656, -97.08473205566406, -85.89418029785156, -74.70362091064453, -63.51306915283203, -52.32251739501953, -41.13196563720703, -29.9414119720459, -18.750858306884766, -7.560306549072266, 3.6302452087402344, 14.82080078125, 26.0113525390625, 37.201904296875, 48.3924560546875, 59.5830078125, 70.7735595703125, 81.964111328125, 93.1546630859375, 104.34522247314453, 115.53577423095703, 126.72632598876953, 137.91688537597656, 149.10743713378906, 160.29798889160156, 171.48854064941406, 182.67909240722656, 193.86964416503906, 205.06019592285156, 216.25074768066406]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 3.0, 8.0, 15.0, 13.0, 12.0, 14.0, 23.0, 24.0, 22.0, 31.0, 33.0, 42.0, 33.0, 42.0, 45.0, 49.0, 52.0, 53.0, 61.0, 41.0, 41.0, 39.0, 36.0, 49.0, 38.0, 35.0, 16.0, 18.0, 17.0, 19.0, 16.0, 14.0, 9.0, 7.0, 6.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-48.039894104003906, -46.751075744628906, -45.462257385253906, -44.173439025878906, -42.884620666503906, -41.595802307128906, -40.306983947753906, -39.018165588378906, -37.729347229003906, -36.440528869628906, -35.151710510253906, -33.862892150878906, -32.574073791503906, -31.285255432128906, -29.996435165405273, -28.707616806030273, -27.41879653930664, -26.12997817993164, -24.84115982055664, -23.55234146118164, -22.26352310180664, -20.97470474243164, -19.685884475708008, -18.397066116333008, -17.108247756958008, -15.819429397583008, -14.530611038208008, -13.241791725158691, -11.952973365783691, -10.664155006408691, -9.375335693359375, -8.086517333984375, -6.797698974609375, -5.508880615234375, -4.220061779022217, -2.9312431812286377, -1.6424245834350586, -0.3536062240600586, 0.9352126121520996, 2.224031448364258, 3.512849807739258, 4.801668167114258, 6.090487003326416, 7.379305839538574, 8.668124198913574, 9.956942558288574, 11.24576187133789, 12.53458023071289, 13.82339859008789, 15.11221694946289, 16.40103530883789, 17.68985366821289, 18.97867202758789, 20.26749038696289, 21.556310653686523, 22.845129013061523, 24.133947372436523, 25.422765731811523, 26.711584091186523, 28.000402450561523, 29.289222717285156, 30.578041076660156, 31.866859436035156, 33.155677795410156, 34.444496154785156]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 1.0, 8.0, 7.0, 10.0, 4.0, 8.0, 10.0, 6.0, 8.0, 14.0, 20.0, 12.0, 23.0, 21.0, 30.0, 24.0, 34.0, 35.0, 24.0, 37.0, 39.0, 32.0, 38.0, 50.0, 38.0, 36.0, 37.0, 41.0, 38.0, 33.0, 25.0, 40.0, 27.0, 28.0, 29.0, 16.0, 10.0, 20.0, 11.0, 10.0, 15.0, 11.0, 13.0, 10.0, 2.0, 3.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.34375, -5.1767578125, -5.009765625, -4.8427734375, -4.67578125, -4.5087890625, -4.341796875, -4.1748046875, -4.0078125, -3.8408203125, -3.673828125, -3.5068359375, -3.33984375, -3.1728515625, -3.005859375, -2.8388671875, -2.671875, -2.5048828125, -2.337890625, -2.1708984375, -2.00390625, -1.8369140625, -1.669921875, -1.5029296875, -1.3359375, -1.1689453125, -1.001953125, -0.8349609375, -0.66796875, -0.5009765625, -0.333984375, -0.1669921875, 0.0, 0.1669921875, 0.333984375, 0.5009765625, 0.66796875, 0.8349609375, 1.001953125, 1.1689453125, 1.3359375, 1.5029296875, 1.669921875, 1.8369140625, 2.00390625, 2.1708984375, 2.337890625, 2.5048828125, 2.671875, 2.8388671875, 3.005859375, 3.1728515625, 3.33984375, 3.5068359375, 3.673828125, 3.8408203125, 4.0078125, 4.1748046875, 4.341796875, 4.5087890625, 4.67578125, 4.8427734375, 5.009765625, 5.1767578125, 5.34375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 11.0, 9.0, 14.0, 25.0, 28.0, 64.0, 67.0, 120.0, 152.0, 276.0, 414.0, 551.0, 780.0, 1175.0, 1751.0, 2468.0, 3739.0, 5378.0, 7953.0, 11753.0, 17426.0, 26033.0, 41394.0, 68597.0, 126762.0, 241114.0, 211937.0, 108364.0, 60361.0, 37100.0, 23621.0, 15783.0, 10468.0, 7232.0, 4957.0, 3405.0, 2302.0, 1638.0, 1070.0, 687.0, 517.0, 323.0, 224.0, 151.0, 127.0, 89.0, 52.0, 27.0, 30.0, 16.0, 15.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1663818359375, -0.16132164001464844, -0.15626144409179688, -0.1512012481689453, -0.14614105224609375, -0.1410808563232422, -0.13602066040039062, -0.13096046447753906, -0.1259002685546875, -0.12084007263183594, -0.11577987670898438, -0.11071968078613281, -0.10565948486328125, -0.10059928894042969, -0.09553909301757812, -0.09047889709472656, -0.085418701171875, -0.08035850524902344, -0.07529830932617188, -0.07023811340332031, -0.06517791748046875, -0.06011772155761719, -0.055057525634765625, -0.04999732971191406, -0.0449371337890625, -0.03987693786621094, -0.034816741943359375, -0.029756546020507812, -0.02469635009765625, -0.019636154174804688, -0.014575958251953125, -0.009515762329101562, -0.00445556640625, 0.0006046295166015625, 0.005664825439453125, 0.010725021362304688, 0.01578521728515625, 0.020845413208007812, 0.025905609130859375, 0.030965805053710938, 0.0360260009765625, 0.04108619689941406, 0.046146392822265625, 0.05120658874511719, 0.05626678466796875, 0.06132698059082031, 0.06638717651367188, 0.07144737243652344, 0.076507568359375, 0.08156776428222656, 0.08662796020507812, 0.09168815612792969, 0.09674835205078125, 0.10180854797363281, 0.10686874389648438, 0.11192893981933594, 0.1169891357421875, 0.12204933166503906, 0.12710952758789062, 0.1321697235107422, 0.13722991943359375, 0.1422901153564453, 0.14735031127929688, 0.15241050720214844, 0.157470703125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 0.0, 5.0, 6.0, 8.0, 5.0, 13.0, 10.0, 19.0, 19.0, 19.0, 20.0, 20.0, 19.0, 29.0, 32.0, 37.0, 36.0, 36.0, 35.0, 39.0, 38.0, 29.0, 1062.0, 37.0, 26.0, 56.0, 44.0, 48.0, 35.0, 32.0, 35.0, 13.0, 31.0, 24.0, 13.0, 14.0, 12.0, 17.0, 14.0, 4.0, 12.0, 5.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.87109375, -4.71942138671875, -4.5677490234375, -4.41607666015625, -4.264404296875, -4.11273193359375, -3.9610595703125, -3.80938720703125, -3.65771484375, -3.50604248046875, -3.3543701171875, -3.20269775390625, -3.051025390625, -2.89935302734375, -2.7476806640625, -2.59600830078125, -2.4443359375, -2.29266357421875, -2.1409912109375, -1.98931884765625, -1.837646484375, -1.68597412109375, -1.5343017578125, -1.38262939453125, -1.23095703125, -1.07928466796875, -0.9276123046875, -0.77593994140625, -0.624267578125, -0.47259521484375, -0.3209228515625, -0.16925048828125, -0.017578125, 0.13409423828125, 0.2857666015625, 0.43743896484375, 0.589111328125, 0.74078369140625, 0.8924560546875, 1.04412841796875, 1.19580078125, 1.34747314453125, 1.4991455078125, 1.65081787109375, 1.802490234375, 1.95416259765625, 2.1058349609375, 2.25750732421875, 2.4091796875, 2.56085205078125, 2.7125244140625, 2.86419677734375, 3.015869140625, 3.16754150390625, 3.3192138671875, 3.47088623046875, 3.62255859375, 3.77423095703125, 3.9259033203125, 4.07757568359375, 4.229248046875, 4.38092041015625, 4.5325927734375, 4.68426513671875, 4.8359375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 6.0, 2.0, 12.0, 17.0, 9.0, 28.0, 28.0, 57.0, 79.0, 106.0, 177.0, 251.0, 370.0, 546.0, 841.0, 1126.0, 1674.0, 2428.0, 3455.0, 5184.0, 7621.0, 11771.0, 18063.0, 28643.0, 47428.0, 82636.0, 152420.0, 1301055.0, 183555.0, 98100.0, 55093.0, 33206.0, 20706.0, 13384.0, 8779.0, 5956.0, 3773.0, 2741.0, 1883.0, 1202.0, 804.0, 588.0, 405.0, 289.0, 209.0, 125.0, 106.0, 70.0, 48.0, 27.0, 25.0, 13.0, 10.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.085693359375, -0.08289718627929688, -0.08010101318359375, -0.07730484008789062, -0.0745086669921875, -0.07171249389648438, -0.06891632080078125, -0.06612014770507812, -0.063323974609375, -0.060527801513671875, -0.05773162841796875, -0.054935455322265625, -0.0521392822265625, -0.049343109130859375, -0.04654693603515625, -0.043750762939453125, -0.04095458984375, -0.038158416748046875, -0.03536224365234375, -0.032566070556640625, -0.0297698974609375, -0.026973724365234375, -0.02417755126953125, -0.021381378173828125, -0.018585205078125, -0.015789031982421875, -0.01299285888671875, -0.010196685791015625, -0.0074005126953125, -0.004604339599609375, -0.00180816650390625, 0.000988006591796875, 0.0037841796875, 0.006580352783203125, 0.00937652587890625, 0.012172698974609375, 0.0149688720703125, 0.017765045166015625, 0.02056121826171875, 0.023357391357421875, 0.026153564453125, 0.028949737548828125, 0.03174591064453125, 0.034542083740234375, 0.0373382568359375, 0.040134429931640625, 0.04293060302734375, 0.045726776123046875, 0.04852294921875, 0.051319122314453125, 0.05411529541015625, 0.056911468505859375, 0.0597076416015625, 0.06250381469726562, 0.06529998779296875, 0.06809616088867188, 0.070892333984375, 0.07368850708007812, 0.07648468017578125, 0.07928085327148438, 0.0820770263671875, 0.08487319946289062, 0.08766937255859375, 0.09046554565429688, 0.09326171875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 7.0, 5.0, 2.0, 7.0, 11.0, 15.0, 20.0, 22.0, 34.0, 57.0, 89.0, 118.0, 166.0, 144.0, 81.0, 57.0, 41.0, 30.0, 28.0, 15.0, 13.0, 7.0, 2.0, 6.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011606216430664062, -0.001123964786529541, -0.0010873079299926758, -0.0010506510734558105, -0.0010139942169189453, -0.00097733736038208, -0.0009406805038452148, -0.0009040236473083496, -0.0008673667907714844, -0.0008307099342346191, -0.0007940530776977539, -0.0007573962211608887, -0.0007207393646240234, -0.0006840825080871582, -0.000647425651550293, -0.0006107687950134277, -0.0005741119384765625, -0.0005374550819396973, -0.000500798225402832, -0.0004641413688659668, -0.00042748451232910156, -0.00039082765579223633, -0.0003541707992553711, -0.00031751394271850586, -0.0002808570861816406, -0.0002442002296447754, -0.00020754337310791016, -0.00017088651657104492, -0.0001342296600341797, -9.757280349731445e-05, -6.091594696044922e-05, -2.4259090423583984e-05, 1.239776611328125e-05, 4.9054622650146484e-05, 8.571147918701172e-05, 0.00012236833572387695, 0.0001590251922607422, 0.00019568204879760742, 0.00023233890533447266, 0.0002689957618713379, 0.0003056526184082031, 0.00034230947494506836, 0.0003789663314819336, 0.00041562318801879883, 0.00045228004455566406, 0.0004889369010925293, 0.0005255937576293945, 0.0005622506141662598, 0.000598907470703125, 0.0006355643272399902, 0.0006722211837768555, 0.0007088780403137207, 0.0007455348968505859, 0.0007821917533874512, 0.0008188486099243164, 0.0008555054664611816, 0.0008921623229980469, 0.0009288191795349121, 0.0009654760360717773, 0.0010021328926086426, 0.0010387897491455078, 0.001075446605682373, 0.0011121034622192383, 0.0011487603187561035, 0.0011854171752929688]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 5.0, 2.0, 7.0, 6.0, 19.0, 21.0, 35.0, 44.0, 47.0, 115.0, 186.0, 479.0, 10880.0, 1033895.0, 1994.0, 368.0, 181.0, 75.0, 53.0, 38.0, 27.0, 16.0, 13.0, 10.0, 3.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023681640625, -0.022949695587158203, -0.022217750549316406, -0.02148580551147461, -0.020753860473632812, -0.020021915435791016, -0.01928997039794922, -0.018558025360107422, -0.017826080322265625, -0.017094135284423828, -0.01636219024658203, -0.015630245208740234, -0.014898300170898438, -0.01416635513305664, -0.013434410095214844, -0.012702465057373047, -0.01197052001953125, -0.011238574981689453, -0.010506629943847656, -0.00977468490600586, -0.009042739868164062, -0.008310794830322266, -0.007578849792480469, -0.006846904754638672, -0.006114959716796875, -0.005383014678955078, -0.004651069641113281, -0.003919124603271484, -0.0031871795654296875, -0.0024552345275878906, -0.0017232894897460938, -0.0009913444519042969, -0.0002593994140625, 0.0004725456237792969, 0.0012044906616210938, 0.0019364356994628906, 0.0026683807373046875, 0.0034003257751464844, 0.004132270812988281, 0.004864215850830078, 0.005596160888671875, 0.006328105926513672, 0.007060050964355469, 0.007791996002197266, 0.008523941040039062, 0.00925588607788086, 0.009987831115722656, 0.010719776153564453, 0.01145172119140625, 0.012183666229248047, 0.012915611267089844, 0.01364755630493164, 0.014379501342773438, 0.015111446380615234, 0.01584339141845703, 0.016575336456298828, 0.017307281494140625, 0.018039226531982422, 0.01877117156982422, 0.019503116607666016, 0.020235061645507812, 0.02096700668334961, 0.021698951721191406, 0.022430896759033203, 0.023162841796875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 67.0, 396.0, 436.0, 77.0, 19.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002718091243878007, -0.0026244448963552713, -0.0025307987816631794, -0.002437152434140444, -0.002343506319448352, -0.0022498599719256163, -0.0021562138572335243, -0.0020625675097107887, -0.001968921162188053, -0.0018752749310806394, -0.0017816286999732256, -0.00168798235245049, -0.001594336237758398, -0.0015006898902356625, -0.0014070436591282487, -0.001313397428020835, -0.001219751313328743, -0.0011261050822213292, -0.0010324588511139154, -0.0009388125617988408, -0.000845166330691427, -0.0007515200995840132, -0.0006578738102689385, -0.0005642275791615248, -0.000470581348054111, -0.00037693511694669724, -0.000283288856735453, -0.00018964259652420878, -9.599636541679502e-05, -2.3501343093812466e-06, 9.129615500569344e-05, 0.0001849423861131072, 0.000278588617220521, 0.00037223484832793474, 0.00046588110853917897, 0.0005595273687504232, 0.000653173599857837, 0.0007468198309652507, 0.0008404661202803254, 0.0009341123513877392, 0.001027758582495153, 0.0011214048136025667, 0.0012150510447099805, 0.0013086972758173943, 0.0014023436233401299, 0.0014959897380322218, 0.0015896360855549574, 0.0016832823166623712, 0.001776928547769785, 0.0018705747788771987, 0.0019642210099846125, 0.002057867357507348, 0.00215151347219944, 0.0022451598197221756, 0.002338806167244911, 0.002432452281937003, 0.002526098396629095, 0.0026197447441518307, 0.0027133908588439226, 0.002807037206366658, 0.00290068332105875, 0.0029943296685814857, 0.0030879760161042213, 0.0031816221307963133, 0.003275268478319049]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 7.0, 13.0, 13.0, 11.0, 19.0, 10.0, 23.0, 12.0, 18.0, 18.0, 29.0, 36.0, 40.0, 32.0, 34.0, 36.0, 36.0, 39.0, 42.0, 33.0, 34.0, 40.0, 37.0, 43.0, 37.0, 29.0, 34.0, 34.0, 32.0, 25.0, 24.0, 21.0, 24.0, 11.0, 16.0, 14.0, 7.0, 9.0, 7.0, 2.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005884170532226562, -0.0005696052685379982, -0.0005507934838533401, -0.0005319816991686821, -0.000513169914484024, -0.000494358129799366, -0.00047554634511470795, -0.0004567345604300499, -0.00043792277574539185, -0.0004191109910607338, -0.00040029920637607574, -0.0003814874216914177, -0.00036267563700675964, -0.0003438638523221016, -0.00032505206763744354, -0.0003062402829527855, -0.00028742849826812744, -0.0002686167135834694, -0.00024980492889881134, -0.0002309931442141533, -0.00021218135952949524, -0.0001933695748448372, -0.00017455779016017914, -0.0001557460054755211, -0.00013693422079086304, -0.00011812243610620499, -9.931065142154694e-05, -8.049886673688889e-05, -6.168708205223083e-05, -4.2875297367572784e-05, -2.4063512682914734e-05, -5.251727998256683e-06, 1.3560056686401367e-05, 3.237184137105942e-05, 5.118362605571747e-05, 6.999541074037552e-05, 8.880719542503357e-05, 0.00010761898010969162, 0.00012643076479434967, 0.00014524254947900772, 0.00016405433416366577, 0.00018286611884832382, 0.00020167790353298187, 0.00022048968821763992, 0.00023930147290229797, 0.000258113257586956, 0.0002769250422716141, 0.0002957368269562721, 0.0003145486116409302, 0.0003333603963255882, 0.0003521721810102463, 0.00037098396569490433, 0.0003897957503795624, 0.00040860753506422043, 0.0004274193197488785, 0.00044623110443353653, 0.0004650428891181946, 0.00048385467380285263, 0.0005026664584875107, 0.0005214782431721687, 0.0005402900278568268, 0.0005591018125414848, 0.0005779135972261429, 0.0005967253819108009, 0.000615537166595459]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 1.0, 8.0, 7.0, 10.0, 4.0, 8.0, 10.0, 6.0, 8.0, 14.0, 20.0, 12.0, 23.0, 21.0, 30.0, 24.0, 34.0, 35.0, 24.0, 37.0, 39.0, 32.0, 38.0, 50.0, 38.0, 36.0, 37.0, 41.0, 38.0, 33.0, 25.0, 40.0, 27.0, 28.0, 29.0, 15.0, 11.0, 20.0, 11.0, 10.0, 15.0, 11.0, 13.0, 10.0, 2.0, 3.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.34375, -5.1767578125, -5.009765625, -4.8427734375, -4.67578125, -4.5087890625, -4.341796875, -4.1748046875, -4.0078125, -3.8408203125, -3.673828125, -3.5068359375, -3.33984375, -3.1728515625, -3.005859375, -2.8388671875, -2.671875, -2.5048828125, -2.337890625, -2.1708984375, -2.00390625, -1.8369140625, -1.669921875, -1.5029296875, -1.3359375, -1.1689453125, -1.001953125, -0.8349609375, -0.66796875, -0.5009765625, -0.333984375, -0.1669921875, 0.0, 0.1669921875, 0.333984375, 0.5009765625, 0.66796875, 0.8349609375, 1.001953125, 1.1689453125, 1.3359375, 1.5029296875, 1.669921875, 1.8369140625, 2.00390625, 2.1708984375, 2.337890625, 2.5048828125, 2.671875, 2.8388671875, 3.005859375, 3.1728515625, 3.33984375, 3.5068359375, 3.673828125, 3.8408203125, 4.0078125, 4.1748046875, 4.341796875, 4.5087890625, 4.67578125, 4.8427734375, 5.009765625, 5.1767578125, 5.34375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 10.0, 13.0, 20.0, 25.0, 22.0, 35.0, 72.0, 71.0, 101.0, 153.0, 202.0, 293.0, 401.0, 566.0, 906.0, 1496.0, 2390.0, 4314.0, 7759.0, 14504.0, 27194.0, 53712.0, 106715.0, 209371.0, 276948.0, 166821.0, 83728.0, 41892.0, 21580.0, 11539.0, 6337.0, 3513.0, 2009.0, 1283.0, 826.0, 485.0, 370.0, 259.0, 186.0, 133.0, 84.0, 64.0, 41.0, 28.0, 23.0, 16.0, 15.0, 11.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.2734375, -5.11029052734375, -4.9471435546875, -4.78399658203125, -4.620849609375, -4.45770263671875, -4.2945556640625, -4.13140869140625, -3.96826171875, -3.80511474609375, -3.6419677734375, -3.47882080078125, -3.315673828125, -3.15252685546875, -2.9893798828125, -2.82623291015625, -2.6630859375, -2.49993896484375, -2.3367919921875, -2.17364501953125, -2.010498046875, -1.84735107421875, -1.6842041015625, -1.52105712890625, -1.35791015625, -1.19476318359375, -1.0316162109375, -0.86846923828125, -0.705322265625, -0.54217529296875, -0.3790283203125, -0.21588134765625, -0.052734375, 0.11041259765625, 0.2735595703125, 0.43670654296875, 0.599853515625, 0.76300048828125, 0.9261474609375, 1.08929443359375, 1.25244140625, 1.41558837890625, 1.5787353515625, 1.74188232421875, 1.905029296875, 2.06817626953125, 2.2313232421875, 2.39447021484375, 2.5576171875, 2.72076416015625, 2.8839111328125, 3.04705810546875, 3.210205078125, 3.37335205078125, 3.5364990234375, 3.69964599609375, 3.86279296875, 4.02593994140625, 4.1890869140625, 4.35223388671875, 4.515380859375, 4.67852783203125, 4.8416748046875, 5.00482177734375, 5.16796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 4.0, 9.0, 11.0, 7.0, 12.0, 25.0, 19.0, 30.0, 33.0, 51.0, 58.0, 78.0, 79.0, 149.0, 299.0, 1400.0, 267.0, 140.0, 77.0, 56.0, 50.0, 41.0, 25.0, 26.0, 24.0, 15.0, 13.0, 9.0, 16.0, 7.0, 7.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9609375, -13.3868408203125, -12.812744140625, -12.2386474609375, -11.66455078125, -11.0904541015625, -10.516357421875, -9.9422607421875, -9.3681640625, -8.7940673828125, -8.219970703125, -7.6458740234375, -7.07177734375, -6.4976806640625, -5.923583984375, -5.3494873046875, -4.775390625, -4.2012939453125, -3.627197265625, -3.0531005859375, -2.47900390625, -1.9049072265625, -1.330810546875, -0.7567138671875, -0.1826171875, 0.3914794921875, 0.965576171875, 1.5396728515625, 2.11376953125, 2.6878662109375, 3.261962890625, 3.8360595703125, 4.41015625, 4.9842529296875, 5.558349609375, 6.1324462890625, 6.70654296875, 7.2806396484375, 7.854736328125, 8.4288330078125, 9.0029296875, 9.5770263671875, 10.151123046875, 10.7252197265625, 11.29931640625, 11.8734130859375, 12.447509765625, 13.0216064453125, 13.595703125, 14.1697998046875, 14.743896484375, 15.3179931640625, 15.89208984375, 16.4661865234375, 17.040283203125, 17.6143798828125, 18.1884765625, 18.7625732421875, 19.336669921875, 19.9107666015625, 20.48486328125, 21.0589599609375, 21.633056640625, 22.2071533203125, 22.78125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 11.0, 12.0, 8.0, 12.0, 16.0, 14.0, 32.0, 46.0, 31.0, 48.0, 71.0, 102.0, 178.0, 312.0, 662.0, 3235.0, 86730.0, 2972088.0, 77559.0, 3015.0, 641.0, 308.0, 166.0, 114.0, 73.0, 64.0, 40.0, 25.0, 28.0, 16.0, 15.0, 11.0, 4.0, 5.0, 10.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-30.859375, -30.077880859375, -29.29638671875, -28.514892578125, -27.7333984375, -26.951904296875, -26.17041015625, -25.388916015625, -24.607421875, -23.825927734375, -23.04443359375, -22.262939453125, -21.4814453125, -20.699951171875, -19.91845703125, -19.136962890625, -18.35546875, -17.573974609375, -16.79248046875, -16.010986328125, -15.2294921875, -14.447998046875, -13.66650390625, -12.885009765625, -12.103515625, -11.322021484375, -10.54052734375, -9.759033203125, -8.9775390625, -8.196044921875, -7.41455078125, -6.633056640625, -5.8515625, -5.070068359375, -4.28857421875, -3.507080078125, -2.7255859375, -1.944091796875, -1.16259765625, -0.381103515625, 0.400390625, 1.181884765625, 1.96337890625, 2.744873046875, 3.5263671875, 4.307861328125, 5.08935546875, 5.870849609375, 6.65234375, 7.433837890625, 8.21533203125, 8.996826171875, 9.7783203125, 10.559814453125, 11.34130859375, 12.122802734375, 12.904296875, 13.685791015625, 14.46728515625, 15.248779296875, 16.0302734375, 16.811767578125, 17.59326171875, 18.374755859375, 19.15625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 12.0, 50.0, 118.0, 212.0, 241.0, 193.0, 111.0, 46.0, 15.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.87434768676758, -34.32606506347656, -31.777782440185547, -29.22949981689453, -26.681217193603516, -24.1329345703125, -21.584651947021484, -19.03636932373047, -16.488086700439453, -13.939804077148438, -11.391521453857422, -8.843238830566406, -6.294956207275391, -3.746673583984375, -1.1983909606933594, 1.3498916625976562, 3.898174285888672, 6.4464569091796875, 8.994739532470703, 11.543022155761719, 14.091304779052734, 16.63958740234375, 19.187870025634766, 21.73615264892578, 24.284435272216797, 26.832717895507812, 29.381000518798828, 31.929283142089844, 34.47756576538086, 37.025848388671875, 39.57413101196289, 42.122413635253906, 44.670692443847656, 47.21897506713867, 49.76725769042969, 52.3155403137207, 54.86382293701172, 57.412105560302734, 59.96038818359375, 62.508670806884766, 65.05695343017578, 67.60523986816406, 70.15351867675781, 72.70179748535156, 75.25008392333984, 77.79837036132812, 80.34664916992188, 82.89492797851562, 85.4432144165039, 87.99150085449219, 90.53977966308594, 93.08805847167969, 95.63634490966797, 98.18463134765625, 100.73291015625, 103.28118896484375, 105.82947540283203, 108.37776184082031, 110.92604064941406, 113.47431945800781, 116.0226058959961, 118.57089233398438, 121.11917114257812, 123.66744995117188, 126.21573638916016]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 8.0, 13.0, 22.0, 14.0, 14.0, 16.0, 25.0, 23.0, 26.0, 32.0, 34.0, 44.0, 45.0, 36.0, 48.0, 46.0, 38.0, 55.0, 34.0, 39.0, 43.0, 40.0, 41.0, 38.0, 28.0, 22.0, 24.0, 19.0, 19.0, 18.0, 15.0, 13.0, 11.0, 10.0, 11.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0], "bins": [-43.98972702026367, -42.67571258544922, -41.3616943359375, -40.04767990112305, -38.73366165161133, -37.419647216796875, -36.105628967285156, -34.7916145324707, -33.47760009765625, -32.1635856628418, -30.849567413330078, -29.535551071166992, -28.221534729003906, -26.907520294189453, -25.593503952026367, -24.27948760986328, -22.965469360351562, -21.651453018188477, -20.33743667602539, -19.023420333862305, -17.70940399169922, -16.395389556884766, -15.08137321472168, -13.767356872558594, -12.453340530395508, -11.139324188232422, -9.825307846069336, -8.511292457580566, -7.1972761154174805, -5.8832597732543945, -4.569243907928467, -3.255228042602539, -1.9412155151367188, -0.6271994113922119, 0.6868166923522949, 2.0008327960968018, 3.3148488998413086, 4.6288652420043945, 5.942881107330322, 7.25689697265625, 8.570913314819336, 9.884929656982422, 11.198945999145508, 12.512961387634277, 13.826977729797363, 15.14099407196045, 16.45500946044922, 17.769025802612305, 19.08304214477539, 20.397058486938477, 21.711074829101562, 23.02509117126465, 24.339107513427734, 25.653121948242188, 26.967138290405273, 28.28115463256836, 29.595170974731445, 30.90918731689453, 32.223201751708984, 33.5372200012207, 34.851234436035156, 36.165252685546875, 37.47926712036133, 38.79328155517578, 40.1072998046875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 1.0, 4.0, 9.0, 11.0, 6.0, 7.0, 8.0, 12.0, 12.0, 18.0, 11.0, 16.0, 14.0, 22.0, 15.0, 29.0, 18.0, 31.0, 39.0, 40.0, 33.0, 42.0, 38.0, 27.0, 40.0, 42.0, 36.0, 34.0, 37.0, 37.0, 27.0, 33.0, 32.0, 25.0, 20.0, 17.0, 15.0, 13.0, 21.0, 22.0, 12.0, 14.0, 13.0, 8.0, 7.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.2578125, -5.0858154296875, -4.913818359375, -4.7418212890625, -4.56982421875, -4.3978271484375, -4.225830078125, -4.0538330078125, -3.8818359375, -3.7098388671875, -3.537841796875, -3.3658447265625, -3.19384765625, -3.0218505859375, -2.849853515625, -2.6778564453125, -2.505859375, -2.3338623046875, -2.161865234375, -1.9898681640625, -1.81787109375, -1.6458740234375, -1.473876953125, -1.3018798828125, -1.1298828125, -0.9578857421875, -0.785888671875, -0.6138916015625, -0.44189453125, -0.2698974609375, -0.097900390625, 0.0740966796875, 0.24609375, 0.4180908203125, 0.590087890625, 0.7620849609375, 0.93408203125, 1.1060791015625, 1.278076171875, 1.4500732421875, 1.6220703125, 1.7940673828125, 1.966064453125, 2.1380615234375, 2.31005859375, 2.4820556640625, 2.654052734375, 2.8260498046875, 2.998046875, 3.1700439453125, 3.342041015625, 3.5140380859375, 3.68603515625, 3.8580322265625, 4.030029296875, 4.2020263671875, 4.3740234375, 4.5460205078125, 4.718017578125, 4.8900146484375, 5.06201171875, 5.2340087890625, 5.406005859375, 5.5780029296875, 5.75]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 2.0, 5.0, 4.0, 6.0, 6.0, 17.0, 12.0, 7.0, 11.0, 13.0, 27.0, 32.0, 42.0, 59.0, 81.0, 150.0, 201.0, 359.0, 680.0, 1403.0, 3079.0, 8223.0, 28132.0, 167334.0, 2439550.0, 1411730.0, 100443.0, 20768.0, 6644.0, 2591.0, 1155.0, 610.0, 335.0, 177.0, 100.0, 67.0, 45.0, 37.0, 23.0, 27.0, 17.0, 16.0, 8.0, 15.0, 8.0, 10.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.3125, -31.26611328125, -30.2197265625, -29.17333984375, -28.126953125, -27.08056640625, -26.0341796875, -24.98779296875, -23.94140625, -22.89501953125, -21.8486328125, -20.80224609375, -19.755859375, -18.70947265625, -17.6630859375, -16.61669921875, -15.5703125, -14.52392578125, -13.4775390625, -12.43115234375, -11.384765625, -10.33837890625, -9.2919921875, -8.24560546875, -7.19921875, -6.15283203125, -5.1064453125, -4.06005859375, -3.013671875, -1.96728515625, -0.9208984375, 0.12548828125, 1.171875, 2.21826171875, 3.2646484375, 4.31103515625, 5.357421875, 6.40380859375, 7.4501953125, 8.49658203125, 9.54296875, 10.58935546875, 11.6357421875, 12.68212890625, 13.728515625, 14.77490234375, 15.8212890625, 16.86767578125, 17.9140625, 18.96044921875, 20.0068359375, 21.05322265625, 22.099609375, 23.14599609375, 24.1923828125, 25.23876953125, 26.28515625, 27.33154296875, 28.3779296875, 29.42431640625, 30.470703125, 31.51708984375, 32.5634765625, 33.60986328125, 34.65625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 14.0, 15.0, 27.0, 46.0, 56.0, 101.0, 233.0, 417.0, 779.0, 930.0, 612.0, 379.0, 212.0, 114.0, 58.0, 37.0, 24.0, 5.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.78125, -28.767578125, -27.75390625, -26.740234375, -25.7265625, -24.712890625, -23.69921875, -22.685546875, -21.671875, -20.658203125, -19.64453125, -18.630859375, -17.6171875, -16.603515625, -15.58984375, -14.576171875, -13.5625, -12.548828125, -11.53515625, -10.521484375, -9.5078125, -8.494140625, -7.48046875, -6.466796875, -5.453125, -4.439453125, -3.42578125, -2.412109375, -1.3984375, -0.384765625, 0.62890625, 1.642578125, 2.65625, 3.669921875, 4.68359375, 5.697265625, 6.7109375, 7.724609375, 8.73828125, 9.751953125, 10.765625, 11.779296875, 12.79296875, 13.806640625, 14.8203125, 15.833984375, 16.84765625, 17.861328125, 18.875, 19.888671875, 20.90234375, 21.916015625, 22.9296875, 23.943359375, 24.95703125, 25.970703125, 26.984375, 27.998046875, 29.01171875, 30.025390625, 31.0390625, 32.052734375, 33.06640625, 34.080078125, 35.09375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 4.0, 13.0, 14.0, 17.0, 24.0, 36.0, 46.0, 66.0, 66.0, 106.0, 182.0, 330.0, 718.0, 2214.0, 8853.0, 46328.0, 521715.0, 3272750.0, 298418.0, 32413.0, 6643.0, 1829.0, 609.0, 279.0, 184.0, 107.0, 77.0, 48.0, 39.0, 34.0, 32.0, 17.0, 19.0, 16.0, 6.0, 10.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.375, -35.2861328125, -34.197265625, -33.1083984375, -32.01953125, -30.9306640625, -29.841796875, -28.7529296875, -27.6640625, -26.5751953125, -25.486328125, -24.3974609375, -23.30859375, -22.2197265625, -21.130859375, -20.0419921875, -18.953125, -17.8642578125, -16.775390625, -15.6865234375, -14.59765625, -13.5087890625, -12.419921875, -11.3310546875, -10.2421875, -9.1533203125, -8.064453125, -6.9755859375, -5.88671875, -4.7978515625, -3.708984375, -2.6201171875, -1.53125, -0.4423828125, 0.646484375, 1.7353515625, 2.82421875, 3.9130859375, 5.001953125, 6.0908203125, 7.1796875, 8.2685546875, 9.357421875, 10.4462890625, 11.53515625, 12.6240234375, 13.712890625, 14.8017578125, 15.890625, 16.9794921875, 18.068359375, 19.1572265625, 20.24609375, 21.3349609375, 22.423828125, 23.5126953125, 24.6015625, 25.6904296875, 26.779296875, 27.8681640625, 28.95703125, 30.0458984375, 31.134765625, 32.2236328125, 33.3125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 13.0, 27.0, 22.0, 16.0, 32.0, 45.0, 61.0, 69.0, 77.0, 77.0, 101.0, 80.0, 67.0, 77.0, 54.0, 40.0, 26.0, 30.0, 17.0, 15.0, 11.0, 2.0, 8.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-119.81044006347656, -115.21060180664062, -110.61077117919922, -106.01094055175781, -101.41110229492188, -96.81126403808594, -92.21143341064453, -87.61160278320312, -83.01176452636719, -78.41192626953125, -73.81209564208984, -69.21226501464844, -64.6124267578125, -60.01259231567383, -55.412757873535156, -50.812923431396484, -46.21308898925781, -41.61325454711914, -37.01342010498047, -32.4135856628418, -27.813751220703125, -23.213916778564453, -18.61408233642578, -14.01424789428711, -9.414413452148438, -4.814579010009766, -0.21474456787109375, 4.385089874267578, 8.98492431640625, 13.584758758544922, 18.184593200683594, 22.784427642822266, 27.384246826171875, 31.984081268310547, 36.58391571044922, 41.18375015258789, 45.78358459472656, 50.383419036865234, 54.983253479003906, 59.58308792114258, 64.18292236328125, 68.78276062011719, 73.3825912475586, 77.982421875, 82.58226013183594, 87.18209838867188, 91.78192901611328, 96.38175964355469, 100.98159790039062, 105.58143615722656, 110.18126678466797, 114.78109741210938, 119.38093566894531, 123.98077392578125, 128.58059692382812, 133.18043518066406, 137.7802734375, 142.38011169433594, 146.97994995117188, 151.57977294921875, 156.1796112060547, 160.77944946289062, 165.3792724609375, 169.97911071777344, 174.57894897460938]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 9.0, 8.0, 13.0, 12.0, 9.0, 13.0, 22.0, 15.0, 18.0, 21.0, 26.0, 24.0, 35.0, 29.0, 28.0, 36.0, 43.0, 39.0, 44.0, 54.0, 37.0, 51.0, 29.0, 36.0, 41.0, 33.0, 31.0, 32.0, 39.0, 34.0, 23.0, 25.0, 18.0, 17.0, 13.0, 6.0, 8.0, 8.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0], "bins": [-103.0640869140625, -100.19120025634766, -97.31831359863281, -94.44542694091797, -91.57254028320312, -88.69965362548828, -85.82676696777344, -82.95388793945312, -80.08099365234375, -77.2081069946289, -74.33522033691406, -71.46233367919922, -68.58944702148438, -65.71656036376953, -62.84367752075195, -59.97079086303711, -57.09790802001953, -54.22502136230469, -51.352134704589844, -48.479248046875, -45.606361389160156, -42.73347473144531, -39.860591888427734, -36.98770523071289, -34.11481857299805, -31.241931915283203, -28.36904525756836, -25.49616050720215, -22.623273849487305, -19.75038719177246, -16.87750244140625, -14.004615783691406, -11.131729125976562, -8.258842468261719, -5.385956764221191, -2.513071060180664, 0.3598155975341797, 3.2327022552490234, 6.105587005615234, 8.978473663330078, 11.851360321044922, 14.724246978759766, 17.59713363647461, 20.47001838684082, 23.342905044555664, 26.215791702270508, 29.08867645263672, 31.961563110351562, 34.834449768066406, 37.70733642578125, 40.580223083496094, 43.45310974121094, 46.32599639892578, 49.198883056640625, 52.0717658996582, 54.94465255737305, 57.81753921508789, 60.690425872802734, 63.56331253051758, 66.43619537353516, 69.30908203125, 72.18196868896484, 75.05485534667969, 77.92774200439453, 80.80062866210938]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 6.0, 16.0, 15.0, 15.0, 19.0, 18.0, 21.0, 26.0, 21.0, 31.0, 23.0, 35.0, 42.0, 43.0, 50.0, 44.0, 50.0, 43.0, 41.0, 47.0, 52.0, 37.0, 32.0, 38.0, 34.0, 39.0, 28.0, 31.0, 19.0, 17.0, 9.0, 10.0, 11.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-250.625, -243.646484375, -236.66796875, -229.689453125, -222.7109375, -215.732421875, -208.75390625, -201.775390625, -194.796875, -187.818359375, -180.83984375, -173.861328125, -166.8828125, -159.904296875, -152.92578125, -145.947265625, -138.96875, -131.990234375, -125.01171875, -118.033203125, -111.0546875, -104.076171875, -97.09765625, -90.119140625, -83.140625, -76.162109375, -69.18359375, -62.205078125, -55.2265625, -48.248046875, -41.26953125, -34.291015625, -27.3125, -20.333984375, -13.35546875, -6.376953125, 0.6015625, 7.580078125, 14.55859375, 21.537109375, 28.515625, 35.494140625, 42.47265625, 49.451171875, 56.4296875, 63.408203125, 70.38671875, 77.365234375, 84.34375, 91.322265625, 98.30078125, 105.279296875, 112.2578125, 119.236328125, 126.21484375, 133.193359375, 140.171875, 147.150390625, 154.12890625, 161.107421875, 168.0859375, 175.064453125, 182.04296875, 189.021484375, 196.0]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 10.0, 18.0, 17.0, 21.0, 51.0, 87.0, 119.0, 142.0, 245.0, 428.0, 628.0, 964.0, 1668.0, 2590.0, 4469.0, 7540.0, 13304.0, 23379.0, 42008.0, 79523.0, 173573.0, 360450.0, 165376.0, 77008.0, 40903.0, 22577.0, 12837.0, 7327.0, 4410.0, 2580.0, 1628.0, 956.0, 579.0, 407.0, 239.0, 173.0, 129.0, 56.0, 41.0, 28.0, 23.0, 14.0, 16.0, 2.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.5390625, -7.3138427734375, -7.088623046875, -6.8634033203125, -6.63818359375, -6.4129638671875, -6.187744140625, -5.9625244140625, -5.7373046875, -5.5120849609375, -5.286865234375, -5.0616455078125, -4.83642578125, -4.6112060546875, -4.385986328125, -4.1607666015625, -3.935546875, -3.7103271484375, -3.485107421875, -3.2598876953125, -3.03466796875, -2.8094482421875, -2.584228515625, -2.3590087890625, -2.1337890625, -1.9085693359375, -1.683349609375, -1.4581298828125, -1.23291015625, -1.0076904296875, -0.782470703125, -0.5572509765625, -0.33203125, -0.1068115234375, 0.118408203125, 0.3436279296875, 0.56884765625, 0.7940673828125, 1.019287109375, 1.2445068359375, 1.4697265625, 1.6949462890625, 1.920166015625, 2.1453857421875, 2.37060546875, 2.5958251953125, 2.821044921875, 3.0462646484375, 3.271484375, 3.4967041015625, 3.721923828125, 3.9471435546875, 4.17236328125, 4.3975830078125, 4.622802734375, 4.8480224609375, 5.0732421875, 5.2984619140625, 5.523681640625, 5.7489013671875, 5.97412109375, 6.1993408203125, 6.424560546875, 6.6497802734375, 6.875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 8.0, 5.0, 7.0, 13.0, 9.0, 15.0, 16.0, 17.0, 16.0, 25.0, 18.0, 27.0, 25.0, 38.0, 41.0, 30.0, 30.0, 34.0, 42.0, 44.0, 37.0, 1071.0, 29.0, 33.0, 42.0, 39.0, 30.0, 32.0, 32.0, 24.0, 28.0, 31.0, 12.0, 19.0, 12.0, 22.0, 14.0, 14.0, 14.0, 5.0, 6.0, 5.0, 3.0, 9.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.5, -133.83984375, -129.1796875, -124.51953125, -119.859375, -115.19921875, -110.5390625, -105.87890625, -101.21875, -96.55859375, -91.8984375, -87.23828125, -82.578125, -77.91796875, -73.2578125, -68.59765625, -63.9375, -59.27734375, -54.6171875, -49.95703125, -45.296875, -40.63671875, -35.9765625, -31.31640625, -26.65625, -21.99609375, -17.3359375, -12.67578125, -8.015625, -3.35546875, 1.3046875, 5.96484375, 10.625, 15.28515625, 19.9453125, 24.60546875, 29.265625, 33.92578125, 38.5859375, 43.24609375, 47.90625, 52.56640625, 57.2265625, 61.88671875, 66.546875, 71.20703125, 75.8671875, 80.52734375, 85.1875, 89.84765625, 94.5078125, 99.16796875, 103.828125, 108.48828125, 113.1484375, 117.80859375, 122.46875, 127.12890625, 131.7890625, 136.44921875, 141.109375, 145.76953125, 150.4296875, 155.08984375, 159.75]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 12.0, 16.0, 13.0, 39.0, 44.0, 77.0, 101.0, 172.0, 254.0, 352.0, 550.0, 821.0, 1265.0, 1849.0, 2820.0, 4292.0, 6624.0, 10201.0, 15684.0, 25178.0, 40450.0, 67584.0, 124013.0, 1322280.0, 217783.0, 100715.0, 57103.0, 35064.0, 21866.0, 14004.0, 8888.0, 5835.0, 3855.0, 2526.0, 1654.0, 1054.0, 705.0, 462.0, 294.0, 215.0, 135.0, 95.0, 70.0, 39.0, 22.0, 16.0, 14.0, 6.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.95703125, -3.8365478515625, -3.716064453125, -3.5955810546875, -3.47509765625, -3.3546142578125, -3.234130859375, -3.1136474609375, -2.9931640625, -2.8726806640625, -2.752197265625, -2.6317138671875, -2.51123046875, -2.3907470703125, -2.270263671875, -2.1497802734375, -2.029296875, -1.9088134765625, -1.788330078125, -1.6678466796875, -1.54736328125, -1.4268798828125, -1.306396484375, -1.1859130859375, -1.0654296875, -0.9449462890625, -0.824462890625, -0.7039794921875, -0.58349609375, -0.4630126953125, -0.342529296875, -0.2220458984375, -0.1015625, 0.0189208984375, 0.139404296875, 0.2598876953125, 0.38037109375, 0.5008544921875, 0.621337890625, 0.7418212890625, 0.8623046875, 0.9827880859375, 1.103271484375, 1.2237548828125, 1.34423828125, 1.4647216796875, 1.585205078125, 1.7056884765625, 1.826171875, 1.9466552734375, 2.067138671875, 2.1876220703125, 2.30810546875, 2.4285888671875, 2.549072265625, 2.6695556640625, 2.7900390625, 2.9105224609375, 3.031005859375, 3.1514892578125, 3.27197265625, 3.3924560546875, 3.512939453125, 3.6334228515625, 3.75390625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 10.0, 6.0, 11.0, 15.0, 8.0, 16.0, 15.0, 24.0, 26.0, 39.0, 49.0, 58.0, 55.0, 79.0, 82.0, 84.0, 62.0, 55.0, 60.0, 54.0, 32.0, 28.0, 23.0, 24.0, 17.0, 12.0, 10.0, 8.0, 3.0, 5.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015625, -0.015136480331420898, -0.014647960662841797, -0.014159440994262695, -0.013670921325683594, -0.013182401657104492, -0.01269388198852539, -0.012205362319946289, -0.011716842651367188, -0.011228322982788086, -0.010739803314208984, -0.010251283645629883, -0.009762763977050781, -0.00927424430847168, -0.008785724639892578, -0.008297204971313477, -0.007808685302734375, -0.0073201656341552734, -0.006831645965576172, -0.00634312629699707, -0.005854606628417969, -0.005366086959838867, -0.004877567291259766, -0.004389047622680664, -0.0039005279541015625, -0.003412008285522461, -0.0029234886169433594, -0.002434968948364258, -0.0019464492797851562, -0.0014579296112060547, -0.0009694099426269531, -0.00048089027404785156, 7.62939453125e-06, 0.0004961490631103516, 0.0009846687316894531, 0.0014731884002685547, 0.0019617080688476562, 0.002450227737426758, 0.0029387474060058594, 0.003427267074584961, 0.0039157867431640625, 0.004404306411743164, 0.004892826080322266, 0.005381345748901367, 0.005869865417480469, 0.00635838508605957, 0.006846904754638672, 0.0073354244232177734, 0.007823944091796875, 0.008312463760375977, 0.008800983428955078, 0.00928950309753418, 0.009778022766113281, 0.010266542434692383, 0.010755062103271484, 0.011243581771850586, 0.011732101440429688, 0.012220621109008789, 0.01270914077758789, 0.013197660446166992, 0.013686180114746094, 0.014174699783325195, 0.014663219451904297, 0.015151739120483398, 0.0156402587890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 5.0, 4.0, 15.0, 19.0, 28.0, 49.0, 92.0, 112.0, 188.0, 374.0, 595.0, 1023.0, 1945.0, 3838.0, 8340.0, 18819.0, 48435.0, 152236.0, 500630.0, 208434.0, 60946.0, 23005.0, 9705.0, 4585.0, 2295.0, 1214.0, 656.0, 367.0, 232.0, 123.0, 75.0, 64.0, 41.0, 26.0, 9.0, 10.0, 8.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09222412109375, -0.08955955505371094, -0.08689498901367188, -0.08423042297363281, -0.08156585693359375, -0.07890129089355469, -0.07623672485351562, -0.07357215881347656, -0.0709075927734375, -0.06824302673339844, -0.06557846069335938, -0.06291389465332031, -0.06024932861328125, -0.05758476257324219, -0.054920196533203125, -0.05225563049316406, -0.049591064453125, -0.04692649841308594, -0.044261932373046875, -0.04159736633300781, -0.03893280029296875, -0.03626823425292969, -0.033603668212890625, -0.030939102172851562, -0.0282745361328125, -0.025609970092773438, -0.022945404052734375, -0.020280838012695312, -0.01761627197265625, -0.014951705932617188, -0.012287139892578125, -0.009622573852539062, -0.0069580078125, -0.0042934417724609375, -0.001628875732421875, 0.0010356903076171875, 0.00370025634765625, 0.0063648223876953125, 0.009029388427734375, 0.011693954467773438, 0.0143585205078125, 0.017023086547851562, 0.019687652587890625, 0.022352218627929688, 0.02501678466796875, 0.027681350708007812, 0.030345916748046875, 0.03301048278808594, 0.035675048828125, 0.03833961486816406, 0.041004180908203125, 0.04366874694824219, 0.04633331298828125, 0.04899787902832031, 0.051662445068359375, 0.05432701110839844, 0.0569915771484375, 0.05965614318847656, 0.062320709228515625, 0.06498527526855469, 0.06764984130859375, 0.07031440734863281, 0.07297897338867188, 0.07564353942871094, 0.07830810546875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 3.0, 11.0, 7.0, 7.0, 9.0, 18.0, 20.0, 22.0, 29.0, 38.0, 55.0, 61.0, 67.0, 73.0, 74.0, 84.0, 72.0, 72.0, 47.0, 44.0, 44.0, 33.0, 25.0, 19.0, 15.0, 13.0, 3.0, 7.0, 3.0, 9.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0177143607288599, -0.017120180651545525, -0.016525998711586, -0.01593181863427162, -0.01533763762563467, -0.014743456616997719, -0.014149276539683342, -0.01355509553104639, -0.012960914522409439, -0.012366733513772488, -0.011772552505135536, -0.01117837242782116, -0.010584191419184208, -0.009990010410547256, -0.00939583033323288, -0.008801649324595928, -0.008207468315958977, -0.007613287307322025, -0.007019106764346361, -0.006424926221370697, -0.005830745212733746, -0.005236564204096794, -0.00464238366112113, -0.004048203118145466, -0.0034540221095085144, -0.0028598413337022066, -0.002265660557895899, -0.001671479782089591, -0.0010772990062832832, -0.00048311823047697544, 0.00011106254532933235, 0.0007052430883049965, 0.0012994222342967987, 0.0018936030101031065, 0.0024877837859094143, 0.003081964561715722, 0.00367614533752203, 0.004270326346158981, 0.0048645068891346455, 0.00545868743211031, 0.006052868440747261, 0.0066470494493842125, 0.007241229992359877, 0.00783541053533554, 0.008429591543972492, 0.009023772552609444, 0.00961795262992382, 0.010212133638560772, 0.010806314647197723, 0.011400495655834675, 0.011994676664471626, 0.012588856741786003, 0.013183037750422955, 0.013777218759059906, 0.014371398836374283, 0.014965579845011234, 0.015559760853648186, 0.016153940930962563, 0.01674812287092209, 0.017342302948236465, 0.017936483025550842, 0.01853066496551037, 0.019124845042824745, 0.01971902698278427, 0.020313207060098648]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 14.0, 14.0, 13.0, 17.0, 10.0, 31.0, 21.0, 24.0, 35.0, 27.0, 34.0, 31.0, 36.0, 42.0, 46.0, 54.0, 37.0, 31.0, 39.0, 45.0, 46.0, 42.0, 33.0, 32.0, 23.0, 34.0, 22.0, 25.0, 24.0, 20.0, 15.0, 19.0, 8.0, 5.0, 6.0, 11.0, 5.0, 3.0, 0.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.011652886867523193, -0.011288831941783428, -0.010924777016043663, -0.010560722090303898, -0.010196667164564133, -0.009832612238824368, -0.009468557313084602, -0.009104502387344837, -0.008740447461605072, -0.008376392535865307, -0.008012337610125542, -0.0076482826843857765, -0.007284227758646011, -0.006920172832906246, -0.006556117907166481, -0.006192062981426716, -0.005828008055686951, -0.0054639531299471855, -0.00509989820420742, -0.004735843278467655, -0.00437178835272789, -0.004007733426988125, -0.0036436785012483597, -0.0032796235755085945, -0.0029155686497688293, -0.002551513724029064, -0.002187458798289299, -0.0018234038725495338, -0.0014593489468097687, -0.0010952940210700035, -0.0007312390953302383, -0.0003671841695904732, -3.129243850708008e-06, 0.00036092568188905716, 0.0007249806076288223, 0.0010890355333685875, 0.0014530904591083527, 0.0018171453848481178, 0.002181200310587883, 0.002545255236327648, 0.0029093101620674133, 0.0032733650878071785, 0.0036374200135469437, 0.004001474939286709, 0.004365529865026474, 0.004729584790766239, 0.005093639716506004, 0.0054576946422457695, 0.005821749567985535, 0.0061858044937253, 0.006549859419465065, 0.00691391434520483, 0.007277969270944595, 0.0076420241966843605, 0.008006079122424126, 0.00837013404816389, 0.008734188973903656, 0.009098243899643421, 0.009462298825383186, 0.009826353751122952, 0.010190408676862717, 0.010554463602602482, 0.010918518528342247, 0.011282573454082012, 0.011646628379821777]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 6.0, 16.0, 15.0, 15.0, 19.0, 18.0, 21.0, 26.0, 21.0, 31.0, 23.0, 34.0, 43.0, 43.0, 50.0, 44.0, 49.0, 44.0, 41.0, 46.0, 53.0, 37.0, 31.0, 39.0, 33.0, 40.0, 28.0, 29.0, 21.0, 17.0, 9.0, 10.0, 11.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-250.625, -243.6484375, -236.671875, -229.6953125, -222.71875, -215.7421875, -208.765625, -201.7890625, -194.8125, -187.8359375, -180.859375, -173.8828125, -166.90625, -159.9296875, -152.953125, -145.9765625, -139.0, -132.0234375, -125.046875, -118.0703125, -111.09375, -104.1171875, -97.140625, -90.1640625, -83.1875, -76.2109375, -69.234375, -62.2578125, -55.28125, -48.3046875, -41.328125, -34.3515625, -27.375, -20.3984375, -13.421875, -6.4453125, 0.53125, 7.5078125, 14.484375, 21.4609375, 28.4375, 35.4140625, 42.390625, 49.3671875, 56.34375, 63.3203125, 70.296875, 77.2734375, 84.25, 91.2265625, 98.203125, 105.1796875, 112.15625, 119.1328125, 126.109375, 133.0859375, 140.0625, 147.0390625, 154.015625, 160.9921875, 167.96875, 174.9453125, 181.921875, 188.8984375, 195.875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 4.0, 13.0, 6.0, 8.0, 19.0, 13.0, 22.0, 22.0, 22.0, 27.0, 41.0, 62.0, 87.0, 172.0, 270.0, 567.0, 1804.0, 14631.0, 440088.0, 567335.0, 19808.0, 1988.0, 651.0, 302.0, 184.0, 115.0, 62.0, 57.0, 42.0, 30.0, 28.0, 20.0, 7.0, 12.0, 10.0, 5.0, 6.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-49.65625, -48.27880859375, -46.9013671875, -45.52392578125, -44.146484375, -42.76904296875, -41.3916015625, -40.01416015625, -38.63671875, -37.25927734375, -35.8818359375, -34.50439453125, -33.126953125, -31.74951171875, -30.3720703125, -28.99462890625, -27.6171875, -26.23974609375, -24.8623046875, -23.48486328125, -22.107421875, -20.72998046875, -19.3525390625, -17.97509765625, -16.59765625, -15.22021484375, -13.8427734375, -12.46533203125, -11.087890625, -9.71044921875, -8.3330078125, -6.95556640625, -5.578125, -4.20068359375, -2.8232421875, -1.44580078125, -0.068359375, 1.30908203125, 2.6865234375, 4.06396484375, 5.44140625, 6.81884765625, 8.1962890625, 9.57373046875, 10.951171875, 12.32861328125, 13.7060546875, 15.08349609375, 16.4609375, 17.83837890625, 19.2158203125, 20.59326171875, 21.970703125, 23.34814453125, 24.7255859375, 26.10302734375, 27.48046875, 28.85791015625, 30.2353515625, 31.61279296875, 32.990234375, 34.36767578125, 35.7451171875, 37.12255859375, 38.5]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 8.0, 18.0, 19.0, 24.0, 20.0, 36.0, 33.0, 43.0, 65.0, 62.0, 79.0, 80.0, 2105.0, 75.0, 48.0, 63.0, 50.0, 46.0, 47.0, 25.0, 24.0, 14.0, 11.0, 10.0, 10.0, 10.0, 5.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-443.0, -429.23046875, -415.4609375, -401.69140625, -387.921875, -374.15234375, -360.3828125, -346.61328125, -332.84375, -319.07421875, -305.3046875, -291.53515625, -277.765625, -263.99609375, -250.2265625, -236.45703125, -222.6875, -208.91796875, -195.1484375, -181.37890625, -167.609375, -153.83984375, -140.0703125, -126.30078125, -112.53125, -98.76171875, -84.9921875, -71.22265625, -57.453125, -43.68359375, -29.9140625, -16.14453125, -2.375, 11.39453125, 25.1640625, 38.93359375, 52.703125, 66.47265625, 80.2421875, 94.01171875, 107.78125, 121.55078125, 135.3203125, 149.08984375, 162.859375, 176.62890625, 190.3984375, 204.16796875, 217.9375, 231.70703125, 245.4765625, 259.24609375, 273.015625, 286.78515625, 300.5546875, 314.32421875, 328.09375, 341.86328125, 355.6328125, 369.40234375, 383.171875, 396.94140625, 410.7109375, 424.48046875, 438.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 12.0, 12.0, 19.0, 34.0, 75.0, 147.0, 333.0, 1014.0, 5484.0, 92770.0, 2982915.0, 57071.0, 4294.0, 929.0, 303.0, 135.0, 56.0, 31.0, 19.0, 5.0, 10.0, 9.0, 6.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.84375, -38.71923828125, -37.5947265625, -36.47021484375, -35.345703125, -34.22119140625, -33.0966796875, -31.97216796875, -30.84765625, -29.72314453125, -28.5986328125, -27.47412109375, -26.349609375, -25.22509765625, -24.1005859375, -22.97607421875, -21.8515625, -20.72705078125, -19.6025390625, -18.47802734375, -17.353515625, -16.22900390625, -15.1044921875, -13.97998046875, -12.85546875, -11.73095703125, -10.6064453125, -9.48193359375, -8.357421875, -7.23291015625, -6.1083984375, -4.98388671875, -3.859375, -2.73486328125, -1.6103515625, -0.48583984375, 0.638671875, 1.76318359375, 2.8876953125, 4.01220703125, 5.13671875, 6.26123046875, 7.3857421875, 8.51025390625, 9.634765625, 10.75927734375, 11.8837890625, 13.00830078125, 14.1328125, 15.25732421875, 16.3818359375, 17.50634765625, 18.630859375, 19.75537109375, 20.8798828125, 22.00439453125, 23.12890625, 24.25341796875, 25.3779296875, 26.50244140625, 27.626953125, 28.75146484375, 29.8759765625, 31.00048828125, 32.125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 5.0, 8.0, 14.0, 15.0, 22.0, 43.0, 51.0, 91.0, 196.0, 204.0, 153.0, 68.0, 29.0, 35.0, 15.0, 10.0, 7.0, 2.0, 6.0, 5.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-559.679443359375, -539.1724853515625, -518.66552734375, -498.1585998535156, -477.6516418457031, -457.1446838378906, -436.63775634765625, -416.13079833984375, -395.62384033203125, -375.11688232421875, -354.60992431640625, -334.1029968261719, -313.5960388183594, -293.0890808105469, -272.5821533203125, -252.0751953125, -231.5682373046875, -211.061279296875, -190.55433654785156, -170.04739379882812, -149.54043579101562, -129.03347778320312, -108.52653503417969, -88.01959228515625, -67.51263427734375, -47.00568389892578, -26.498733520507812, -5.991783142089844, 14.515167236328125, 35.022117614746094, 55.52906799316406, 76.0360107421875, 96.54296875, 117.04991912841797, 137.55686950683594, 158.06381225585938, 178.57077026367188, 199.07772827148438, 219.5846710205078, 240.09161376953125, 260.59857177734375, 281.10552978515625, 301.61248779296875, 322.1194152832031, 342.6263732910156, 363.1333312988281, 383.6402587890625, 404.147216796875, 424.6541748046875, 445.1611328125, 465.6680908203125, 486.1750183105469, 506.6819763183594, 527.1889038085938, 547.6958618164062, 568.2028198242188, 588.7097778320312, 609.2167358398438, 629.7236938476562, 650.2306518554688, 670.737548828125, 691.2445068359375, 711.75146484375, 732.2584228515625, 752.765380859375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 9.0, 5.0, 7.0, 11.0, 17.0, 23.0, 16.0, 23.0, 18.0, 13.0, 26.0, 24.0, 27.0, 31.0, 55.0, 44.0, 43.0, 48.0, 49.0, 50.0, 40.0, 33.0, 34.0, 44.0, 29.0, 34.0, 27.0, 48.0, 29.0, 26.0, 18.0, 18.0, 12.0, 15.0, 7.0, 8.0, 9.0, 2.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-704.7015380859375, -684.605224609375, -664.5088500976562, -644.4125366210938, -624.316162109375, -604.2198486328125, -584.1234741210938, -564.0271606445312, -543.9307861328125, -523.83447265625, -503.73809814453125, -483.6417541503906, -463.54541015625, -443.4490661621094, -423.35272216796875, -403.25640869140625, -383.1600646972656, -363.063720703125, -342.9673767089844, -322.87103271484375, -302.7746887207031, -282.6783447265625, -262.58203125, -242.4856719970703, -222.3893280029297, -202.29298400878906, -182.19664001464844, -162.10031127929688, -142.00396728515625, -121.9076156616211, -101.811279296875, -81.71493530273438, -61.61859130859375, -41.522247314453125, -21.425907135009766, -1.3295669555664062, 18.76677703857422, 38.863121032714844, 58.95945739746094, 79.05580139160156, 99.15214538574219, 119.24848937988281, 139.34483337402344, 159.441162109375, 179.53750610351562, 199.63385009765625, 219.73019409179688, 239.8265380859375, 259.9228820800781, 280.01922607421875, 300.1155700683594, 320.2119140625, 340.3082580566406, 360.40460205078125, 380.50091552734375, 400.5972900390625, 420.693603515625, 440.7899475097656, 460.88629150390625, 480.9826354980469, 501.0789794921875, 521.17529296875, 541.2716674804688, 561.3679809570312, 581.46435546875]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 9.0, 8.0, 10.0, 9.0, 9.0, 12.0, 22.0, 24.0, 29.0, 37.0, 27.0, 51.0, 54.0, 109.0, 177.0, 263.0, 552.0, 1553.0, 5682.0, 1025233.0, 10269.0, 2567.0, 775.0, 362.0, 226.0, 138.0, 71.0, 51.0, 41.0, 27.0, 30.0, 12.0, 14.0, 17.0, 11.0, 18.0, 11.0, 7.0, 6.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-148.81954956054688, -144.12600708007812, -139.43246459960938, -134.73892211914062, -130.0453643798828, -125.35182189941406, -120.65827941894531, -115.96473693847656, -111.27119445800781, -106.57765197753906, -101.88410186767578, -97.19055938720703, -92.49701690673828, -87.803466796875, -83.10992431640625, -78.4163818359375, -73.72283172607422, -69.02928924560547, -64.33573913574219, -59.64219665527344, -54.94865417480469, -50.25510787963867, -45.561561584472656, -40.868019104003906, -36.17447280883789, -31.480928421020508, -26.787384033203125, -22.09383773803711, -17.400293350219727, -12.706748962402344, -8.013202667236328, -3.319660186767578, 1.3738861083984375, 6.0674309730529785, 10.76097583770752, 15.454521179199219, 20.1480655670166, 24.841609954833984, 29.53515625, 34.22869873046875, 38.922245025634766, 43.61579132080078, 48.30933380126953, 53.00288009643555, 57.69642639160156, 62.38996887207031, 67.08351135253906, 71.77705383300781, 76.4706039428711, 81.16414642333984, 85.85769653320312, 90.55123901367188, 95.24478149414062, 99.93832397460938, 104.63187408447266, 109.3254165649414, 114.01896667480469, 118.71250915527344, 123.40605926513672, 128.099609375, 132.79315185546875, 137.4866943359375, 142.18023681640625, 146.873779296875, 151.56732177734375]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 2.0, 5.0, 12.0, 12.0, 24.0, 30.0, 65.0, 85.0, 155.0, 286.0, 550.0, 2039.0, 49823.0, 51402116.0, 6298.0, 911.0, 310.0, 159.0, 93.0, 56.0, 30.0, 10.0, 15.0, 17.0, 15.0, 6.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-407.26434326171875, -394.21893310546875, -381.1735534667969, -368.1281433105469, -355.082763671875, -342.037353515625, -328.991943359375, -315.9465637207031, -302.90118408203125, -289.85577392578125, -276.8103942871094, -263.7649841308594, -250.7196044921875, -237.6741943359375, -224.62879943847656, -211.58340454101562, -198.53799438476562, -185.4925994873047, -172.44720458984375, -159.40179443359375, -146.35641479492188, -133.31100463867188, -120.26560974121094, -107.22021484375, -94.17481994628906, -81.12942504882812, -68.08403015136719, -55.03862762451172, -41.99323272705078, -28.947837829589844, -15.902435302734375, -2.8570404052734375, 10.188385009765625, 23.233781814575195, 36.279178619384766, 49.32457733154297, 62.369972229003906, 75.41536712646484, 88.46076965332031, 101.50616455078125, 114.55155944824219, 127.59695434570312, 140.64234924316406, 153.687744140625, 166.733154296875, 179.77853393554688, 192.82394409179688, 205.8693389892578, 218.91473388671875, 231.9601287841797, 245.00552368164062, 258.0509338378906, 271.0963134765625, 284.1417236328125, 297.1871337890625, 310.2325134277344, 323.27789306640625, 336.32330322265625, 349.3686828613281, 362.4140930175781, 375.45947265625, 388.5048828125, 401.55029296875, 414.5956726074219, 427.6410827636719]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 2.0, 8.0, 21.0, 19.0, 33.0, 61.0, 75.0, 119.0, 196.0, 338.0, 471.0, 742.0, 1195.0, 1776.0, 2593.0, 3998.0, 6034.0, 9242.0, 14371.0, 23046.0, 36345.0, 58880.0, 99671.0, 175856.0, 340920.0, 783054.0, 3871106.0, 385483.0, 195006.0, 109252.0, 64453.0, 38800.0, 24846.0, 15508.0, 9789.0, 6259.0, 4011.0, 2649.0, 1727.0, 1129.0, 739.0, 530.0, 325.0, 246.0, 170.0, 116.0, 85.0, 42.0, 35.0, 29.0, 14.0, 5.0, 0.0, 2.0, 2.0, 1.0, 5.0], "bins": [-1.134765625, -1.1004638671875, -1.066162109375, -1.0318603515625, -0.99755859375, -0.9632568359375, -0.928955078125, -0.8946533203125, -0.8603515625, -0.8260498046875, -0.791748046875, -0.7574462890625, -0.72314453125, -0.6888427734375, -0.654541015625, -0.6202392578125, -0.5859375, -0.5516357421875, -0.517333984375, -0.4830322265625, -0.44873046875, -0.4144287109375, -0.380126953125, -0.3458251953125, -0.3115234375, -0.2772216796875, -0.242919921875, -0.2086181640625, -0.17431640625, -0.1400146484375, -0.105712890625, -0.0714111328125, -0.037109375, -0.0028076171875, 0.031494140625, 0.0657958984375, 0.10009765625, 0.1343994140625, 0.168701171875, 0.2030029296875, 0.2373046875, 0.2716064453125, 0.305908203125, 0.3402099609375, 0.37451171875, 0.4088134765625, 0.443115234375, 0.4774169921875, 0.51171875, 0.5460205078125, 0.580322265625, 0.6146240234375, 0.64892578125, 0.6832275390625, 0.717529296875, 0.7518310546875, 0.7861328125, 0.8204345703125, 0.854736328125, 0.8890380859375, 0.92333984375, 0.9576416015625, 0.991943359375, 1.0262451171875, 1.060546875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 11.0, 5.0, 7.0, 15.0, 12.0, 13.0, 24.0, 13.0, 36.0, 24.0, 32.0, 37.0, 35.0, 37.0, 41.0, 35.0, 39.0, 53.0, 1064.0, 41.0, 54.0, 44.0, 35.0, 35.0, 33.0, 32.0, 26.0, 27.0, 28.0, 12.0, 22.0, 17.0, 12.0, 9.0, 10.0, 11.0, 7.0, 6.0, 8.0, 6.0, 1.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-68.0, -65.90234375, -63.8046875, -61.70703125, -59.609375, -57.51171875, -55.4140625, -53.31640625, -51.21875, -49.12109375, -47.0234375, -44.92578125, -42.828125, -40.73046875, -38.6328125, -36.53515625, -34.4375, -32.33984375, -30.2421875, -28.14453125, -26.046875, -23.94921875, -21.8515625, -19.75390625, -17.65625, -15.55859375, -13.4609375, -11.36328125, -9.265625, -7.16796875, -5.0703125, -2.97265625, -0.875, 1.22265625, 3.3203125, 5.41796875, 7.515625, 9.61328125, 11.7109375, 13.80859375, 15.90625, 18.00390625, 20.1015625, 22.19921875, 24.296875, 26.39453125, 28.4921875, 30.58984375, 32.6875, 34.78515625, 36.8828125, 38.98046875, 41.078125, 43.17578125, 45.2734375, 47.37109375, 49.46875, 51.56640625, 53.6640625, 55.76171875, 57.859375, 59.95703125, 62.0546875, 64.15234375, 66.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 4.0, 5.0, 1.0, 6.0, 9.0, 9.0, 9.0, 30.0, 38.0, 45.0, 68.0, 120.0, 158.0, 226.0, 349.0, 481.0, 754.0, 1175.0, 1732.0, 2617.0, 4137.0, 6467.0, 10102.0, 15675.0, 25011.0, 39961.0, 66043.0, 114546.0, 215911.0, 440240.0, 3932259.0, 674187.0, 332650.0, 168221.0, 92687.0, 54211.0, 33213.0, 20643.0, 13314.0, 8331.0, 5452.0, 3527.0, 2330.0, 1530.0, 971.0, 661.0, 425.0, 270.0, 190.0, 126.0, 78.0, 61.0, 54.0, 41.0, 29.0, 14.0, 15.0, 9.0, 10.0, 5.0, 4.0], "bins": [-0.94775390625, -0.9197235107421875, -0.891693115234375, -0.8636627197265625, -0.83563232421875, -0.8076019287109375, -0.779571533203125, -0.7515411376953125, -0.7235107421875, -0.6954803466796875, -0.667449951171875, -0.6394195556640625, -0.61138916015625, -0.5833587646484375, -0.555328369140625, -0.5272979736328125, -0.499267578125, -0.4712371826171875, -0.443206787109375, -0.4151763916015625, -0.38714599609375, -0.3591156005859375, -0.331085205078125, -0.3030548095703125, -0.2750244140625, -0.2469940185546875, -0.218963623046875, -0.1909332275390625, -0.16290283203125, -0.1348724365234375, -0.106842041015625, -0.0788116455078125, -0.05078125, -0.0227508544921875, 0.005279541015625, 0.0333099365234375, 0.06134033203125, 0.0893707275390625, 0.117401123046875, 0.1454315185546875, 0.1734619140625, 0.2014923095703125, 0.229522705078125, 0.2575531005859375, 0.28558349609375, 0.3136138916015625, 0.341644287109375, 0.3696746826171875, 0.397705078125, 0.4257354736328125, 0.453765869140625, 0.4817962646484375, 0.50982666015625, 0.5378570556640625, 0.565887451171875, 0.5939178466796875, 0.6219482421875, 0.6499786376953125, 0.678009033203125, 0.7060394287109375, 0.73406982421875, 0.7621002197265625, 0.790130615234375, 0.8181610107421875, 0.84619140625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 3.0, 11.0, 10.0, 10.0, 12.0, 11.0, 10.0, 13.0, 14.0, 23.0, 19.0, 20.0, 19.0, 29.0, 31.0, 38.0, 31.0, 30.0, 42.0, 30.0, 34.0, 1061.0, 33.0, 51.0, 36.0, 40.0, 37.0, 40.0, 31.0, 33.0, 23.0, 14.0, 25.0, 15.0, 21.0, 19.0, 11.0, 14.0, 14.0, 8.0, 8.0, 8.0, 6.0, 6.0, 5.0, 4.0, 1.0, 8.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-47.78125, -46.2177734375, -44.654296875, -43.0908203125, -41.52734375, -39.9638671875, -38.400390625, -36.8369140625, -35.2734375, -33.7099609375, -32.146484375, -30.5830078125, -29.01953125, -27.4560546875, -25.892578125, -24.3291015625, -22.765625, -21.2021484375, -19.638671875, -18.0751953125, -16.51171875, -14.9482421875, -13.384765625, -11.8212890625, -10.2578125, -8.6943359375, -7.130859375, -5.5673828125, -4.00390625, -2.4404296875, -0.876953125, 0.6865234375, 2.25, 3.8134765625, 5.376953125, 6.9404296875, 8.50390625, 10.0673828125, 11.630859375, 13.1943359375, 14.7578125, 16.3212890625, 17.884765625, 19.4482421875, 21.01171875, 22.5751953125, 24.138671875, 25.7021484375, 27.265625, 28.8291015625, 30.392578125, 31.9560546875, 33.51953125, 35.0830078125, 36.646484375, 38.2099609375, 39.7734375, 41.3369140625, 42.900390625, 44.4638671875, 46.02734375, 47.5908203125, 49.154296875, 50.7177734375, 52.28125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 11.0, 18.0, 12.0, 23.0, 31.0, 34.0, 50.0, 58.0, 69.0, 116.0, 127.0, 134.0, 199.0, 260.0, 333.0, 466.0, 702.0, 981.0, 1525.0, 2588.0, 5597.0, 14041.0, 42023.0, 198596.0, 5906098.0, 77368.0, 21565.0, 8411.0, 3772.0, 1990.0, 1154.0, 790.0, 535.0, 407.0, 308.0, 241.0, 218.0, 152.0, 101.0, 82.0, 52.0, 55.0, 40.0, 32.0, 19.0, 13.0, 13.0, 11.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.30078125, -4.16302490234375, -4.0252685546875, -3.88751220703125, -3.749755859375, -3.61199951171875, -3.4742431640625, -3.33648681640625, -3.19873046875, -3.06097412109375, -2.9232177734375, -2.78546142578125, -2.647705078125, -2.50994873046875, -2.3721923828125, -2.23443603515625, -2.0966796875, -1.95892333984375, -1.8211669921875, -1.68341064453125, -1.545654296875, -1.40789794921875, -1.2701416015625, -1.13238525390625, -0.99462890625, -0.85687255859375, -0.7191162109375, -0.58135986328125, -0.443603515625, -0.30584716796875, -0.1680908203125, -0.03033447265625, 0.107421875, 0.24517822265625, 0.3829345703125, 0.52069091796875, 0.658447265625, 0.79620361328125, 0.9339599609375, 1.07171630859375, 1.20947265625, 1.34722900390625, 1.4849853515625, 1.62274169921875, 1.760498046875, 1.89825439453125, 2.0360107421875, 2.17376708984375, 2.3115234375, 2.44927978515625, 2.5870361328125, 2.72479248046875, 2.862548828125, 3.00030517578125, 3.1380615234375, 3.27581787109375, 3.41357421875, 3.55133056640625, 3.6890869140625, 3.82684326171875, 3.964599609375, 4.10235595703125, 4.2401123046875, 4.37786865234375, 4.515625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 8.0, 9.0, 11.0, 10.0, 9.0, 21.0, 18.0, 15.0, 23.0, 19.0, 27.0, 23.0, 33.0, 35.0, 36.0, 27.0, 29.0, 33.0, 31.0, 41.0, 1073.0, 32.0, 47.0, 32.0, 37.0, 27.0, 32.0, 34.0, 36.0, 31.0, 18.0, 31.0, 14.0, 15.0, 14.0, 19.0, 16.0, 16.0, 10.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-52.0625, -50.552734375, -49.04296875, -47.533203125, -46.0234375, -44.513671875, -43.00390625, -41.494140625, -39.984375, -38.474609375, -36.96484375, -35.455078125, -33.9453125, -32.435546875, -30.92578125, -29.416015625, -27.90625, -26.396484375, -24.88671875, -23.376953125, -21.8671875, -20.357421875, -18.84765625, -17.337890625, -15.828125, -14.318359375, -12.80859375, -11.298828125, -9.7890625, -8.279296875, -6.76953125, -5.259765625, -3.75, -2.240234375, -0.73046875, 0.779296875, 2.2890625, 3.798828125, 5.30859375, 6.818359375, 8.328125, 9.837890625, 11.34765625, 12.857421875, 14.3671875, 15.876953125, 17.38671875, 18.896484375, 20.40625, 21.916015625, 23.42578125, 24.935546875, 26.4453125, 27.955078125, 29.46484375, 30.974609375, 32.484375, 33.994140625, 35.50390625, 37.013671875, 38.5234375, 40.033203125, 41.54296875, 43.052734375, 44.5625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 13.0, 128.0, 808.0, 31.0, 9.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-701.2349853515625, -687.2791748046875, -673.3233032226562, -659.3674926757812, -645.4116821289062, -631.4558715820312, -617.5, -603.544189453125, -589.58837890625, -575.632568359375, -561.6766967773438, -547.7208862304688, -533.7650756835938, -519.8092651367188, -505.8533935546875, -491.8975830078125, -477.9417419433594, -463.98590087890625, -450.03009033203125, -436.0742492675781, -422.1184387207031, -408.16259765625, -394.206787109375, -380.2509460449219, -366.29510498046875, -352.3392639160156, -338.3834533691406, -324.4276123046875, -310.4718017578125, -296.5159606933594, -282.56011962890625, -268.60430908203125, -254.64846801757812, -240.69264221191406, -226.73681640625, -212.78097534179688, -198.82516479492188, -184.86932373046875, -170.9134979248047, -156.95767211914062, -143.00184631347656, -129.0460205078125, -115.09019470214844, -101.13436126708984, -87.17853546142578, -73.22270965576172, -59.266876220703125, -45.31105041503906, -31.355224609375, -17.399396896362305, -3.4435691833496094, 10.512260437011719, 24.46808624267578, 38.423912048339844, 52.37974548339844, 66.3355712890625, 80.29139709472656, 94.24722290039062, 108.20304870605469, 122.15888214111328, 136.11471557617188, 150.07052612304688, 164.0263671875, 177.98219299316406, 191.93801879882812]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 1.0, 4.0, 10.0, 10.0, 16.0, 15.0, 18.0, 22.0, 26.0, 33.0, 22.0, 37.0, 31.0, 44.0, 41.0, 40.0, 46.0, 42.0, 46.0, 48.0, 44.0, 45.0, 41.0, 39.0, 40.0, 35.0, 27.0, 24.0, 23.0, 20.0, 15.0, 15.0, 12.0, 12.0, 9.0, 9.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.25540161132812, -123.369873046875, -119.48434448242188, -115.59882354736328, -111.71329498291016, -107.82776641845703, -103.94224548339844, -100.05671691894531, -96.17118835449219, -92.28565979003906, -88.40013122558594, -84.51461029052734, -80.62908172607422, -76.7435531616211, -72.8580322265625, -68.97250366210938, -65.08697509765625, -61.201446533203125, -57.315921783447266, -53.430397033691406, -49.54486846923828, -45.659339904785156, -41.7738151550293, -37.88829040527344, -34.00276184082031, -30.11723518371582, -26.231708526611328, -22.346181869506836, -18.460655212402344, -14.575128555297852, -10.68960189819336, -6.804075241088867, -2.918548583984375, 0.9669780731201172, 4.852504730224609, 8.738031387329102, 12.623558044433594, 16.509084701538086, 20.394611358642578, 24.28013801574707, 28.165664672851562, 32.05119323730469, 35.93671798706055, 39.822242736816406, 43.70777130126953, 47.593299865722656, 51.478824615478516, 55.364349365234375, 59.2498779296875, 63.135406494140625, 67.02093505859375, 70.90645599365234, 74.79198455810547, 78.6775131225586, 82.56303405761719, 86.44856262207031, 90.33409118652344, 94.21961975097656, 98.10514831542969, 101.99066925048828, 105.8761978149414, 109.76172637939453, 113.64724731445312, 117.53277587890625, 121.41830444335938]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 0.0, 6.0, 2.0, 6.0, 2.0, 1.0, 6.0, 0.0, 4.0, 3.0, 7.0, 18.0, 6.0, 3.0, 1.0, 16.0, 5.0, 14.0, 15.0, 11.0, 15.0, 14.0, 24.0, 26.0, 39.0, 76.0, 103.0, 360.0, 2873.0, 56601.0, 4117218.0, 14809.0, 1520.0, 213.0, 46.0, 30.0, 35.0, 33.0, 19.0, 15.0, 10.0, 18.0, 4.0, 12.0, 8.0, 8.0, 2.0, 6.0, 5.0, 8.0, 0.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-0.1676025390625, -0.1627063751220703, -0.15781021118164062, -0.15291404724121094, -0.14801788330078125, -0.14312171936035156, -0.13822555541992188, -0.1333293914794922, -0.1284332275390625, -0.12353706359863281, -0.11864089965820312, -0.11374473571777344, -0.10884857177734375, -0.10395240783691406, -0.09905624389648438, -0.09416007995605469, -0.089263916015625, -0.08436775207519531, -0.07947158813476562, -0.07457542419433594, -0.06967926025390625, -0.06478309631347656, -0.059886932373046875, -0.05499076843261719, -0.0500946044921875, -0.04519844055175781, -0.040302276611328125, -0.03540611267089844, -0.03050994873046875, -0.025613784790039062, -0.020717620849609375, -0.015821456909179688, -0.01092529296875, -0.0060291290283203125, -0.001132965087890625, 0.0037631988525390625, 0.00865936279296875, 0.013555526733398438, 0.018451690673828125, 0.023347854614257812, 0.0282440185546875, 0.03314018249511719, 0.038036346435546875, 0.04293251037597656, 0.04782867431640625, 0.05272483825683594, 0.057621002197265625, 0.06251716613769531, 0.067413330078125, 0.07230949401855469, 0.07720565795898438, 0.08210182189941406, 0.08699798583984375, 0.09189414978027344, 0.09679031372070312, 0.10168647766113281, 0.1065826416015625, 0.11147880554199219, 0.11637496948242188, 0.12127113342285156, 0.12616729736328125, 0.13106346130371094, 0.13595962524414062, 0.1408557891845703, 0.145751953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 5.0, 4.0, 10.0, 6.0, 7.0, 13.0, 13.0, 17.0, 715.0, 94.0, 20.0, 15.0, 6.0, 4.0, 10.0, 11.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1058349609375, -0.10268402099609375, -0.0995330810546875, -0.09638214111328125, -0.093231201171875, -0.09008026123046875, -0.0869293212890625, -0.08377838134765625, -0.08062744140625, -0.07747650146484375, -0.0743255615234375, -0.07117462158203125, -0.068023681640625, -0.06487274169921875, -0.0617218017578125, -0.05857086181640625, -0.055419921875, -0.05226898193359375, -0.0491180419921875, -0.04596710205078125, -0.042816162109375, -0.03966522216796875, -0.0365142822265625, -0.03336334228515625, -0.03021240234375, -0.02706146240234375, -0.0239105224609375, -0.02075958251953125, -0.017608642578125, -0.01445770263671875, -0.0113067626953125, -0.00815582275390625, -0.0050048828125, -0.00185394287109375, 0.0012969970703125, 0.00444793701171875, 0.007598876953125, 0.01074981689453125, 0.0139007568359375, 0.01705169677734375, 0.02020263671875, 0.02335357666015625, 0.0265045166015625, 0.02965545654296875, 0.032806396484375, 0.03595733642578125, 0.0391082763671875, 0.04225921630859375, 0.04541015625, 0.04856109619140625, 0.0517120361328125, 0.05486297607421875, 0.058013916015625, 0.06116485595703125, 0.0643157958984375, 0.06746673583984375, 0.07061767578125, 0.07376861572265625, 0.0769195556640625, 0.08007049560546875, 0.083221435546875, 0.08637237548828125, 0.0895233154296875, 0.09267425537109375, 0.0958251953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 9.0, 2.0, 5.0, 14.0, 2.0, 12.0, 19.0, 21.0, 37.0, 71.0, 108.0, 138.0, 313.0, 537.0, 1440.0, 5015.0, 204959.0, 3970652.0, 8460.0, 1577.0, 458.0, 177.0, 83.0, 58.0, 39.0, 18.0, 19.0, 7.0, 7.0, 5.0, 5.0, 4.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177490234375, -0.17196083068847656, -0.16643142700195312, -0.1609020233154297, -0.15537261962890625, -0.1498432159423828, -0.14431381225585938, -0.13878440856933594, -0.1332550048828125, -0.12772560119628906, -0.12219619750976562, -0.11666679382324219, -0.11113739013671875, -0.10560798645019531, -0.10007858276367188, -0.09454917907714844, -0.089019775390625, -0.08349037170410156, -0.07796096801757812, -0.07243156433105469, -0.06690216064453125, -0.06137275695800781, -0.055843353271484375, -0.05031394958496094, -0.0447845458984375, -0.03925514221191406, -0.033725738525390625, -0.028196334838867188, -0.02266693115234375, -0.017137527465820312, -0.011608123779296875, -0.0060787200927734375, -0.00054931640625, 0.0049800872802734375, 0.010509490966796875, 0.016038894653320312, 0.02156829833984375, 0.027097702026367188, 0.032627105712890625, 0.03815650939941406, 0.0436859130859375, 0.04921531677246094, 0.054744720458984375, 0.06027412414550781, 0.06580352783203125, 0.07133293151855469, 0.07686233520507812, 0.08239173889160156, 0.087921142578125, 0.09345054626464844, 0.09897994995117188, 0.10450935363769531, 0.11003875732421875, 0.11556816101074219, 0.12109756469726562, 0.12662696838378906, 0.1321563720703125, 0.13768577575683594, 0.14321517944335938, 0.1487445831298828, 0.15427398681640625, 0.1598033905029297, 0.16533279418945312, 0.17086219787597656, 0.1763916015625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 9.0, 7.0, 4.0, 24.0, 67.0, 290.0, 2684.0, 719.0, 151.0, 48.0, 22.0, 14.0, 3.0, 7.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1121826171875, -0.10921096801757812, -0.10623931884765625, -0.10326766967773438, -0.1002960205078125, -0.09732437133789062, -0.09435272216796875, -0.09138107299804688, -0.088409423828125, -0.08543777465820312, -0.08246612548828125, -0.07949447631835938, -0.0765228271484375, -0.07355117797851562, -0.07057952880859375, -0.06760787963867188, -0.06463623046875, -0.061664581298828125, -0.05869293212890625, -0.055721282958984375, -0.0527496337890625, -0.049777984619140625, -0.04680633544921875, -0.043834686279296875, -0.040863037109375, -0.037891387939453125, -0.03491973876953125, -0.031948089599609375, -0.0289764404296875, -0.026004791259765625, -0.02303314208984375, -0.020061492919921875, -0.01708984375, -0.014118194580078125, -0.01114654541015625, -0.008174896240234375, -0.0052032470703125, -0.002231597900390625, 0.00074005126953125, 0.003711700439453125, 0.006683349609375, 0.009654998779296875, 0.01262664794921875, 0.015598297119140625, 0.0185699462890625, 0.021541595458984375, 0.02451324462890625, 0.027484893798828125, 0.03045654296875, 0.033428192138671875, 0.03639984130859375, 0.039371490478515625, 0.0423431396484375, 0.045314788818359375, 0.04828643798828125, 0.051258087158203125, 0.054229736328125, 0.057201385498046875, 0.06017303466796875, 0.06314468383789062, 0.0661163330078125, 0.06908798217773438, 0.07205963134765625, 0.07503128051757812, 0.0780029296875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 10.0, 27.0, 606.0, 305.0, 27.0, 9.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.5389622449874878, -0.5269617438316345, -0.5149612426757812, -0.502960741519928, -0.4909602701663971, -0.4789597690105438, -0.46695929765701294, -0.45495879650115967, -0.4429582953453064, -0.4309577941894531, -0.41895729303359985, -0.40695682168006897, -0.3949563205242157, -0.3829558193683624, -0.37095534801483154, -0.35895484685897827, -0.346954345703125, -0.33495384454727173, -0.32295334339141846, -0.3109528720378876, -0.2989523708820343, -0.28695186972618103, -0.27495139837265015, -0.2629508972167969, -0.2509503960609436, -0.23894989490509033, -0.22694940865039825, -0.21494892239570618, -0.2029484212398529, -0.19094792008399963, -0.17894743382930756, -0.16694694757461548, -0.1549464464187622, -0.14294594526290894, -0.13094545900821686, -0.11894496530294418, -0.10694447159767151, -0.09494397789239883, -0.08294348418712616, -0.07094299048185349, -0.05894249677658081, -0.046942003071308136, -0.03494150936603546, -0.022941015660762787, -0.010940521955490112, 0.0010599717497825623, 0.013060465455055237, 0.02506095916032791, 0.037061452865600586, 0.04906194657087326, 0.061062440276145935, 0.07306293398141861, 0.08506342768669128, 0.09706392139196396, 0.10906441509723663, 0.12106490880250931, 0.13306540250778198, 0.14506590366363525, 0.15706638991832733, 0.1690668761730194, 0.18106737732887268, 0.19306787848472595, 0.20506836473941803, 0.2170688509941101, 0.22906935214996338]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 10.0, 7.0, 5.0, 9.0, 5.0, 13.0, 26.0, 44.0, 55.0, 101.0, 128.0, 132.0, 131.0, 96.0, 75.0, 42.0, 22.0, 16.0, 11.0, 7.0, 5.0, 10.0, 5.0, 5.0, 0.0, 7.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.39849191904067993, -0.3884199559688568, -0.3783479928970337, -0.3682760000228882, -0.35820403695106506, -0.34813207387924194, -0.33806008100509644, -0.3279881179332733, -0.3179161548614502, -0.3078441917896271, -0.29777222871780396, -0.28770023584365845, -0.2776282727718353, -0.2675563097000122, -0.2574843168258667, -0.24741235375404358, -0.23734039068222046, -0.22726842761039734, -0.21719644963741302, -0.2071244716644287, -0.1970525085926056, -0.18698054552078247, -0.17690856754779816, -0.16683658957481384, -0.15676462650299072, -0.1466926634311676, -0.1366206854581833, -0.12654870748519897, -0.11647674441337585, -0.10640477389097214, -0.09633280336856842, -0.0862608328461647, -0.07618886232376099, -0.06611689180135727, -0.05604492127895355, -0.045972950756549835, -0.03590098023414612, -0.0258290097117424, -0.015757039189338684, -0.005685068666934967, 0.00438690185546875, 0.014458872377872467, 0.024530842900276184, 0.0346028134226799, 0.04467478394508362, 0.054746754467487335, 0.06481872498989105, 0.07489069551229477, 0.08496266603469849, 0.0950346365571022, 0.10510660707950592, 0.11517857760190964, 0.12525054812431335, 0.13532251119613647, 0.1453944891691208, 0.1554664671421051, 0.16553843021392822, 0.17561039328575134, 0.18568237125873566, 0.19575434923171997, 0.2058263123035431, 0.2158982753753662, 0.22597025334835052, 0.23604223132133484, 0.24611419439315796]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 9.0, 18.0, 17.0, 36.0, 59.0, 73.0, 108.0, 184.0, 206.0, 343.0, 451.0, 765.0, 1075.0, 1660.0, 2695.0, 4454.0, 8430.0, 18642.0, 175983.0, 790616.0, 20833.0, 9017.0, 4853.0, 2737.0, 1818.0, 1130.0, 721.0, 504.0, 333.0, 204.0, 181.0, 122.0, 75.0, 58.0, 39.0, 20.0, 28.0, 21.0, 7.0, 6.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.444580078125, -0.4297904968261719, -0.41500091552734375, -0.4002113342285156, -0.3854217529296875, -0.3706321716308594, -0.35584259033203125, -0.3410530090332031, -0.326263427734375, -0.3114738464355469, -0.29668426513671875, -0.2818946838378906, -0.2671051025390625, -0.2523155212402344, -0.23752593994140625, -0.22273635864257812, -0.20794677734375, -0.19315719604492188, -0.17836761474609375, -0.16357803344726562, -0.1487884521484375, -0.13399887084960938, -0.11920928955078125, -0.10441970825195312, -0.089630126953125, -0.07484054565429688, -0.06005096435546875, -0.045261383056640625, -0.0304718017578125, -0.015682220458984375, -0.00089263916015625, 0.013896942138671875, 0.0286865234375, 0.043476104736328125, 0.05826568603515625, 0.07305526733398438, 0.0878448486328125, 0.10263442993164062, 0.11742401123046875, 0.13221359252929688, 0.147003173828125, 0.16179275512695312, 0.17658233642578125, 0.19137191772460938, 0.2061614990234375, 0.22095108032226562, 0.23574066162109375, 0.2505302429199219, 0.26531982421875, 0.2801094055175781, 0.29489898681640625, 0.3096885681152344, 0.3244781494140625, 0.3392677307128906, 0.35405731201171875, 0.3688468933105469, 0.383636474609375, 0.3984260559082031, 0.41321563720703125, 0.4280052185058594, 0.4427947998046875, 0.4575843811035156, 0.47237396240234375, 0.4871635437011719, 0.501953125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 5.0, 6.0, 8.0, 7.0, 11.0, 13.0, 10.0, 69.0, 739.0, 27.0, 14.0, 12.0, 3.0, 7.0, 10.0, 7.0, 3.0, 4.0, 6.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10589599609375, -0.10278129577636719, -0.09966659545898438, -0.09655189514160156, -0.09343719482421875, -0.09032249450683594, -0.08720779418945312, -0.08409309387207031, -0.0809783935546875, -0.07786369323730469, -0.07474899291992188, -0.07163429260253906, -0.06851959228515625, -0.06540489196777344, -0.062290191650390625, -0.05917549133300781, -0.056060791015625, -0.05294609069824219, -0.049831390380859375, -0.04671669006347656, -0.04360198974609375, -0.04048728942871094, -0.037372589111328125, -0.03425788879394531, -0.0311431884765625, -0.028028488159179688, -0.024913787841796875, -0.021799087524414062, -0.01868438720703125, -0.015569686889648438, -0.012454986572265625, -0.009340286254882812, -0.0062255859375, -0.0031108856201171875, 3.814697265625e-06, 0.0031185150146484375, 0.00623321533203125, 0.009347915649414062, 0.012462615966796875, 0.015577316284179688, 0.0186920166015625, 0.021806716918945312, 0.024921417236328125, 0.028036117553710938, 0.03115081787109375, 0.03426551818847656, 0.037380218505859375, 0.04049491882324219, 0.043609619140625, 0.04672431945800781, 0.049839019775390625, 0.05295372009277344, 0.05606842041015625, 0.05918312072753906, 0.062297821044921875, 0.06541252136230469, 0.0685272216796875, 0.07164192199707031, 0.07475662231445312, 0.07787132263183594, 0.08098602294921875, 0.08410072326660156, 0.08721542358398438, 0.09033012390136719, 0.09344482421875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 8.0, 13.0, 20.0, 30.0, 32.0, 59.0, 49.0, 68.0, 86.0, 93.0, 135.0, 199.0, 353.0, 678.0, 1159.0, 2412.0, 5854.0, 16505.0, 63494.0, 549617.0, 339015.0, 46358.0, 12779.0, 4772.0, 2133.0, 1013.0, 577.0, 287.0, 173.0, 144.0, 82.0, 84.0, 67.0, 64.0, 36.0, 34.0, 15.0, 16.0, 10.0, 6.0, 11.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.251708984375, -0.24449729919433594, -0.23728561401367188, -0.2300739288330078, -0.22286224365234375, -0.2156505584716797, -0.20843887329101562, -0.20122718811035156, -0.1940155029296875, -0.18680381774902344, -0.17959213256835938, -0.1723804473876953, -0.16516876220703125, -0.1579570770263672, -0.15074539184570312, -0.14353370666503906, -0.136322021484375, -0.12911033630371094, -0.12189865112304688, -0.11468696594238281, -0.10747528076171875, -0.10026359558105469, -0.09305191040039062, -0.08584022521972656, -0.0786285400390625, -0.07141685485839844, -0.06420516967773438, -0.05699348449707031, -0.04978179931640625, -0.04257011413574219, -0.035358428955078125, -0.028146743774414062, -0.02093505859375, -0.013723373413085938, -0.006511688232421875, 0.0006999969482421875, 0.00791168212890625, 0.015123367309570312, 0.022335052490234375, 0.029546737670898438, 0.0367584228515625, 0.04397010803222656, 0.051181793212890625, 0.05839347839355469, 0.06560516357421875, 0.07281684875488281, 0.08002853393554688, 0.08724021911621094, 0.094451904296875, 0.10166358947753906, 0.10887527465820312, 0.11608695983886719, 0.12329864501953125, 0.1305103302001953, 0.13772201538085938, 0.14493370056152344, 0.1521453857421875, 0.15935707092285156, 0.16656875610351562, 0.1737804412841797, 0.18099212646484375, 0.1882038116455078, 0.19541549682617188, 0.20262718200683594, 0.2098388671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 8.0, 7.0, 13.0, 18.0, 13.0, 21.0, 18.0, 18.0, 20.0, 21.0, 27.0, 26.0, 26.0, 36.0, 33.0, 36.0, 44.0, 29.0, 47.0, 36.0, 33.0, 43.0, 49.0, 38.0, 37.0, 33.0, 31.0, 35.0, 35.0, 23.0, 13.0, 23.0, 13.0, 15.0, 17.0, 9.0, 22.0, 4.0, 5.0, 3.0, 4.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.37841796875, -0.3673553466796875, -0.356292724609375, -0.3452301025390625, -0.33416748046875, -0.3231048583984375, -0.312042236328125, -0.3009796142578125, -0.2899169921875, -0.2788543701171875, -0.267791748046875, -0.2567291259765625, -0.24566650390625, -0.2346038818359375, -0.223541259765625, -0.2124786376953125, -0.201416015625, -0.1903533935546875, -0.179290771484375, -0.1682281494140625, -0.15716552734375, -0.1461029052734375, -0.135040283203125, -0.1239776611328125, -0.1129150390625, -0.1018524169921875, -0.090789794921875, -0.0797271728515625, -0.06866455078125, -0.0576019287109375, -0.046539306640625, -0.0354766845703125, -0.0244140625, -0.0133514404296875, -0.002288818359375, 0.0087738037109375, 0.01983642578125, 0.0308990478515625, 0.041961669921875, 0.0530242919921875, 0.0640869140625, 0.0751495361328125, 0.086212158203125, 0.0972747802734375, 0.10833740234375, 0.1194000244140625, 0.130462646484375, 0.1415252685546875, 0.152587890625, 0.1636505126953125, 0.174713134765625, 0.1857757568359375, 0.19683837890625, 0.2079010009765625, 0.218963623046875, 0.2300262451171875, 0.2410888671875, 0.2521514892578125, 0.263214111328125, 0.2742767333984375, 0.28533935546875, 0.2964019775390625, 0.307464599609375, 0.3185272216796875, 0.32958984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 7.0, 8.0, 9.0, 17.0, 16.0, 36.0, 59.0, 108.0, 230.0, 476.0, 1163.0, 4851.0, 174406.0, 857683.0, 7082.0, 1422.0, 490.0, 205.0, 107.0, 61.0, 31.0, 24.0, 14.0, 8.0, 12.0, 8.0, 7.0, 2.0, 0.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.114013671875, -0.11109733581542969, -0.10818099975585938, -0.10526466369628906, -0.10234832763671875, -0.09943199157714844, -0.09651565551757812, -0.09359931945800781, -0.0906829833984375, -0.08776664733886719, -0.08485031127929688, -0.08193397521972656, -0.07901763916015625, -0.07610130310058594, -0.07318496704101562, -0.07026863098144531, -0.067352294921875, -0.06443595886230469, -0.061519622802734375, -0.05860328674316406, -0.05568695068359375, -0.05277061462402344, -0.049854278564453125, -0.04693794250488281, -0.0440216064453125, -0.04110527038574219, -0.038188934326171875, -0.03527259826660156, -0.03235626220703125, -0.029439926147460938, -0.026523590087890625, -0.023607254028320312, -0.02069091796875, -0.017774581909179688, -0.014858245849609375, -0.011941909790039062, -0.00902557373046875, -0.0061092376708984375, -0.003192901611328125, -0.0002765655517578125, 0.0026397705078125, 0.0055561065673828125, 0.008472442626953125, 0.011388778686523438, 0.01430511474609375, 0.017221450805664062, 0.020137786865234375, 0.023054122924804688, 0.025970458984375, 0.028886795043945312, 0.031803131103515625, 0.03471946716308594, 0.03763580322265625, 0.04055213928222656, 0.043468475341796875, 0.04638481140136719, 0.0493011474609375, 0.05221748352050781, 0.055133819580078125, 0.05805015563964844, 0.06096649169921875, 0.06388282775878906, 0.06679916381835938, 0.06971549987792969, 0.0726318359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 13.0, 10.0, 13.0, 22.0, 22.0, 54.0, 57.0, 78.0, 82.0, 102.0, 111.0, 92.0, 81.0, 76.0, 54.0, 43.0, 20.0, 18.0, 10.0, 7.0, 11.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.329183578491211e-05, -1.2675300240516663e-05, -1.2058764696121216e-05, -1.1442229151725769e-05, -1.0825693607330322e-05, -1.0209158062934875e-05, -9.592622518539429e-06, -8.976086974143982e-06, -8.359551429748535e-06, -7.743015885353088e-06, -7.126480340957642e-06, -6.509944796562195e-06, -5.893409252166748e-06, -5.276873707771301e-06, -4.6603381633758545e-06, -4.043802618980408e-06, -3.427267074584961e-06, -2.810731530189514e-06, -2.1941959857940674e-06, -1.5776604413986206e-06, -9.611248970031738e-07, -3.4458935260772705e-07, 2.7194619178771973e-07, 8.884817361831665e-07, 1.5050172805786133e-06, 2.12155282497406e-06, 2.738088369369507e-06, 3.3546239137649536e-06, 3.9711594581604e-06, 4.587695002555847e-06, 5.204230546951294e-06, 5.820766091346741e-06, 6.4373016357421875e-06, 7.053837180137634e-06, 7.670372724533081e-06, 8.286908268928528e-06, 8.903443813323975e-06, 9.519979357719421e-06, 1.0136514902114868e-05, 1.0753050446510315e-05, 1.1369585990905762e-05, 1.1986121535301208e-05, 1.2602657079696655e-05, 1.3219192624092102e-05, 1.3835728168487549e-05, 1.4452263712882996e-05, 1.5068799257278442e-05, 1.568533480167389e-05, 1.6301870346069336e-05, 1.6918405890464783e-05, 1.753494143486023e-05, 1.8151476979255676e-05, 1.8768012523651123e-05, 1.938454806804657e-05, 2.0001083612442017e-05, 2.0617619156837463e-05, 2.123415470123291e-05, 2.1850690245628357e-05, 2.2467225790023804e-05, 2.308376133441925e-05, 2.3700296878814697e-05, 2.4316832423210144e-05, 2.493336796760559e-05, 2.5549903512001038e-05, 2.6166439056396484e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 13.0, 14.0, 19.0, 29.0, 36.0, 55.0, 92.0, 127.0, 257.0, 494.0, 1062.0, 2937.0, 10760.0, 98576.0, 884489.0, 39317.0, 6505.0, 1997.0, 789.0, 426.0, 203.0, 102.0, 80.0, 48.0, 36.0, 22.0, 12.0, 13.0, 4.0, 7.0, 4.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06585693359375, -0.06388139724731445, -0.061905860900878906, -0.05993032455444336, -0.05795478820800781, -0.055979251861572266, -0.05400371551513672, -0.05202817916870117, -0.050052642822265625, -0.04807710647583008, -0.04610157012939453, -0.044126033782958984, -0.04215049743652344, -0.04017496109008789, -0.038199424743652344, -0.0362238883972168, -0.03424835205078125, -0.0322728157043457, -0.030297279357910156, -0.02832174301147461, -0.026346206665039062, -0.024370670318603516, -0.02239513397216797, -0.020419597625732422, -0.018444061279296875, -0.016468524932861328, -0.014492988586425781, -0.012517452239990234, -0.010541915893554688, -0.00856637954711914, -0.006590843200683594, -0.004615306854248047, -0.0026397705078125, -0.0006642341613769531, 0.0013113021850585938, 0.0032868385314941406, 0.0052623748779296875, 0.007237911224365234, 0.009213447570800781, 0.011188983917236328, 0.013164520263671875, 0.015140056610107422, 0.01711559295654297, 0.019091129302978516, 0.021066665649414062, 0.02304220199584961, 0.025017738342285156, 0.026993274688720703, 0.02896881103515625, 0.030944347381591797, 0.032919883728027344, 0.03489542007446289, 0.03687095642089844, 0.038846492767333984, 0.04082202911376953, 0.04279756546020508, 0.044773101806640625, 0.04674863815307617, 0.04872417449951172, 0.050699710845947266, 0.05267524719238281, 0.05465078353881836, 0.056626319885253906, 0.05860185623168945, 0.060577392578125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 8.0, 2.0, 9.0, 9.0, 8.0, 26.0, 14.0, 27.0, 36.0, 45.0, 78.0, 76.0, 110.0, 107.0, 108.0, 73.0, 63.0, 51.0, 31.0, 41.0, 24.0, 11.0, 14.0, 7.0, 5.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1173095703125, -0.11426067352294922, -0.11121177673339844, -0.10816287994384766, -0.10511398315429688, -0.1020650863647461, -0.09901618957519531, -0.09596729278564453, -0.09291839599609375, -0.08986949920654297, -0.08682060241699219, -0.0837717056274414, -0.08072280883789062, -0.07767391204833984, -0.07462501525878906, -0.07157611846923828, -0.0685272216796875, -0.06547832489013672, -0.06242942810058594, -0.059380531311035156, -0.056331634521484375, -0.053282737731933594, -0.05023384094238281, -0.04718494415283203, -0.04413604736328125, -0.04108715057373047, -0.03803825378417969, -0.034989356994628906, -0.031940460205078125, -0.028891563415527344, -0.025842666625976562, -0.02279376983642578, -0.019744873046875, -0.01669597625732422, -0.013647079467773438, -0.010598182678222656, -0.007549285888671875, -0.004500389099121094, -0.0014514923095703125, 0.0015974044799804688, 0.00464630126953125, 0.007695198059082031, 0.010744094848632812, 0.013792991638183594, 0.016841888427734375, 0.019890785217285156, 0.022939682006835938, 0.02598857879638672, 0.0290374755859375, 0.03208637237548828, 0.03513526916503906, 0.038184165954589844, 0.041233062744140625, 0.044281959533691406, 0.04733085632324219, 0.05037975311279297, 0.05342864990234375, 0.05647754669189453, 0.05952644348144531, 0.0625753402709961, 0.06562423706054688, 0.06867313385009766, 0.07172203063964844, 0.07477092742919922, 0.07781982421875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 37.0, 670.0, 261.0, 23.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.026463508605957, -12.754094123840332, -12.48172378540039, -12.209354400634766, -11.936984062194824, -11.6646146774292, -11.392244338989258, -11.119874954223633, -10.847505569458008, -10.575136184692383, -10.302765846252441, -10.030396461486816, -9.758026123046875, -9.48565673828125, -9.213286399841309, -8.940917015075684, -8.668546676635742, -8.396177291870117, -8.123806953430176, -7.851437091827393, -7.579067230224609, -7.306697845458984, -7.034327983856201, -6.761958122253418, -6.489588260650635, -6.217218399047852, -5.944848537445068, -5.672478675842285, -5.40010929107666, -5.127738952636719, -4.855369567871094, -4.5829997062683105, -4.310628890991211, -4.038259029388428, -3.7658891677856445, -3.4935195446014404, -3.2211496829986572, -2.948779821395874, -2.67641019821167, -2.4040403366088867, -2.1316704750061035, -1.8593006134033203, -1.5869308710098267, -1.314561128616333, -1.0421912670135498, -0.7698214054107666, -0.49745166301727295, -0.2250819206237793, 0.047287940979003906, 0.31965774297714233, 0.5920275449752808, 0.8643973469734192, 1.1367671489715576, 1.4091370105743408, 1.6815067529678345, 1.9538764953613281, 2.2262463569641113, 2.4986162185668945, 2.7709860801696777, 3.043355703353882, 3.315725564956665, 3.5880954265594482, 3.8604650497436523, 4.1328349113464355, 4.405204772949219]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 7.0, 9.0, 12.0, 20.0, 26.0, 54.0, 93.0, 110.0, 153.0, 158.0, 104.0, 71.0, 58.0, 26.0, 25.0, 8.0, 15.0, 5.0, 8.0, 3.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.521082878112793, -7.284963607788086, -7.048844337463379, -6.812725067138672, -6.576605796813965, -6.340486526489258, -6.104366779327393, -5.8682475090026855, -5.6321282386779785, -5.3960089683532715, -5.1598896980285645, -4.923770427703857, -4.687650680541992, -4.451531410217285, -4.215412139892578, -3.979292869567871, -3.743173599243164, -3.507054328918457, -3.27093505859375, -3.034815549850464, -2.798696279525757, -2.56257700920105, -2.3264575004577637, -2.0903382301330566, -1.8542189598083496, -1.6180996894836426, -1.381980299949646, -1.1458609104156494, -0.9097416400909424, -0.6736223697662354, -0.43750298023223877, -0.2013835906982422, 0.034735679626464844, 0.27085500955581665, 0.5069743394851685, 0.7430936694145203, 0.9792129993438721, 1.215332269668579, 1.4514516592025757, 1.6875710487365723, 1.9236903190612793, 2.1598095893859863, 2.3959288597106934, 2.6320483684539795, 2.8681676387786865, 3.1042869091033936, 3.3404064178466797, 3.5765256881713867, 3.8126449584960938, 4.048764228820801, 4.284883499145508, 4.521002769470215, 4.757122039794922, 4.993241310119629, 5.229361057281494, 5.465480327606201, 5.701599597930908, 5.937718868255615, 6.173838138580322, 6.409957408905029, 6.6460771560668945, 6.882196426391602, 7.118315696716309, 7.354434967041016, 7.590554237365723]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 13.0, 24.0, 22.0, 31.0, 56.0, 91.0, 163.0, 257.0, 476.0, 858.0, 1551.0, 3380.0, 7397.0, 22416.0, 4055415.0, 83882.0, 11475.0, 3939.0, 1548.0, 659.0, 298.0, 117.0, 71.0, 45.0, 29.0, 14.0, 14.0, 14.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0791015625, -1.0461883544921875, -1.013275146484375, -0.9803619384765625, -0.94744873046875, -0.9145355224609375, -0.881622314453125, -0.8487091064453125, -0.8157958984375, -0.7828826904296875, -0.749969482421875, -0.7170562744140625, -0.68414306640625, -0.6512298583984375, -0.618316650390625, -0.5854034423828125, -0.552490234375, -0.5195770263671875, -0.486663818359375, -0.4537506103515625, -0.42083740234375, -0.3879241943359375, -0.355010986328125, -0.3220977783203125, -0.2891845703125, -0.2562713623046875, -0.223358154296875, -0.1904449462890625, -0.15753173828125, -0.1246185302734375, -0.091705322265625, -0.0587921142578125, -0.02587890625, 0.0070343017578125, 0.039947509765625, 0.0728607177734375, 0.10577392578125, 0.1386871337890625, 0.171600341796875, 0.2045135498046875, 0.2374267578125, 0.2703399658203125, 0.303253173828125, 0.3361663818359375, 0.36907958984375, 0.4019927978515625, 0.434906005859375, 0.4678192138671875, 0.500732421875, 0.5336456298828125, 0.566558837890625, 0.5994720458984375, 0.63238525390625, 0.6652984619140625, 0.698211669921875, 0.7311248779296875, 0.7640380859375, 0.7969512939453125, 0.829864501953125, 0.8627777099609375, 0.89569091796875, 0.9286041259765625, 0.961517333984375, 0.9944305419921875, 1.02734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 10.0, 3.0, 7.0, 7.0, 11.0, 9.0, 21.0, 18.0, 442.0, 355.0, 27.0, 7.0, 15.0, 10.0, 7.0, 11.0, 8.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10113525390625, -0.0982208251953125, -0.095306396484375, -0.0923919677734375, -0.0894775390625, -0.0865631103515625, -0.083648681640625, -0.0807342529296875, -0.07781982421875, -0.0749053955078125, -0.071990966796875, -0.0690765380859375, -0.066162109375, -0.0632476806640625, -0.060333251953125, -0.0574188232421875, -0.05450439453125, -0.0515899658203125, -0.048675537109375, -0.0457611083984375, -0.0428466796875, -0.0399322509765625, -0.037017822265625, -0.0341033935546875, -0.03118896484375, -0.0282745361328125, -0.025360107421875, -0.0224456787109375, -0.01953125, -0.0166168212890625, -0.013702392578125, -0.0107879638671875, -0.00787353515625, -0.0049591064453125, -0.002044677734375, 0.0008697509765625, 0.0037841796875, 0.0066986083984375, 0.009613037109375, 0.0125274658203125, 0.01544189453125, 0.0183563232421875, 0.021270751953125, 0.0241851806640625, 0.027099609375, 0.0300140380859375, 0.032928466796875, 0.0358428955078125, 0.03875732421875, 0.0416717529296875, 0.044586181640625, 0.0475006103515625, 0.0504150390625, 0.0533294677734375, 0.056243896484375, 0.0591583251953125, 0.06207275390625, 0.0649871826171875, 0.067901611328125, 0.0708160400390625, 0.07373046875, 0.0766448974609375, 0.079559326171875, 0.0824737548828125, 0.08538818359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 12.0, 15.0, 16.0, 16.0, 33.0, 62.0, 74.0, 119.0, 279.0, 594.0, 1315.0, 4059.0, 18178.0, 224298.0, 3864296.0, 62010.0, 12017.0, 3791.0, 1532.0, 697.0, 357.0, 168.0, 111.0, 59.0, 38.0, 30.0, 18.0, 14.0, 13.0, 9.0, 10.0, 7.0, 8.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.457275390625, -0.44309234619140625, -0.4289093017578125, -0.41472625732421875, -0.400543212890625, -0.38636016845703125, -0.3721771240234375, -0.35799407958984375, -0.34381103515625, -0.32962799072265625, -0.3154449462890625, -0.30126190185546875, -0.287078857421875, -0.27289581298828125, -0.2587127685546875, -0.24452972412109375, -0.2303466796875, -0.21616363525390625, -0.2019805908203125, -0.18779754638671875, -0.173614501953125, -0.15943145751953125, -0.1452484130859375, -0.13106536865234375, -0.11688232421875, -0.10269927978515625, -0.0885162353515625, -0.07433319091796875, -0.060150146484375, -0.04596710205078125, -0.0317840576171875, -0.01760101318359375, -0.00341796875, 0.01076507568359375, 0.0249481201171875, 0.03913116455078125, 0.053314208984375, 0.06749725341796875, 0.0816802978515625, 0.09586334228515625, 0.11004638671875, 0.12422943115234375, 0.1384124755859375, 0.15259552001953125, 0.166778564453125, 0.18096160888671875, 0.1951446533203125, 0.20932769775390625, 0.2235107421875, 0.23769378662109375, 0.2518768310546875, 0.26605987548828125, 0.280242919921875, 0.29442596435546875, 0.3086090087890625, 0.32279205322265625, 0.33697509765625, 0.35115814208984375, 0.3653411865234375, 0.37952423095703125, 0.393707275390625, 0.40789031982421875, 0.4220733642578125, 0.43625640869140625, 0.450439453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 6.0, 3.0, 7.0, 11.0, 9.0, 8.0, 8.0, 18.0, 32.0, 47.0, 59.0, 131.0, 724.0, 2162.0, 268.0, 122.0, 78.0, 58.0, 49.0, 43.0, 31.0, 26.0, 21.0, 17.0, 18.0, 16.0, 11.0, 11.0, 11.0, 7.0, 5.0, 10.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.0792236328125, -0.07650566101074219, -0.07378768920898438, -0.07106971740722656, -0.06835174560546875, -0.06563377380371094, -0.06291580200195312, -0.06019783020019531, -0.0574798583984375, -0.05476188659667969, -0.052043914794921875, -0.04932594299316406, -0.04660797119140625, -0.04388999938964844, -0.041172027587890625, -0.03845405578613281, -0.035736083984375, -0.03301811218261719, -0.030300140380859375, -0.027582168579101562, -0.02486419677734375, -0.022146224975585938, -0.019428253173828125, -0.016710281372070312, -0.0139923095703125, -0.011274337768554688, -0.008556365966796875, -0.0058383941650390625, -0.00312042236328125, -0.0004024505615234375, 0.002315521240234375, 0.0050334930419921875, 0.00775146484375, 0.010469436645507812, 0.013187408447265625, 0.015905380249023438, 0.01862335205078125, 0.021341323852539062, 0.024059295654296875, 0.026777267456054688, 0.0294952392578125, 0.03221321105957031, 0.034931182861328125, 0.03764915466308594, 0.04036712646484375, 0.04308509826660156, 0.045803070068359375, 0.04852104187011719, 0.051239013671875, 0.05395698547363281, 0.056674957275390625, 0.05939292907714844, 0.06211090087890625, 0.06482887268066406, 0.06754684448242188, 0.07026481628417969, 0.0729827880859375, 0.07570075988769531, 0.07841873168945312, 0.08113670349121094, 0.08385467529296875, 0.08657264709472656, 0.08929061889648438, 0.09200859069824219, 0.0947265625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 746.0, 246.0, 10.0, 4.0, 4.0, 1.0, 1.0], "bins": [-14.510116577148438, -14.259368896484375, -14.008621215820312, -13.75787353515625, -13.507124900817871, -13.256377220153809, -13.005629539489746, -12.754881858825684, -12.504134178161621, -12.253386497497559, -12.002638816833496, -11.751890182495117, -11.501142501831055, -11.250394821166992, -10.99964714050293, -10.748899459838867, -10.498151779174805, -10.247404098510742, -9.99665641784668, -9.745908737182617, -9.495160102844238, -9.244412422180176, -8.993664741516113, -8.74291706085205, -8.492168426513672, -8.24142074584961, -7.990672588348389, -7.739924907684326, -7.489177227020264, -7.238429069519043, -6.9876813888549805, -6.736933708190918, -6.486185073852539, -6.235437393188477, -5.984689235687256, -5.733941555023193, -5.483193874359131, -5.23244571685791, -4.981698036193848, -4.730950355529785, -4.480202674865723, -4.22945499420166, -3.9787070751190186, -3.727959156036377, -3.4772114753723145, -3.226463556289673, -2.9757156372070312, -2.7249679565429688, -2.474220037460327, -2.2234721183776855, -1.972724437713623, -1.7219765186309814, -1.4712287187576294, -1.2204809188842773, -0.9697329998016357, -0.7189851999282837, -0.46823740005493164, -0.2174895703792572, 0.033258259296417236, 0.28400611877441406, 0.5347539186477661, 0.7855017185211182, 1.0362496376037598, 1.2869974374771118, 1.5377452373504639]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 10.0, 12.0, 20.0, 27.0, 57.0, 72.0, 109.0, 100.0, 124.0, 104.0, 90.0, 95.0, 57.0, 45.0, 32.0, 18.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5981602668762207, -1.5600923299789429, -1.5220245122909546, -1.4839565753936768, -1.4458887577056885, -1.4078208208084106, -1.3697530031204224, -1.3316850662231445, -1.2936172485351562, -1.2555493116378784, -1.2174814939498901, -1.1794135570526123, -1.141345739364624, -1.1032778024673462, -1.065209984779358, -1.02714204788208, -0.9890741109848022, -0.9510062336921692, -0.9129383563995361, -0.8748704791069031, -0.83680260181427, -0.7987346649169922, -0.7606667876243591, -0.7225989103317261, -0.684531033039093, -0.64646315574646, -0.6083952784538269, -0.5703274011611938, -0.532259464263916, -0.49419161677360535, -0.4561237096786499, -0.41805583238601685, -0.37998783588409424, -0.3419199585914612, -0.3038520812988281, -0.2657841742038727, -0.22771629691123962, -0.18964841961860657, -0.15158052742481232, -0.11351263523101807, -0.07544475793838501, -0.037376873195171356, 0.0006910115480422974, 0.03875889629125595, 0.0768267810344696, 0.11489465832710266, 0.1529625505208969, 0.19103044271469116, 0.22909832000732422, 0.2671661972999573, 0.30523407459259033, 0.3433019816875458, 0.38136985898017883, 0.4194377362728119, 0.45750564336776733, 0.4955735206604004, 0.5336413979530334, 0.5717092752456665, 0.6097771525382996, 0.6478450298309326, 0.6859129667282104, 0.7239807844161987, 0.7620487213134766, 0.8001165986061096, 0.8381844758987427]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 12.0, 17.0, 25.0, 34.0, 46.0, 83.0, 133.0, 178.0, 298.0, 510.0, 960.0, 1922.0, 4525.0, 11776.0, 43058.0, 915777.0, 47523.0, 12429.0, 4803.0, 2041.0, 949.0, 525.0, 339.0, 175.0, 119.0, 83.0, 55.0, 48.0, 27.0, 14.0, 7.0, 9.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49951171875, -0.48314666748046875, -0.4667816162109375, -0.45041656494140625, -0.434051513671875, -0.41768646240234375, -0.4013214111328125, -0.38495635986328125, -0.36859130859375, -0.35222625732421875, -0.3358612060546875, -0.31949615478515625, -0.303131103515625, -0.28676605224609375, -0.2704010009765625, -0.25403594970703125, -0.2376708984375, -0.22130584716796875, -0.2049407958984375, -0.18857574462890625, -0.172210693359375, -0.15584564208984375, -0.1394805908203125, -0.12311553955078125, -0.10675048828125, -0.09038543701171875, -0.0740203857421875, -0.05765533447265625, -0.041290283203125, -0.02492523193359375, -0.0085601806640625, 0.00780487060546875, 0.024169921875, 0.04053497314453125, 0.0569000244140625, 0.07326507568359375, 0.089630126953125, 0.10599517822265625, 0.1223602294921875, 0.13872528076171875, 0.15509033203125, 0.17145538330078125, 0.1878204345703125, 0.20418548583984375, 0.220550537109375, 0.23691558837890625, 0.2532806396484375, 0.26964569091796875, 0.2860107421875, 0.30237579345703125, 0.3187408447265625, 0.33510589599609375, 0.351470947265625, 0.36783599853515625, 0.3842010498046875, 0.40056610107421875, 0.41693115234375, 0.43329620361328125, 0.4496612548828125, 0.46602630615234375, 0.482391357421875, 0.49875640869140625, 0.5151214599609375, 0.5314865112304688, 0.5478515625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 8.0, 5.0, 9.0, 8.0, 12.0, 18.0, 13.0, 81.0, 429.0, 294.0, 46.0, 12.0, 12.0, 8.0, 10.0, 10.0, 6.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10565185546875, -0.10260200500488281, -0.09955215454101562, -0.09650230407714844, -0.09345245361328125, -0.09040260314941406, -0.08735275268554688, -0.08430290222167969, -0.0812530517578125, -0.07820320129394531, -0.07515335083007812, -0.07210350036621094, -0.06905364990234375, -0.06600379943847656, -0.06295394897460938, -0.05990409851074219, -0.056854248046875, -0.05380439758300781, -0.050754547119140625, -0.04770469665527344, -0.04465484619140625, -0.04160499572753906, -0.038555145263671875, -0.03550529479980469, -0.0324554443359375, -0.029405593872070312, -0.026355743408203125, -0.023305892944335938, -0.02025604248046875, -0.017206192016601562, -0.014156341552734375, -0.011106491088867188, -0.008056640625, -0.0050067901611328125, -0.001956939697265625, 0.0010929107666015625, 0.00414276123046875, 0.0071926116943359375, 0.010242462158203125, 0.013292312622070312, 0.0163421630859375, 0.019392013549804688, 0.022441864013671875, 0.025491714477539062, 0.02854156494140625, 0.03159141540527344, 0.034641265869140625, 0.03769111633300781, 0.040740966796875, 0.04379081726074219, 0.046840667724609375, 0.04989051818847656, 0.05294036865234375, 0.05599021911621094, 0.059040069580078125, 0.06208992004394531, 0.0651397705078125, 0.06818962097167969, 0.07123947143554688, 0.07428932189941406, 0.07733917236328125, 0.08038902282714844, 0.08343887329101562, 0.08648872375488281, 0.08953857421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 4.0, 3.0, 10.0, 9.0, 7.0, 11.0, 4.0, 12.0, 9.0, 21.0, 27.0, 32.0, 26.0, 39.0, 64.0, 98.0, 151.0, 256.0, 467.0, 900.0, 2171.0, 7366.0, 44771.0, 594949.0, 357426.0, 30581.0, 5546.0, 1735.0, 749.0, 392.0, 246.0, 115.0, 82.0, 50.0, 43.0, 25.0, 19.0, 26.0, 21.0, 14.0, 11.0, 12.0, 16.0, 10.0, 7.0, 9.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.3134765625, -0.304229736328125, -0.29498291015625, -0.285736083984375, -0.2764892578125, -0.267242431640625, -0.25799560546875, -0.248748779296875, -0.239501953125, -0.230255126953125, -0.22100830078125, -0.211761474609375, -0.2025146484375, -0.193267822265625, -0.18402099609375, -0.174774169921875, -0.16552734375, -0.156280517578125, -0.14703369140625, -0.137786865234375, -0.1285400390625, -0.119293212890625, -0.11004638671875, -0.100799560546875, -0.091552734375, -0.082305908203125, -0.07305908203125, -0.063812255859375, -0.0545654296875, -0.045318603515625, -0.03607177734375, -0.026824951171875, -0.017578125, -0.008331298828125, 0.00091552734375, 0.010162353515625, 0.0194091796875, 0.028656005859375, 0.03790283203125, 0.047149658203125, 0.056396484375, 0.065643310546875, 0.07489013671875, 0.084136962890625, 0.0933837890625, 0.102630615234375, 0.11187744140625, 0.121124267578125, 0.13037109375, 0.139617919921875, 0.14886474609375, 0.158111572265625, 0.1673583984375, 0.176605224609375, 0.18585205078125, 0.195098876953125, 0.204345703125, 0.213592529296875, 0.22283935546875, 0.232086181640625, 0.2413330078125, 0.250579833984375, 0.25982666015625, 0.269073486328125, 0.2783203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 7.0, 5.0, 11.0, 10.0, 9.0, 8.0, 9.0, 19.0, 24.0, 18.0, 25.0, 18.0, 30.0, 33.0, 34.0, 40.0, 29.0, 45.0, 44.0, 44.0, 36.0, 33.0, 39.0, 28.0, 51.0, 35.0, 38.0, 37.0, 25.0, 23.0, 24.0, 11.0, 23.0, 21.0, 17.0, 16.0, 11.0, 11.0, 17.0, 9.0, 13.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.220458984375, -0.21431541442871094, -0.20817184448242188, -0.2020282745361328, -0.19588470458984375, -0.1897411346435547, -0.18359756469726562, -0.17745399475097656, -0.1713104248046875, -0.16516685485839844, -0.15902328491210938, -0.1528797149658203, -0.14673614501953125, -0.1405925750732422, -0.13444900512695312, -0.12830543518066406, -0.122161865234375, -0.11601829528808594, -0.10987472534179688, -0.10373115539550781, -0.09758758544921875, -0.09144401550292969, -0.08530044555664062, -0.07915687561035156, -0.0730133056640625, -0.06686973571777344, -0.060726165771484375, -0.05458259582519531, -0.04843902587890625, -0.04229545593261719, -0.036151885986328125, -0.030008316040039062, -0.02386474609375, -0.017721176147460938, -0.011577606201171875, -0.0054340362548828125, 0.00070953369140625, 0.0068531036376953125, 0.012996673583984375, 0.019140243530273438, 0.0252838134765625, 0.03142738342285156, 0.037570953369140625, 0.04371452331542969, 0.04985809326171875, 0.05600166320800781, 0.062145233154296875, 0.06828880310058594, 0.074432373046875, 0.08057594299316406, 0.08671951293945312, 0.09286308288574219, 0.09900665283203125, 0.10515022277832031, 0.11129379272460938, 0.11743736267089844, 0.1235809326171875, 0.12972450256347656, 0.13586807250976562, 0.1420116424560547, 0.14815521240234375, 0.1542987823486328, 0.16044235229492188, 0.16658592224121094, 0.1727294921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 8.0, 13.0, 13.0, 8.0, 21.0, 28.0, 59.0, 76.0, 181.0, 386.0, 873.0, 2975.0, 17053.0, 977829.0, 42477.0, 4320.0, 1249.0, 451.0, 233.0, 108.0, 40.0, 32.0, 27.0, 24.0, 10.0, 15.0, 3.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1954345703125, -0.18995094299316406, -0.18446731567382812, -0.1789836883544922, -0.17350006103515625, -0.1680164337158203, -0.16253280639648438, -0.15704917907714844, -0.1515655517578125, -0.14608192443847656, -0.14059829711914062, -0.1351146697998047, -0.12963104248046875, -0.12414741516113281, -0.11866378784179688, -0.11318016052246094, -0.107696533203125, -0.10221290588378906, -0.09672927856445312, -0.09124565124511719, -0.08576202392578125, -0.08027839660644531, -0.07479476928710938, -0.06931114196777344, -0.0638275146484375, -0.05834388732910156, -0.052860260009765625, -0.04737663269042969, -0.04189300537109375, -0.03640937805175781, -0.030925750732421875, -0.025442123413085938, -0.01995849609375, -0.014474868774414062, -0.008991241455078125, -0.0035076141357421875, 0.00197601318359375, 0.0074596405029296875, 0.012943267822265625, 0.018426895141601562, 0.0239105224609375, 0.029394149780273438, 0.034877777099609375, 0.04036140441894531, 0.04584503173828125, 0.05132865905761719, 0.056812286376953125, 0.06229591369628906, 0.067779541015625, 0.07326316833496094, 0.07874679565429688, 0.08423042297363281, 0.08971405029296875, 0.09519767761230469, 0.10068130493164062, 0.10616493225097656, 0.1116485595703125, 0.11713218688964844, 0.12261581420898438, 0.1280994415283203, 0.13358306884765625, 0.1390666961669922, 0.14455032348632812, 0.15003395080566406, 0.155517578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 6.0, 4.0, 2.0, 8.0, 2.0, 12.0, 24.0, 445.0, 399.0, 37.0, 14.0, 8.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002301931381225586, -0.00022413022816181183, -0.00021806731820106506, -0.0002120044082403183, -0.00020594149827957153, -0.00019987858831882477, -0.000193815678358078, -0.00018775276839733124, -0.00018168985843658447, -0.0001756269484758377, -0.00016956403851509094, -0.00016350112855434418, -0.0001574382185935974, -0.00015137530863285065, -0.00014531239867210388, -0.00013924948871135712, -0.00013318657875061035, -0.00012712366878986359, -0.00012106075882911682, -0.00011499784886837006, -0.00010893493890762329, -0.00010287202894687653, -9.680911898612976e-05, -9.0746209025383e-05, -8.468329906463623e-05, -7.862038910388947e-05, -7.25574791431427e-05, -6.649456918239594e-05, -6.043165922164917e-05, -5.4368749260902405e-05, -4.830583930015564e-05, -4.2242929339408875e-05, -3.618001937866211e-05, -3.0117109417915344e-05, -2.405419945716858e-05, -1.7991289496421814e-05, -1.1928379535675049e-05, -5.865469574928284e-06, 1.9744038581848145e-07, 6.260350346565247e-06, 1.2323260307312012e-05, 1.8386170268058777e-05, 2.4449080228805542e-05, 3.0511990189552307e-05, 3.657490015029907e-05, 4.263781011104584e-05, 4.87007200717926e-05, 5.476363003253937e-05, 6.082653999328613e-05, 6.68894499540329e-05, 7.295235991477966e-05, 7.901526987552643e-05, 8.50781798362732e-05, 9.114108979701996e-05, 9.720399975776672e-05, 0.00010326690971851349, 0.00010932981967926025, 0.00011539272964000702, 0.00012145563960075378, 0.00012751854956150055, 0.00013358145952224731, 0.00013964436948299408, 0.00014570727944374084, 0.0001517701894044876, 0.00015783309936523438]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 13.0, 30.0, 39.0, 42.0, 95.0, 198.0, 345.0, 894.0, 3145.0, 23462.0, 915796.0, 95150.0, 6617.0, 1541.0, 543.0, 275.0, 133.0, 91.0, 50.0, 32.0, 19.0, 6.0, 9.0, 3.0, 8.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1541748046875, -0.1491546630859375, -0.144134521484375, -0.1391143798828125, -0.13409423828125, -0.1290740966796875, -0.124053955078125, -0.1190338134765625, -0.114013671875, -0.1089935302734375, -0.103973388671875, -0.0989532470703125, -0.09393310546875, -0.0889129638671875, -0.083892822265625, -0.0788726806640625, -0.0738525390625, -0.0688323974609375, -0.063812255859375, -0.0587921142578125, -0.05377197265625, -0.0487518310546875, -0.043731689453125, -0.0387115478515625, -0.03369140625, -0.0286712646484375, -0.023651123046875, -0.0186309814453125, -0.01361083984375, -0.0085906982421875, -0.003570556640625, 0.0014495849609375, 0.0064697265625, 0.0114898681640625, 0.016510009765625, 0.0215301513671875, 0.02655029296875, 0.0315704345703125, 0.036590576171875, 0.0416107177734375, 0.046630859375, 0.0516510009765625, 0.056671142578125, 0.0616912841796875, 0.06671142578125, 0.0717315673828125, 0.076751708984375, 0.0817718505859375, 0.0867919921875, 0.0918121337890625, 0.096832275390625, 0.1018524169921875, 0.10687255859375, 0.1118927001953125, 0.116912841796875, 0.1219329833984375, 0.126953125, 0.1319732666015625, 0.136993408203125, 0.1420135498046875, 0.14703369140625, 0.1520538330078125, 0.157073974609375, 0.1620941162109375, 0.1671142578125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 8.0, 17.0, 12.0, 16.0, 44.0, 39.0, 62.0, 86.0, 92.0, 133.0, 124.0, 109.0, 74.0, 45.0, 49.0, 20.0, 19.0, 14.0, 10.0, 2.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.087158203125, -0.08362388610839844, -0.08008956909179688, -0.07655525207519531, -0.07302093505859375, -0.06948661804199219, -0.06595230102539062, -0.06241798400878906, -0.0588836669921875, -0.05534934997558594, -0.051815032958984375, -0.04828071594238281, -0.04474639892578125, -0.04121208190917969, -0.037677764892578125, -0.03414344787597656, -0.030609130859375, -0.027074813842773438, -0.023540496826171875, -0.020006179809570312, -0.01647186279296875, -0.012937545776367188, -0.009403228759765625, -0.0058689117431640625, -0.0023345947265625, 0.0011997222900390625, 0.004734039306640625, 0.008268356323242188, 0.01180267333984375, 0.015336990356445312, 0.018871307373046875, 0.022405624389648438, 0.02593994140625, 0.029474258422851562, 0.033008575439453125, 0.03654289245605469, 0.04007720947265625, 0.04361152648925781, 0.047145843505859375, 0.05068016052246094, 0.0542144775390625, 0.05774879455566406, 0.061283111572265625, 0.06481742858886719, 0.06835174560546875, 0.07188606262207031, 0.07542037963867188, 0.07895469665527344, 0.082489013671875, 0.08602333068847656, 0.08955764770507812, 0.09309196472167969, 0.09662628173828125, 0.10016059875488281, 0.10369491577148438, 0.10722923278808594, 0.1107635498046875, 0.11429786682128906, 0.11783218383789062, 0.12136650085449219, 0.12490081787109375, 0.1284351348876953, 0.13196945190429688, 0.13550376892089844, 0.1390380859375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 22.0, 134.0, 503.0, 240.0, 54.0, 17.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.889031171798706, -2.817814588546753, -2.746598243713379, -2.675381660461426, -2.6041650772094727, -2.5329487323760986, -2.4617321491241455, -2.3905158042907715, -2.3192992210388184, -2.2480826377868652, -2.176866292953491, -2.105649709701538, -2.034433364868164, -1.963216781616211, -1.8920001983642578, -1.8207837343215942, -1.7495672702789307, -1.678350806236267, -1.6071343421936035, -1.5359177589416504, -1.4647012948989868, -1.3934848308563232, -1.3222682476043701, -1.2510517835617065, -1.179835319519043, -1.1086188554763794, -1.0374023914337158, -0.9661858081817627, -0.8949693441390991, -0.8237528800964355, -0.7525363564491272, -0.6813198328018188, -0.6101036071777344, -0.5388871431350708, -0.46767061948776245, -0.3964541256427765, -0.3252376317977905, -0.25402113795280457, -0.1828046441078186, -0.11158815026283264, -0.04037165641784668, 0.030844837427139282, 0.10206133127212524, 0.1732778251171112, 0.24449431896209717, 0.31571081280708313, 0.3869273066520691, 0.45814380049705505, 0.529360294342041, 0.6005767583847046, 0.6717932820320129, 0.7430098056793213, 0.8142262697219849, 0.8854427337646484, 0.9566592574119568, 1.0278757810592651, 1.0990922451019287, 1.1703087091445923, 1.2415251731872559, 1.312741756439209, 1.3839582204818726, 1.4551746845245361, 1.5263912677764893, 1.5976077318191528, 1.6688241958618164]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 10.0, 7.0, 9.0, 7.0, 11.0, 16.0, 24.0, 30.0, 42.0, 43.0, 54.0, 61.0, 69.0, 82.0, 73.0, 69.0, 56.0, 65.0, 57.0, 38.0, 38.0, 22.0, 21.0, 17.0, 20.0, 12.0, 7.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9664127826690674, -1.9060291051864624, -1.8456453084945679, -1.785261631011963, -1.7248778343200684, -1.6644941568374634, -1.6041104793548584, -1.5437266826629639, -1.4833428859710693, -1.4229592084884644, -1.3625754117965698, -1.3021917343139648, -1.2418079376220703, -1.1814242601394653, -1.1210405826568604, -1.0606567859649658, -1.0002731084823608, -0.9398893713951111, -0.8795056343078613, -0.8191219568252563, -0.7587381601333618, -0.6983544826507568, -0.6379707455635071, -0.5775870084762573, -0.5172032713890076, -0.4568195343017578, -0.39643579721450806, -0.3360520899295807, -0.27566835284233093, -0.21528461575508118, -0.1549009084701538, -0.09451717138290405, -0.0341334342956543, 0.026250295341014862, 0.08663402497768402, 0.14701774716377258, 0.20740148425102234, 0.2677852213382721, 0.32816892862319946, 0.3885526657104492, 0.448936402797699, 0.5093201398849487, 0.5697038769721985, 0.6300876140594482, 0.6904712915420532, 0.7508550882339478, 0.8112387657165527, 0.8716225028038025, 0.9320062398910522, 0.992389976978302, 1.0527737140655518, 1.1131573915481567, 1.1735411882400513, 1.2339248657226562, 1.2943086624145508, 1.3546923398971558, 1.4150760173797607, 1.4754596948623657, 1.5358434915542603, 1.5962271690368652, 1.6566109657287598, 1.7169946432113647, 1.7773783206939697, 1.8377621173858643, 1.8981459140777588]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 10.0, 12.0, 12.0, 18.0, 18.0, 28.0, 67.0, 59.0, 82.0, 120.0, 259.0, 521.0, 1201.0, 2664.0, 8070.0, 97311.0, 4065752.0, 13045.0, 2894.0, 1117.0, 505.0, 234.0, 93.0, 53.0, 35.0, 25.0, 15.0, 14.0, 8.0, 6.0, 11.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.1512908935546875, -1.113128662109375, -1.0749664306640625, -1.03680419921875, -0.9986419677734375, -0.960479736328125, -0.9223175048828125, -0.8841552734375, -0.8459930419921875, -0.807830810546875, -0.7696685791015625, -0.73150634765625, -0.6933441162109375, -0.655181884765625, -0.6170196533203125, -0.578857421875, -0.5406951904296875, -0.502532958984375, -0.4643707275390625, -0.42620849609375, -0.3880462646484375, -0.349884033203125, -0.3117218017578125, -0.2735595703125, -0.2353973388671875, -0.197235107421875, -0.1590728759765625, -0.12091064453125, -0.0827484130859375, -0.044586181640625, -0.0064239501953125, 0.03173828125, 0.0699005126953125, 0.108062744140625, 0.1462249755859375, 0.18438720703125, 0.2225494384765625, 0.260711669921875, 0.2988739013671875, 0.3370361328125, 0.3751983642578125, 0.413360595703125, 0.4515228271484375, 0.48968505859375, 0.5278472900390625, 0.566009521484375, 0.6041717529296875, 0.642333984375, 0.6804962158203125, 0.718658447265625, 0.7568206787109375, 0.79498291015625, 0.8331451416015625, 0.871307373046875, 0.9094696044921875, 0.9476318359375, 0.9857940673828125, 1.023956298828125, 1.0621185302734375, 1.10028076171875, 1.1384429931640625, 1.176605224609375, 1.2147674560546875, 1.2529296875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 1.0, 7.0, 9.0, 5.0, 12.0, 8.0, 19.0, 13.0, 28.0, 159.0, 418.0, 214.0, 47.0, 15.0, 12.0, 13.0, 9.0, 7.0, 1.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10174560546875, -0.09870433807373047, -0.09566307067871094, -0.0926218032836914, -0.08958053588867188, -0.08653926849365234, -0.08349800109863281, -0.08045673370361328, -0.07741546630859375, -0.07437419891357422, -0.07133293151855469, -0.06829166412353516, -0.06525039672851562, -0.062209129333496094, -0.05916786193847656, -0.05612659454345703, -0.0530853271484375, -0.05004405975341797, -0.04700279235839844, -0.043961524963378906, -0.040920257568359375, -0.037878990173339844, -0.03483772277832031, -0.03179645538330078, -0.02875518798828125, -0.02571392059326172, -0.022672653198242188, -0.019631385803222656, -0.016590118408203125, -0.013548851013183594, -0.010507583618164062, -0.007466316223144531, -0.004425048828125, -0.0013837814331054688, 0.0016574859619140625, 0.004698753356933594, 0.007740020751953125, 0.010781288146972656, 0.013822555541992188, 0.01686382293701172, 0.01990509033203125, 0.02294635772705078, 0.025987625122070312, 0.029028892517089844, 0.032070159912109375, 0.035111427307128906, 0.03815269470214844, 0.04119396209716797, 0.0442352294921875, 0.04727649688720703, 0.05031776428222656, 0.053359031677246094, 0.056400299072265625, 0.059441566467285156, 0.06248283386230469, 0.06552410125732422, 0.06856536865234375, 0.07160663604736328, 0.07464790344238281, 0.07768917083740234, 0.08073043823242188, 0.0837717056274414, 0.08681297302246094, 0.08985424041748047, 0.0928955078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 6.0, 12.0, 6.0, 9.0, 12.0, 12.0, 26.0, 32.0, 42.0, 67.0, 114.0, 242.0, 868.0, 6484.0, 3175249.0, 1003323.0, 6356.0, 854.0, 264.0, 110.0, 67.0, 34.0, 28.0, 13.0, 9.0, 14.0, 3.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86279296875, -0.8319625854492188, -0.8011322021484375, -0.7703018188476562, -0.739471435546875, -0.7086410522460938, -0.6778106689453125, -0.6469802856445312, -0.61614990234375, -0.5853195190429688, -0.5544891357421875, -0.5236587524414062, -0.492828369140625, -0.46199798583984375, -0.4311676025390625, -0.40033721923828125, -0.3695068359375, -0.33867645263671875, -0.3078460693359375, -0.27701568603515625, -0.246185302734375, -0.21535491943359375, -0.1845245361328125, -0.15369415283203125, -0.12286376953125, -0.09203338623046875, -0.0612030029296875, -0.03037261962890625, 0.000457763671875, 0.03128814697265625, 0.0621185302734375, 0.09294891357421875, 0.123779296875, 0.15460968017578125, 0.1854400634765625, 0.21627044677734375, 0.247100830078125, 0.27793121337890625, 0.3087615966796875, 0.33959197998046875, 0.37042236328125, 0.40125274658203125, 0.4320831298828125, 0.46291351318359375, 0.493743896484375, 0.5245742797851562, 0.5554046630859375, 0.5862350463867188, 0.6170654296875, 0.6478958129882812, 0.6787261962890625, 0.7095565795898438, 0.740386962890625, 0.7712173461914062, 0.8020477294921875, 0.8328781127929688, 0.86370849609375, 0.8945388793945312, 0.9253692626953125, 0.9561996459960938, 0.987030029296875, 1.0178604125976562, 1.0486907958984375, 1.0795211791992188, 1.1103515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 4.0, 6.0, 11.0, 8.0, 13.0, 17.0, 20.0, 42.0, 55.0, 106.0, 406.0, 2709.0, 279.0, 134.0, 61.0, 50.0, 23.0, 23.0, 28.0, 15.0, 11.0, 7.0, 6.0, 8.0, 9.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.141357421875, -0.1375732421875, -0.1337890625, -0.1300048828125, -0.126220703125, -0.1224365234375, -0.11865234375, -0.1148681640625, -0.111083984375, -0.1072998046875, -0.103515625, -0.0997314453125, -0.095947265625, -0.0921630859375, -0.08837890625, -0.0845947265625, -0.080810546875, -0.0770263671875, -0.0732421875, -0.0694580078125, -0.065673828125, -0.0618896484375, -0.05810546875, -0.0543212890625, -0.050537109375, -0.0467529296875, -0.04296875, -0.0391845703125, -0.035400390625, -0.0316162109375, -0.02783203125, -0.0240478515625, -0.020263671875, -0.0164794921875, -0.0126953125, -0.0089111328125, -0.005126953125, -0.0013427734375, 0.00244140625, 0.0062255859375, 0.010009765625, 0.0137939453125, 0.017578125, 0.0213623046875, 0.025146484375, 0.0289306640625, 0.03271484375, 0.0364990234375, 0.040283203125, 0.0440673828125, 0.0478515625, 0.0516357421875, 0.055419921875, 0.0592041015625, 0.06298828125, 0.0667724609375, 0.070556640625, 0.0743408203125, 0.078125, 0.0819091796875, 0.085693359375, 0.0894775390625, 0.09326171875, 0.0970458984375, 0.100830078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 665.0, 330.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.783815383911133, -6.660317420959473, -6.5368194580078125, -6.413321018218994, -6.289823055267334, -6.166325092315674, -6.042827129364014, -5.919328689575195, -5.795830726623535, -5.672332763671875, -5.548834800720215, -5.4253363609313965, -5.301838397979736, -5.178340435028076, -5.054842472076416, -4.931344032287598, -4.8078460693359375, -4.684348106384277, -4.560850143432617, -4.437351703643799, -4.313853740692139, -4.1903557777404785, -4.066857814788818, -3.943359613418579, -3.819861650466919, -3.696363687515259, -3.5728654861450195, -3.4493675231933594, -3.32586932182312, -3.20237135887146, -3.0788731575012207, -2.9553751945495605, -2.831876754760742, -2.708378791809082, -2.5848805904388428, -2.4613826274871826, -2.3378844261169434, -2.214386463165283, -2.090888261795044, -1.9673902988433838, -1.8438923358917236, -1.720394253730774, -1.5968961715698242, -1.4733980894088745, -1.3499000072479248, -1.2264020442962646, -1.1029038429260254, -0.9794058203697205, -0.855907678604126, -0.7324095964431763, -0.6089115142822266, -0.48541346192359924, -0.36191537976264954, -0.23841732740402222, -0.11491924524307251, 0.008578836917877197, 0.1320769190788269, 0.2555750012397766, 0.3790730834007263, 0.5025711059570312, 0.626069188117981, 0.7495672702789307, 0.8730653524398804, 0.9965634346008301, 1.1200615167617798]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 3.0, 5.0, 8.0, 7.0, 13.0, 31.0, 38.0, 59.0, 60.0, 76.0, 102.0, 86.0, 106.0, 85.0, 72.0, 70.0, 53.0, 35.0, 25.0, 21.0, 13.0, 7.0, 5.0, 5.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5499835014343262, -0.5298078060150146, -0.5096321702003479, -0.4894564747810364, -0.46928080916404724, -0.4491051435470581, -0.42892947793006897, -0.40875381231307983, -0.3885781168937683, -0.3684024512767792, -0.34822678565979004, -0.3280510902404785, -0.3078754246234894, -0.28769975900650024, -0.2675240933895111, -0.24734841287136078, -0.22717276215553284, -0.2069970965385437, -0.18682141602039337, -0.16664575040340424, -0.1464700698852539, -0.12629440426826477, -0.10611873865127563, -0.0859430581331253, -0.06576739251613617, -0.04559171944856644, -0.025416050106287003, -0.005240380764007568, 0.014935292303562164, 0.0351109653711319, 0.05528663098812103, 0.07546231150627136, 0.0956379771232605, 0.11581365019083023, 0.13598932325839996, 0.1561649888753891, 0.17634066939353943, 0.19651633501052856, 0.2166920006275177, 0.23686768114566803, 0.25704336166381836, 0.2772190272808075, 0.29739469289779663, 0.31757038831710815, 0.3377460539340973, 0.3579217195510864, 0.37809738516807556, 0.3982730507850647, 0.41844871640205383, 0.43862438201904297, 0.4588000476360321, 0.47897571325302124, 0.49915140867233276, 0.5193270444869995, 0.539502739906311, 0.5596784353256226, 0.5798540711402893, 0.6000297665596008, 0.6202054023742676, 0.6403810977935791, 0.6605567336082458, 0.6807324290275574, 0.7009080648422241, 0.7210837602615356, 0.7412594556808472]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 17.0, 9.0, 19.0, 27.0, 17.0, 24.0, 31.0, 43.0, 60.0, 87.0, 145.0, 194.0, 274.0, 491.0, 930.0, 1892.0, 4380.0, 14350.0, 139988.0, 841478.0, 31321.0, 6917.0, 2784.0, 1217.0, 636.0, 400.0, 233.0, 137.0, 115.0, 89.0, 49.0, 27.0, 38.0, 30.0, 19.0, 18.0, 12.0, 17.0, 8.0, 6.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.45361328125, -0.4390869140625, -0.424560546875, -0.4100341796875, -0.3955078125, -0.3809814453125, -0.366455078125, -0.3519287109375, -0.33740234375, -0.3228759765625, -0.308349609375, -0.2938232421875, -0.279296875, -0.2647705078125, -0.250244140625, -0.2357177734375, -0.22119140625, -0.2066650390625, -0.192138671875, -0.1776123046875, -0.1630859375, -0.1485595703125, -0.134033203125, -0.1195068359375, -0.10498046875, -0.0904541015625, -0.075927734375, -0.0614013671875, -0.046875, -0.0323486328125, -0.017822265625, -0.0032958984375, 0.01123046875, 0.0257568359375, 0.040283203125, 0.0548095703125, 0.0693359375, 0.0838623046875, 0.098388671875, 0.1129150390625, 0.12744140625, 0.1419677734375, 0.156494140625, 0.1710205078125, 0.185546875, 0.2000732421875, 0.214599609375, 0.2291259765625, 0.24365234375, 0.2581787109375, 0.272705078125, 0.2872314453125, 0.3017578125, 0.3162841796875, 0.330810546875, 0.3453369140625, 0.35986328125, 0.3743896484375, 0.388916015625, 0.4034423828125, 0.41796875, 0.4324951171875, 0.447021484375, 0.4615478515625, 0.47607421875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 12.0, 10.0, 14.0, 16.0, 17.0, 116.0, 325.0, 304.0, 104.0, 27.0, 18.0, 9.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.0956888198852539, -0.09268379211425781, -0.08967876434326172, -0.08667373657226562, -0.08366870880126953, -0.08066368103027344, -0.07765865325927734, -0.07465362548828125, -0.07164859771728516, -0.06864356994628906, -0.06563854217529297, -0.06263351440429688, -0.05962848663330078, -0.05662345886230469, -0.053618431091308594, -0.0506134033203125, -0.047608375549316406, -0.04460334777832031, -0.04159832000732422, -0.038593292236328125, -0.03558826446533203, -0.03258323669433594, -0.029578208923339844, -0.02657318115234375, -0.023568153381347656, -0.020563125610351562, -0.01755809783935547, -0.014553070068359375, -0.011548042297363281, -0.008543014526367188, -0.005537986755371094, -0.002532958984375, 0.00047206878662109375, 0.0034770965576171875, 0.006482124328613281, 0.009487152099609375, 0.012492179870605469, 0.015497207641601562, 0.018502235412597656, 0.02150726318359375, 0.024512290954589844, 0.027517318725585938, 0.03052234649658203, 0.033527374267578125, 0.03653240203857422, 0.03953742980957031, 0.042542457580566406, 0.0455474853515625, 0.048552513122558594, 0.05155754089355469, 0.05456256866455078, 0.057567596435546875, 0.06057262420654297, 0.06357765197753906, 0.06658267974853516, 0.06958770751953125, 0.07259273529052734, 0.07559776306152344, 0.07860279083251953, 0.08160781860351562, 0.08461284637451172, 0.08761787414550781, 0.0906229019165039, 0.0936279296875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 6.0, 13.0, 8.0, 10.0, 7.0, 19.0, 20.0, 19.0, 32.0, 51.0, 59.0, 67.0, 105.0, 130.0, 223.0, 326.0, 582.0, 1009.0, 2020.0, 6162.0, 40531.0, 798150.0, 179255.0, 13120.0, 3282.0, 1399.0, 664.0, 403.0, 275.0, 173.0, 103.0, 90.0, 50.0, 42.0, 33.0, 26.0, 10.0, 18.0, 15.0, 11.0, 9.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.420166015625, -0.4073333740234375, -0.394500732421875, -0.3816680908203125, -0.36883544921875, -0.3560028076171875, -0.343170166015625, -0.3303375244140625, -0.3175048828125, -0.3046722412109375, -0.291839599609375, -0.2790069580078125, -0.26617431640625, -0.2533416748046875, -0.240509033203125, -0.2276763916015625, -0.21484375, -0.2020111083984375, -0.189178466796875, -0.1763458251953125, -0.16351318359375, -0.1506805419921875, -0.137847900390625, -0.1250152587890625, -0.1121826171875, -0.0993499755859375, -0.086517333984375, -0.0736846923828125, -0.06085205078125, -0.0480194091796875, -0.035186767578125, -0.0223541259765625, -0.009521484375, 0.0033111572265625, 0.016143798828125, 0.0289764404296875, 0.04180908203125, 0.0546417236328125, 0.067474365234375, 0.0803070068359375, 0.0931396484375, 0.1059722900390625, 0.118804931640625, 0.1316375732421875, 0.14447021484375, 0.1573028564453125, 0.170135498046875, 0.1829681396484375, 0.19580078125, 0.2086334228515625, 0.221466064453125, 0.2342987060546875, 0.24713134765625, 0.2599639892578125, 0.272796630859375, 0.2856292724609375, 0.2984619140625, 0.3112945556640625, 0.324127197265625, 0.3369598388671875, 0.34979248046875, 0.3626251220703125, 0.375457763671875, 0.3882904052734375, 0.401123046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 11.0, 9.0, 10.0, 11.0, 13.0, 15.0, 26.0, 19.0, 26.0, 31.0, 26.0, 41.0, 36.0, 39.0, 43.0, 51.0, 48.0, 41.0, 46.0, 38.0, 44.0, 45.0, 31.0, 39.0, 35.0, 30.0, 31.0, 22.0, 23.0, 14.0, 13.0, 13.0, 17.0, 15.0, 7.0, 6.0, 7.0, 3.0, 1.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1868896484375, -0.18124008178710938, -0.17559051513671875, -0.16994094848632812, -0.1642913818359375, -0.15864181518554688, -0.15299224853515625, -0.14734268188476562, -0.141693115234375, -0.13604354858398438, -0.13039398193359375, -0.12474441528320312, -0.1190948486328125, -0.11344528198242188, -0.10779571533203125, -0.10214614868164062, -0.09649658203125, -0.09084701538085938, -0.08519744873046875, -0.07954788208007812, -0.0738983154296875, -0.06824874877929688, -0.06259918212890625, -0.056949615478515625, -0.051300048828125, -0.045650482177734375, -0.04000091552734375, -0.034351348876953125, -0.0287017822265625, -0.023052215576171875, -0.01740264892578125, -0.011753082275390625, -0.006103515625, -0.000453948974609375, 0.00519561767578125, 0.010845184326171875, 0.0164947509765625, 0.022144317626953125, 0.02779388427734375, 0.033443450927734375, 0.039093017578125, 0.044742584228515625, 0.05039215087890625, 0.056041717529296875, 0.0616912841796875, 0.06734085083007812, 0.07299041748046875, 0.07863998413085938, 0.08428955078125, 0.08993911743164062, 0.09558868408203125, 0.10123825073242188, 0.1068878173828125, 0.11253738403320312, 0.11818695068359375, 0.12383651733398438, 0.129486083984375, 0.13513565063476562, 0.14078521728515625, 0.14643478393554688, 0.1520843505859375, 0.15773391723632812, 0.16338348388671875, 0.16903305053710938, 0.1746826171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 9.0, 12.0, 9.0, 24.0, 35.0, 54.0, 96.0, 137.0, 280.0, 577.0, 1474.0, 6130.0, 65073.0, 918035.0, 48975.0, 5258.0, 1279.0, 477.0, 224.0, 130.0, 63.0, 49.0, 41.0, 32.0, 17.0, 14.0, 9.0, 7.0, 2.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.25537109375, -0.24795913696289062, -0.24054718017578125, -0.23313522338867188, -0.2257232666015625, -0.21831130981445312, -0.21089935302734375, -0.20348739624023438, -0.196075439453125, -0.18866348266601562, -0.18125152587890625, -0.17383956909179688, -0.1664276123046875, -0.15901565551757812, -0.15160369873046875, -0.14419174194335938, -0.13677978515625, -0.12936782836914062, -0.12195587158203125, -0.11454391479492188, -0.1071319580078125, -0.09972000122070312, -0.09230804443359375, -0.08489608764648438, -0.077484130859375, -0.07007217407226562, -0.06266021728515625, -0.055248260498046875, -0.0478363037109375, -0.040424346923828125, -0.03301239013671875, -0.025600433349609375, -0.0181884765625, -0.010776519775390625, -0.00336456298828125, 0.004047393798828125, 0.0114593505859375, 0.018871307373046875, 0.02628326416015625, 0.033695220947265625, 0.041107177734375, 0.048519134521484375, 0.05593109130859375, 0.06334304809570312, 0.0707550048828125, 0.07816696166992188, 0.08557891845703125, 0.09299087524414062, 0.10040283203125, 0.10781478881835938, 0.11522674560546875, 0.12263870239257812, 0.1300506591796875, 0.13746261596679688, 0.14487457275390625, 0.15228652954101562, 0.159698486328125, 0.16711044311523438, 0.17452239990234375, 0.18193435668945312, 0.1893463134765625, 0.19675827026367188, 0.20417022705078125, 0.21158218383789062, 0.218994140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 10.0, 3.0, 3.0, 13.0, 4.0, 11.0, 13.0, 20.0, 27.0, 39.0, 56.0, 57.0, 108.0, 249.0, 112.0, 66.0, 58.0, 34.0, 31.0, 20.0, 15.0, 16.0, 9.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00022661685943603516, -0.00022023916244506836, -0.00021386146545410156, -0.00020748376846313477, -0.00020110607147216797, -0.00019472837448120117, -0.00018835067749023438, -0.00018197298049926758, -0.00017559528350830078, -0.00016921758651733398, -0.0001628398895263672, -0.0001564621925354004, -0.0001500844955444336, -0.0001437067985534668, -0.0001373291015625, -0.0001309514045715332, -0.0001245737075805664, -0.00011819601058959961, -0.00011181831359863281, -0.00010544061660766602, -9.906291961669922e-05, -9.268522262573242e-05, -8.630752563476562e-05, -7.992982864379883e-05, -7.355213165283203e-05, -6.717443466186523e-05, -6.079673767089844e-05, -5.441904067993164e-05, -4.8041343688964844e-05, -4.166364669799805e-05, -3.528594970703125e-05, -2.8908252716064453e-05, -2.2530555725097656e-05, -1.615285873413086e-05, -9.775161743164062e-06, -3.3974647521972656e-06, 2.9802322387695312e-06, 9.357929229736328e-06, 1.5735626220703125e-05, 2.2113323211669922e-05, 2.849102020263672e-05, 3.4868717193603516e-05, 4.124641418457031e-05, 4.762411117553711e-05, 5.4001808166503906e-05, 6.03795051574707e-05, 6.67572021484375e-05, 7.31348991394043e-05, 7.95125961303711e-05, 8.589029312133789e-05, 9.226799011230469e-05, 9.864568710327148e-05, 0.00010502338409423828, 0.00011140108108520508, 0.00011777877807617188, 0.00012415647506713867, 0.00013053417205810547, 0.00013691186904907227, 0.00014328956604003906, 0.00014966726303100586, 0.00015604496002197266, 0.00016242265701293945, 0.00016880035400390625, 0.00017517805099487305, 0.00018155574798583984]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 0.0, 14.0, 8.0, 11.0, 26.0, 39.0, 55.0, 72.0, 176.0, 385.0, 971.0, 5173.0, 321141.0, 712628.0, 5960.0, 1100.0, 386.0, 167.0, 78.0, 55.0, 29.0, 26.0, 17.0, 7.0, 7.0, 9.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.496826171875, -0.48223114013671875, -0.4676361083984375, -0.45304107666015625, -0.438446044921875, -0.42385101318359375, -0.4092559814453125, -0.39466094970703125, -0.38006591796875, -0.36547088623046875, -0.3508758544921875, -0.33628082275390625, -0.321685791015625, -0.30709075927734375, -0.2924957275390625, -0.27790069580078125, -0.2633056640625, -0.24871063232421875, -0.2341156005859375, -0.21952056884765625, -0.204925537109375, -0.19033050537109375, -0.1757354736328125, -0.16114044189453125, -0.14654541015625, -0.13195037841796875, -0.1173553466796875, -0.10276031494140625, -0.088165283203125, -0.07357025146484375, -0.0589752197265625, -0.04438018798828125, -0.02978515625, -0.01519012451171875, -0.0005950927734375, 0.01399993896484375, 0.028594970703125, 0.04319000244140625, 0.0577850341796875, 0.07238006591796875, 0.08697509765625, 0.10157012939453125, 0.1161651611328125, 0.13076019287109375, 0.145355224609375, 0.15995025634765625, 0.1745452880859375, 0.18914031982421875, 0.2037353515625, 0.21833038330078125, 0.2329254150390625, 0.24752044677734375, 0.262115478515625, 0.27671051025390625, 0.2913055419921875, 0.30590057373046875, 0.32049560546875, 0.33509063720703125, 0.3496856689453125, 0.36428070068359375, 0.378875732421875, 0.39347076416015625, 0.4080657958984375, 0.42266082763671875, 0.437255859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 4.0, 7.0, 5.0, 10.0, 9.0, 15.0, 16.0, 37.0, 49.0, 91.0, 142.0, 184.0, 144.0, 96.0, 51.0, 31.0, 24.0, 17.0, 11.0, 15.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2091064453125, -0.2036876678466797, -0.19826889038085938, -0.19285011291503906, -0.18743133544921875, -0.18201255798339844, -0.17659378051757812, -0.1711750030517578, -0.1657562255859375, -0.1603374481201172, -0.15491867065429688, -0.14949989318847656, -0.14408111572265625, -0.13866233825683594, -0.13324356079101562, -0.1278247833251953, -0.122406005859375, -0.11698722839355469, -0.11156845092773438, -0.10614967346191406, -0.10073089599609375, -0.09531211853027344, -0.08989334106445312, -0.08447456359863281, -0.0790557861328125, -0.07363700866699219, -0.06821823120117188, -0.06279945373535156, -0.05738067626953125, -0.05196189880371094, -0.046543121337890625, -0.04112434387207031, -0.03570556640625, -0.030286788940429688, -0.024868011474609375, -0.019449234008789062, -0.01403045654296875, -0.008611679077148438, -0.003192901611328125, 0.0022258758544921875, 0.0076446533203125, 0.013063430786132812, 0.018482208251953125, 0.023900985717773438, 0.02931976318359375, 0.03473854064941406, 0.040157318115234375, 0.04557609558105469, 0.050994873046875, 0.05641365051269531, 0.061832427978515625, 0.06725120544433594, 0.07266998291015625, 0.07808876037597656, 0.08350753784179688, 0.08892631530761719, 0.0943450927734375, 0.09976387023925781, 0.10518264770507812, 0.11060142517089844, 0.11602020263671875, 0.12143898010253906, 0.12685775756835938, 0.1322765350341797, 0.1376953125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 12.0, 24.0, 90.0, 377.0, 401.0, 69.0, 13.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6290292739868164, -3.5252389907836914, -3.4214487075805664, -3.3176584243774414, -3.2138681411743164, -3.1100778579711914, -3.0062878131866455, -2.9024975299835205, -2.7987072467803955, -2.6949169635772705, -2.5911266803741455, -2.4873363971710205, -2.3835463523864746, -2.2797560691833496, -2.1759657859802246, -2.0721755027770996, -1.9683852195739746, -1.8645949363708496, -1.7608046531677246, -1.6570144891738892, -1.5532242059707642, -1.4494339227676392, -1.3456437587738037, -1.2418534755706787, -1.1380631923675537, -1.0342729091644287, -0.9304826855659485, -0.8266924619674683, -0.7229021787643433, -0.6191118955612183, -0.515321671962738, -0.4115314483642578, -0.3077414035797119, -0.2039511501789093, -0.10016089677810669, 0.003629356622695923, 0.10741961002349854, 0.21120989322662354, 0.31500011682510376, 0.418790340423584, 0.522580623626709, 0.626370906829834, 0.7301611304283142, 0.8339513540267944, 0.9377416372299194, 1.0415319204330444, 1.1453220844268799, 1.2491123676300049, 1.3529026508331299, 1.4566929340362549, 1.5604832172393799, 1.6642733812332153, 1.7680636644363403, 1.8718539476394653, 1.9756441116333008, 2.079434394836426, 2.183224678039551, 2.287014961242676, 2.390805244445801, 2.494595527648926, 2.598385810852051, 2.702176094055176, 2.8059661388397217, 2.9097564220428467, 3.0135467052459717]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 9.0, 5.0, 12.0, 21.0, 20.0, 28.0, 50.0, 40.0, 44.0, 60.0, 54.0, 55.0, 82.0, 66.0, 70.0, 58.0, 70.0, 59.0, 38.0, 38.0, 34.0, 20.0, 23.0, 9.0, 12.0, 4.0, 10.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.2630128860473633, -2.1985321044921875, -2.134051561355591, -2.069571018218994, -2.0050902366638184, -1.9406095743179321, -1.876128911972046, -1.8116482496261597, -1.7471675872802734, -1.6826869249343872, -1.618206262588501, -1.5537256002426147, -1.4892449378967285, -1.4247642755508423, -1.360283613204956, -1.2958029508590698, -1.2313222885131836, -1.1668416261672974, -1.1023609638214111, -1.037880301475525, -0.9733996391296387, -0.9089189767837524, -0.8444383144378662, -0.77995765209198, -0.7154769897460938, -0.6509963274002075, -0.5865156650543213, -0.5220350027084351, -0.45755434036254883, -0.3930736780166626, -0.32859301567077637, -0.26411235332489014, -0.1996316909790039, -0.13515102863311768, -0.07067036628723145, -0.006189703941345215, 0.058290958404541016, 0.12277162075042725, 0.18725228309631348, 0.2517329454421997, 0.31621360778808594, 0.38069427013397217, 0.4451749324798584, 0.5096555948257446, 0.5741362571716309, 0.6386169195175171, 0.7030975818634033, 0.7675782442092896, 0.8320589065551758, 0.896539568901062, 0.9610202312469482, 1.0255008935928345, 1.0899815559387207, 1.154462218284607, 1.2189428806304932, 1.2834235429763794, 1.3479042053222656, 1.4123848676681519, 1.476865530014038, 1.5413461923599243, 1.6058268547058105, 1.6703075170516968, 1.734788179397583, 1.7992688417434692, 1.8637495040893555]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 17.0, 24.0, 55.0, 124.0, 442.0, 5764.0, 4184984.0, 2458.0, 285.0, 65.0, 21.0, 17.0, 18.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.875, -2.7738037109375, -2.672607421875, -2.5714111328125, -2.47021484375, -2.3690185546875, -2.267822265625, -2.1666259765625, -2.0654296875, -1.9642333984375, -1.863037109375, -1.7618408203125, -1.66064453125, -1.5594482421875, -1.458251953125, -1.3570556640625, -1.255859375, -1.1546630859375, -1.053466796875, -0.9522705078125, -0.85107421875, -0.7498779296875, -0.648681640625, -0.5474853515625, -0.4462890625, -0.3450927734375, -0.243896484375, -0.1427001953125, -0.04150390625, 0.0596923828125, 0.160888671875, 0.2620849609375, 0.36328125, 0.4644775390625, 0.565673828125, 0.6668701171875, 0.76806640625, 0.8692626953125, 0.970458984375, 1.0716552734375, 1.1728515625, 1.2740478515625, 1.375244140625, 1.4764404296875, 1.57763671875, 1.6788330078125, 1.780029296875, 1.8812255859375, 1.982421875, 2.0836181640625, 2.184814453125, 2.2860107421875, 2.38720703125, 2.4884033203125, 2.589599609375, 2.6907958984375, 2.7919921875, 2.8931884765625, 2.994384765625, 3.0955810546875, 3.19677734375, 3.2979736328125, 3.399169921875, 3.5003662109375, 3.6015625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 15.0, 9.0, 15.0, 18.0, 42.0, 165.0, 289.0, 275.0, 99.0, 30.0, 16.0, 8.0, 8.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09661865234375, -0.09336280822753906, -0.09010696411132812, -0.08685111999511719, -0.08359527587890625, -0.08033943176269531, -0.07708358764648438, -0.07382774353027344, -0.0705718994140625, -0.06731605529785156, -0.06406021118164062, -0.06080436706542969, -0.05754852294921875, -0.05429267883300781, -0.051036834716796875, -0.04778099060058594, -0.044525146484375, -0.04126930236816406, -0.038013458251953125, -0.03475761413574219, -0.03150177001953125, -0.028245925903320312, -0.024990081787109375, -0.021734237670898438, -0.0184783935546875, -0.015222549438476562, -0.011966705322265625, -0.008710861206054688, -0.00545501708984375, -0.0021991729736328125, 0.001056671142578125, 0.0043125152587890625, 0.007568359375, 0.010824203491210938, 0.014080047607421875, 0.017335891723632812, 0.02059173583984375, 0.023847579956054688, 0.027103424072265625, 0.030359268188476562, 0.0336151123046875, 0.03687095642089844, 0.040126800537109375, 0.04338264465332031, 0.04663848876953125, 0.04989433288574219, 0.053150177001953125, 0.05640602111816406, 0.059661865234375, 0.06291770935058594, 0.06617355346679688, 0.06942939758300781, 0.07268524169921875, 0.07594108581542969, 0.07919692993164062, 0.08245277404785156, 0.0857086181640625, 0.08896446228027344, 0.09222030639648438, 0.09547615051269531, 0.09873199462890625, 0.10198783874511719, 0.10524368286132812, 0.10849952697753906, 0.11175537109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 7.0, 11.0, 13.0, 18.0, 36.0, 56.0, 68.0, 99.0, 208.0, 424.0, 849.0, 2526.0, 13032.0, 3572018.0, 589218.0, 11049.0, 2514.0, 981.0, 418.0, 240.0, 179.0, 105.0, 61.0, 46.0, 32.0, 23.0, 9.0, 8.0, 4.0, 6.0, 5.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5830078125, -0.5621414184570312, -0.5412750244140625, -0.5204086303710938, -0.499542236328125, -0.47867584228515625, -0.4578094482421875, -0.43694305419921875, -0.41607666015625, -0.39521026611328125, -0.3743438720703125, -0.35347747802734375, -0.332611083984375, -0.31174468994140625, -0.2908782958984375, -0.27001190185546875, -0.2491455078125, -0.22827911376953125, -0.2074127197265625, -0.18654632568359375, -0.165679931640625, -0.14481353759765625, -0.1239471435546875, -0.10308074951171875, -0.08221435546875, -0.06134796142578125, -0.0404815673828125, -0.01961517333984375, 0.001251220703125, 0.02211761474609375, 0.0429840087890625, 0.06385040283203125, 0.084716796875, 0.10558319091796875, 0.1264495849609375, 0.14731597900390625, 0.168182373046875, 0.18904876708984375, 0.2099151611328125, 0.23078155517578125, 0.25164794921875, 0.27251434326171875, 0.2933807373046875, 0.31424713134765625, 0.335113525390625, 0.35597991943359375, 0.3768463134765625, 0.39771270751953125, 0.4185791015625, 0.43944549560546875, 0.4603118896484375, 0.48117828369140625, 0.502044677734375, 0.5229110717773438, 0.5437774658203125, 0.5646438598632812, 0.58551025390625, 0.6063766479492188, 0.6272430419921875, 0.6481094360351562, 0.668975830078125, 0.6898422241210938, 0.7107086181640625, 0.7315750122070312, 0.75244140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 8.0, 6.0, 19.0, 23.0, 35.0, 74.0, 202.0, 2515.0, 844.0, 150.0, 59.0, 37.0, 24.0, 18.0, 13.0, 5.0, 9.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080810546875, -0.07672882080078125, -0.0726470947265625, -0.06856536865234375, -0.064483642578125, -0.06040191650390625, -0.0563201904296875, -0.05223846435546875, -0.04815673828125, -0.04407501220703125, -0.0399932861328125, -0.03591156005859375, -0.031829833984375, -0.02774810791015625, -0.0236663818359375, -0.01958465576171875, -0.0155029296875, -0.01142120361328125, -0.0073394775390625, -0.00325775146484375, 0.000823974609375, 0.00490570068359375, 0.0089874267578125, 0.01306915283203125, 0.01715087890625, 0.02123260498046875, 0.0253143310546875, 0.02939605712890625, 0.033477783203125, 0.03755950927734375, 0.0416412353515625, 0.04572296142578125, 0.0498046875, 0.05388641357421875, 0.0579681396484375, 0.06204986572265625, 0.066131591796875, 0.07021331787109375, 0.0742950439453125, 0.07837677001953125, 0.08245849609375, 0.08654022216796875, 0.0906219482421875, 0.09470367431640625, 0.098785400390625, 0.10286712646484375, 0.1069488525390625, 0.11103057861328125, 0.1151123046875, 0.11919403076171875, 0.1232757568359375, 0.12735748291015625, 0.131439208984375, 0.13552093505859375, 0.1396026611328125, 0.14368438720703125, 0.14776611328125, 0.15184783935546875, 0.1559295654296875, 0.16001129150390625, 0.164093017578125, 0.16817474365234375, 0.1722564697265625, 0.17633819580078125, 0.180419921875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 13.0, 162.0, 755.0, 63.0, 13.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.944117307662964, -2.871133327484131, -2.7981491088867188, -2.7251651287078857, -2.6521811485290527, -2.5791969299316406, -2.5062129497528076, -2.4332289695739746, -2.3602447509765625, -2.2872607707977295, -2.2142765522003174, -2.1412925720214844, -2.0683085918426514, -1.9953244924545288, -1.9223403930664062, -1.8493564128875732, -1.7763724327087402, -1.7033883333206177, -1.6304043531417847, -1.557420253753662, -1.484436273574829, -1.4114521741867065, -1.338468074798584, -1.265484094619751, -1.1924999952316284, -1.1195158958435059, -1.0465319156646729, -0.9735478162765503, -0.9005637764930725, -0.8275797367095947, -0.7545956373214722, -0.6816115975379944, -0.6086273193359375, -0.5356432795524597, -0.46265920996665955, -0.3896751403808594, -0.3166911005973816, -0.2437070608139038, -0.17072299122810364, -0.09773892164230347, -0.024754881858825684, 0.04822917282581329, 0.12121322751045227, 0.19419728219509125, 0.2671813368797302, 0.340165376663208, 0.4131494462490082, 0.48613351583480835, 0.5591175556182861, 0.6321015954017639, 0.7050856351852417, 0.7780697345733643, 0.851053774356842, 0.9240378141403198, 0.9970219135284424, 1.0700058937072754, 1.142989993095398, 1.2159740924835205, 1.2889580726623535, 1.361942172050476, 1.4349262714385986, 1.5079102516174316, 1.5808943510055542, 1.6538784503936768, 1.7268624305725098]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 7.0, 2.0, 5.0, 6.0, 9.0, 14.0, 16.0, 15.0, 32.0, 20.0, 40.0, 54.0, 48.0, 42.0, 58.0, 57.0, 59.0, 48.0, 49.0, 66.0, 64.0, 50.0, 45.0, 34.0, 28.0, 42.0, 25.0, 21.0, 9.0, 8.0, 10.0, 5.0, 2.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4465025067329407, -0.4348994791507721, -0.42329642176628113, -0.41169339418411255, -0.4000903367996216, -0.388487309217453, -0.3768842816352844, -0.36528122425079346, -0.3536781668663025, -0.3420751392841339, -0.33047208189964294, -0.31886905431747437, -0.3072659969329834, -0.2956629693508148, -0.28405994176864624, -0.2724568843841553, -0.2608538568019867, -0.24925081431865692, -0.23764777183532715, -0.22604474425315857, -0.2144416868686676, -0.20283865928649902, -0.19123561680316925, -0.17963257431983948, -0.1680295318365097, -0.15642648935317993, -0.14482344686985016, -0.13322040438652039, -0.12161736935377121, -0.11001432687044144, -0.09841129183769226, -0.08680824935436249, -0.07520520687103271, -0.06360216438770294, -0.05199912562966347, -0.04039608687162399, -0.02879304438829422, -0.017190001904964447, -0.005586966872215271, 0.006016075611114502, 0.017619118094444275, 0.0292221587151289, 0.04082519933581352, 0.052428238093853, 0.06403128057718277, 0.07563432306051254, 0.08723735809326172, 0.09884040057659149, 0.11044344305992126, 0.12204648554325104, 0.1336495280265808, 0.1452525556087494, 0.15685561299324036, 0.16845864057540894, 0.1800616830587387, 0.19166472554206848, 0.20326776802539825, 0.21487081050872803, 0.2264738529920578, 0.23807689547538757, 0.24967992305755615, 0.2612829804420471, 0.2728860080242157, 0.2844890356063843, 0.29609209299087524]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 8.0, 5.0, 8.0, 8.0, 10.0, 14.0, 13.0, 16.0, 10.0, 23.0, 36.0, 54.0, 65.0, 113.0, 112.0, 166.0, 219.0, 339.0, 420.0, 774.0, 1280.0, 2803.0, 9042.0, 56144.0, 800351.0, 152910.0, 15154.0, 4135.0, 1621.0, 895.0, 534.0, 348.0, 228.0, 178.0, 136.0, 107.0, 68.0, 50.0, 44.0, 29.0, 22.0, 17.0, 11.0, 11.0, 7.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291015625, -0.2821083068847656, -0.27320098876953125, -0.2642936706542969, -0.2553863525390625, -0.24647903442382812, -0.23757171630859375, -0.22866439819335938, -0.219757080078125, -0.21084976196289062, -0.20194244384765625, -0.19303512573242188, -0.1841278076171875, -0.17522048950195312, -0.16631317138671875, -0.15740585327148438, -0.14849853515625, -0.13959121704101562, -0.13068389892578125, -0.12177658081054688, -0.1128692626953125, -0.10396194458007812, -0.09505462646484375, -0.08614730834960938, -0.077239990234375, -0.06833267211914062, -0.05942535400390625, -0.050518035888671875, -0.0416107177734375, -0.032703399658203125, -0.02379608154296875, -0.014888763427734375, -0.0059814453125, 0.002925872802734375, 0.01183319091796875, 0.020740509033203125, 0.0296478271484375, 0.038555145263671875, 0.04746246337890625, 0.056369781494140625, 0.065277099609375, 0.07418441772460938, 0.08309173583984375, 0.09199905395507812, 0.1009063720703125, 0.10981369018554688, 0.11872100830078125, 0.12762832641601562, 0.13653564453125, 0.14544296264648438, 0.15435028076171875, 0.16325759887695312, 0.1721649169921875, 0.18107223510742188, 0.18997955322265625, 0.19888687133789062, 0.207794189453125, 0.21670150756835938, 0.22560882568359375, 0.23451614379882812, 0.2434234619140625, 0.2523307800292969, 0.26123809814453125, 0.2701454162597656, 0.279052734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 11.0, 17.0, 16.0, 22.0, 70.0, 166.0, 290.0, 250.0, 91.0, 35.0, 9.0, 10.0, 7.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1014404296875, -0.09822463989257812, -0.09500885009765625, -0.09179306030273438, -0.0885772705078125, -0.08536148071289062, -0.08214569091796875, -0.07892990112304688, -0.075714111328125, -0.07249832153320312, -0.06928253173828125, -0.06606674194335938, -0.0628509521484375, -0.059635162353515625, -0.05641937255859375, -0.053203582763671875, -0.04998779296875, -0.046772003173828125, -0.04355621337890625, -0.040340423583984375, -0.0371246337890625, -0.033908843994140625, -0.03069305419921875, -0.027477264404296875, -0.024261474609375, -0.021045684814453125, -0.01782989501953125, -0.014614105224609375, -0.0113983154296875, -0.008182525634765625, -0.00496673583984375, -0.001750946044921875, 0.00146484375, 0.004680633544921875, 0.00789642333984375, 0.011112213134765625, 0.0143280029296875, 0.017543792724609375, 0.02075958251953125, 0.023975372314453125, 0.027191162109375, 0.030406951904296875, 0.03362274169921875, 0.036838531494140625, 0.0400543212890625, 0.043270111083984375, 0.04648590087890625, 0.049701690673828125, 0.05291748046875, 0.056133270263671875, 0.05934906005859375, 0.06256484985351562, 0.0657806396484375, 0.06899642944335938, 0.07221221923828125, 0.07542800903320312, 0.078643798828125, 0.08185958862304688, 0.08507537841796875, 0.08829116821289062, 0.0915069580078125, 0.09472274780273438, 0.09793853759765625, 0.10115432739257812, 0.1043701171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 5.0, 12.0, 20.0, 20.0, 35.0, 34.0, 45.0, 84.0, 120.0, 168.0, 250.0, 378.0, 652.0, 1274.0, 2564.0, 7550.0, 50289.0, 684883.0, 270945.0, 20606.0, 4433.0, 1782.0, 913.0, 498.0, 308.0, 214.0, 155.0, 95.0, 51.0, 40.0, 36.0, 26.0, 13.0, 17.0, 8.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.33251953125, -0.3232307434082031, -0.31394195556640625, -0.3046531677246094, -0.2953643798828125, -0.2860755920410156, -0.27678680419921875, -0.2674980163574219, -0.258209228515625, -0.24892044067382812, -0.23963165283203125, -0.23034286499023438, -0.2210540771484375, -0.21176528930664062, -0.20247650146484375, -0.19318771362304688, -0.18389892578125, -0.17461013793945312, -0.16532135009765625, -0.15603256225585938, -0.1467437744140625, -0.13745498657226562, -0.12816619873046875, -0.11887741088867188, -0.109588623046875, -0.10029983520507812, -0.09101104736328125, -0.08172225952148438, -0.0724334716796875, -0.06314468383789062, -0.05385589599609375, -0.044567108154296875, -0.0352783203125, -0.025989532470703125, -0.01670074462890625, -0.007411956787109375, 0.0018768310546875, 0.011165618896484375, 0.02045440673828125, 0.029743194580078125, 0.039031982421875, 0.048320770263671875, 0.05760955810546875, 0.06689834594726562, 0.0761871337890625, 0.08547592163085938, 0.09476470947265625, 0.10405349731445312, 0.11334228515625, 0.12263107299804688, 0.13191986083984375, 0.14120864868164062, 0.1504974365234375, 0.15978622436523438, 0.16907501220703125, 0.17836380004882812, 0.187652587890625, 0.19694137573242188, 0.20623016357421875, 0.21551895141601562, 0.2248077392578125, 0.23409652709960938, 0.24338531494140625, 0.2526741027832031, 0.261962890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 1.0, 9.0, 9.0, 9.0, 10.0, 16.0, 12.0, 27.0, 24.0, 35.0, 37.0, 26.0, 41.0, 61.0, 54.0, 46.0, 49.0, 57.0, 43.0, 41.0, 50.0, 44.0, 48.0, 52.0, 33.0, 26.0, 27.0, 24.0, 16.0, 17.0, 14.0, 10.0, 11.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.270263671875, -0.2636280059814453, -0.2569923400878906, -0.25035667419433594, -0.24372100830078125, -0.23708534240722656, -0.23044967651367188, -0.2238140106201172, -0.2171783447265625, -0.2105426788330078, -0.20390701293945312, -0.19727134704589844, -0.19063568115234375, -0.18400001525878906, -0.17736434936523438, -0.1707286834716797, -0.164093017578125, -0.1574573516845703, -0.15082168579101562, -0.14418601989746094, -0.13755035400390625, -0.13091468811035156, -0.12427902221679688, -0.11764335632324219, -0.1110076904296875, -0.10437202453613281, -0.09773635864257812, -0.09110069274902344, -0.08446502685546875, -0.07782936096191406, -0.07119369506835938, -0.06455802917480469, -0.05792236328125, -0.05128669738769531, -0.044651031494140625, -0.03801536560058594, -0.03137969970703125, -0.024744033813476562, -0.018108367919921875, -0.011472702026367188, -0.0048370361328125, 0.0017986297607421875, 0.008434295654296875, 0.015069961547851562, 0.02170562744140625, 0.028341293334960938, 0.034976959228515625, 0.04161262512207031, 0.048248291015625, 0.05488395690917969, 0.061519622802734375, 0.06815528869628906, 0.07479095458984375, 0.08142662048339844, 0.08806228637695312, 0.09469795227050781, 0.1013336181640625, 0.10796928405761719, 0.11460494995117188, 0.12124061584472656, 0.12787628173828125, 0.13451194763183594, 0.14114761352539062, 0.1477832794189453, 0.1544189453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 2.0, 9.0, 15.0, 22.0, 23.0, 33.0, 65.0, 111.0, 219.0, 420.0, 978.0, 2565.0, 10290.0, 153450.0, 830715.0, 40999.0, 5514.0, 1711.0, 667.0, 308.0, 176.0, 86.0, 49.0, 35.0, 20.0, 20.0, 15.0, 8.0, 7.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.174072265625, -0.1686840057373047, -0.16329574584960938, -0.15790748596191406, -0.15251922607421875, -0.14713096618652344, -0.14174270629882812, -0.1363544464111328, -0.1309661865234375, -0.1255779266357422, -0.12018966674804688, -0.11480140686035156, -0.10941314697265625, -0.10402488708496094, -0.09863662719726562, -0.09324836730957031, -0.087860107421875, -0.08247184753417969, -0.07708358764648438, -0.07169532775878906, -0.06630706787109375, -0.06091880798339844, -0.055530548095703125, -0.05014228820800781, -0.0447540283203125, -0.03936576843261719, -0.033977508544921875, -0.028589248657226562, -0.02320098876953125, -0.017812728881835938, -0.012424468994140625, -0.0070362091064453125, -0.00164794921875, 0.0037403106689453125, 0.009128570556640625, 0.014516830444335938, 0.01990509033203125, 0.025293350219726562, 0.030681610107421875, 0.03606986999511719, 0.0414581298828125, 0.04684638977050781, 0.052234649658203125, 0.05762290954589844, 0.06301116943359375, 0.06839942932128906, 0.07378768920898438, 0.07917594909667969, 0.084564208984375, 0.08995246887207031, 0.09534072875976562, 0.10072898864746094, 0.10611724853515625, 0.11150550842285156, 0.11689376831054688, 0.12228202819824219, 0.1276702880859375, 0.1330585479736328, 0.13844680786132812, 0.14383506774902344, 0.14922332763671875, 0.15461158752441406, 0.15999984741210938, 0.1653881072998047, 0.1707763671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 2.0, 5.0, 9.0, 8.0, 8.0, 9.0, 14.0, 19.0, 31.0, 45.0, 99.0, 212.0, 233.0, 105.0, 57.0, 34.0, 32.0, 19.0, 15.0, 10.0, 6.0, 5.0, 8.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001747608184814453, -0.00016832351684570312, -0.00016188621520996094, -0.00015544891357421875, -0.00014901161193847656, -0.00014257431030273438, -0.0001361370086669922, -0.00012969970703125, -0.0001232624053955078, -0.00011682510375976562, -0.00011038780212402344, -0.00010395050048828125, -9.751319885253906e-05, -9.107589721679688e-05, -8.463859558105469e-05, -7.82012939453125e-05, -7.176399230957031e-05, -6.532669067382812e-05, -5.888938903808594e-05, -5.245208740234375e-05, -4.601478576660156e-05, -3.9577484130859375e-05, -3.314018249511719e-05, -2.6702880859375e-05, -2.0265579223632812e-05, -1.3828277587890625e-05, -7.3909759521484375e-06, -9.5367431640625e-07, 5.4836273193359375e-06, 1.1920928955078125e-05, 1.8358230590820312e-05, 2.47955322265625e-05, 3.123283386230469e-05, 3.7670135498046875e-05, 4.410743713378906e-05, 5.054473876953125e-05, 5.698204040527344e-05, 6.341934204101562e-05, 6.985664367675781e-05, 7.62939453125e-05, 8.273124694824219e-05, 8.916854858398438e-05, 9.560585021972656e-05, 0.00010204315185546875, 0.00010848045349121094, 0.00011491775512695312, 0.00012135505676269531, 0.0001277923583984375, 0.0001342296600341797, 0.00014066696166992188, 0.00014710426330566406, 0.00015354156494140625, 0.00015997886657714844, 0.00016641616821289062, 0.0001728534698486328, 0.000179290771484375, 0.0001857280731201172, 0.00019216537475585938, 0.00019860267639160156, 0.00020503997802734375, 0.00021147727966308594, 0.00021791458129882812, 0.0002243518829345703, 0.0002307891845703125, 0.0002372264862060547]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 13.0, 13.0, 24.0, 37.0, 57.0, 72.0, 129.0, 193.0, 391.0, 728.0, 1630.0, 4203.0, 15172.0, 144186.0, 783347.0, 80667.0, 11271.0, 3484.0, 1373.0, 644.0, 363.0, 180.0, 113.0, 61.0, 60.0, 35.0, 20.0, 17.0, 13.0, 17.0, 8.0, 11.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.173828125, -0.1690521240234375, -0.164276123046875, -0.1595001220703125, -0.15472412109375, -0.1499481201171875, -0.145172119140625, -0.1403961181640625, -0.1356201171875, -0.1308441162109375, -0.126068115234375, -0.1212921142578125, -0.11651611328125, -0.1117401123046875, -0.106964111328125, -0.1021881103515625, -0.097412109375, -0.0926361083984375, -0.087860107421875, -0.0830841064453125, -0.07830810546875, -0.0735321044921875, -0.068756103515625, -0.0639801025390625, -0.0592041015625, -0.0544281005859375, -0.049652099609375, -0.0448760986328125, -0.04010009765625, -0.0353240966796875, -0.030548095703125, -0.0257720947265625, -0.02099609375, -0.0162200927734375, -0.011444091796875, -0.0066680908203125, -0.00189208984375, 0.0028839111328125, 0.007659912109375, 0.0124359130859375, 0.0172119140625, 0.0219879150390625, 0.026763916015625, 0.0315399169921875, 0.03631591796875, 0.0410919189453125, 0.045867919921875, 0.0506439208984375, 0.055419921875, 0.0601959228515625, 0.064971923828125, 0.0697479248046875, 0.07452392578125, 0.0792999267578125, 0.084075927734375, 0.0888519287109375, 0.0936279296875, 0.0984039306640625, 0.103179931640625, 0.1079559326171875, 0.11273193359375, 0.1175079345703125, 0.122283935546875, 0.1270599365234375, 0.1318359375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 1.0, 3.0, 7.0, 7.0, 17.0, 17.0, 28.0, 51.0, 52.0, 85.0, 91.0, 120.0, 127.0, 86.0, 88.0, 57.0, 36.0, 33.0, 27.0, 13.0, 16.0, 13.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.13589859008789062, -0.13190460205078125, -0.12791061401367188, -0.1239166259765625, -0.11992263793945312, -0.11592864990234375, -0.11193466186523438, -0.107940673828125, -0.10394668579101562, -0.09995269775390625, -0.09595870971679688, -0.0919647216796875, -0.08797073364257812, -0.08397674560546875, -0.07998275756835938, -0.07598876953125, -0.07199478149414062, -0.06800079345703125, -0.06400680541992188, -0.0600128173828125, -0.056018829345703125, -0.05202484130859375, -0.048030853271484375, -0.044036865234375, -0.040042877197265625, -0.03604888916015625, -0.032054901123046875, -0.0280609130859375, -0.024066925048828125, -0.02007293701171875, -0.016078948974609375, -0.0120849609375, -0.008090972900390625, -0.00409698486328125, -0.000102996826171875, 0.0038909912109375, 0.007884979248046875, 0.01187896728515625, 0.015872955322265625, 0.019866943359375, 0.023860931396484375, 0.02785491943359375, 0.031848907470703125, 0.0358428955078125, 0.039836883544921875, 0.04383087158203125, 0.047824859619140625, 0.05181884765625, 0.055812835693359375, 0.05980682373046875, 0.06380081176757812, 0.0677947998046875, 0.07178878784179688, 0.07578277587890625, 0.07977676391601562, 0.083770751953125, 0.08776473999023438, 0.09175872802734375, 0.09575271606445312, 0.0997467041015625, 0.10374069213867188, 0.10773468017578125, 0.11172866821289062, 0.11572265625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 25.0, 379.0, 580.0, 18.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.153179168701172, -11.932692527770996, -11.712206840515137, -11.491720199584961, -11.271233558654785, -11.05074691772461, -10.83026123046875, -10.609774589538574, -10.389287948608398, -10.168801307678223, -9.948315620422363, -9.727828979492188, -9.507342338562012, -9.286855697631836, -9.066370010375977, -8.8458833694458, -8.625396728515625, -8.40491008758545, -8.18442440032959, -7.963937759399414, -7.743451118469238, -7.522964954376221, -7.302478313446045, -7.081992149353027, -6.86150598526001, -6.641019821166992, -6.420533180236816, -6.200047016143799, -5.979560375213623, -5.7590742111206055, -5.53858757019043, -5.318101406097412, -5.097614765167236, -4.877128601074219, -4.656641960144043, -4.436155796051025, -4.21566915512085, -3.995182991027832, -3.7746963500976562, -3.5542101860046387, -3.333723545074463, -3.113237142562866, -2.8927507400512695, -2.672264337539673, -2.451777935028076, -2.2312917709350586, -2.010805130004883, -1.7903188467025757, -1.5698325634002686, -1.3493461608886719, -1.1288597583770752, -0.9083734154701233, -0.6878870129585266, -0.4674006700515747, -0.24691426753997803, -0.026427865028381348, 0.19405853748321533, 0.414544939994812, 0.6350313425064087, 0.8555176854133606, 1.0760040283203125, 1.2964904308319092, 1.5169768333435059, 1.7374632358551025, 1.9579496383666992]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 12.0, 12.0, 5.0, 10.0, 21.0, 22.0, 32.0, 44.0, 47.0, 49.0, 55.0, 69.0, 73.0, 63.0, 57.0, 58.0, 55.0, 44.0, 47.0, 41.0, 36.0, 35.0, 21.0, 27.0, 17.0, 17.0, 9.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.251816749572754, -1.1966667175292969, -1.1415166854858398, -1.0863665342330933, -1.0312165021896362, -0.9760664701461792, -0.9209163784980774, -0.8657662868499756, -0.8106162548065186, -0.7554662227630615, -0.7003161311149597, -0.6451660394668579, -0.5900160074234009, -0.5348659753799438, -0.47971588373184204, -0.4245658218860626, -0.3694157600402832, -0.3142656981945038, -0.25911563634872437, -0.20396557450294495, -0.14881551265716553, -0.09366545081138611, -0.03851538896560669, 0.01663467288017273, 0.07178473472595215, 0.12693479657173157, 0.182084858417511, 0.2372349202632904, 0.2923849821090698, 0.34753504395484924, 0.40268510580062866, 0.4578351676464081, 0.5129852294921875, 0.5681352615356445, 0.6232853531837463, 0.6784354448318481, 0.7335854768753052, 0.7887355089187622, 0.843885600566864, 0.8990356922149658, 0.9541857242584229, 1.0093357563018799, 1.064485788345337, 1.1196359395980835, 1.1747859716415405, 1.2299360036849976, 1.2850861549377441, 1.3402361869812012, 1.3953862190246582, 1.4505362510681152, 1.5056862831115723, 1.5608364343643188, 1.6159864664077759, 1.671136498451233, 1.7262866497039795, 1.7814366817474365, 1.8365867137908936, 1.8917367458343506, 1.9468867778778076, 2.0020368099212646, 2.057187080383301, 2.112337112426758, 2.167487144470215, 2.222637176513672, 2.277787208557129]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 8.0, 7.0, 16.0, 16.0, 23.0, 35.0, 71.0, 114.0, 220.0, 527.0, 1580.0, 8503.0, 4056540.0, 121050.0, 3924.0, 929.0, 320.0, 161.0, 75.0, 51.0, 38.0, 19.0, 15.0, 5.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5664443969726562, -0.5445098876953125, -0.5225753784179688, -0.500640869140625, -0.47870635986328125, -0.4567718505859375, -0.43483734130859375, -0.41290283203125, -0.39096832275390625, -0.3690338134765625, -0.34709930419921875, -0.325164794921875, -0.30323028564453125, -0.2812957763671875, -0.25936126708984375, -0.2374267578125, -0.21549224853515625, -0.1935577392578125, -0.17162322998046875, -0.149688720703125, -0.12775421142578125, -0.1058197021484375, -0.08388519287109375, -0.06195068359375, -0.04001617431640625, -0.0180816650390625, 0.00385284423828125, 0.025787353515625, 0.04772186279296875, 0.0696563720703125, 0.09159088134765625, 0.113525390625, 0.13545989990234375, 0.1573944091796875, 0.17932891845703125, 0.201263427734375, 0.22319793701171875, 0.2451324462890625, 0.26706695556640625, 0.28900146484375, 0.31093597412109375, 0.3328704833984375, 0.35480499267578125, 0.376739501953125, 0.39867401123046875, 0.4206085205078125, 0.44254302978515625, 0.4644775390625, 0.48641204833984375, 0.5083465576171875, 0.5302810668945312, 0.552215576171875, 0.5741500854492188, 0.5960845947265625, 0.6180191040039062, 0.63995361328125, 0.6618881225585938, 0.6838226318359375, 0.7057571411132812, 0.727691650390625, 0.7496261596679688, 0.7715606689453125, 0.7934951782226562, 0.8154296875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 15.0, 18.0, 17.0, 53.0, 126.0, 219.0, 245.0, 163.0, 81.0, 27.0, 13.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.093017578125, -0.08992671966552734, -0.08683586120605469, -0.08374500274658203, -0.08065414428710938, -0.07756328582763672, -0.07447242736816406, -0.0713815689086914, -0.06829071044921875, -0.0651998519897461, -0.06210899353027344, -0.05901813507080078, -0.055927276611328125, -0.05283641815185547, -0.04974555969238281, -0.046654701232910156, -0.0435638427734375, -0.040472984313964844, -0.03738212585449219, -0.03429126739501953, -0.031200408935546875, -0.02810955047607422, -0.025018692016601562, -0.021927833557128906, -0.01883697509765625, -0.015746116638183594, -0.012655258178710938, -0.009564399719238281, -0.006473541259765625, -0.0033826828002929688, -0.0002918243408203125, 0.0027990341186523438, 0.005889892578125, 0.008980751037597656, 0.012071609497070312, 0.015162467956542969, 0.018253326416015625, 0.02134418487548828, 0.024435043334960938, 0.027525901794433594, 0.03061676025390625, 0.033707618713378906, 0.03679847717285156, 0.03988933563232422, 0.042980194091796875, 0.04607105255126953, 0.04916191101074219, 0.052252769470214844, 0.0553436279296875, 0.058434486389160156, 0.06152534484863281, 0.06461620330810547, 0.06770706176757812, 0.07079792022705078, 0.07388877868652344, 0.0769796371459961, 0.08007049560546875, 0.0831613540649414, 0.08625221252441406, 0.08934307098388672, 0.09243392944335938, 0.09552478790283203, 0.09861564636230469, 0.10170650482177734, 0.10479736328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 3.0, 4.0, 9.0, 16.0, 17.0, 22.0, 34.0, 56.0, 115.0, 222.0, 433.0, 929.0, 2340.0, 9778.0, 192169.0, 3960707.0, 21379.0, 3742.0, 1240.0, 532.0, 222.0, 136.0, 64.0, 33.0, 41.0, 7.0, 8.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48046875, -0.46506500244140625, -0.4496612548828125, -0.43425750732421875, -0.418853759765625, -0.40345001220703125, -0.3880462646484375, -0.37264251708984375, -0.35723876953125, -0.34183502197265625, -0.3264312744140625, -0.31102752685546875, -0.295623779296875, -0.28022003173828125, -0.2648162841796875, -0.24941253662109375, -0.2340087890625, -0.21860504150390625, -0.2032012939453125, -0.18779754638671875, -0.172393798828125, -0.15699005126953125, -0.1415863037109375, -0.12618255615234375, -0.11077880859375, -0.09537506103515625, -0.0799713134765625, -0.06456756591796875, -0.049163818359375, -0.03376007080078125, -0.0183563232421875, -0.00295257568359375, 0.012451171875, 0.02785491943359375, 0.0432586669921875, 0.05866241455078125, 0.074066162109375, 0.08946990966796875, 0.1048736572265625, 0.12027740478515625, 0.13568115234375, 0.15108489990234375, 0.1664886474609375, 0.18189239501953125, 0.197296142578125, 0.21269989013671875, 0.2281036376953125, 0.24350738525390625, 0.2589111328125, 0.27431488037109375, 0.2897186279296875, 0.30512237548828125, 0.320526123046875, 0.33592987060546875, 0.3513336181640625, 0.36673736572265625, 0.38214111328125, 0.39754486083984375, 0.4129486083984375, 0.42835235595703125, 0.443756103515625, 0.45915985107421875, 0.4745635986328125, 0.48996734619140625, 0.50537109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 11.0, 13.0, 25.0, 51.0, 123.0, 719.0, 2718.0, 239.0, 72.0, 30.0, 19.0, 14.0, 9.0, 6.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12194061279296875, -0.1179046630859375, -0.11386871337890625, -0.109832763671875, -0.10579681396484375, -0.1017608642578125, -0.09772491455078125, -0.09368896484375, -0.08965301513671875, -0.0856170654296875, -0.08158111572265625, -0.077545166015625, -0.07350921630859375, -0.0694732666015625, -0.06543731689453125, -0.0614013671875, -0.05736541748046875, -0.0533294677734375, -0.04929351806640625, -0.045257568359375, -0.04122161865234375, -0.0371856689453125, -0.03314971923828125, -0.02911376953125, -0.02507781982421875, -0.0210418701171875, -0.01700592041015625, -0.012969970703125, -0.00893402099609375, -0.0048980712890625, -0.00086212158203125, 0.003173828125, 0.00720977783203125, 0.0112457275390625, 0.01528167724609375, 0.019317626953125, 0.02335357666015625, 0.0273895263671875, 0.03142547607421875, 0.03546142578125, 0.03949737548828125, 0.0435333251953125, 0.04756927490234375, 0.051605224609375, 0.05564117431640625, 0.0596771240234375, 0.06371307373046875, 0.0677490234375, 0.07178497314453125, 0.0758209228515625, 0.07985687255859375, 0.083892822265625, 0.08792877197265625, 0.0919647216796875, 0.09600067138671875, 0.10003662109375, 0.10407257080078125, 0.1081085205078125, 0.11214447021484375, 0.116180419921875, 0.12021636962890625, 0.1242523193359375, 0.12828826904296875, 0.13232421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 19.0, 194.0, 723.0, 54.0, 13.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.944915771484375, -2.886420726776123, -2.82792592048645, -2.7694308757781982, -2.7109360694885254, -2.6524410247802734, -2.5939462184906006, -2.5354511737823486, -2.476956367492676, -2.418461322784424, -2.359966516494751, -2.301471471786499, -2.242976665496826, -2.184481620788574, -2.1259868144989014, -2.0674917697906494, -2.0089969635009766, -1.9505020380020142, -1.8920071125030518, -1.8335121870040894, -1.775017261505127, -1.7165223360061646, -1.6580274105072021, -1.5995323657989502, -1.5410373210906982, -1.4825423955917358, -1.4240474700927734, -1.365552544593811, -1.3070576190948486, -1.2485626935958862, -1.1900677680969238, -1.1315727233886719, -1.073077917098999, -1.0145829916000366, -0.9560880661010742, -0.8975931406021118, -0.8390982151031494, -0.780603289604187, -0.7221083045005798, -0.6636133790016174, -0.605118453502655, -0.5466235280036926, -0.4881286025047302, -0.42963364720344543, -0.37113872170448303, -0.31264379620552063, -0.25414884090423584, -0.19565391540527344, -0.13715898990631104, -0.07866405695676804, -0.020169124007225037, 0.03832581639289856, 0.09682074189186096, 0.15531566739082336, 0.21381062269210815, 0.27230554819107056, 0.33080047369003296, 0.38929539918899536, 0.44779032468795776, 0.5062853097915649, 0.5647802352905273, 0.6232751607894897, 0.6817700862884521, 0.7402650117874146, 0.798759937286377]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 2.0, 10.0, 15.0, 12.0, 12.0, 19.0, 23.0, 26.0, 21.0, 36.0, 42.0, 41.0, 41.0, 38.0, 51.0, 54.0, 54.0, 48.0, 59.0, 58.0, 49.0, 31.0, 31.0, 45.0, 43.0, 15.0, 18.0, 19.0, 15.0, 16.0, 7.0, 12.0, 13.0, 8.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2920803427696228, -0.2838532328605652, -0.27562612295150757, -0.26739904284477234, -0.2591719329357147, -0.2509448230266571, -0.24271772801876068, -0.23449063301086426, -0.22626352310180664, -0.21803641319274902, -0.2098093181848526, -0.20158222317695618, -0.19335511326789856, -0.18512800335884094, -0.17690090835094452, -0.1686738133430481, -0.16044670343399048, -0.15221959352493286, -0.14399249851703644, -0.13576540350914001, -0.1275382936000824, -0.11931119114160538, -0.11108408868312836, -0.10285698622465134, -0.09462988376617432, -0.0864027813076973, -0.07817567884922028, -0.06994857639074326, -0.061721473932266235, -0.053494371473789215, -0.045267269015312195, -0.037040166556835175, -0.028813064098358154, -0.020585961639881134, -0.012358859181404114, -0.0041317567229270935, 0.004095345735549927, 0.012322448194026947, 0.020549550652503967, 0.028776653110980988, 0.03700375556945801, 0.04523085802793503, 0.05345796048641205, 0.06168506294488907, 0.06991216540336609, 0.07813926786184311, 0.08636637032032013, 0.09459347277879715, 0.10282057523727417, 0.11104767769575119, 0.11927478015422821, 0.12750187516212463, 0.13572898507118225, 0.14395609498023987, 0.1521831899881363, 0.16041028499603271, 0.16863739490509033, 0.17686450481414795, 0.18509159982204437, 0.1933186948299408, 0.2015458047389984, 0.20977291464805603, 0.21800000965595245, 0.22622710466384888, 0.2344542145729065]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 19.0, 14.0, 27.0, 38.0, 44.0, 56.0, 90.0, 118.0, 157.0, 241.0, 380.0, 603.0, 990.0, 2230.0, 7859.0, 68327.0, 825119.0, 125418.0, 11039.0, 2683.0, 1185.0, 619.0, 378.0, 275.0, 176.0, 121.0, 92.0, 68.0, 49.0, 34.0, 24.0, 17.0, 14.0, 6.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2607421875, -0.25162506103515625, -0.2425079345703125, -0.23339080810546875, -0.224273681640625, -0.21515655517578125, -0.2060394287109375, -0.19692230224609375, -0.18780517578125, -0.17868804931640625, -0.1695709228515625, -0.16045379638671875, -0.151336669921875, -0.14221954345703125, -0.1331024169921875, -0.12398529052734375, -0.1148681640625, -0.10575103759765625, -0.0966339111328125, -0.08751678466796875, -0.078399658203125, -0.06928253173828125, -0.0601654052734375, -0.05104827880859375, -0.04193115234375, -0.03281402587890625, -0.0236968994140625, -0.01457977294921875, -0.005462646484375, 0.00365447998046875, 0.0127716064453125, 0.02188873291015625, 0.031005859375, 0.04012298583984375, 0.0492401123046875, 0.05835723876953125, 0.067474365234375, 0.07659149169921875, 0.0857086181640625, 0.09482574462890625, 0.10394287109375, 0.11305999755859375, 0.1221771240234375, 0.13129425048828125, 0.140411376953125, 0.14952850341796875, 0.1586456298828125, 0.16776275634765625, 0.1768798828125, 0.18599700927734375, 0.1951141357421875, 0.20423126220703125, 0.213348388671875, 0.22246551513671875, 0.2315826416015625, 0.24069976806640625, 0.24981689453125, 0.25893402099609375, 0.2680511474609375, 0.27716827392578125, 0.286285400390625, 0.29540252685546875, 0.3045196533203125, 0.31363677978515625, 0.32275390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 6.0, 20.0, 9.0, 26.0, 68.0, 127.0, 222.0, 234.0, 144.0, 82.0, 36.0, 9.0, 9.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09796142578125, -0.09480094909667969, -0.09164047241210938, -0.08847999572753906, -0.08531951904296875, -0.08215904235839844, -0.07899856567382812, -0.07583808898925781, -0.0726776123046875, -0.06951713562011719, -0.06635665893554688, -0.06319618225097656, -0.06003570556640625, -0.05687522888183594, -0.053714752197265625, -0.05055427551269531, -0.047393798828125, -0.04423332214355469, -0.041072845458984375, -0.03791236877441406, -0.03475189208984375, -0.03159141540527344, -0.028430938720703125, -0.025270462036132812, -0.0221099853515625, -0.018949508666992188, -0.015789031982421875, -0.012628555297851562, -0.00946807861328125, -0.0063076019287109375, -0.003147125244140625, 1.33514404296875e-05, 0.003173828125, 0.0063343048095703125, 0.009494781494140625, 0.012655258178710938, 0.01581573486328125, 0.018976211547851562, 0.022136688232421875, 0.025297164916992188, 0.0284576416015625, 0.03161811828613281, 0.034778594970703125, 0.03793907165527344, 0.04109954833984375, 0.04426002502441406, 0.047420501708984375, 0.05058097839355469, 0.053741455078125, 0.05690193176269531, 0.060062408447265625, 0.06322288513183594, 0.06638336181640625, 0.06954383850097656, 0.07270431518554688, 0.07586479187011719, 0.0790252685546875, 0.08218574523925781, 0.08534622192382812, 0.08850669860839844, 0.09166717529296875, 0.09482765197753906, 0.09798812866210938, 0.10114860534667969, 0.10430908203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 3.0, 11.0, 12.0, 16.0, 27.0, 27.0, 39.0, 86.0, 124.0, 264.0, 489.0, 965.0, 2391.0, 7433.0, 43299.0, 760428.0, 209280.0, 16509.0, 4095.0, 1512.0, 694.0, 349.0, 191.0, 95.0, 81.0, 35.0, 32.0, 13.0, 11.0, 15.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35888671875, -0.34722137451171875, -0.3355560302734375, -0.32389068603515625, -0.312225341796875, -0.30055999755859375, -0.2888946533203125, -0.27722930908203125, -0.26556396484375, -0.25389862060546875, -0.2422332763671875, -0.23056793212890625, -0.218902587890625, -0.20723724365234375, -0.1955718994140625, -0.18390655517578125, -0.1722412109375, -0.16057586669921875, -0.1489105224609375, -0.13724517822265625, -0.125579833984375, -0.11391448974609375, -0.1022491455078125, -0.09058380126953125, -0.07891845703125, -0.06725311279296875, -0.0555877685546875, -0.04392242431640625, -0.032257080078125, -0.02059173583984375, -0.0089263916015625, 0.00273895263671875, 0.014404296875, 0.02606964111328125, 0.0377349853515625, 0.04940032958984375, 0.061065673828125, 0.07273101806640625, 0.0843963623046875, 0.09606170654296875, 0.10772705078125, 0.11939239501953125, 0.1310577392578125, 0.14272308349609375, 0.154388427734375, 0.16605377197265625, 0.1777191162109375, 0.18938446044921875, 0.2010498046875, 0.21271514892578125, 0.2243804931640625, 0.23604583740234375, 0.247711181640625, 0.25937652587890625, 0.2710418701171875, 0.28270721435546875, 0.29437255859375, 0.30603790283203125, 0.3177032470703125, 0.32936859130859375, 0.341033935546875, 0.35269927978515625, 0.3643646240234375, 0.37602996826171875, 0.3876953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 12.0, 19.0, 18.0, 29.0, 32.0, 33.0, 52.0, 48.0, 54.0, 64.0, 62.0, 72.0, 65.0, 72.0, 52.0, 45.0, 42.0, 37.0, 32.0, 20.0, 27.0, 19.0, 21.0, 12.0, 8.0, 5.0, 12.0, 0.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.29052734375, -0.28219032287597656, -0.2738533020019531, -0.2655162811279297, -0.25717926025390625, -0.2488422393798828, -0.24050521850585938, -0.23216819763183594, -0.2238311767578125, -0.21549415588378906, -0.20715713500976562, -0.1988201141357422, -0.19048309326171875, -0.1821460723876953, -0.17380905151367188, -0.16547203063964844, -0.157135009765625, -0.14879798889160156, -0.14046096801757812, -0.1321239471435547, -0.12378692626953125, -0.11544990539550781, -0.10711288452148438, -0.09877586364746094, -0.0904388427734375, -0.08210182189941406, -0.07376480102539062, -0.06542778015136719, -0.05709075927734375, -0.04875373840332031, -0.040416717529296875, -0.03207969665527344, -0.02374267578125, -0.015405654907226562, -0.007068634033203125, 0.0012683868408203125, 0.00960540771484375, 0.017942428588867188, 0.026279449462890625, 0.03461647033691406, 0.0429534912109375, 0.05129051208496094, 0.059627532958984375, 0.06796455383300781, 0.07630157470703125, 0.08463859558105469, 0.09297561645507812, 0.10131263732910156, 0.109649658203125, 0.11798667907714844, 0.12632369995117188, 0.1346607208251953, 0.14299774169921875, 0.1513347625732422, 0.15967178344726562, 0.16800880432128906, 0.1763458251953125, 0.18468284606933594, 0.19301986694335938, 0.2013568878173828, 0.20969390869140625, 0.2180309295654297, 0.22636795043945312, 0.23470497131347656, 0.2430419921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 12.0, 12.0, 22.0, 26.0, 44.0, 61.0, 79.0, 112.0, 182.0, 236.0, 378.0, 696.0, 1607.0, 4612.0, 52068.0, 974863.0, 8616.0, 2466.0, 1010.0, 499.0, 272.0, 187.0, 126.0, 98.0, 66.0, 55.0, 40.0, 34.0, 15.0, 13.0, 8.0, 7.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.394775390625, -0.38126373291015625, -0.3677520751953125, -0.35424041748046875, -0.340728759765625, -0.32721710205078125, -0.3137054443359375, -0.30019378662109375, -0.28668212890625, -0.27317047119140625, -0.2596588134765625, -0.24614715576171875, -0.232635498046875, -0.21912384033203125, -0.2056121826171875, -0.19210052490234375, -0.1785888671875, -0.16507720947265625, -0.1515655517578125, -0.13805389404296875, -0.124542236328125, -0.11103057861328125, -0.0975189208984375, -0.08400726318359375, -0.07049560546875, -0.05698394775390625, -0.0434722900390625, -0.02996063232421875, -0.016448974609375, -0.00293731689453125, 0.0105743408203125, 0.02408599853515625, 0.03759765625, 0.05110931396484375, 0.0646209716796875, 0.07813262939453125, 0.091644287109375, 0.10515594482421875, 0.1186676025390625, 0.13217926025390625, 0.14569091796875, 0.15920257568359375, 0.1727142333984375, 0.18622589111328125, 0.199737548828125, 0.21324920654296875, 0.2267608642578125, 0.24027252197265625, 0.2537841796875, 0.26729583740234375, 0.2808074951171875, 0.29431915283203125, 0.307830810546875, 0.32134246826171875, 0.3348541259765625, 0.34836578369140625, 0.36187744140625, 0.37538909912109375, 0.3889007568359375, 0.40241241455078125, 0.415924072265625, 0.42943572998046875, 0.4429473876953125, 0.45645904541015625, 0.469970703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 6.0, 9.0, 9.0, 6.0, 10.0, 15.0, 9.0, 20.0, 32.0, 33.0, 37.0, 37.0, 43.0, 69.0, 100.0, 92.0, 82.0, 54.0, 62.0, 57.0, 37.0, 32.0, 26.0, 24.0, 18.0, 18.0, 15.0, 8.0, 3.0, 9.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.125471115112305e-05, -8.846446871757507e-05, -8.56742262840271e-05, -8.288398385047913e-05, -8.009374141693115e-05, -7.730349898338318e-05, -7.45132565498352e-05, -7.172301411628723e-05, -6.893277168273926e-05, -6.614252924919128e-05, -6.335228681564331e-05, -6.056204438209534e-05, -5.777180194854736e-05, -5.498155951499939e-05, -5.2191317081451416e-05, -4.940107464790344e-05, -4.661083221435547e-05, -4.3820589780807495e-05, -4.103034734725952e-05, -3.824010491371155e-05, -3.5449862480163574e-05, -3.26596200466156e-05, -2.9869377613067627e-05, -2.7079135179519653e-05, -2.428889274597168e-05, -2.1498650312423706e-05, -1.8708407878875732e-05, -1.591816544532776e-05, -1.3127923011779785e-05, -1.0337680578231812e-05, -7.547438144683838e-06, -4.757195711135864e-06, -1.9669532775878906e-06, 8.23289155960083e-07, 3.6135315895080566e-06, 6.40377402305603e-06, 9.194016456604004e-06, 1.1984258890151978e-05, 1.4774501323699951e-05, 1.7564743757247925e-05, 2.03549861907959e-05, 2.3145228624343872e-05, 2.5935471057891846e-05, 2.872571349143982e-05, 3.151595592498779e-05, 3.4306198358535767e-05, 3.709644079208374e-05, 3.9886683225631714e-05, 4.267692565917969e-05, 4.546716809272766e-05, 4.8257410526275635e-05, 5.104765295982361e-05, 5.383789539337158e-05, 5.6628137826919556e-05, 5.941838026046753e-05, 6.22086226940155e-05, 6.499886512756348e-05, 6.778910756111145e-05, 7.057934999465942e-05, 7.33695924282074e-05, 7.615983486175537e-05, 7.895007729530334e-05, 8.174031972885132e-05, 8.453056216239929e-05, 8.732080459594727e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 6.0, 11.0, 10.0, 13.0, 5.0, 23.0, 21.0, 23.0, 30.0, 48.0, 63.0, 111.0, 194.0, 322.0, 695.0, 1476.0, 3702.0, 12068.0, 178932.0, 817142.0, 24037.0, 5429.0, 2139.0, 890.0, 439.0, 247.0, 151.0, 79.0, 66.0, 42.0, 40.0, 27.0, 17.0, 9.0, 12.0, 5.0, 4.0, 8.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1595458984375, -0.15367889404296875, -0.1478118896484375, -0.14194488525390625, -0.136077880859375, -0.13021087646484375, -0.1243438720703125, -0.11847686767578125, -0.11260986328125, -0.10674285888671875, -0.1008758544921875, -0.09500885009765625, -0.089141845703125, -0.08327484130859375, -0.0774078369140625, -0.07154083251953125, -0.065673828125, -0.05980682373046875, -0.0539398193359375, -0.04807281494140625, -0.042205810546875, -0.03633880615234375, -0.0304718017578125, -0.02460479736328125, -0.01873779296875, -0.01287078857421875, -0.0070037841796875, -0.00113677978515625, 0.004730224609375, 0.01059722900390625, 0.0164642333984375, 0.02233123779296875, 0.0281982421875, 0.03406524658203125, 0.0399322509765625, 0.04579925537109375, 0.051666259765625, 0.05753326416015625, 0.0634002685546875, 0.06926727294921875, 0.07513427734375, 0.08100128173828125, 0.0868682861328125, 0.09273529052734375, 0.098602294921875, 0.10446929931640625, 0.1103363037109375, 0.11620330810546875, 0.1220703125, 0.12793731689453125, 0.1338043212890625, 0.13967132568359375, 0.145538330078125, 0.15140533447265625, 0.1572723388671875, 0.16313934326171875, 0.16900634765625, 0.17487335205078125, 0.1807403564453125, 0.18660736083984375, 0.192474365234375, 0.19834136962890625, 0.2042083740234375, 0.21007537841796875, 0.2159423828125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 11.0, 27.0, 52.0, 161.0, 264.0, 230.0, 123.0, 55.0, 24.0, 10.0, 5.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3115234375, -0.3033027648925781, -0.29508209228515625, -0.2868614196777344, -0.2786407470703125, -0.2704200744628906, -0.26219940185546875, -0.2539787292480469, -0.245758056640625, -0.23753738403320312, -0.22931671142578125, -0.22109603881835938, -0.2128753662109375, -0.20465469360351562, -0.19643402099609375, -0.18821334838867188, -0.17999267578125, -0.17177200317382812, -0.16355133056640625, -0.15533065795898438, -0.1471099853515625, -0.13888931274414062, -0.13066864013671875, -0.12244796752929688, -0.114227294921875, -0.10600662231445312, -0.09778594970703125, -0.08956527709960938, -0.0813446044921875, -0.07312393188476562, -0.06490325927734375, -0.056682586669921875, -0.0484619140625, -0.040241241455078125, -0.03202056884765625, -0.023799896240234375, -0.0155792236328125, -0.007358551025390625, 0.00086212158203125, 0.009082794189453125, 0.017303466796875, 0.025524139404296875, 0.03374481201171875, 0.041965484619140625, 0.0501861572265625, 0.058406829833984375, 0.06662750244140625, 0.07484817504882812, 0.08306884765625, 0.09128952026367188, 0.09951019287109375, 0.10773086547851562, 0.1159515380859375, 0.12417221069335938, 0.13239288330078125, 0.14061355590820312, 0.148834228515625, 0.15705490112304688, 0.16527557373046875, 0.17349624633789062, 0.1817169189453125, 0.18993759155273438, 0.19815826416015625, 0.20637893676757812, 0.214599609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 8.0, 15.0, 40.0, 111.0, 333.0, 337.0, 108.0, 31.0, 7.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.772488594055176, -4.659119606018066, -4.545750617980957, -4.432381629943848, -4.319012641906738, -4.205643653869629, -4.0922746658325195, -3.97890567779541, -3.865536689758301, -3.7521677017211914, -3.638798713684082, -3.5254297256469727, -3.4120607376098633, -3.298691749572754, -3.1853227615356445, -3.071953773498535, -2.958585023880005, -2.8452160358428955, -2.731847047805786, -2.6184780597686768, -2.5051090717315674, -2.391740083694458, -2.2783713340759277, -2.1650023460388184, -2.051633358001709, -1.9382643699645996, -1.8248953819274902, -1.7115263938903809, -1.5981574058532715, -1.484788417816162, -1.3714195489883423, -1.258050560951233, -1.144681692123413, -1.0313127040863037, -0.9179437160491943, -0.8045747876167297, -0.6912057995796204, -0.577836811542511, -0.4644678831100464, -0.351098895072937, -0.23772990703582764, -0.12436093389987946, -0.010991960763931274, 0.10237699747085571, 0.2157459855079651, 0.32911497354507446, 0.44248390197753906, 0.5558528900146484, 0.6692218780517578, 0.7825908660888672, 0.8959598541259766, 1.009328842163086, 1.1226978302001953, 1.2360668182373047, 1.3494356870651245, 1.4628046751022339, 1.5761736631393433, 1.6895426511764526, 1.802911639213562, 1.9162805080413818, 2.029649496078491, 2.1430184841156006, 2.25638747215271, 2.3697564601898193, 2.4831254482269287]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 7.0, 6.0, 15.0, 18.0, 17.0, 19.0, 28.0, 25.0, 38.0, 36.0, 47.0, 47.0, 57.0, 70.0, 55.0, 52.0, 49.0, 51.0, 39.0, 53.0, 50.0, 47.0, 39.0, 22.0, 20.0, 15.0, 17.0, 11.0, 12.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5680876970291138, -1.5160160064697266, -1.4639441967010498, -1.411872386932373, -1.3598006963729858, -1.3077290058135986, -1.2556571960449219, -1.2035853862762451, -1.151513695716858, -1.0994420051574707, -1.047370195388794, -0.995298445224762, -0.94322669506073, -0.891154944896698, -0.839083194732666, -0.787011444568634, -0.734939694404602, -0.6828679442405701, -0.6307961940765381, -0.5787244439125061, -0.5266526937484741, -0.47458094358444214, -0.42250919342041016, -0.3704374432563782, -0.3183656930923462, -0.2662939429283142, -0.21422219276428223, -0.16215044260025024, -0.11007869243621826, -0.05800694227218628, -0.005935192108154297, 0.046136558055877686, 0.09820842742919922, 0.1502801775932312, 0.20235192775726318, 0.25442367792129517, 0.30649542808532715, 0.35856717824935913, 0.4106389284133911, 0.4627106785774231, 0.5147824287414551, 0.5668541789054871, 0.618925929069519, 0.670997679233551, 0.723069429397583, 0.775141179561615, 0.827212929725647, 0.879284679889679, 0.9313564300537109, 0.9834281802177429, 1.035499930381775, 1.087571620941162, 1.1396434307098389, 1.1917152404785156, 1.2437869310379028, 1.29585862159729, 1.3479304313659668, 1.4000022411346436, 1.4520739316940308, 1.504145622253418, 1.5562174320220947, 1.6082892417907715, 1.6603609323501587, 1.712432622909546, 1.7645044326782227]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 21.0, 23.0, 54.0, 102.0, 258.0, 848.0, 6127.0, 4109695.0, 74126.0, 2219.0, 479.0, 154.0, 60.0, 49.0, 28.0, 7.0, 19.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7734375, -0.7498550415039062, -0.7262725830078125, -0.7026901245117188, -0.679107666015625, -0.6555252075195312, -0.6319427490234375, -0.6083602905273438, -0.58477783203125, -0.5611953735351562, -0.5376129150390625, -0.5140304565429688, -0.490447998046875, -0.46686553955078125, -0.4432830810546875, -0.41970062255859375, -0.3961181640625, -0.37253570556640625, -0.3489532470703125, -0.32537078857421875, -0.301788330078125, -0.27820587158203125, -0.2546234130859375, -0.23104095458984375, -0.20745849609375, -0.18387603759765625, -0.1602935791015625, -0.13671112060546875, -0.113128662109375, -0.08954620361328125, -0.0659637451171875, -0.04238128662109375, -0.018798828125, 0.00478363037109375, 0.0283660888671875, 0.05194854736328125, 0.075531005859375, 0.09911346435546875, 0.1226959228515625, 0.14627838134765625, 0.16986083984375, 0.19344329833984375, 0.2170257568359375, 0.24060821533203125, 0.264190673828125, 0.28777313232421875, 0.3113555908203125, 0.33493804931640625, 0.3585205078125, 0.38210296630859375, 0.4056854248046875, 0.42926788330078125, 0.452850341796875, 0.47643280029296875, 0.5000152587890625, 0.5235977172851562, 0.54718017578125, 0.5707626342773438, 0.5943450927734375, 0.6179275512695312, 0.641510009765625, 0.6650924682617188, 0.6886749267578125, 0.7122573852539062, 0.73583984375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 10.0, 9.0, 26.0, 43.0, 79.0, 129.0, 216.0, 181.0, 150.0, 73.0, 38.0, 21.0, 8.0, 9.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09442138671875, -0.09136486053466797, -0.08830833435058594, -0.0852518081665039, -0.08219528198242188, -0.07913875579833984, -0.07608222961425781, -0.07302570343017578, -0.06996917724609375, -0.06691265106201172, -0.06385612487792969, -0.060799598693847656, -0.057743072509765625, -0.054686546325683594, -0.05163002014160156, -0.04857349395751953, -0.0455169677734375, -0.04246044158935547, -0.03940391540527344, -0.036347389221191406, -0.033290863037109375, -0.030234336853027344, -0.027177810668945312, -0.02412128448486328, -0.02106475830078125, -0.01800823211669922, -0.014951705932617188, -0.011895179748535156, -0.008838653564453125, -0.005782127380371094, -0.0027256011962890625, 0.00033092498779296875, 0.003387451171875, 0.006443977355957031, 0.009500503540039062, 0.012557029724121094, 0.015613555908203125, 0.018670082092285156, 0.021726608276367188, 0.02478313446044922, 0.02783966064453125, 0.03089618682861328, 0.03395271301269531, 0.037009239196777344, 0.040065765380859375, 0.043122291564941406, 0.04617881774902344, 0.04923534393310547, 0.0522918701171875, 0.05534839630126953, 0.05840492248535156, 0.061461448669433594, 0.06451797485351562, 0.06757450103759766, 0.07063102722167969, 0.07368755340576172, 0.07674407958984375, 0.07980060577392578, 0.08285713195800781, 0.08591365814208984, 0.08897018432617188, 0.0920267105102539, 0.09508323669433594, 0.09813976287841797, 0.1011962890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 11.0, 13.0, 23.0, 29.0, 60.0, 89.0, 177.0, 414.0, 1100.0, 4916.0, 153116.0, 4023207.0, 8529.0, 1680.0, 486.0, 221.0, 81.0, 57.0, 37.0, 14.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.970703125, -0.9465179443359375, -0.922332763671875, -0.8981475830078125, -0.87396240234375, -0.8497772216796875, -0.825592041015625, -0.8014068603515625, -0.7772216796875, -0.7530364990234375, -0.728851318359375, -0.7046661376953125, -0.68048095703125, -0.6562957763671875, -0.632110595703125, -0.6079254150390625, -0.583740234375, -0.5595550537109375, -0.535369873046875, -0.5111846923828125, -0.48699951171875, -0.4628143310546875, -0.438629150390625, -0.4144439697265625, -0.3902587890625, -0.3660736083984375, -0.341888427734375, -0.3177032470703125, -0.29351806640625, -0.2693328857421875, -0.245147705078125, -0.2209625244140625, -0.19677734375, -0.1725921630859375, -0.148406982421875, -0.1242218017578125, -0.10003662109375, -0.0758514404296875, -0.051666259765625, -0.0274810791015625, -0.0032958984375, 0.0208892822265625, 0.045074462890625, 0.0692596435546875, 0.09344482421875, 0.1176300048828125, 0.141815185546875, 0.1660003662109375, 0.190185546875, 0.2143707275390625, 0.238555908203125, 0.2627410888671875, 0.28692626953125, 0.3111114501953125, 0.335296630859375, 0.3594818115234375, 0.3836669921875, 0.4078521728515625, 0.432037353515625, 0.4562225341796875, 0.48040771484375, 0.5045928955078125, 0.528778076171875, 0.5529632568359375, 0.5771484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 16.0, 29.0, 69.0, 288.0, 3327.0, 245.0, 46.0, 17.0, 12.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.21020889282226562, -0.20459747314453125, -0.19898605346679688, -0.1933746337890625, -0.18776321411132812, -0.18215179443359375, -0.17654037475585938, -0.170928955078125, -0.16531753540039062, -0.15970611572265625, -0.15409469604492188, -0.1484832763671875, -0.14287185668945312, -0.13726043701171875, -0.13164901733398438, -0.12603759765625, -0.12042617797851562, -0.11481475830078125, -0.10920333862304688, -0.1035919189453125, -0.09798049926757812, -0.09236907958984375, -0.08675765991210938, -0.081146240234375, -0.07553482055664062, -0.06992340087890625, -0.06431198120117188, -0.0587005615234375, -0.053089141845703125, -0.04747772216796875, -0.041866302490234375, -0.0362548828125, -0.030643463134765625, -0.02503204345703125, -0.019420623779296875, -0.0138092041015625, -0.008197784423828125, -0.00258636474609375, 0.003025054931640625, 0.008636474609375, 0.014247894287109375, 0.01985931396484375, 0.025470733642578125, 0.0310821533203125, 0.036693572998046875, 0.04230499267578125, 0.047916412353515625, 0.05352783203125, 0.059139251708984375, 0.06475067138671875, 0.07036209106445312, 0.0759735107421875, 0.08158493041992188, 0.08719635009765625, 0.09280776977539062, 0.098419189453125, 0.10403060913085938, 0.10964202880859375, 0.11525344848632812, 0.1208648681640625, 0.12647628784179688, 0.13208770751953125, 0.13769912719726562, 0.143310546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 10.0, 59.0, 351.0, 524.0, 56.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.796971321105957, -1.7426871061325073, -1.6884030103683472, -1.6341187953948975, -1.5798345804214478, -1.5255504846572876, -1.471266269683838, -1.4169821739196777, -1.362697958946228, -1.3084137439727783, -1.2541296482086182, -1.1998454332351685, -1.1455612182617188, -1.0912771224975586, -1.0369929075241089, -0.982708752155304, -0.9284245371818542, -0.8741403818130493, -0.8198561668395996, -0.7655720114707947, -0.7112878561019897, -0.65700364112854, -0.6027194857597351, -0.5484353303909302, -0.49415114521980286, -0.43986696004867554, -0.3855828046798706, -0.3312986195087433, -0.27701443433761597, -0.22273027896881104, -0.16844609379768372, -0.11416193842887878, -0.059877753257751465, -0.005593579262495041, 0.04869059473276138, 0.1029747724533081, 0.15725894272327423, 0.21154311299324036, 0.2658272981643677, 0.3201114535331726, 0.3743956387042999, 0.42867982387542725, 0.4829639792442322, 0.5372481346130371, 0.5915323495864868, 0.6458165049552917, 0.7001006603240967, 0.7543848752975464, 0.8086690306663513, 0.8629531860351562, 0.917237401008606, 0.9715215563774109, 1.0258057117462158, 1.0800899267196655, 1.1343741416931152, 1.1886582374572754, 1.242942452430725, 1.2972266674041748, 1.351510763168335, 1.4057949781417847, 1.4600791931152344, 1.5143632888793945, 1.5686475038528442, 1.622931718826294, 1.677215814590454]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 9.0, 10.0, 11.0, 14.0, 18.0, 31.0, 30.0, 32.0, 39.0, 36.0, 50.0, 52.0, 65.0, 61.0, 60.0, 59.0, 63.0, 53.0, 56.0, 31.0, 41.0, 34.0, 38.0, 16.0, 17.0, 17.0, 7.0, 5.0, 5.0, 9.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3317965865135193, -0.32152053713798523, -0.31124448776245117, -0.3009684383869171, -0.29069238901138306, -0.2804163098335266, -0.27014029026031494, -0.2598642110824585, -0.24958816170692444, -0.23931211233139038, -0.22903606295585632, -0.21876001358032227, -0.20848394930362701, -0.19820789992809296, -0.1879318505525589, -0.17765578627586365, -0.16737975180149078, -0.15710370242595673, -0.14682765305042267, -0.13655158877372742, -0.12627553939819336, -0.1159994900226593, -0.10572344064712524, -0.09544738382101059, -0.08517133444547653, -0.07489528506994247, -0.06461922824382782, -0.05434317886829376, -0.044067125767469406, -0.03379107266664505, -0.023515023291110992, -0.013238966464996338, -0.0029629170894622803, 0.007313135080039501, 0.017589187249541283, 0.02786523848772049, 0.038141291588544846, 0.0484173446893692, 0.05869339406490326, 0.06896945089101791, 0.07924550026655197, 0.08952154964208603, 0.09979760646820068, 0.11007365584373474, 0.1203497052192688, 0.13062575459480286, 0.14090180397033691, 0.15117786824703217, 0.16145391762256622, 0.17172996699810028, 0.18200601637363434, 0.1922820806503296, 0.20255813002586365, 0.2128341794013977, 0.22311022877693176, 0.23338627815246582, 0.24366232752799988, 0.25393837690353394, 0.264214426279068, 0.27449047565460205, 0.2847665250301361, 0.29504257440567017, 0.3053186535835266, 0.31559470295906067, 0.3258707523345947]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 5.0, 8.0, 9.0, 10.0, 16.0, 17.0, 31.0, 50.0, 73.0, 123.0, 187.0, 303.0, 569.0, 1118.0, 2759.0, 10632.0, 96672.0, 835743.0, 85329.0, 9657.0, 2754.0, 1090.0, 538.0, 325.0, 154.0, 118.0, 75.0, 55.0, 33.0, 27.0, 20.0, 17.0, 8.0, 3.0, 6.0, 1.0, 6.0, 9.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.255126953125, -0.24511337280273438, -0.23509979248046875, -0.22508621215820312, -0.2150726318359375, -0.20505905151367188, -0.19504547119140625, -0.18503189086914062, -0.175018310546875, -0.16500473022460938, -0.15499114990234375, -0.14497756958007812, -0.1349639892578125, -0.12495040893554688, -0.11493682861328125, -0.10492324829101562, -0.09490966796875, -0.08489608764648438, -0.07488250732421875, -0.06486892700195312, -0.0548553466796875, -0.044841766357421875, -0.03482818603515625, -0.024814605712890625, -0.014801025390625, -0.004787445068359375, 0.00522613525390625, 0.015239715576171875, 0.0252532958984375, 0.035266876220703125, 0.04528045654296875, 0.055294036865234375, 0.0653076171875, 0.07532119750976562, 0.08533477783203125, 0.09534835815429688, 0.1053619384765625, 0.11537551879882812, 0.12538909912109375, 0.13540267944335938, 0.145416259765625, 0.15542984008789062, 0.16544342041015625, 0.17545700073242188, 0.1854705810546875, 0.19548416137695312, 0.20549774169921875, 0.21551132202148438, 0.22552490234375, 0.23553848266601562, 0.24555206298828125, 0.2555656433105469, 0.2655792236328125, 0.2755928039550781, 0.28560638427734375, 0.2956199645996094, 0.305633544921875, 0.3156471252441406, 0.32566070556640625, 0.3356742858886719, 0.3456878662109375, 0.3557014465332031, 0.36571502685546875, 0.3757286071777344, 0.3857421875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 6.0, 9.0, 22.0, 30.0, 54.0, 90.0, 171.0, 192.0, 160.0, 131.0, 49.0, 40.0, 18.0, 9.0, 8.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0921630859375, -0.08923912048339844, -0.08631515502929688, -0.08339118957519531, -0.08046722412109375, -0.07754325866699219, -0.07461929321289062, -0.07169532775878906, -0.0687713623046875, -0.06584739685058594, -0.06292343139648438, -0.05999946594238281, -0.05707550048828125, -0.05415153503417969, -0.051227569580078125, -0.04830360412597656, -0.045379638671875, -0.04245567321777344, -0.039531707763671875, -0.03660774230957031, -0.03368377685546875, -0.030759811401367188, -0.027835845947265625, -0.024911880493164062, -0.0219879150390625, -0.019063949584960938, -0.016139984130859375, -0.013216018676757812, -0.01029205322265625, -0.0073680877685546875, -0.004444122314453125, -0.0015201568603515625, 0.00140380859375, 0.0043277740478515625, 0.007251739501953125, 0.010175704956054688, 0.01309967041015625, 0.016023635864257812, 0.018947601318359375, 0.021871566772460938, 0.0247955322265625, 0.027719497680664062, 0.030643463134765625, 0.03356742858886719, 0.03649139404296875, 0.03941535949707031, 0.042339324951171875, 0.04526329040527344, 0.048187255859375, 0.05111122131347656, 0.054035186767578125, 0.05695915222167969, 0.05988311767578125, 0.06280708312988281, 0.06573104858398438, 0.06865501403808594, 0.0715789794921875, 0.07450294494628906, 0.07742691040039062, 0.08035087585449219, 0.08327484130859375, 0.08619880676269531, 0.08912277221679688, 0.09204673767089844, 0.094970703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 7.0, 8.0, 16.0, 10.0, 28.0, 19.0, 35.0, 44.0, 61.0, 92.0, 130.0, 199.0, 271.0, 424.0, 753.0, 1477.0, 3296.0, 8694.0, 30525.0, 176676.0, 656045.0, 131086.0, 24951.0, 7484.0, 2881.0, 1344.0, 698.0, 396.0, 286.0, 200.0, 120.0, 84.0, 50.0, 38.0, 26.0, 22.0, 12.0, 11.0, 10.0, 10.0, 7.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.204345703125, -0.1978435516357422, -0.19134140014648438, -0.18483924865722656, -0.17833709716796875, -0.17183494567871094, -0.16533279418945312, -0.1588306427001953, -0.1523284912109375, -0.1458263397216797, -0.13932418823242188, -0.13282203674316406, -0.12631988525390625, -0.11981773376464844, -0.11331558227539062, -0.10681343078613281, -0.100311279296875, -0.09380912780761719, -0.08730697631835938, -0.08080482482910156, -0.07430267333984375, -0.06780052185058594, -0.061298370361328125, -0.05479621887207031, -0.0482940673828125, -0.04179191589355469, -0.035289764404296875, -0.028787612915039062, -0.02228546142578125, -0.015783309936523438, -0.009281158447265625, -0.0027790069580078125, 0.00372314453125, 0.010225296020507812, 0.016727447509765625, 0.023229598999023438, 0.02973175048828125, 0.03623390197753906, 0.042736053466796875, 0.04923820495605469, 0.0557403564453125, 0.06224250793457031, 0.06874465942382812, 0.07524681091308594, 0.08174896240234375, 0.08825111389160156, 0.09475326538085938, 0.10125541687011719, 0.107757568359375, 0.11425971984863281, 0.12076187133789062, 0.12726402282714844, 0.13376617431640625, 0.14026832580566406, 0.14677047729492188, 0.1532726287841797, 0.1597747802734375, 0.1662769317626953, 0.17277908325195312, 0.17928123474121094, 0.18578338623046875, 0.19228553771972656, 0.19878768920898438, 0.2052898406982422, 0.2117919921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 6.0, 5.0, 7.0, 16.0, 11.0, 16.0, 17.0, 14.0, 17.0, 22.0, 38.0, 24.0, 18.0, 41.0, 24.0, 38.0, 39.0, 39.0, 39.0, 31.0, 42.0, 44.0, 42.0, 42.0, 43.0, 30.0, 34.0, 41.0, 22.0, 31.0, 22.0, 24.0, 20.0, 11.0, 22.0, 14.0, 9.0, 9.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.177490234375, -0.17191123962402344, -0.16633224487304688, -0.1607532501220703, -0.15517425537109375, -0.1495952606201172, -0.14401626586914062, -0.13843727111816406, -0.1328582763671875, -0.12727928161621094, -0.12170028686523438, -0.11612129211425781, -0.11054229736328125, -0.10496330261230469, -0.09938430786132812, -0.09380531311035156, -0.088226318359375, -0.08264732360839844, -0.07706832885742188, -0.07148933410644531, -0.06591033935546875, -0.06033134460449219, -0.054752349853515625, -0.04917335510253906, -0.0435943603515625, -0.03801536560058594, -0.032436370849609375, -0.026857376098632812, -0.02127838134765625, -0.015699386596679688, -0.010120391845703125, -0.0045413970947265625, 0.00103759765625, 0.0066165924072265625, 0.012195587158203125, 0.017774581909179688, 0.02335357666015625, 0.028932571411132812, 0.034511566162109375, 0.04009056091308594, 0.0456695556640625, 0.05124855041503906, 0.056827545166015625, 0.06240653991699219, 0.06798553466796875, 0.07356452941894531, 0.07914352416992188, 0.08472251892089844, 0.090301513671875, 0.09588050842285156, 0.10145950317382812, 0.10703849792480469, 0.11261749267578125, 0.11819648742675781, 0.12377548217773438, 0.12935447692871094, 0.1349334716796875, 0.14051246643066406, 0.14609146118164062, 0.1516704559326172, 0.15724945068359375, 0.1628284454345703, 0.16840744018554688, 0.17398643493652344, 0.1795654296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 10.0, 11.0, 10.0, 10.0, 31.0, 37.0, 58.0, 86.0, 139.0, 261.0, 537.0, 1189.0, 3098.0, 11869.0, 108733.0, 830764.0, 77292.0, 9568.0, 2643.0, 1074.0, 445.0, 256.0, 140.0, 96.0, 62.0, 41.0, 26.0, 17.0, 9.0, 11.0, 4.0, 11.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11126708984375, -0.10748767852783203, -0.10370826721191406, -0.0999288558959961, -0.09614944458007812, -0.09237003326416016, -0.08859062194824219, -0.08481121063232422, -0.08103179931640625, -0.07725238800048828, -0.07347297668457031, -0.06969356536865234, -0.06591415405273438, -0.062134742736816406, -0.05835533142089844, -0.05457592010498047, -0.0507965087890625, -0.04701709747314453, -0.04323768615722656, -0.039458274841308594, -0.035678863525390625, -0.031899452209472656, -0.028120040893554688, -0.02434062957763672, -0.02056121826171875, -0.01678180694580078, -0.013002395629882812, -0.009222984313964844, -0.005443572998046875, -0.0016641616821289062, 0.0021152496337890625, 0.005894660949707031, 0.009674072265625, 0.013453483581542969, 0.017232894897460938, 0.021012306213378906, 0.024791717529296875, 0.028571128845214844, 0.03235054016113281, 0.03612995147705078, 0.03990936279296875, 0.04368877410888672, 0.04746818542480469, 0.051247596740722656, 0.055027008056640625, 0.058806419372558594, 0.06258583068847656, 0.06636524200439453, 0.0701446533203125, 0.07392406463623047, 0.07770347595214844, 0.0814828872680664, 0.08526229858398438, 0.08904170989990234, 0.09282112121582031, 0.09660053253173828, 0.10037994384765625, 0.10415935516357422, 0.10793876647949219, 0.11171817779541016, 0.11549758911132812, 0.1192770004272461, 0.12305641174316406, 0.12683582305908203, 0.130615234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 13.0, 10.0, 8.0, 15.0, 18.0, 19.0, 32.0, 34.0, 52.0, 53.0, 69.0, 97.0, 124.0, 95.0, 78.0, 46.0, 33.0, 29.0, 28.0, 25.0, 20.0, 18.0, 5.0, 11.0, 7.0, 5.0, 10.0, 4.0, 8.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.82012939453125e-05, -7.562246173620224e-05, -7.304362952709198e-05, -7.046479731798172e-05, -6.788596510887146e-05, -6.53071328997612e-05, -6.272830069065094e-05, -6.014946848154068e-05, -5.757063627243042e-05, -5.499180406332016e-05, -5.24129718542099e-05, -4.983413964509964e-05, -4.725530743598938e-05, -4.467647522687912e-05, -4.209764301776886e-05, -3.95188108086586e-05, -3.693997859954834e-05, -3.436114639043808e-05, -3.178231418132782e-05, -2.920348197221756e-05, -2.66246497631073e-05, -2.404581755399704e-05, -2.146698534488678e-05, -1.888815313577652e-05, -1.630932092666626e-05, -1.3730488717556e-05, -1.115165650844574e-05, -8.57282429933548e-06, -5.99399209022522e-06, -3.4151598811149597e-06, -8.363276720046997e-07, 1.7425045371055603e-06, 4.32133674621582e-06, 6.90016895532608e-06, 9.47900116443634e-06, 1.20578333735466e-05, 1.463666558265686e-05, 1.721549779176712e-05, 1.979433000087738e-05, 2.237316220998764e-05, 2.49519944190979e-05, 2.753082662820816e-05, 3.010965883731842e-05, 3.268849104642868e-05, 3.526732325553894e-05, 3.78461554646492e-05, 4.042498767375946e-05, 4.300381988286972e-05, 4.558265209197998e-05, 4.816148430109024e-05, 5.07403165102005e-05, 5.331914871931076e-05, 5.589798092842102e-05, 5.847681313753128e-05, 6.105564534664154e-05, 6.36344775557518e-05, 6.621330976486206e-05, 6.879214197397232e-05, 7.137097418308258e-05, 7.394980639219284e-05, 7.65286386013031e-05, 7.910747081041336e-05, 8.168630301952362e-05, 8.426513522863388e-05, 8.684396743774414e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 7.0, 11.0, 17.0, 9.0, 19.0, 22.0, 37.0, 40.0, 75.0, 114.0, 133.0, 220.0, 356.0, 590.0, 1177.0, 2397.0, 5347.0, 16255.0, 84129.0, 701185.0, 195141.0, 26965.0, 7887.0, 3018.0, 1385.0, 766.0, 414.0, 236.0, 170.0, 114.0, 79.0, 61.0, 44.0, 30.0, 23.0, 20.0, 16.0, 4.0, 7.0, 9.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.091552734375, -0.08856868743896484, -0.08558464050292969, -0.08260059356689453, -0.07961654663085938, -0.07663249969482422, -0.07364845275878906, -0.0706644058227539, -0.06768035888671875, -0.0646963119506836, -0.06171226501464844, -0.05872821807861328, -0.055744171142578125, -0.05276012420654297, -0.04977607727050781, -0.046792030334472656, -0.0438079833984375, -0.040823936462402344, -0.03783988952636719, -0.03485584259033203, -0.031871795654296875, -0.02888774871826172, -0.025903701782226562, -0.022919654846191406, -0.01993560791015625, -0.016951560974121094, -0.013967514038085938, -0.010983467102050781, -0.007999420166015625, -0.005015373229980469, -0.0020313262939453125, 0.0009527206420898438, 0.003936767578125, 0.006920814514160156, 0.009904861450195312, 0.012888908386230469, 0.015872955322265625, 0.01885700225830078, 0.021841049194335938, 0.024825096130371094, 0.02780914306640625, 0.030793190002441406, 0.03377723693847656, 0.03676128387451172, 0.039745330810546875, 0.04272937774658203, 0.04571342468261719, 0.048697471618652344, 0.0516815185546875, 0.054665565490722656, 0.05764961242675781, 0.06063365936279297, 0.06361770629882812, 0.06660175323486328, 0.06958580017089844, 0.0725698471069336, 0.07555389404296875, 0.0785379409790039, 0.08152198791503906, 0.08450603485107422, 0.08749008178710938, 0.09047412872314453, 0.09345817565917969, 0.09644222259521484, 0.09942626953125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 4.0, 1.0, 4.0, 4.0, 7.0, 3.0, 4.0, 9.0, 11.0, 13.0, 20.0, 24.0, 49.0, 75.0, 115.0, 158.0, 174.0, 107.0, 71.0, 52.0, 27.0, 19.0, 10.0, 12.0, 5.0, 6.0, 8.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.172607421875, -0.16793251037597656, -0.16325759887695312, -0.1585826873779297, -0.15390777587890625, -0.1492328643798828, -0.14455795288085938, -0.13988304138183594, -0.1352081298828125, -0.13053321838378906, -0.12585830688476562, -0.12118339538574219, -0.11650848388671875, -0.11183357238769531, -0.10715866088867188, -0.10248374938964844, -0.097808837890625, -0.09313392639160156, -0.08845901489257812, -0.08378410339355469, -0.07910919189453125, -0.07443428039550781, -0.06975936889648438, -0.06508445739746094, -0.0604095458984375, -0.05573463439941406, -0.051059722900390625, -0.04638481140136719, -0.04170989990234375, -0.03703498840332031, -0.032360076904296875, -0.027685165405273438, -0.02301025390625, -0.018335342407226562, -0.013660430908203125, -0.008985519409179688, -0.00431060791015625, 0.0003643035888671875, 0.005039215087890625, 0.009714126586914062, 0.0143890380859375, 0.019063949584960938, 0.023738861083984375, 0.028413772583007812, 0.03308868408203125, 0.03776359558105469, 0.042438507080078125, 0.04711341857910156, 0.051788330078125, 0.05646324157714844, 0.061138153076171875, 0.06581306457519531, 0.07048797607421875, 0.07516288757324219, 0.07983779907226562, 0.08451271057128906, 0.0891876220703125, 0.09386253356933594, 0.09853744506835938, 0.10321235656738281, 0.10788726806640625, 0.11256217956542969, 0.11723709106445312, 0.12191200256347656, 0.1265869140625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 22.0, 73.0, 365.0, 428.0, 86.0, 18.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.296441078186035, -4.186485767364502, -4.076530456542969, -3.9665749073028564, -3.8566195964813232, -3.74666428565979, -3.6367087364196777, -3.5267534255981445, -3.4167981147766113, -3.306842803955078, -3.196887493133545, -3.0869319438934326, -2.9769766330718994, -2.867021322250366, -2.757065773010254, -2.6471104621887207, -2.5371551513671875, -2.4271998405456543, -2.317244529724121, -2.207288980484009, -2.0973336696624756, -1.9873783588409424, -1.8774229288101196, -1.7674674987792969, -1.6575121879577637, -1.5475568771362305, -1.4376014471054077, -1.327646017074585, -1.2176907062530518, -1.1077353954315186, -0.9977799654006958, -0.8878245949745178, -0.7778692245483398, -0.6679138541221619, -0.5579584836959839, -0.4480031132698059, -0.33804774284362793, -0.22809237241744995, -0.11813700199127197, -0.008181631565093994, 0.10177373886108398, 0.21172910928726196, 0.32168447971343994, 0.4316398501396179, 0.5415952205657959, 0.6515505909919739, 0.7615059614181519, 0.8714613318443298, 0.9814167022705078, 1.091372013092041, 1.2013274431228638, 1.3112828731536865, 1.4212381839752197, 1.531193494796753, 1.6411489248275757, 1.7511043548583984, 1.8610596656799316, 1.9710149765014648, 2.080970287322998, 2.1909258365631104, 2.3008811473846436, 2.4108364582061768, 2.520792007446289, 2.6307473182678223, 2.7407026290893555]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 10.0, 19.0, 7.0, 24.0, 27.0, 34.0, 36.0, 23.0, 65.0, 51.0, 39.0, 60.0, 55.0, 65.0, 70.0, 50.0, 48.0, 50.0, 38.0, 39.0, 35.0, 37.0, 19.0, 14.0, 17.0, 17.0, 10.0, 12.0, 10.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.976169228553772, -0.932508111000061, -0.8888469934463501, -0.8451858758926392, -0.8015247583389282, -0.7578636407852173, -0.7142025828361511, -0.6705414652824402, -0.6268803477287292, -0.5832192301750183, -0.5395581126213074, -0.4958970248699188, -0.4522359073162079, -0.40857478976249695, -0.3649137020111084, -0.32125258445739746, -0.2775914669036865, -0.23393034934997559, -0.19026924669742584, -0.1466081440448761, -0.10294702649116516, -0.059285908937454224, -0.015624821186065674, 0.028036296367645264, 0.0716974139213562, 0.11535852402448654, 0.15901963412761688, 0.20268073678016663, 0.24634185433387756, 0.2900029718875885, 0.33366405963897705, 0.377325177192688, 0.4209862947463989, 0.46464741230010986, 0.5083085298538208, 0.5519696474075317, 0.5956307649612427, 0.6392918825149536, 0.6829529404640198, 0.7266140580177307, 0.7702751755714417, 0.8139362931251526, 0.8575974106788635, 0.9012584686279297, 0.9449195861816406, 0.9885807037353516, 1.0322418212890625, 1.0759029388427734, 1.1195640563964844, 1.1632251739501953, 1.2068862915039062, 1.2505474090576172, 1.2942085266113281, 1.337869644165039, 1.38153076171875, 1.425191879272461, 1.4688529968261719, 1.5125141143798828, 1.5561752319335938, 1.5998363494873047, 1.6434974670410156, 1.6871585845947266, 1.7308197021484375, 1.7744808197021484, 1.8181418180465698]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 4.0, 3.0, 12.0, 13.0, 12.0, 23.0, 34.0, 59.0, 87.0, 134.0, 282.0, 526.0, 1290.0, 4424.0, 26498.0, 3661290.0, 477847.0, 16311.0, 3333.0, 1082.0, 446.0, 209.0, 122.0, 83.0, 48.0, 27.0, 26.0, 13.0, 11.0, 11.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399658203125, -0.3885231018066406, -0.37738800048828125, -0.3662528991699219, -0.3551177978515625, -0.3439826965332031, -0.33284759521484375, -0.3217124938964844, -0.310577392578125, -0.2994422912597656, -0.28830718994140625, -0.2771720886230469, -0.2660369873046875, -0.2549018859863281, -0.24376678466796875, -0.23263168334960938, -0.22149658203125, -0.21036148071289062, -0.19922637939453125, -0.18809127807617188, -0.1769561767578125, -0.16582107543945312, -0.15468597412109375, -0.14355087280273438, -0.132415771484375, -0.12128067016601562, -0.11014556884765625, -0.09901046752929688, -0.0878753662109375, -0.07674026489257812, -0.06560516357421875, -0.054470062255859375, -0.0433349609375, -0.032199859619140625, -0.02106475830078125, -0.009929656982421875, 0.0012054443359375, 0.012340545654296875, 0.02347564697265625, 0.034610748291015625, 0.045745849609375, 0.056880950927734375, 0.06801605224609375, 0.07915115356445312, 0.0902862548828125, 0.10142135620117188, 0.11255645751953125, 0.12369155883789062, 0.13482666015625, 0.14596176147460938, 0.15709686279296875, 0.16823196411132812, 0.1793670654296875, 0.19050216674804688, 0.20163726806640625, 0.21277236938476562, 0.223907470703125, 0.23504257202148438, 0.24617767333984375, 0.2573127746582031, 0.2684478759765625, 0.2795829772949219, 0.29071807861328125, 0.3018531799316406, 0.31298828125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 10.0, 13.0, 19.0, 31.0, 68.0, 122.0, 167.0, 200.0, 146.0, 101.0, 52.0, 31.0, 14.0, 13.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0926513671875, -0.08968544006347656, -0.08671951293945312, -0.08375358581542969, -0.08078765869140625, -0.07782173156738281, -0.07485580444335938, -0.07188987731933594, -0.0689239501953125, -0.06595802307128906, -0.06299209594726562, -0.06002616882324219, -0.05706024169921875, -0.05409431457519531, -0.051128387451171875, -0.04816246032714844, -0.045196533203125, -0.04223060607910156, -0.039264678955078125, -0.03629875183105469, -0.03333282470703125, -0.030366897583007812, -0.027400970458984375, -0.024435043334960938, -0.0214691162109375, -0.018503189086914062, -0.015537261962890625, -0.012571334838867188, -0.00960540771484375, -0.0066394805908203125, -0.003673553466796875, -0.0007076263427734375, 0.00225830078125, 0.0052242279052734375, 0.008190155029296875, 0.011156082153320312, 0.01412200927734375, 0.017087936401367188, 0.020053863525390625, 0.023019790649414062, 0.0259857177734375, 0.028951644897460938, 0.031917572021484375, 0.03488349914550781, 0.03784942626953125, 0.04081535339355469, 0.043781280517578125, 0.04674720764160156, 0.049713134765625, 0.05267906188964844, 0.055644989013671875, 0.05861091613769531, 0.06157684326171875, 0.06454277038574219, 0.06750869750976562, 0.07047462463378906, 0.0734405517578125, 0.07640647888183594, 0.07937240600585938, 0.08233833312988281, 0.08530426025390625, 0.08827018737792969, 0.09123611450195312, 0.09420204162597656, 0.09716796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 9.0, 14.0, 18.0, 17.0, 31.0, 42.0, 91.0, 148.0, 243.0, 499.0, 1150.0, 3314.0, 15548.0, 226204.0, 3887875.0, 48825.0, 7042.0, 1813.0, 704.0, 307.0, 146.0, 89.0, 50.0, 34.0, 27.0, 14.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.405517578125, -0.3946342468261719, -0.38375091552734375, -0.3728675842285156, -0.3619842529296875, -0.3511009216308594, -0.34021759033203125, -0.3293342590332031, -0.318450927734375, -0.3075675964355469, -0.29668426513671875, -0.2858009338378906, -0.2749176025390625, -0.2640342712402344, -0.25315093994140625, -0.24226760864257812, -0.23138427734375, -0.22050094604492188, -0.20961761474609375, -0.19873428344726562, -0.1878509521484375, -0.17696762084960938, -0.16608428955078125, -0.15520095825195312, -0.144317626953125, -0.13343429565429688, -0.12255096435546875, -0.11166763305664062, -0.1007843017578125, -0.08990097045898438, -0.07901763916015625, -0.06813430786132812, -0.0572509765625, -0.046367645263671875, -0.03548431396484375, -0.024600982666015625, -0.0137176513671875, -0.002834320068359375, 0.00804901123046875, 0.018932342529296875, 0.029815673828125, 0.040699005126953125, 0.05158233642578125, 0.062465667724609375, 0.0733489990234375, 0.08423233032226562, 0.09511566162109375, 0.10599899291992188, 0.11688232421875, 0.12776565551757812, 0.13864898681640625, 0.14953231811523438, 0.1604156494140625, 0.17129898071289062, 0.18218231201171875, 0.19306564331054688, 0.203948974609375, 0.21483230590820312, 0.22571563720703125, 0.23659896850585938, 0.2474822998046875, 0.2583656311035156, 0.26924896240234375, 0.2801322937011719, 0.291015625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 16.0, 27.0, 52.0, 79.0, 197.0, 816.0, 2258.0, 366.0, 111.0, 57.0, 27.0, 20.0, 11.0, 10.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1929931640625, -0.18842697143554688, -0.18386077880859375, -0.17929458618164062, -0.1747283935546875, -0.17016220092773438, -0.16559600830078125, -0.16102981567382812, -0.156463623046875, -0.15189743041992188, -0.14733123779296875, -0.14276504516601562, -0.1381988525390625, -0.13363265991210938, -0.12906646728515625, -0.12450027465820312, -0.11993408203125, -0.11536788940429688, -0.11080169677734375, -0.10623550415039062, -0.1016693115234375, -0.09710311889648438, -0.09253692626953125, -0.08797073364257812, -0.083404541015625, -0.07883834838867188, -0.07427215576171875, -0.06970596313476562, -0.0651397705078125, -0.060573577880859375, -0.05600738525390625, -0.051441192626953125, -0.046875, -0.042308807373046875, -0.03774261474609375, -0.033176422119140625, -0.0286102294921875, -0.024044036865234375, -0.01947784423828125, -0.014911651611328125, -0.010345458984375, -0.005779266357421875, -0.00121307373046875, 0.003353118896484375, 0.0079193115234375, 0.012485504150390625, 0.01705169677734375, 0.021617889404296875, 0.02618408203125, 0.030750274658203125, 0.03531646728515625, 0.039882659912109375, 0.0444488525390625, 0.049015045166015625, 0.05358123779296875, 0.058147430419921875, 0.062713623046875, 0.06727981567382812, 0.07184600830078125, 0.07641220092773438, 0.0809783935546875, 0.08554458618164062, 0.09011077880859375, 0.09467697143554688, 0.0992431640625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 12.0, 28.0, 91.0, 184.0, 347.0, 247.0, 61.0, 23.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.449288010597229, -0.418795108795166, -0.38830217719078064, -0.35780927538871765, -0.3273163437843323, -0.2968234419822693, -0.2663305401802063, -0.23583760857582092, -0.20534469187259674, -0.17485177516937256, -0.14435885846614838, -0.11386594921350479, -0.08337303251028061, -0.052880123257637024, -0.022387206554412842, 0.00810571014881134, 0.03859862685203552, 0.0690915435552597, 0.09958446025848389, 0.13007736206054688, 0.16057029366493225, 0.19106319546699524, 0.22155611217021942, 0.2520490288734436, 0.2825419306755066, 0.3130348324775696, 0.34352776408195496, 0.37402066588401794, 0.4045135974884033, 0.4350064992904663, 0.4654994010925293, 0.4959923326969147, 0.5264852643013, 0.556978166103363, 0.587471067905426, 0.6179640293121338, 0.6484569311141968, 0.6789498329162598, 0.7094427347183228, 0.7399356365203857, 0.7704285979270935, 0.8009214997291565, 0.8314144015312195, 0.8619073629379272, 0.8924002647399902, 0.9228931665420532, 0.9533860683441162, 0.9838789701461792, 1.0143718719482422, 1.0448647737503052, 1.0753576755523682, 1.1058505773544312, 1.1363434791564941, 1.1668365001678467, 1.1973294019699097, 1.2278223037719727, 1.2583152055740356, 1.2888081073760986, 1.3193010091781616, 1.3497939109802246, 1.3802868127822876, 1.4107797145843506, 1.4412727355957031, 1.4717656373977661, 1.502258539199829]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 11.0, 12.0, 28.0, 30.0, 38.0, 47.0, 44.0, 73.0, 59.0, 81.0, 75.0, 60.0, 61.0, 61.0, 58.0, 51.0, 45.0, 44.0, 28.0, 36.0, 23.0, 11.0, 9.0, 11.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5464600324630737, -0.5318363308906555, -0.5172126293182373, -0.5025889277458191, -0.4879651963710785, -0.4733414947986603, -0.4587177634239197, -0.44409406185150146, -0.42947036027908325, -0.41484665870666504, -0.4002229571342468, -0.3855992257595062, -0.370975524187088, -0.3563518226146698, -0.3417280912399292, -0.327104389667511, -0.3124806880950928, -0.29785698652267456, -0.28323328495025635, -0.26860955357551575, -0.25398585200309753, -0.23936215043067932, -0.22473843395709991, -0.2101147174835205, -0.1954910159111023, -0.18086731433868408, -0.16624359786510468, -0.15161988139152527, -0.13699617981910706, -0.12237247079610825, -0.10774876177310944, -0.09312505275011063, -0.07850134372711182, -0.063877634704113, -0.0492539256811142, -0.03463021665811539, -0.020006507635116577, -0.005382798612117767, 0.009240910410881042, 0.023864619433879852, 0.03848832845687866, 0.05311203747987747, 0.06773574650287628, 0.08235945552587509, 0.0969831645488739, 0.11160687357187271, 0.12623058259487152, 0.14085429906845093, 0.15547800064086914, 0.17010170221328735, 0.18472541868686676, 0.19934913516044617, 0.21397283673286438, 0.2285965383052826, 0.243220254778862, 0.2578439712524414, 0.2724676728248596, 0.28709137439727783, 0.30171507596969604, 0.31633880734443665, 0.33096250891685486, 0.34558621048927307, 0.36020994186401367, 0.3748336434364319, 0.3894573450088501]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 3.0, 8.0, 8.0, 17.0, 26.0, 36.0, 40.0, 51.0, 79.0, 120.0, 208.0, 337.0, 547.0, 1137.0, 2931.0, 10573.0, 81968.0, 832629.0, 100043.0, 12005.0, 3159.0, 1174.0, 564.0, 310.0, 176.0, 118.0, 83.0, 56.0, 46.0, 21.0, 29.0, 16.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.369384765625, -0.3589897155761719, -0.34859466552734375, -0.3381996154785156, -0.3278045654296875, -0.3174095153808594, -0.30701446533203125, -0.2966194152832031, -0.286224365234375, -0.2758293151855469, -0.26543426513671875, -0.2550392150878906, -0.2446441650390625, -0.23424911499023438, -0.22385406494140625, -0.21345901489257812, -0.20306396484375, -0.19266891479492188, -0.18227386474609375, -0.17187881469726562, -0.1614837646484375, -0.15108871459960938, -0.14069366455078125, -0.13029861450195312, -0.119903564453125, -0.10950851440429688, -0.09911346435546875, -0.08871841430664062, -0.0783233642578125, -0.06792831420898438, -0.05753326416015625, -0.047138214111328125, -0.0367431640625, -0.026348114013671875, -0.01595306396484375, -0.005558013916015625, 0.0048370361328125, 0.015232086181640625, 0.02562713623046875, 0.036022186279296875, 0.046417236328125, 0.056812286376953125, 0.06720733642578125, 0.07760238647460938, 0.0879974365234375, 0.09839248657226562, 0.10878753662109375, 0.11918258666992188, 0.12957763671875, 0.13997268676757812, 0.15036773681640625, 0.16076278686523438, 0.1711578369140625, 0.18155288696289062, 0.19194793701171875, 0.20234298706054688, 0.212738037109375, 0.22313308715820312, 0.23352813720703125, 0.24392318725585938, 0.2543182373046875, 0.2647132873535156, 0.27510833740234375, 0.2855033874511719, 0.2958984375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 12.0, 8.0, 13.0, 16.0, 34.0, 68.0, 110.0, 169.0, 201.0, 148.0, 88.0, 61.0, 40.0, 13.0, 9.0, 7.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09661865234375, -0.0936279296875, -0.09063720703125, -0.087646484375, -0.08465576171875, -0.0816650390625, -0.07867431640625, -0.07568359375, -0.07269287109375, -0.0697021484375, -0.06671142578125, -0.063720703125, -0.06072998046875, -0.0577392578125, -0.05474853515625, -0.0517578125, -0.04876708984375, -0.0457763671875, -0.04278564453125, -0.039794921875, -0.03680419921875, -0.0338134765625, -0.03082275390625, -0.02783203125, -0.02484130859375, -0.0218505859375, -0.01885986328125, -0.015869140625, -0.01287841796875, -0.0098876953125, -0.00689697265625, -0.00390625, -0.00091552734375, 0.0020751953125, 0.00506591796875, 0.008056640625, 0.01104736328125, 0.0140380859375, 0.01702880859375, 0.02001953125, 0.02301025390625, 0.0260009765625, 0.02899169921875, 0.031982421875, 0.03497314453125, 0.0379638671875, 0.04095458984375, 0.0439453125, 0.04693603515625, 0.0499267578125, 0.05291748046875, 0.055908203125, 0.05889892578125, 0.0618896484375, 0.06488037109375, 0.06787109375, 0.07086181640625, 0.0738525390625, 0.07684326171875, 0.079833984375, 0.08282470703125, 0.0858154296875, 0.08880615234375, 0.091796875, 0.09478759765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 16.0, 12.0, 15.0, 15.0, 27.0, 34.0, 60.0, 67.0, 111.0, 170.0, 217.0, 399.0, 631.0, 1133.0, 2114.0, 4385.0, 11041.0, 33562.0, 159299.0, 641184.0, 142587.0, 31508.0, 10584.0, 4347.0, 2164.0, 1084.0, 652.0, 370.0, 225.0, 153.0, 120.0, 75.0, 58.0, 36.0, 31.0, 16.0, 13.0, 14.0, 4.0, 7.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.211181640625, -0.20554542541503906, -0.19990921020507812, -0.1942729949951172, -0.18863677978515625, -0.1830005645751953, -0.17736434936523438, -0.17172813415527344, -0.1660919189453125, -0.16045570373535156, -0.15481948852539062, -0.1491832733154297, -0.14354705810546875, -0.1379108428955078, -0.13227462768554688, -0.12663841247558594, -0.121002197265625, -0.11536598205566406, -0.10972976684570312, -0.10409355163574219, -0.09845733642578125, -0.09282112121582031, -0.08718490600585938, -0.08154869079589844, -0.0759124755859375, -0.07027626037597656, -0.06464004516601562, -0.05900382995605469, -0.05336761474609375, -0.04773139953613281, -0.042095184326171875, -0.03645896911621094, -0.03082275390625, -0.025186538696289062, -0.019550323486328125, -0.013914108276367188, -0.00827789306640625, -0.0026416778564453125, 0.002994537353515625, 0.008630752563476562, 0.0142669677734375, 0.019903182983398438, 0.025539398193359375, 0.031175613403320312, 0.03681182861328125, 0.04244804382324219, 0.048084259033203125, 0.05372047424316406, 0.059356689453125, 0.06499290466308594, 0.07062911987304688, 0.07626533508300781, 0.08190155029296875, 0.08753776550292969, 0.09317398071289062, 0.09881019592285156, 0.1044464111328125, 0.11008262634277344, 0.11571884155273438, 0.12135505676269531, 0.12699127197265625, 0.1326274871826172, 0.13826370239257812, 0.14389991760253906, 0.1495361328125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 9.0, 11.0, 9.0, 15.0, 23.0, 25.0, 35.0, 28.0, 41.0, 37.0, 59.0, 50.0, 51.0, 61.0, 63.0, 74.0, 54.0, 53.0, 52.0, 40.0, 34.0, 31.0, 30.0, 25.0, 26.0, 9.0, 11.0, 3.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.274658203125, -0.2673473358154297, -0.2600364685058594, -0.25272560119628906, -0.24541473388671875, -0.23810386657714844, -0.23079299926757812, -0.2234821319580078, -0.2161712646484375, -0.2088603973388672, -0.20154953002929688, -0.19423866271972656, -0.18692779541015625, -0.17961692810058594, -0.17230606079101562, -0.1649951934814453, -0.157684326171875, -0.1503734588623047, -0.14306259155273438, -0.13575172424316406, -0.12844085693359375, -0.12112998962402344, -0.11381912231445312, -0.10650825500488281, -0.0991973876953125, -0.09188652038574219, -0.08457565307617188, -0.07726478576660156, -0.06995391845703125, -0.06264305114746094, -0.055332183837890625, -0.04802131652832031, -0.04071044921875, -0.03339958190917969, -0.026088714599609375, -0.018777847290039062, -0.01146697998046875, -0.0041561126708984375, 0.003154754638671875, 0.010465621948242188, 0.0177764892578125, 0.025087356567382812, 0.032398223876953125, 0.03970909118652344, 0.04701995849609375, 0.05433082580566406, 0.061641693115234375, 0.06895256042480469, 0.076263427734375, 0.08357429504394531, 0.09088516235351562, 0.09819602966308594, 0.10550689697265625, 0.11281776428222656, 0.12012863159179688, 0.1274394989013672, 0.1347503662109375, 0.1420612335205078, 0.14937210083007812, 0.15668296813964844, 0.16399383544921875, 0.17130470275878906, 0.17861557006835938, 0.1859264373779297, 0.1932373046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 1.0, 5.0, 7.0, 7.0, 13.0, 15.0, 28.0, 37.0, 47.0, 89.0, 143.0, 303.0, 741.0, 2285.0, 8319.0, 45936.0, 873661.0, 99405.0, 12416.0, 3132.0, 1052.0, 406.0, 180.0, 107.0, 60.0, 52.0, 24.0, 18.0, 13.0, 17.0, 4.0, 2.0, 2.0, 5.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16552734375, -0.15974807739257812, -0.15396881103515625, -0.14818954467773438, -0.1424102783203125, -0.13663101196289062, -0.13085174560546875, -0.12507247924804688, -0.119293212890625, -0.11351394653320312, -0.10773468017578125, -0.10195541381835938, -0.0961761474609375, -0.09039688110351562, -0.08461761474609375, -0.07883834838867188, -0.07305908203125, -0.06727981567382812, -0.06150054931640625, -0.055721282958984375, -0.0499420166015625, -0.044162750244140625, -0.03838348388671875, -0.032604217529296875, -0.026824951171875, -0.021045684814453125, -0.01526641845703125, -0.009487152099609375, -0.0037078857421875, 0.002071380615234375, 0.00785064697265625, 0.013629913330078125, 0.0194091796875, 0.025188446044921875, 0.03096771240234375, 0.036746978759765625, 0.0425262451171875, 0.048305511474609375, 0.05408477783203125, 0.059864044189453125, 0.065643310546875, 0.07142257690429688, 0.07720184326171875, 0.08298110961914062, 0.0887603759765625, 0.09453964233398438, 0.10031890869140625, 0.10609817504882812, 0.11187744140625, 0.11765670776367188, 0.12343597412109375, 0.12921524047851562, 0.1349945068359375, 0.14077377319335938, 0.14655303955078125, 0.15233230590820312, 0.158111572265625, 0.16389083862304688, 0.16967010498046875, 0.17544937133789062, 0.1812286376953125, 0.18700790405273438, 0.19278717041015625, 0.19856643676757812, 0.204345703125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 7.0, 8.0, 5.0, 3.0, 7.0, 8.0, 14.0, 20.0, 20.0, 16.0, 25.0, 32.0, 42.0, 67.0, 72.0, 107.0, 97.0, 104.0, 81.0, 53.0, 32.0, 25.0, 21.0, 20.0, 18.0, 16.0, 14.0, 6.0, 10.0, 8.0, 7.0, 10.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.153915405273438e-05, -7.901154458522797e-05, -7.648393511772156e-05, -7.395632565021515e-05, -7.142871618270874e-05, -6.890110671520233e-05, -6.637349724769592e-05, -6.384588778018951e-05, -6.13182783126831e-05, -5.87906688451767e-05, -5.626305937767029e-05, -5.373544991016388e-05, -5.120784044265747e-05, -4.868023097515106e-05, -4.615262150764465e-05, -4.3625012040138245e-05, -4.1097402572631836e-05, -3.856979310512543e-05, -3.604218363761902e-05, -3.351457417011261e-05, -3.09869647026062e-05, -2.8459355235099792e-05, -2.5931745767593384e-05, -2.3404136300086975e-05, -2.0876526832580566e-05, -1.8348917365074158e-05, -1.582130789756775e-05, -1.329369843006134e-05, -1.0766088962554932e-05, -8.238479495048523e-06, -5.710870027542114e-06, -3.1832605600357056e-06, -6.556510925292969e-07, 1.8719583749771118e-06, 4.3995678424835205e-06, 6.927177309989929e-06, 9.454786777496338e-06, 1.1982396245002747e-05, 1.4510005712509155e-05, 1.7037615180015564e-05, 1.9565224647521973e-05, 2.209283411502838e-05, 2.462044358253479e-05, 2.71480530500412e-05, 2.9675662517547607e-05, 3.2203271985054016e-05, 3.4730881452560425e-05, 3.7258490920066833e-05, 3.978610038757324e-05, 4.231370985507965e-05, 4.484131932258606e-05, 4.736892879009247e-05, 4.989653825759888e-05, 5.2424147725105286e-05, 5.4951757192611694e-05, 5.74793666601181e-05, 6.000697612762451e-05, 6.253458559513092e-05, 6.506219506263733e-05, 6.758980453014374e-05, 7.011741399765015e-05, 7.264502346515656e-05, 7.517263293266296e-05, 7.770024240016937e-05, 8.022785186767578e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 11.0, 11.0, 16.0, 28.0, 31.0, 50.0, 73.0, 88.0, 184.0, 205.0, 397.0, 664.0, 1299.0, 2639.0, 5931.0, 15977.0, 75319.0, 795829.0, 116039.0, 19827.0, 7246.0, 3161.0, 1538.0, 793.0, 444.0, 278.0, 158.0, 91.0, 59.0, 48.0, 26.0, 21.0, 13.0, 10.0, 12.0, 9.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10601806640625, -0.10203075408935547, -0.09804344177246094, -0.0940561294555664, -0.09006881713867188, -0.08608150482177734, -0.08209419250488281, -0.07810688018798828, -0.07411956787109375, -0.07013225555419922, -0.06614494323730469, -0.062157630920410156, -0.058170318603515625, -0.054183006286621094, -0.05019569396972656, -0.04620838165283203, -0.0422210693359375, -0.03823375701904297, -0.03424644470214844, -0.030259132385253906, -0.026271820068359375, -0.022284507751464844, -0.018297195434570312, -0.014309883117675781, -0.01032257080078125, -0.006335258483886719, -0.0023479461669921875, 0.0016393661499023438, 0.005626678466796875, 0.009613990783691406, 0.013601303100585938, 0.01758861541748047, 0.021575927734375, 0.02556324005126953, 0.029550552368164062, 0.033537864685058594, 0.037525177001953125, 0.041512489318847656, 0.04549980163574219, 0.04948711395263672, 0.05347442626953125, 0.05746173858642578, 0.06144905090332031, 0.06543636322021484, 0.06942367553710938, 0.0734109878540039, 0.07739830017089844, 0.08138561248779297, 0.0853729248046875, 0.08936023712158203, 0.09334754943847656, 0.0973348617553711, 0.10132217407226562, 0.10530948638916016, 0.10929679870605469, 0.11328411102294922, 0.11727142333984375, 0.12125873565673828, 0.1252460479736328, 0.12923336029052734, 0.13322067260742188, 0.1372079849243164, 0.14119529724121094, 0.14518260955810547, 0.149169921875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 10.0, 8.0, 13.0, 14.0, 20.0, 50.0, 74.0, 194.0, 330.0, 109.0, 49.0, 30.0, 17.0, 21.0, 8.0, 7.0, 3.0, 8.0, 4.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2073974609375, -0.1998004913330078, -0.19220352172851562, -0.18460655212402344, -0.17700958251953125, -0.16941261291503906, -0.16181564331054688, -0.1542186737060547, -0.1466217041015625, -0.1390247344970703, -0.13142776489257812, -0.12383079528808594, -0.11623382568359375, -0.10863685607910156, -0.10103988647460938, -0.09344291687011719, -0.085845947265625, -0.07824897766113281, -0.07065200805664062, -0.06305503845214844, -0.05545806884765625, -0.04786109924316406, -0.040264129638671875, -0.03266716003417969, -0.0250701904296875, -0.017473220825195312, -0.009876251220703125, -0.0022792816162109375, 0.00531768798828125, 0.012914657592773438, 0.020511627197265625, 0.028108596801757812, 0.03570556640625, 0.04330253601074219, 0.050899505615234375, 0.05849647521972656, 0.06609344482421875, 0.07369041442871094, 0.08128738403320312, 0.08888435363769531, 0.0964813232421875, 0.10407829284667969, 0.11167526245117188, 0.11927223205566406, 0.12686920166015625, 0.13446617126464844, 0.14206314086914062, 0.1496601104736328, 0.157257080078125, 0.1648540496826172, 0.17245101928710938, 0.18004798889160156, 0.18764495849609375, 0.19524192810058594, 0.20283889770507812, 0.2104358673095703, 0.2180328369140625, 0.2256298065185547, 0.23322677612304688, 0.24082374572753906, 0.24842071533203125, 0.25601768493652344, 0.2636146545410156, 0.2712116241455078, 0.27880859375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 21.0, 11.0, 19.0, 68.0, 176.0, 328.0, 269.0, 73.0, 25.0, 2.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7482235431671143, -3.662583827972412, -3.576944351196289, -3.491304636001587, -3.4056649208068848, -3.3200254440307617, -3.2343857288360596, -3.1487460136413574, -3.0631065368652344, -2.9774668216705322, -2.891827344894409, -2.806187629699707, -2.720547914505005, -2.6349081993103027, -2.5492687225341797, -2.4636290073394775, -2.3779892921447754, -2.2923495769500732, -2.20671010017395, -2.121070384979248, -2.035430669784546, -1.9497910737991333, -1.8641514778137207, -1.7785117626190186, -1.692872166633606, -1.6072325706481934, -1.5215928554534912, -1.4359532594680786, -1.350313663482666, -1.2646739482879639, -1.1790343523025513, -1.0933947563171387, -1.0077552795410156, -0.9221156239509583, -0.8364759683609009, -0.7508363723754883, -0.6651967167854309, -0.5795570611953735, -0.49391746520996094, -0.40827780961990356, -0.3226381540298462, -0.23699851334095, -0.15135887265205383, -0.06571924686431885, 0.019920408725738525, 0.1055600643157959, 0.1911996603012085, 0.27683931589126587, 0.36247897148132324, 0.4481186270713806, 0.533758282661438, 0.6193978786468506, 0.705037534236908, 0.7906771898269653, 0.8763167858123779, 0.9619564414024353, 1.0475960969924927, 1.1332356929779053, 1.2188754081726074, 1.30451500415802, 1.3901546001434326, 1.4757943153381348, 1.5614339113235474, 1.64707350730896, 1.732713222503662]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 7.0, 2.0, 11.0, 11.0, 8.0, 13.0, 12.0, 14.0, 28.0, 22.0, 32.0, 35.0, 36.0, 29.0, 42.0, 44.0, 42.0, 44.0, 51.0, 53.0, 56.0, 42.0, 36.0, 27.0, 35.0, 33.0, 40.0, 30.0, 23.0, 22.0, 16.0, 17.0, 21.0, 20.0, 8.0, 8.0, 4.0, 4.0, 5.0, 6.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0845484733581543, -1.0480408668518066, -1.0115331411361694, -0.9750255346298218, -0.9385178685188293, -0.9020102024078369, -0.8655025959014893, -0.8289949297904968, -0.7924872636795044, -0.755979597568512, -0.7194719910621643, -0.6829643249511719, -0.6464566588401794, -0.609948992729187, -0.5734413862228394, -0.5369337201118469, -0.5004261136054993, -0.4639184772968292, -0.4274108111858368, -0.39090317487716675, -0.3543955087661743, -0.3178878724575043, -0.28138023614883423, -0.2448725700378418, -0.20836493372917175, -0.17185728251934052, -0.13534963130950928, -0.09884199500083923, -0.062334343791007996, -0.025826692581176758, 0.010680943727493286, 0.04718860983848572, 0.08369624614715576, 0.120203897356987, 0.15671154856681824, 0.19321918487548828, 0.22972683608531952, 0.26623448729515076, 0.3027421236038208, 0.33924978971481323, 0.3757574260234833, 0.4122650623321533, 0.44877272844314575, 0.4852803647518158, 0.5217880010604858, 0.5582956671714783, 0.5948033332824707, 0.6313109397888184, 0.6678186058998108, 0.7043262720108032, 0.7408338785171509, 0.7773415446281433, 0.8138492107391357, 0.8503568172454834, 0.8868644833564758, 0.9233721494674683, 0.9598797559738159, 0.9963874220848083, 1.0328950881958008, 1.0694026947021484, 1.105910301208496, 1.1424180269241333, 1.178925633430481, 1.2154333591461182, 1.2519409656524658]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 13.0, 15.0, 19.0, 42.0, 69.0, 136.0, 283.0, 609.0, 1920.0, 12701.0, 3996934.0, 173006.0, 6254.0, 1314.0, 471.0, 215.0, 111.0, 58.0, 42.0, 18.0, 15.0, 10.0, 0.0, 6.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.467529296875, -0.4518623352050781, -0.43619537353515625, -0.4205284118652344, -0.4048614501953125, -0.3891944885253906, -0.37352752685546875, -0.3578605651855469, -0.342193603515625, -0.3265266418457031, -0.31085968017578125, -0.2951927185058594, -0.2795257568359375, -0.2638587951660156, -0.24819183349609375, -0.23252487182617188, -0.21685791015625, -0.20119094848632812, -0.18552398681640625, -0.16985702514648438, -0.1541900634765625, -0.13852310180664062, -0.12285614013671875, -0.10718917846679688, -0.091522216796875, -0.07585525512695312, -0.06018829345703125, -0.044521331787109375, -0.0288543701171875, -0.013187408447265625, 0.00247955322265625, 0.018146514892578125, 0.0338134765625, 0.049480438232421875, 0.06514739990234375, 0.08081436157226562, 0.0964813232421875, 0.11214828491210938, 0.12781524658203125, 0.14348220825195312, 0.159149169921875, 0.17481613159179688, 0.19048309326171875, 0.20615005493164062, 0.2218170166015625, 0.23748397827148438, 0.25315093994140625, 0.2688179016113281, 0.28448486328125, 0.3001518249511719, 0.31581878662109375, 0.3314857482910156, 0.3471527099609375, 0.3628196716308594, 0.37848663330078125, 0.3941535949707031, 0.409820556640625, 0.4254875183105469, 0.44115447998046875, 0.4568214416503906, 0.4724884033203125, 0.4881553649902344, 0.5038223266601562, 0.5194892883300781, 0.53515625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 9.0, 12.0, 22.0, 32.0, 65.0, 115.0, 155.0, 180.0, 127.0, 113.0, 67.0, 42.0, 25.0, 12.0, 10.0, 8.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09369945526123047, -0.09071922302246094, -0.0877389907836914, -0.08475875854492188, -0.08177852630615234, -0.07879829406738281, -0.07581806182861328, -0.07283782958984375, -0.06985759735107422, -0.06687736511230469, -0.06389713287353516, -0.060916900634765625, -0.057936668395996094, -0.05495643615722656, -0.05197620391845703, -0.0489959716796875, -0.04601573944091797, -0.04303550720214844, -0.040055274963378906, -0.037075042724609375, -0.034094810485839844, -0.031114578247070312, -0.02813434600830078, -0.02515411376953125, -0.02217388153076172, -0.019193649291992188, -0.016213417053222656, -0.013233184814453125, -0.010252952575683594, -0.0072727203369140625, -0.004292488098144531, -0.001312255859375, 0.0016679763793945312, 0.0046482086181640625, 0.007628440856933594, 0.010608673095703125, 0.013588905334472656, 0.016569137573242188, 0.01954936981201172, 0.02252960205078125, 0.02550983428955078, 0.028490066528320312, 0.031470298767089844, 0.034450531005859375, 0.037430763244628906, 0.04041099548339844, 0.04339122772216797, 0.0463714599609375, 0.04935169219970703, 0.05233192443847656, 0.055312156677246094, 0.058292388916015625, 0.061272621154785156, 0.06425285339355469, 0.06723308563232422, 0.07021331787109375, 0.07319355010986328, 0.07617378234863281, 0.07915401458740234, 0.08213424682617188, 0.0851144790649414, 0.08809471130371094, 0.09107494354248047, 0.09405517578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 12.0, 22.0, 27.0, 46.0, 54.0, 56.0, 99.0, 134.0, 175.0, 247.0, 321.0, 473.0, 667.0, 1106.0, 2260.0, 7380.0, 48461.0, 3934971.0, 176400.0, 13965.0, 3456.0, 1401.0, 781.0, 543.0, 346.0, 265.0, 168.0, 135.0, 103.0, 45.0, 45.0, 27.0, 26.0, 20.0, 13.0, 6.0, 1.0, 7.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.368408203125, -0.3591289520263672, -0.3498497009277344, -0.34057044982910156, -0.33129119873046875, -0.32201194763183594, -0.3127326965332031, -0.3034534454345703, -0.2941741943359375, -0.2848949432373047, -0.2756156921386719, -0.26633644104003906, -0.25705718994140625, -0.24777793884277344, -0.23849868774414062, -0.2292194366455078, -0.219940185546875, -0.2106609344482422, -0.20138168334960938, -0.19210243225097656, -0.18282318115234375, -0.17354393005371094, -0.16426467895507812, -0.1549854278564453, -0.1457061767578125, -0.1364269256591797, -0.12714767456054688, -0.11786842346191406, -0.10858917236328125, -0.09930992126464844, -0.09003067016601562, -0.08075141906738281, -0.07147216796875, -0.06219291687011719, -0.052913665771484375, -0.04363441467285156, -0.03435516357421875, -0.025075912475585938, -0.015796661376953125, -0.0065174102783203125, 0.0027618408203125, 0.012041091918945312, 0.021320343017578125, 0.030599594116210938, 0.03987884521484375, 0.04915809631347656, 0.058437347412109375, 0.06771659851074219, 0.076995849609375, 0.08627510070800781, 0.09555435180664062, 0.10483360290527344, 0.11411285400390625, 0.12339210510253906, 0.13267135620117188, 0.1419506072998047, 0.1512298583984375, 0.1605091094970703, 0.16978836059570312, 0.17906761169433594, 0.18834686279296875, 0.19762611389160156, 0.20690536499023438, 0.2161846160888672, 0.2254638671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 1.0, 10.0, 19.0, 40.0, 94.0, 415.0, 3033.0, 334.0, 64.0, 28.0, 14.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2269287109375, -0.2214508056640625, -0.215972900390625, -0.2104949951171875, -0.20501708984375, -0.1995391845703125, -0.194061279296875, -0.1885833740234375, -0.18310546875, -0.1776275634765625, -0.172149658203125, -0.1666717529296875, -0.16119384765625, -0.1557159423828125, -0.150238037109375, -0.1447601318359375, -0.1392822265625, -0.1338043212890625, -0.128326416015625, -0.1228485107421875, -0.11737060546875, -0.1118927001953125, -0.106414794921875, -0.1009368896484375, -0.095458984375, -0.0899810791015625, -0.084503173828125, -0.0790252685546875, -0.07354736328125, -0.0680694580078125, -0.062591552734375, -0.0571136474609375, -0.0516357421875, -0.0461578369140625, -0.040679931640625, -0.0352020263671875, -0.02972412109375, -0.0242462158203125, -0.018768310546875, -0.0132904052734375, -0.0078125, -0.0023345947265625, 0.003143310546875, 0.0086212158203125, 0.01409912109375, 0.0195770263671875, 0.025054931640625, 0.0305328369140625, 0.0360107421875, 0.0414886474609375, 0.046966552734375, 0.0524444580078125, 0.05792236328125, 0.0634002685546875, 0.068878173828125, 0.0743560791015625, 0.079833984375, 0.0853118896484375, 0.090789794921875, 0.0962677001953125, 0.10174560546875, 0.1072235107421875, 0.112701416015625, 0.1181793212890625, 0.1236572265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 9.0, 13.0, 46.0, 109.0, 384.0, 340.0, 88.0, 14.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1068203449249268, -2.0655229091644287, -2.0242257118225098, -1.9829282760620117, -1.9416308403015137, -1.9003335237503052, -1.8590360879898071, -1.8177387714385986, -1.7764413356781006, -1.735144019126892, -1.693846583366394, -1.6525492668151855, -1.6112518310546875, -1.569954514503479, -1.528657078742981, -1.4873597621917725, -1.4460623264312744, -1.404765009880066, -1.3634675741195679, -1.3221702575683594, -1.2808728218078613, -1.2395755052566528, -1.1982780694961548, -1.1569807529449463, -1.1156834363937378, -1.0743861198425293, -1.0330886840820312, -0.991791307926178, -0.9504939317703247, -0.9091965556144714, -0.8678991794586182, -0.8266018629074097, -0.7853043675422668, -0.7440069913864136, -0.7027096152305603, -0.661412239074707, -0.6201148629188538, -0.5788174867630005, -0.537520170211792, -0.49622276425361633, -0.45492538809776306, -0.4136280119419098, -0.3723306357860565, -0.33103328943252563, -0.28973591327667236, -0.2484385222196579, -0.20714116096496582, -0.16584378480911255, -0.12454640865325928, -0.083249032497406, -0.04195166379213333, -0.0006542950868606567, 0.040643081068992615, 0.08194045722484589, 0.12323781847953796, 0.16453519463539124, 0.2058325707912445, 0.24712994694709778, 0.28842732310295105, 0.32972466945648193, 0.3710220456123352, 0.4123194217681885, 0.45361679792404175, 0.494914174079895, 0.5362115502357483]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 2.0, 11.0, 7.0, 14.0, 14.0, 15.0, 14.0, 20.0, 36.0, 26.0, 45.0, 35.0, 47.0, 46.0, 52.0, 48.0, 43.0, 55.0, 54.0, 43.0, 48.0, 47.0, 43.0, 41.0, 29.0, 30.0, 23.0, 23.0, 18.0, 18.0, 19.0, 12.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2975556254386902, -0.2845814824104309, -0.27160730957984924, -0.25863316655158997, -0.2456590086221695, -0.23268485069274902, -0.21971070766448975, -0.20673654973506927, -0.1937623918056488, -0.18078823387622833, -0.16781407594680786, -0.15483993291854858, -0.1418657749891281, -0.12889161705970764, -0.11591746658086777, -0.1029433161020279, -0.08996915817260742, -0.07699500024318695, -0.06402084976434708, -0.051046695560216904, -0.03807254135608673, -0.02509838342666626, -0.012124232947826385, 0.0008499175310134888, 0.01382407546043396, 0.026798229664564133, 0.039772383868694305, 0.05274653807282448, 0.06572069227695465, 0.07869485020637512, 0.091669000685215, 0.10464315116405487, 0.11761730909347534, 0.1305914670228958, 0.14356562495231628, 0.15653976798057556, 0.16951392590999603, 0.1824880838394165, 0.19546222686767578, 0.20843638479709625, 0.22141054272651672, 0.2343847006559372, 0.24735885858535767, 0.26033300161361694, 0.2733071446418762, 0.2862813174724579, 0.29925546050071716, 0.31222963333129883, 0.3252037763595581, 0.3381779193878174, 0.35115209221839905, 0.3641262352466583, 0.37710040807724, 0.39007455110549927, 0.40304869413375854, 0.4160228371620178, 0.4289970099925995, 0.44197115302085876, 0.45494532585144043, 0.4679194688796997, 0.480893611907959, 0.49386778473854065, 0.5068419575691223, 0.5198161005973816, 0.5327902436256409]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 1.0, 4.0, 4.0, 11.0, 11.0, 16.0, 31.0, 28.0, 47.0, 83.0, 95.0, 150.0, 227.0, 344.0, 605.0, 1210.0, 2542.0, 7392.0, 30398.0, 226056.0, 673792.0, 82208.0, 14841.0, 4352.0, 1856.0, 872.0, 475.0, 289.0, 199.0, 131.0, 75.0, 62.0, 32.0, 25.0, 24.0, 11.0, 14.0, 7.0, 7.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.262451171875, -0.2543182373046875, -0.246185302734375, -0.2380523681640625, -0.22991943359375, -0.2217864990234375, -0.213653564453125, -0.2055206298828125, -0.1973876953125, -0.1892547607421875, -0.181121826171875, -0.1729888916015625, -0.16485595703125, -0.1567230224609375, -0.148590087890625, -0.1404571533203125, -0.13232421875, -0.1241912841796875, -0.116058349609375, -0.1079254150390625, -0.09979248046875, -0.0916595458984375, -0.083526611328125, -0.0753936767578125, -0.0672607421875, -0.0591278076171875, -0.050994873046875, -0.0428619384765625, -0.03472900390625, -0.0265960693359375, -0.018463134765625, -0.0103302001953125, -0.002197265625, 0.0059356689453125, 0.014068603515625, 0.0222015380859375, 0.03033447265625, 0.0384674072265625, 0.046600341796875, 0.0547332763671875, 0.0628662109375, 0.0709991455078125, 0.079132080078125, 0.0872650146484375, 0.09539794921875, 0.1035308837890625, 0.111663818359375, 0.1197967529296875, 0.1279296875, 0.1360626220703125, 0.144195556640625, 0.1523284912109375, 0.16046142578125, 0.1685943603515625, 0.176727294921875, 0.1848602294921875, 0.1929931640625, 0.2011260986328125, 0.209259033203125, 0.2173919677734375, 0.22552490234375, 0.2336578369140625, 0.241790771484375, 0.2499237060546875, 0.258056640625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 13.0, 11.0, 31.0, 44.0, 73.0, 110.0, 156.0, 156.0, 121.0, 98.0, 66.0, 43.0, 29.0, 15.0, 13.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097412109375, -0.09440135955810547, -0.09139060974121094, -0.0883798599243164, -0.08536911010742188, -0.08235836029052734, -0.07934761047363281, -0.07633686065673828, -0.07332611083984375, -0.07031536102294922, -0.06730461120605469, -0.06429386138916016, -0.061283111572265625, -0.058272361755371094, -0.05526161193847656, -0.05225086212158203, -0.0492401123046875, -0.04622936248779297, -0.04321861267089844, -0.040207862854003906, -0.037197113037109375, -0.034186363220214844, -0.031175613403320312, -0.02816486358642578, -0.02515411376953125, -0.02214336395263672, -0.019132614135742188, -0.016121864318847656, -0.013111114501953125, -0.010100364685058594, -0.0070896148681640625, -0.004078865051269531, -0.001068115234375, 0.0019426345825195312, 0.0049533843994140625, 0.007964134216308594, 0.010974884033203125, 0.013985633850097656, 0.016996383666992188, 0.02000713348388672, 0.02301788330078125, 0.02602863311767578, 0.029039382934570312, 0.032050132751464844, 0.035060882568359375, 0.038071632385253906, 0.04108238220214844, 0.04409313201904297, 0.0471038818359375, 0.05011463165283203, 0.05312538146972656, 0.056136131286621094, 0.059146881103515625, 0.062157630920410156, 0.06516838073730469, 0.06817913055419922, 0.07118988037109375, 0.07420063018798828, 0.07721138000488281, 0.08022212982177734, 0.08323287963867188, 0.0862436294555664, 0.08925437927246094, 0.09226512908935547, 0.09527587890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 14.0, 16.0, 16.0, 38.0, 55.0, 113.0, 121.0, 247.0, 455.0, 1027.0, 2399.0, 7356.0, 33275.0, 365486.0, 578564.0, 44925.0, 9191.0, 2880.0, 1091.0, 553.0, 281.0, 145.0, 98.0, 54.0, 39.0, 22.0, 18.0, 16.0, 15.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294189453125, -0.2844085693359375, -0.274627685546875, -0.2648468017578125, -0.25506591796875, -0.2452850341796875, -0.235504150390625, -0.2257232666015625, -0.2159423828125, -0.2061614990234375, -0.196380615234375, -0.1865997314453125, -0.17681884765625, -0.1670379638671875, -0.157257080078125, -0.1474761962890625, -0.1376953125, -0.1279144287109375, -0.118133544921875, -0.1083526611328125, -0.09857177734375, -0.0887908935546875, -0.079010009765625, -0.0692291259765625, -0.0594482421875, -0.0496673583984375, -0.039886474609375, -0.0301055908203125, -0.02032470703125, -0.0105438232421875, -0.000762939453125, 0.0090179443359375, 0.018798828125, 0.0285797119140625, 0.038360595703125, 0.0481414794921875, 0.05792236328125, 0.0677032470703125, 0.077484130859375, 0.0872650146484375, 0.0970458984375, 0.1068267822265625, 0.116607666015625, 0.1263885498046875, 0.13616943359375, 0.1459503173828125, 0.155731201171875, 0.1655120849609375, 0.17529296875, 0.1850738525390625, 0.194854736328125, 0.2046356201171875, 0.21441650390625, 0.2241973876953125, 0.233978271484375, 0.2437591552734375, 0.2535400390625, 0.2633209228515625, 0.273101806640625, 0.2828826904296875, 0.29266357421875, 0.3024444580078125, 0.312225341796875, 0.3220062255859375, 0.331787109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 11.0, 14.0, 8.0, 13.0, 16.0, 17.0, 16.0, 24.0, 30.0, 35.0, 34.0, 42.0, 44.0, 33.0, 51.0, 54.0, 44.0, 60.0, 42.0, 46.0, 37.0, 49.0, 39.0, 40.0, 35.0, 25.0, 21.0, 15.0, 17.0, 15.0, 7.0, 7.0, 12.0, 2.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.2412109375, -0.2338104248046875, -0.226409912109375, -0.2190093994140625, -0.21160888671875, -0.2042083740234375, -0.196807861328125, -0.1894073486328125, -0.1820068359375, -0.1746063232421875, -0.167205810546875, -0.1598052978515625, -0.15240478515625, -0.1450042724609375, -0.137603759765625, -0.1302032470703125, -0.122802734375, -0.1154022216796875, -0.108001708984375, -0.1006011962890625, -0.09320068359375, -0.0858001708984375, -0.078399658203125, -0.0709991455078125, -0.0635986328125, -0.0561981201171875, -0.048797607421875, -0.0413970947265625, -0.03399658203125, -0.0265960693359375, -0.019195556640625, -0.0117950439453125, -0.00439453125, 0.0030059814453125, 0.010406494140625, 0.0178070068359375, 0.02520751953125, 0.0326080322265625, 0.040008544921875, 0.0474090576171875, 0.0548095703125, 0.0622100830078125, 0.069610595703125, 0.0770111083984375, 0.08441162109375, 0.0918121337890625, 0.099212646484375, 0.1066131591796875, 0.114013671875, 0.1214141845703125, 0.128814697265625, 0.1362152099609375, 0.14361572265625, 0.1510162353515625, 0.158416748046875, 0.1658172607421875, 0.1732177734375, 0.1806182861328125, 0.188018798828125, 0.1954193115234375, 0.20281982421875, 0.2102203369140625, 0.217620849609375, 0.2250213623046875, 0.232421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 13.0, 16.0, 24.0, 25.0, 66.0, 147.0, 318.0, 698.0, 2742.0, 85185.0, 951640.0, 5862.0, 1042.0, 369.0, 191.0, 75.0, 47.0, 25.0, 24.0, 9.0, 6.0, 11.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60107421875, -0.583984375, -0.56689453125, -0.5498046875, -0.53271484375, -0.515625, -0.49853515625, -0.4814453125, -0.46435546875, -0.447265625, -0.43017578125, -0.4130859375, -0.39599609375, -0.37890625, -0.36181640625, -0.3447265625, -0.32763671875, -0.310546875, -0.29345703125, -0.2763671875, -0.25927734375, -0.2421875, -0.22509765625, -0.2080078125, -0.19091796875, -0.173828125, -0.15673828125, -0.1396484375, -0.12255859375, -0.10546875, -0.08837890625, -0.0712890625, -0.05419921875, -0.037109375, -0.02001953125, -0.0029296875, 0.01416015625, 0.03125, 0.04833984375, 0.0654296875, 0.08251953125, 0.099609375, 0.11669921875, 0.1337890625, 0.15087890625, 0.16796875, 0.18505859375, 0.2021484375, 0.21923828125, 0.236328125, 0.25341796875, 0.2705078125, 0.28759765625, 0.3046875, 0.32177734375, 0.3388671875, 0.35595703125, 0.373046875, 0.39013671875, 0.4072265625, 0.42431640625, 0.44140625, 0.45849609375, 0.4755859375, 0.49267578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 13.0, 12.0, 18.0, 14.0, 20.0, 27.0, 22.0, 33.0, 45.0, 60.0, 90.0, 113.0, 99.0, 91.0, 63.0, 47.0, 39.0, 27.0, 26.0, 26.0, 21.0, 11.0, 14.0, 9.0, 9.0, 12.0, 3.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.655952453613281e-05, -9.356345981359482e-05, -9.056739509105682e-05, -8.757133036851883e-05, -8.457526564598083e-05, -8.157920092344284e-05, -7.858313620090485e-05, -7.558707147836685e-05, -7.259100675582886e-05, -6.959494203329086e-05, -6.659887731075287e-05, -6.360281258821487e-05, -6.060674786567688e-05, -5.7610683143138885e-05, -5.461461842060089e-05, -5.16185536980629e-05, -4.86224889755249e-05, -4.562642425298691e-05, -4.2630359530448914e-05, -3.963429480791092e-05, -3.6638230085372925e-05, -3.364216536283493e-05, -3.0646100640296936e-05, -2.765003591775894e-05, -2.4653971195220947e-05, -2.1657906472682953e-05, -1.866184175014496e-05, -1.5665777027606964e-05, -1.266971230506897e-05, -9.673647582530975e-06, -6.677582859992981e-06, -3.6815181374549866e-06, -6.854534149169922e-07, 2.310611307621002e-06, 5.306676030158997e-06, 8.302740752696991e-06, 1.1298805475234985e-05, 1.429487019777298e-05, 1.7290934920310974e-05, 2.028699964284897e-05, 2.3283064365386963e-05, 2.6279129087924957e-05, 2.927519381046295e-05, 3.2271258533000946e-05, 3.526732325553894e-05, 3.8263387978076935e-05, 4.125945270061493e-05, 4.4255517423152924e-05, 4.725158214569092e-05, 5.024764686822891e-05, 5.324371159076691e-05, 5.62397763133049e-05, 5.9235841035842896e-05, 6.223190575838089e-05, 6.522797048091888e-05, 6.822403520345688e-05, 7.122009992599487e-05, 7.421616464853287e-05, 7.721222937107086e-05, 8.020829409360886e-05, 8.320435881614685e-05, 8.620042353868484e-05, 8.919648826122284e-05, 9.219255298376083e-05, 9.518861770629883e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 5.0, 8.0, 6.0, 12.0, 16.0, 22.0, 24.0, 29.0, 56.0, 90.0, 192.0, 319.0, 761.0, 1987.0, 6923.0, 47078.0, 895140.0, 81873.0, 9492.0, 2610.0, 965.0, 409.0, 203.0, 111.0, 75.0, 56.0, 30.0, 16.0, 6.0, 7.0, 0.0, 14.0, 9.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.248046875, -0.2406635284423828, -0.23328018188476562, -0.22589683532714844, -0.21851348876953125, -0.21113014221191406, -0.20374679565429688, -0.1963634490966797, -0.1889801025390625, -0.1815967559814453, -0.17421340942382812, -0.16683006286621094, -0.15944671630859375, -0.15206336975097656, -0.14468002319335938, -0.1372966766357422, -0.129913330078125, -0.12252998352050781, -0.11514663696289062, -0.10776329040527344, -0.10037994384765625, -0.09299659729003906, -0.08561325073242188, -0.07822990417480469, -0.0708465576171875, -0.06346321105957031, -0.056079864501953125, -0.04869651794433594, -0.04131317138671875, -0.03392982482910156, -0.026546478271484375, -0.019163131713867188, -0.01177978515625, -0.0043964385986328125, 0.002986907958984375, 0.010370254516601562, 0.01775360107421875, 0.025136947631835938, 0.032520294189453125, 0.03990364074707031, 0.0472869873046875, 0.05467033386230469, 0.062053680419921875, 0.06943702697753906, 0.07682037353515625, 0.08420372009277344, 0.09158706665039062, 0.09897041320800781, 0.106353759765625, 0.11373710632324219, 0.12112045288085938, 0.12850379943847656, 0.13588714599609375, 0.14327049255371094, 0.15065383911132812, 0.1580371856689453, 0.1654205322265625, 0.1728038787841797, 0.18018722534179688, 0.18757057189941406, 0.19495391845703125, 0.20233726501464844, 0.20972061157226562, 0.2171039581298828, 0.2244873046875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 5.0, 4.0, 3.0, 1.0, 5.0, 7.0, 5.0, 7.0, 8.0, 13.0, 14.0, 24.0, 50.0, 67.0, 119.0, 275.0, 159.0, 102.0, 44.0, 30.0, 16.0, 11.0, 10.0, 7.0, 9.0, 4.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.3042259216308594, -0.29570770263671875, -0.2871894836425781, -0.2786712646484375, -0.2701530456542969, -0.26163482666015625, -0.2531166076660156, -0.244598388671875, -0.23608016967773438, -0.22756195068359375, -0.21904373168945312, -0.2105255126953125, -0.20200729370117188, -0.19348907470703125, -0.18497085571289062, -0.17645263671875, -0.16793441772460938, -0.15941619873046875, -0.15089797973632812, -0.1423797607421875, -0.13386154174804688, -0.12534332275390625, -0.11682510375976562, -0.108306884765625, -0.09978866577148438, -0.09127044677734375, -0.08275222778320312, -0.0742340087890625, -0.06571578979492188, -0.05719757080078125, -0.048679351806640625, -0.0401611328125, -0.031642913818359375, -0.02312469482421875, -0.014606475830078125, -0.0060882568359375, 0.002429962158203125, 0.01094818115234375, 0.019466400146484375, 0.027984619140625, 0.036502838134765625, 0.04502105712890625, 0.053539276123046875, 0.0620574951171875, 0.07057571411132812, 0.07909393310546875, 0.08761215209960938, 0.09613037109375, 0.10464859008789062, 0.11316680908203125, 0.12168502807617188, 0.1302032470703125, 0.13872146606445312, 0.14723968505859375, 0.15575790405273438, 0.164276123046875, 0.17279434204101562, 0.18131256103515625, 0.18983078002929688, 0.1983489990234375, 0.20686721801757812, 0.21538543701171875, 0.22390365600585938, 0.232421875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 12.0, 41.0, 322.0, 580.0, 40.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.710500717163086, -11.44558334350586, -11.180665016174316, -10.91574764251709, -10.650829315185547, -10.38591194152832, -10.120994567871094, -9.85607624053955, -9.591158866882324, -9.326241493225098, -9.061323165893555, -8.796405792236328, -8.531487464904785, -8.266570091247559, -8.001651763916016, -7.736734390258789, -7.471816539764404, -7.2068986892700195, -6.941980838775635, -6.67706298828125, -6.412145614624023, -6.147227764129639, -5.882309913635254, -5.617392063140869, -5.352474212646484, -5.0875563621521, -4.822638511657715, -4.557721138000488, -4.2928032875061035, -4.027885437011719, -3.762967586517334, -3.498049736022949, -3.233132839202881, -2.968214988708496, -2.7032973766326904, -2.4383795261383057, -2.1734619140625, -1.9085440635681152, -1.6436262130737305, -1.3787084817886353, -1.11379075050354, -0.8488730192184448, -0.5839552283287048, -0.31903743743896484, -0.05411970615386963, 0.21079802513122559, 0.47571587562561035, 0.7406336069107056, 1.0055513381958008, 1.270469069480896, 1.5353868007659912, 1.800304651260376, 2.0652222633361816, 2.3301401138305664, 2.595057964324951, 2.859975814819336, 3.1248934268951416, 3.3898112773895264, 3.654728889465332, 3.919646739959717, 4.184564590454102, 4.449481964111328, 4.714400291442871, 4.979317665100098, 5.244235515594482]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 12.0, 10.0, 8.0, 15.0, 22.0, 27.0, 20.0, 30.0, 33.0, 62.0, 35.0, 55.0, 42.0, 56.0, 61.0, 67.0, 46.0, 54.0, 55.0, 37.0, 33.0, 47.0, 37.0, 23.0, 26.0, 19.0, 13.0, 11.0, 11.0, 14.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4613746404647827, -1.4001802206039429, -1.3389859199523926, -1.2777915000915527, -1.216597080230713, -1.155402660369873, -1.0942083597183228, -1.033013939857483, -0.9718195796012878, -0.9106252193450928, -0.8494307994842529, -0.7882364392280579, -0.7270420789718628, -0.665847659111023, -0.6046532988548279, -0.5434589385986328, -0.48226451873779297, -0.4210701286792755, -0.35987573862075806, -0.298681378364563, -0.23748698830604553, -0.17629259824752808, -0.11509823799133301, -0.05390384793281555, 0.007290542125701904, 0.06848492473363876, 0.12967930734157562, 0.19087368249893188, 0.25206807255744934, 0.3132624626159668, 0.37445682287216187, 0.4356512129306793, 0.4968454837799072, 0.5580398440361023, 0.6192342638969421, 0.6804286241531372, 0.741623044013977, 0.8028174042701721, 0.8640117645263672, 0.925206184387207, 0.9864005446434021, 1.0475949048995972, 1.108789324760437, 1.1699836254119873, 1.2311780452728271, 1.292372465133667, 1.3535668849945068, 1.4147611856460571, 1.475955605506897, 1.5371500253677368, 1.598344326019287, 1.659538745880127, 1.7207331657409668, 1.7819275856018066, 1.843121886253357, 1.9043163061141968, 1.965510606765747, 2.026705026626587, 2.0878994464874268, 2.1490936279296875, 2.2102880477905273, 2.271482467651367, 2.332676887512207, 2.393871307373047, 2.4550657272338867]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 8.0, 10.0, 13.0, 17.0, 41.0, 57.0, 80.0, 150.0, 280.0, 521.0, 1160.0, 2835.0, 9257.0, 48158.0, 3859858.0, 242071.0, 20550.0, 5454.0, 1947.0, 844.0, 418.0, 201.0, 127.0, 82.0, 41.0, 27.0, 22.0, 12.0, 8.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.268310546875, -0.26012420654296875, -0.2519378662109375, -0.24375152587890625, -0.235565185546875, -0.22737884521484375, -0.2191925048828125, -0.21100616455078125, -0.20281982421875, -0.19463348388671875, -0.1864471435546875, -0.17826080322265625, -0.170074462890625, -0.16188812255859375, -0.1537017822265625, -0.14551544189453125, -0.1373291015625, -0.12914276123046875, -0.1209564208984375, -0.11277008056640625, -0.104583740234375, -0.09639739990234375, -0.0882110595703125, -0.08002471923828125, -0.07183837890625, -0.06365203857421875, -0.0554656982421875, -0.04727935791015625, -0.039093017578125, -0.03090667724609375, -0.0227203369140625, -0.01453399658203125, -0.00634765625, 0.00183868408203125, 0.0100250244140625, 0.01821136474609375, 0.026397705078125, 0.03458404541015625, 0.0427703857421875, 0.05095672607421875, 0.05914306640625, 0.06732940673828125, 0.0755157470703125, 0.08370208740234375, 0.091888427734375, 0.10007476806640625, 0.1082611083984375, 0.11644744873046875, 0.1246337890625, 0.13282012939453125, 0.1410064697265625, 0.14919281005859375, 0.157379150390625, 0.16556549072265625, 0.1737518310546875, 0.18193817138671875, 0.19012451171875, 0.19831085205078125, 0.2064971923828125, 0.21468353271484375, 0.222869873046875, 0.23105621337890625, 0.2392425537109375, 0.24742889404296875, 0.255615234375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 11.0, 8.0, 12.0, 20.0, 34.0, 47.0, 71.0, 98.0, 109.0, 138.0, 120.0, 109.0, 70.0, 46.0, 41.0, 23.0, 17.0, 10.0, 11.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09686279296875, -0.09388446807861328, -0.09090614318847656, -0.08792781829833984, -0.08494949340820312, -0.0819711685180664, -0.07899284362792969, -0.07601451873779297, -0.07303619384765625, -0.07005786895751953, -0.06707954406738281, -0.0641012191772461, -0.061122894287109375, -0.058144569396972656, -0.05516624450683594, -0.05218791961669922, -0.0492095947265625, -0.04623126983642578, -0.04325294494628906, -0.040274620056152344, -0.037296295166015625, -0.034317970275878906, -0.03133964538574219, -0.02836132049560547, -0.02538299560546875, -0.02240467071533203, -0.019426345825195312, -0.016448020935058594, -0.013469696044921875, -0.010491371154785156, -0.0075130462646484375, -0.004534721374511719, -0.001556396484375, 0.0014219284057617188, 0.0044002532958984375, 0.007378578186035156, 0.010356903076171875, 0.013335227966308594, 0.016313552856445312, 0.01929187774658203, 0.02227020263671875, 0.02524852752685547, 0.028226852416992188, 0.031205177307128906, 0.034183502197265625, 0.037161827087402344, 0.04014015197753906, 0.04311847686767578, 0.0460968017578125, 0.04907512664794922, 0.05205345153808594, 0.055031776428222656, 0.058010101318359375, 0.060988426208496094, 0.06396675109863281, 0.06694507598876953, 0.06992340087890625, 0.07290172576904297, 0.07588005065917969, 0.0788583755493164, 0.08183670043945312, 0.08481502532958984, 0.08779335021972656, 0.09077167510986328, 0.09375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 8.0, 10.0, 23.0, 29.0, 36.0, 65.0, 92.0, 113.0, 233.0, 440.0, 744.0, 1259.0, 2808.0, 8921.0, 74956.0, 4025171.0, 64996.0, 8380.0, 2918.0, 1324.0, 718.0, 388.0, 223.0, 139.0, 120.0, 64.0, 44.0, 18.0, 19.0, 7.0, 8.0, 5.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.40478515625, -0.3933753967285156, -0.38196563720703125, -0.3705558776855469, -0.3591461181640625, -0.3477363586425781, -0.33632659912109375, -0.3249168395996094, -0.313507080078125, -0.3020973205566406, -0.29068756103515625, -0.2792778015136719, -0.2678680419921875, -0.2564582824707031, -0.24504852294921875, -0.23363876342773438, -0.22222900390625, -0.21081924438476562, -0.19940948486328125, -0.18799972534179688, -0.1765899658203125, -0.16518020629882812, -0.15377044677734375, -0.14236068725585938, -0.130950927734375, -0.11954116821289062, -0.10813140869140625, -0.09672164916992188, -0.0853118896484375, -0.07390213012695312, -0.06249237060546875, -0.051082611083984375, -0.0396728515625, -0.028263092041015625, -0.01685333251953125, -0.005443572998046875, 0.0059661865234375, 0.017375946044921875, 0.02878570556640625, 0.040195465087890625, 0.051605224609375, 0.06301498413085938, 0.07442474365234375, 0.08583450317382812, 0.0972442626953125, 0.10865402221679688, 0.12006378173828125, 0.13147354125976562, 0.14288330078125, 0.15429306030273438, 0.16570281982421875, 0.17711257934570312, 0.1885223388671875, 0.19993209838867188, 0.21134185791015625, 0.22275161743164062, 0.234161376953125, 0.24557113647460938, 0.25698089599609375, 0.2683906555175781, 0.2798004150390625, 0.2912101745605469, 0.30261993408203125, 0.3140296936035156, 0.325439453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 14.0, 34.0, 89.0, 501.0, 3077.0, 221.0, 55.0, 29.0, 18.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27099609375, -0.2633190155029297, -0.2556419372558594, -0.24796485900878906, -0.24028778076171875, -0.23261070251464844, -0.22493362426757812, -0.2172565460205078, -0.2095794677734375, -0.2019023895263672, -0.19422531127929688, -0.18654823303222656, -0.17887115478515625, -0.17119407653808594, -0.16351699829101562, -0.1558399200439453, -0.148162841796875, -0.1404857635498047, -0.13280868530273438, -0.12513160705566406, -0.11745452880859375, -0.10977745056152344, -0.10210037231445312, -0.09442329406738281, -0.0867462158203125, -0.07906913757324219, -0.07139205932617188, -0.06371498107910156, -0.05603790283203125, -0.04836082458496094, -0.040683746337890625, -0.03300666809082031, -0.02532958984375, -0.017652511596679688, -0.009975433349609375, -0.0022983551025390625, 0.00537872314453125, 0.013055801391601562, 0.020732879638671875, 0.028409957885742188, 0.0360870361328125, 0.04376411437988281, 0.051441192626953125, 0.05911827087402344, 0.06679534912109375, 0.07447242736816406, 0.08214950561523438, 0.08982658386230469, 0.097503662109375, 0.10518074035644531, 0.11285781860351562, 0.12053489685058594, 0.12821197509765625, 0.13588905334472656, 0.14356613159179688, 0.1512432098388672, 0.1589202880859375, 0.1665973663330078, 0.17427444458007812, 0.18195152282714844, 0.18962860107421875, 0.19730567932128906, 0.20498275756835938, 0.2126598358154297, 0.2203369140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 15.0, 41.0, 72.0, 199.0, 283.0, 214.0, 85.0, 50.0, 20.0, 5.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7644767761230469, -0.7356289625167847, -0.7067811489105225, -0.6779333353042603, -0.649085521697998, -0.6202377080917358, -0.5913898944854736, -0.5625420808792114, -0.5336942672729492, -0.504846453666687, -0.4759986400604248, -0.4471508264541626, -0.4183030128479004, -0.3894551992416382, -0.360607385635376, -0.33175957202911377, -0.30291175842285156, -0.27406394481658936, -0.24521613121032715, -0.21636831760406494, -0.18752050399780273, -0.15867269039154053, -0.12982487678527832, -0.10097706317901611, -0.0721292495727539, -0.0432814359664917, -0.014433622360229492, 0.014414191246032715, 0.04326200485229492, 0.07210981845855713, 0.10095763206481934, 0.12980544567108154, 0.15865325927734375, 0.18750107288360596, 0.21634888648986816, 0.24519670009613037, 0.2740445137023926, 0.3028923273086548, 0.331740140914917, 0.3605879545211792, 0.3894357681274414, 0.4182835817337036, 0.4471313953399658, 0.475979208946228, 0.5048270225524902, 0.5336748361587524, 0.5625226497650146, 0.5913704633712769, 0.6202182769775391, 0.6490660905838013, 0.6779139041900635, 0.7067617177963257, 0.7356095314025879, 0.7644573450088501, 0.7933051586151123, 0.8221529722213745, 0.8510007858276367, 0.8798485994338989, 0.9086964130401611, 0.9375442266464233, 0.9663920402526855, 0.9952398538589478, 1.02408766746521, 1.0529354810714722, 1.0817832946777344]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 10.0, 7.0, 5.0, 5.0, 12.0, 9.0, 23.0, 18.0, 22.0, 19.0, 21.0, 36.0, 27.0, 28.0, 30.0, 38.0, 40.0, 38.0, 46.0, 44.0, 47.0, 32.0, 39.0, 35.0, 29.0, 45.0, 40.0, 34.0, 35.0, 35.0, 31.0, 16.0, 20.0, 13.0, 21.0, 10.0, 6.0, 7.0, 9.0, 5.0, 6.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3800247311592102, -0.3687201142311096, -0.35741546750068665, -0.34611085057258606, -0.3348062038421631, -0.3235015869140625, -0.3121969699859619, -0.30089232325553894, -0.28958767652511597, -0.2782830595970154, -0.2669784128665924, -0.2556737959384918, -0.24436914920806885, -0.23306453227996826, -0.22175990045070648, -0.2104552686214447, -0.19915065169334412, -0.18784601986408234, -0.17654138803482056, -0.16523677110671997, -0.153932124376297, -0.1426275074481964, -0.13132287561893463, -0.12001824378967285, -0.10871361196041107, -0.09740898013114929, -0.08610434830188751, -0.07479972392320633, -0.06349509209394455, -0.05219046026468277, -0.04088583588600159, -0.029581204056739807, -0.018276572227478027, -0.006971942260861397, 0.004332687705755234, 0.015637315809726715, 0.026941947638988495, 0.038246579468250275, 0.04955120384693146, 0.06085583567619324, 0.07216046750545502, 0.0834650993347168, 0.09476973116397858, 0.10607435554265976, 0.11737898737192154, 0.12868362665176392, 0.1399882435798645, 0.15129287540912628, 0.16259750723838806, 0.17390213906764984, 0.18520677089691162, 0.1965113878250122, 0.20781603455543518, 0.21912065148353577, 0.23042528331279755, 0.24172991514205933, 0.2530345320701599, 0.2643391489982605, 0.27564379572868347, 0.28694841265678406, 0.29825305938720703, 0.3095576763153076, 0.3208622932434082, 0.3321669399738312, 0.34347158670425415]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 9.0, 15.0, 16.0, 40.0, 44.0, 97.0, 131.0, 288.0, 611.0, 1787.0, 6866.0, 50388.0, 910813.0, 65977.0, 7944.0, 2024.0, 764.0, 352.0, 156.0, 74.0, 47.0, 38.0, 21.0, 21.0, 9.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41943359375, -0.4061393737792969, -0.39284515380859375, -0.3795509338378906, -0.3662567138671875, -0.3529624938964844, -0.33966827392578125, -0.3263740539550781, -0.313079833984375, -0.2997856140136719, -0.28649139404296875, -0.2731971740722656, -0.2599029541015625, -0.24660873413085938, -0.23331451416015625, -0.22002029418945312, -0.20672607421875, -0.19343185424804688, -0.18013763427734375, -0.16684341430664062, -0.1535491943359375, -0.14025497436523438, -0.12696075439453125, -0.11366653442382812, -0.100372314453125, -0.08707809448242188, -0.07378387451171875, -0.060489654541015625, -0.0471954345703125, -0.033901214599609375, -0.02060699462890625, -0.007312774658203125, 0.0059814453125, 0.019275665283203125, 0.03256988525390625, 0.045864105224609375, 0.0591583251953125, 0.07245254516601562, 0.08574676513671875, 0.09904098510742188, 0.112335205078125, 0.12562942504882812, 0.13892364501953125, 0.15221786499023438, 0.1655120849609375, 0.17880630493164062, 0.19210052490234375, 0.20539474487304688, 0.21868896484375, 0.23198318481445312, 0.24527740478515625, 0.2585716247558594, 0.2718658447265625, 0.2851600646972656, 0.29845428466796875, 0.3117485046386719, 0.325042724609375, 0.3383369445800781, 0.35163116455078125, 0.3649253845214844, 0.3782196044921875, 0.3915138244628906, 0.40480804443359375, 0.4181022644042969, 0.431396484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 9.0, 7.0, 13.0, 20.0, 25.0, 55.0, 90.0, 89.0, 121.0, 116.0, 118.0, 97.0, 76.0, 58.0, 36.0, 20.0, 21.0, 17.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09857177734375, -0.09554195404052734, -0.09251213073730469, -0.08948230743408203, -0.08645248413085938, -0.08342266082763672, -0.08039283752441406, -0.0773630142211914, -0.07433319091796875, -0.0713033676147461, -0.06827354431152344, -0.06524372100830078, -0.062213897705078125, -0.05918407440185547, -0.05615425109863281, -0.053124427795410156, -0.0500946044921875, -0.047064781188964844, -0.04403495788574219, -0.04100513458251953, -0.037975311279296875, -0.03494548797607422, -0.03191566467285156, -0.028885841369628906, -0.02585601806640625, -0.022826194763183594, -0.019796371459960938, -0.01676654815673828, -0.013736724853515625, -0.010706901550292969, -0.0076770782470703125, -0.004647254943847656, -0.001617431640625, 0.0014123916625976562, 0.0044422149658203125, 0.007472038269042969, 0.010501861572265625, 0.013531684875488281, 0.016561508178710938, 0.019591331481933594, 0.02262115478515625, 0.025650978088378906, 0.028680801391601562, 0.03171062469482422, 0.034740447998046875, 0.03777027130126953, 0.04080009460449219, 0.043829917907714844, 0.0468597412109375, 0.049889564514160156, 0.05291938781738281, 0.05594921112060547, 0.058979034423828125, 0.06200885772705078, 0.06503868103027344, 0.0680685043334961, 0.07109832763671875, 0.0741281509399414, 0.07715797424316406, 0.08018779754638672, 0.08321762084960938, 0.08624744415283203, 0.08927726745605469, 0.09230709075927734, 0.0953369140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 7.0, 12.0, 10.0, 29.0, 27.0, 35.0, 62.0, 73.0, 119.0, 162.0, 336.0, 663.0, 1460.0, 3972.0, 14290.0, 109056.0, 856077.0, 48096.0, 8905.0, 2773.0, 1139.0, 498.0, 283.0, 155.0, 93.0, 66.0, 36.0, 23.0, 32.0, 14.0, 7.0, 8.0, 11.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33251953125, -0.3225440979003906, -0.31256866455078125, -0.3025932312011719, -0.2926177978515625, -0.2826423645019531, -0.27266693115234375, -0.2626914978027344, -0.252716064453125, -0.24274063110351562, -0.23276519775390625, -0.22278976440429688, -0.2128143310546875, -0.20283889770507812, -0.19286346435546875, -0.18288803100585938, -0.17291259765625, -0.16293716430664062, -0.15296173095703125, -0.14298629760742188, -0.1330108642578125, -0.12303543090820312, -0.11305999755859375, -0.10308456420898438, -0.093109130859375, -0.08313369750976562, -0.07315826416015625, -0.06318283081054688, -0.0532073974609375, -0.043231964111328125, -0.03325653076171875, -0.023281097412109375, -0.0133056640625, -0.003330230712890625, 0.00664520263671875, 0.016620635986328125, 0.0265960693359375, 0.036571502685546875, 0.04654693603515625, 0.056522369384765625, 0.066497802734375, 0.07647323608398438, 0.08644866943359375, 0.09642410278320312, 0.1063995361328125, 0.11637496948242188, 0.12635040283203125, 0.13632583618164062, 0.14630126953125, 0.15627670288085938, 0.16625213623046875, 0.17622756958007812, 0.1862030029296875, 0.19617843627929688, 0.20615386962890625, 0.21612930297851562, 0.226104736328125, 0.23608016967773438, 0.24605560302734375, 0.2560310363769531, 0.2660064697265625, 0.2759819030761719, 0.28595733642578125, 0.2959327697753906, 0.305908203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 0.0, 3.0, 11.0, 6.0, 13.0, 16.0, 22.0, 29.0, 35.0, 40.0, 31.0, 50.0, 80.0, 82.0, 82.0, 72.0, 66.0, 63.0, 48.0, 65.0, 50.0, 39.0, 23.0, 15.0, 14.0, 8.0, 14.0, 5.0, 5.0, 5.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393798828125, -0.3832244873046875, -0.372650146484375, -0.3620758056640625, -0.35150146484375, -0.3409271240234375, -0.330352783203125, -0.3197784423828125, -0.3092041015625, -0.2986297607421875, -0.288055419921875, -0.2774810791015625, -0.26690673828125, -0.2563323974609375, -0.245758056640625, -0.2351837158203125, -0.224609375, -0.2140350341796875, -0.203460693359375, -0.1928863525390625, -0.18231201171875, -0.1717376708984375, -0.161163330078125, -0.1505889892578125, -0.1400146484375, -0.1294403076171875, -0.118865966796875, -0.1082916259765625, -0.09771728515625, -0.0871429443359375, -0.076568603515625, -0.0659942626953125, -0.055419921875, -0.0448455810546875, -0.034271240234375, -0.0236968994140625, -0.01312255859375, -0.0025482177734375, 0.008026123046875, 0.0186004638671875, 0.0291748046875, 0.0397491455078125, 0.050323486328125, 0.0608978271484375, 0.07147216796875, 0.0820465087890625, 0.092620849609375, 0.1031951904296875, 0.11376953125, 0.1243438720703125, 0.134918212890625, 0.1454925537109375, 0.15606689453125, 0.1666412353515625, 0.177215576171875, 0.1877899169921875, 0.1983642578125, 0.2089385986328125, 0.219512939453125, 0.2300872802734375, 0.24066162109375, 0.2512359619140625, 0.261810302734375, 0.2723846435546875, 0.282958984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 6.0, 13.0, 17.0, 23.0, 25.0, 58.0, 108.0, 157.0, 407.0, 1029.0, 5020.0, 65001.0, 927842.0, 43109.0, 4058.0, 933.0, 354.0, 175.0, 68.0, 43.0, 44.0, 19.0, 5.0, 9.0, 14.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.19758224487304688, -0.19167327880859375, -0.18576431274414062, -0.1798553466796875, -0.17394638061523438, -0.16803741455078125, -0.16212844848632812, -0.156219482421875, -0.15031051635742188, -0.14440155029296875, -0.13849258422851562, -0.1325836181640625, -0.12667465209960938, -0.12076568603515625, -0.11485671997070312, -0.10894775390625, -0.10303878784179688, -0.09712982177734375, -0.09122085571289062, -0.0853118896484375, -0.07940292358398438, -0.07349395751953125, -0.06758499145507812, -0.061676025390625, -0.055767059326171875, -0.04985809326171875, -0.043949127197265625, -0.0380401611328125, -0.032131195068359375, -0.02622222900390625, -0.020313262939453125, -0.014404296875, -0.008495330810546875, -0.00258636474609375, 0.003322601318359375, 0.0092315673828125, 0.015140533447265625, 0.02104949951171875, 0.026958465576171875, 0.032867431640625, 0.038776397705078125, 0.04468536376953125, 0.050594329833984375, 0.0565032958984375, 0.062412261962890625, 0.06832122802734375, 0.07423019409179688, 0.08013916015625, 0.08604812622070312, 0.09195709228515625, 0.09786605834960938, 0.1037750244140625, 0.10968399047851562, 0.11559295654296875, 0.12150192260742188, 0.127410888671875, 0.13331985473632812, 0.13922882080078125, 0.14513778686523438, 0.1510467529296875, 0.15695571899414062, 0.16286468505859375, 0.16877365112304688, 0.1746826171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 9.0, 9.0, 18.0, 24.0, 36.0, 45.0, 76.0, 115.0, 151.0, 145.0, 113.0, 70.0, 43.0, 32.0, 18.0, 19.0, 15.0, 8.0, 10.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.435415267944336e-05, -9.129848331212997e-05, -8.824281394481659e-05, -8.51871445775032e-05, -8.213147521018982e-05, -7.907580584287643e-05, -7.602013647556305e-05, -7.296446710824966e-05, -6.990879774093628e-05, -6.68531283736229e-05, -6.379745900630951e-05, -6.0741789638996124e-05, -5.768612027168274e-05, -5.4630450904369354e-05, -5.157478153705597e-05, -4.8519112169742584e-05, -4.54634428024292e-05, -4.2407773435115814e-05, -3.935210406780243e-05, -3.6296434700489044e-05, -3.324076533317566e-05, -3.0185095965862274e-05, -2.712942659854889e-05, -2.4073757231235504e-05, -2.101808786392212e-05, -1.7962418496608734e-05, -1.4906749129295349e-05, -1.1851079761981964e-05, -8.795410394668579e-06, -5.739741027355194e-06, -2.684071660041809e-06, 3.7159770727157593e-07, 3.427267074584961e-06, 6.482936441898346e-06, 9.538605809211731e-06, 1.2594275176525116e-05, 1.56499445438385e-05, 1.8705613911151886e-05, 2.176128327846527e-05, 2.4816952645778656e-05, 2.787262201309204e-05, 3.0928291380405426e-05, 3.398396074771881e-05, 3.7039630115032196e-05, 4.009529948234558e-05, 4.3150968849658966e-05, 4.620663821697235e-05, 4.9262307584285736e-05, 5.231797695159912e-05, 5.5373646318912506e-05, 5.842931568622589e-05, 6.148498505353928e-05, 6.454065442085266e-05, 6.759632378816605e-05, 7.065199315547943e-05, 7.370766252279282e-05, 7.67633318901062e-05, 7.981900125741959e-05, 8.287467062473297e-05, 8.593033999204636e-05, 8.898600935935974e-05, 9.204167872667313e-05, 9.509734809398651e-05, 9.81530174612999e-05, 0.00010120868682861328]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 15.0, 11.0, 17.0, 16.0, 33.0, 57.0, 88.0, 140.0, 257.0, 442.0, 935.0, 2887.0, 15500.0, 216035.0, 780499.0, 25326.0, 3824.0, 1227.0, 520.0, 278.0, 146.0, 98.0, 66.0, 45.0, 28.0, 16.0, 10.0, 9.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2137451171875, -0.20841598510742188, -0.20308685302734375, -0.19775772094726562, -0.1924285888671875, -0.18709945678710938, -0.18177032470703125, -0.17644119262695312, -0.171112060546875, -0.16578292846679688, -0.16045379638671875, -0.15512466430664062, -0.1497955322265625, -0.14446640014648438, -0.13913726806640625, -0.13380813598632812, -0.12847900390625, -0.12314987182617188, -0.11782073974609375, -0.11249160766601562, -0.1071624755859375, -0.10183334350585938, -0.09650421142578125, -0.09117507934570312, -0.085845947265625, -0.08051681518554688, -0.07518768310546875, -0.06985855102539062, -0.0645294189453125, -0.059200286865234375, -0.05387115478515625, -0.048542022705078125, -0.043212890625, -0.037883758544921875, -0.03255462646484375, -0.027225494384765625, -0.0218963623046875, -0.016567230224609375, -0.01123809814453125, -0.005908966064453125, -0.000579833984375, 0.004749298095703125, 0.01007843017578125, 0.015407562255859375, 0.0207366943359375, 0.026065826416015625, 0.03139495849609375, 0.036724090576171875, 0.04205322265625, 0.047382354736328125, 0.05271148681640625, 0.058040618896484375, 0.0633697509765625, 0.06869888305664062, 0.07402801513671875, 0.07935714721679688, 0.084686279296875, 0.09001541137695312, 0.09534454345703125, 0.10067367553710938, 0.1060028076171875, 0.11133193969726562, 0.11666107177734375, 0.12199020385742188, 0.1273193359375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 11.0, 12.0, 15.0, 22.0, 20.0, 23.0, 25.0, 43.0, 58.0, 218.0, 266.0, 52.0, 33.0, 25.0, 34.0, 25.0, 10.0, 15.0, 11.0, 12.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1099853515625, -0.10632896423339844, -0.10267257690429688, -0.09901618957519531, -0.09535980224609375, -0.09170341491699219, -0.08804702758789062, -0.08439064025878906, -0.0807342529296875, -0.07707786560058594, -0.07342147827148438, -0.06976509094238281, -0.06610870361328125, -0.06245231628417969, -0.058795928955078125, -0.05513954162597656, -0.051483154296875, -0.04782676696777344, -0.044170379638671875, -0.04051399230957031, -0.03685760498046875, -0.03320121765136719, -0.029544830322265625, -0.025888442993164062, -0.0222320556640625, -0.018575668334960938, -0.014919281005859375, -0.011262893676757812, -0.00760650634765625, -0.0039501190185546875, -0.000293731689453125, 0.0033626556396484375, 0.00701904296875, 0.010675430297851562, 0.014331817626953125, 0.017988204956054688, 0.02164459228515625, 0.025300979614257812, 0.028957366943359375, 0.03261375427246094, 0.0362701416015625, 0.03992652893066406, 0.043582916259765625, 0.04723930358886719, 0.05089569091796875, 0.05455207824707031, 0.058208465576171875, 0.06186485290527344, 0.065521240234375, 0.06917762756347656, 0.07283401489257812, 0.07649040222167969, 0.08014678955078125, 0.08380317687988281, 0.08745956420898438, 0.09111595153808594, 0.0947723388671875, 0.09842872619628906, 0.10208511352539062, 0.10574150085449219, 0.10939788818359375, 0.11305427551269531, 0.11671066284179688, 0.12036705017089844, 0.1240234375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 859.0, 146.0, 6.0], "bins": [-34.48314666748047, -33.9256477355957, -33.36814880371094, -32.810646057128906, -32.25314712524414, -31.695648193359375, -31.13814926147461, -30.58064842224121, -30.023149490356445, -29.46565055847168, -28.90814971923828, -28.350650787353516, -27.79315185546875, -27.23565101623535, -26.678152084350586, -26.120651245117188, -25.563152313232422, -25.005653381347656, -24.448152542114258, -23.890653610229492, -23.333152770996094, -22.775653839111328, -22.218154907226562, -21.660654067993164, -21.1031551361084, -20.545656204223633, -19.988155364990234, -19.43065643310547, -18.873157501220703, -18.315656661987305, -17.75815773010254, -17.20065689086914, -16.643157958984375, -16.08565902709961, -15.528158187866211, -14.970659255981445, -14.413159370422363, -13.855659484863281, -13.298160552978516, -12.740660667419434, -12.183160781860352, -11.62566089630127, -11.068161010742188, -10.510662078857422, -9.95316219329834, -9.395662307739258, -8.838163375854492, -8.28066349029541, -7.72316312789917, -7.165663719177246, -6.608163833618164, -6.050663948059082, -5.493164539337158, -4.935665130615234, -4.378165245056152, -3.8206655979156494, -3.2631659507751465, -2.7056663036346436, -2.1481666564941406, -1.5906670093536377, -1.0331673622131348, -0.47566771507263184, 0.0818319320678711, 0.639331579208374, 1.1968311071395874]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 6.0, 9.0, 9.0, 8.0, 16.0, 13.0, 25.0, 20.0, 29.0, 27.0, 39.0, 21.0, 32.0, 40.0, 48.0, 44.0, 61.0, 50.0, 47.0, 53.0, 32.0, 54.0, 41.0, 32.0, 39.0, 33.0, 22.0, 21.0, 22.0, 14.0, 20.0, 8.0, 12.0, 15.0, 11.0, 6.0, 6.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2465689182281494, -1.2084039449691772, -1.1702390909194946, -1.1320741176605225, -1.0939092636108398, -1.0557442903518677, -1.0175793170928955, -0.9794144630432129, -0.9412494897842407, -0.9030845761299133, -0.8649196624755859, -0.8267546892166138, -0.7885897755622864, -0.750424861907959, -0.7122599482536316, -0.6740950345993042, -0.6359301209449768, -0.5977652072906494, -0.559600293636322, -0.5214353799819946, -0.48327040672302246, -0.44510549306869507, -0.4069405794143677, -0.3687756359577179, -0.3306107223033905, -0.2924458086490631, -0.25428086519241333, -0.21611595153808594, -0.17795102298259735, -0.13978609442710876, -0.10162118077278137, -0.06345623731613159, -0.0252913236618042, 0.012873601168394089, 0.05103852599859238, 0.08920344710350037, 0.12736837565898895, 0.16553330421447754, 0.20369821786880493, 0.2418631613254547, 0.2800280749797821, 0.3181929886341095, 0.3563579320907593, 0.39452284574508667, 0.43268775939941406, 0.47085270285606384, 0.5090175867080688, 0.547182559967041, 0.5853474736213684, 0.6235123872756958, 0.6616773009300232, 0.6998422145843506, 0.7380071878433228, 0.7761721014976501, 0.8143370151519775, 0.8525019884109497, 0.8906668424606323, 0.9288317561149597, 0.9669966697692871, 1.0051616430282593, 1.043326497077942, 1.081491470336914, 1.1196563243865967, 1.1578212976455688, 1.195986270904541]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 11.0, 24.0, 28.0, 32.0, 93.0, 244.0, 753.0, 3201.0, 33354.0, 4099736.0, 51174.0, 4197.0, 873.0, 295.0, 114.0, 54.0, 35.0, 24.0, 11.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.498291015625, -0.4825019836425781, -0.46671295166015625, -0.4509239196777344, -0.4351348876953125, -0.4193458557128906, -0.40355682373046875, -0.3877677917480469, -0.371978759765625, -0.3561897277832031, -0.34040069580078125, -0.3246116638183594, -0.3088226318359375, -0.2930335998535156, -0.27724456787109375, -0.2614555358886719, -0.24566650390625, -0.22987747192382812, -0.21408843994140625, -0.19829940795898438, -0.1825103759765625, -0.16672134399414062, -0.15093231201171875, -0.13514328002929688, -0.119354248046875, -0.10356521606445312, -0.08777618408203125, -0.07198715209960938, -0.0561981201171875, -0.040409088134765625, -0.02462005615234375, -0.008831024169921875, 0.0069580078125, 0.022747039794921875, 0.03853607177734375, 0.054325103759765625, 0.0701141357421875, 0.08590316772460938, 0.10169219970703125, 0.11748123168945312, 0.133270263671875, 0.14905929565429688, 0.16484832763671875, 0.18063735961914062, 0.1964263916015625, 0.21221542358398438, 0.22800445556640625, 0.24379348754882812, 0.25958251953125, 0.2753715515136719, 0.29116058349609375, 0.3069496154785156, 0.3227386474609375, 0.3385276794433594, 0.35431671142578125, 0.3701057434082031, 0.385894775390625, 0.4016838073730469, 0.41747283935546875, 0.4332618713378906, 0.4490509033203125, 0.4648399353027344, 0.48062896728515625, 0.4964179992675781, 0.51220703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 10.0, 9.0, 9.0, 20.0, 33.0, 43.0, 70.0, 82.0, 102.0, 119.0, 107.0, 105.0, 78.0, 68.0, 50.0, 23.0, 19.0, 25.0, 14.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1007080078125, -0.09765243530273438, -0.09459686279296875, -0.09154129028320312, -0.0884857177734375, -0.08543014526367188, -0.08237457275390625, -0.07931900024414062, -0.076263427734375, -0.07320785522460938, -0.07015228271484375, -0.06709671020507812, -0.0640411376953125, -0.060985565185546875, -0.05792999267578125, -0.054874420166015625, -0.05181884765625, -0.048763275146484375, -0.04570770263671875, -0.042652130126953125, -0.0395965576171875, -0.036540985107421875, -0.03348541259765625, -0.030429840087890625, -0.027374267578125, -0.024318695068359375, -0.02126312255859375, -0.018207550048828125, -0.0151519775390625, -0.012096405029296875, -0.00904083251953125, -0.005985260009765625, -0.0029296875, 0.000125885009765625, 0.00318145751953125, 0.006237030029296875, 0.0092926025390625, 0.012348175048828125, 0.01540374755859375, 0.018459320068359375, 0.021514892578125, 0.024570465087890625, 0.02762603759765625, 0.030681610107421875, 0.0337371826171875, 0.036792755126953125, 0.03984832763671875, 0.042903900146484375, 0.04595947265625, 0.049015045166015625, 0.05207061767578125, 0.055126190185546875, 0.0581817626953125, 0.061237335205078125, 0.06429290771484375, 0.06734848022460938, 0.070404052734375, 0.07345962524414062, 0.07651519775390625, 0.07957077026367188, 0.0826263427734375, 0.08568191528320312, 0.08873748779296875, 0.09179306030273438, 0.0948486328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 18.0, 22.0, 33.0, 68.0, 89.0, 177.0, 294.0, 496.0, 904.0, 2091.0, 7983.0, 83395.0, 4032252.0, 56045.0, 6706.0, 1786.0, 823.0, 461.0, 276.0, 139.0, 93.0, 57.0, 31.0, 17.0, 9.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.390380859375, -0.3779640197753906, -0.36554718017578125, -0.3531303405761719, -0.3407135009765625, -0.3282966613769531, -0.31587982177734375, -0.3034629821777344, -0.291046142578125, -0.2786293029785156, -0.26621246337890625, -0.2537956237792969, -0.2413787841796875, -0.22896194458007812, -0.21654510498046875, -0.20412826538085938, -0.19171142578125, -0.17929458618164062, -0.16687774658203125, -0.15446090698242188, -0.1420440673828125, -0.12962722778320312, -0.11721038818359375, -0.10479354858398438, -0.092376708984375, -0.07995986938476562, -0.06754302978515625, -0.055126190185546875, -0.0427093505859375, -0.030292510986328125, -0.01787567138671875, -0.005458831787109375, 0.0069580078125, 0.019374847412109375, 0.03179168701171875, 0.044208526611328125, 0.0566253662109375, 0.06904220581054688, 0.08145904541015625, 0.09387588500976562, 0.106292724609375, 0.11870956420898438, 0.13112640380859375, 0.14354324340820312, 0.1559600830078125, 0.16837692260742188, 0.18079376220703125, 0.19321060180664062, 0.20562744140625, 0.21804428100585938, 0.23046112060546875, 0.24287796020507812, 0.2552947998046875, 0.2677116394042969, 0.28012847900390625, 0.2925453186035156, 0.304962158203125, 0.3173789978027344, 0.32979583740234375, 0.3422126770019531, 0.3546295166015625, 0.3670463562011719, 0.37946319580078125, 0.3918800354003906, 0.404296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 11.0, 13.0, 28.0, 56.0, 225.0, 2719.0, 819.0, 102.0, 45.0, 21.0, 12.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2066650390625, -0.20037269592285156, -0.19408035278320312, -0.1877880096435547, -0.18149566650390625, -0.1752033233642578, -0.16891098022460938, -0.16261863708496094, -0.1563262939453125, -0.15003395080566406, -0.14374160766601562, -0.1374492645263672, -0.13115692138671875, -0.12486457824707031, -0.11857223510742188, -0.11227989196777344, -0.105987548828125, -0.09969520568847656, -0.09340286254882812, -0.08711051940917969, -0.08081817626953125, -0.07452583312988281, -0.06823348999023438, -0.06194114685058594, -0.0556488037109375, -0.04935646057128906, -0.043064117431640625, -0.03677177429199219, -0.03047943115234375, -0.024187088012695312, -0.017894744873046875, -0.011602401733398438, -0.00531005859375, 0.0009822845458984375, 0.007274627685546875, 0.013566970825195312, 0.01985931396484375, 0.026151657104492188, 0.032444000244140625, 0.03873634338378906, 0.0450286865234375, 0.05132102966308594, 0.057613372802734375, 0.06390571594238281, 0.07019805908203125, 0.07649040222167969, 0.08278274536132812, 0.08907508850097656, 0.095367431640625, 0.10165977478027344, 0.10795211791992188, 0.11424446105957031, 0.12053680419921875, 0.1268291473388672, 0.13312149047851562, 0.13941383361816406, 0.1457061767578125, 0.15199851989746094, 0.15829086303710938, 0.1645832061767578, 0.17087554931640625, 0.1771678924560547, 0.18346023559570312, 0.18975257873535156, 0.196044921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 15.0, 47.0, 65.0, 174.0, 297.0, 212.0, 93.0, 51.0, 14.0, 10.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49684569239616394, -0.4729893207550049, -0.4491329491138458, -0.42527657747268677, -0.4014201760292053, -0.37756383419036865, -0.3537074327468872, -0.32985106110572815, -0.3059946894645691, -0.28213831782341003, -0.258281946182251, -0.23442555963993073, -0.21056918799877167, -0.1867128163576126, -0.16285642981529236, -0.1390000581741333, -0.11514368653297424, -0.09128731489181519, -0.06743093580007553, -0.043574556708335876, -0.01971818506717682, 0.004138186573982239, 0.02799457311630249, 0.05185094475746155, 0.0757073163986206, 0.09956368803977966, 0.12342006713151932, 0.14727644622325897, 0.17113281786441803, 0.1949891895055771, 0.21884557604789734, 0.2427019476890564, 0.26655828952789307, 0.2904146611690521, 0.3142710328102112, 0.3381274342536926, 0.3619837760925293, 0.38584017753601074, 0.4096965491771698, 0.43355292081832886, 0.4574092924594879, 0.481265664100647, 0.5051220655441284, 0.5289784073829651, 0.5528348088264465, 0.5766911506652832, 0.6005475521087646, 0.6244039535522461, 0.6482602953910828, 0.6721166968345642, 0.6959730386734009, 0.7198294401168823, 0.743685781955719, 0.7675421833992004, 0.7913985252380371, 0.8152549266815186, 0.839111328125, 0.8629677295684814, 0.8868240714073181, 0.9106804728507996, 0.9345368146896362, 0.9583932161331177, 0.9822496175765991, 1.006105899810791, 1.0299623012542725]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 6.0, 14.0, 19.0, 12.0, 13.0, 28.0, 31.0, 28.0, 36.0, 46.0, 48.0, 47.0, 61.0, 70.0, 70.0, 66.0, 61.0, 49.0, 55.0, 53.0, 50.0, 36.0, 29.0, 19.0, 17.0, 13.0, 9.0, 3.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36349231004714966, -0.34973224997520447, -0.3359721899032593, -0.3222121298313141, -0.3084520697593689, -0.2946920096874237, -0.2809319496154785, -0.2671718895435333, -0.25341182947158813, -0.23965176939964294, -0.22589170932769775, -0.21213164925575256, -0.19837158918380737, -0.18461152911186218, -0.170851469039917, -0.1570914089679718, -0.1433313637971878, -0.12957130372524261, -0.11581124365329742, -0.10205118358135223, -0.08829112350940704, -0.07453107088804245, -0.06077101081609726, -0.04701095074415207, -0.03325089067220688, -0.019490830600261688, -0.005730772390961647, 0.008029285818338394, 0.021789345890283585, 0.03554940223693848, 0.04930946230888367, 0.06306952238082886, 0.07682958245277405, 0.09058964252471924, 0.10434970259666443, 0.11810976266860962, 0.1318698227405548, 0.1456298828125, 0.1593899428844452, 0.17315000295639038, 0.18691006302833557, 0.20067012310028076, 0.21443018317222595, 0.22819024324417114, 0.24195030331611633, 0.2557103633880615, 0.2694704234600067, 0.2832304835319519, 0.2969905138015747, 0.3107505738735199, 0.3245106339454651, 0.3382706940174103, 0.35203075408935547, 0.36579081416130066, 0.37955087423324585, 0.39331093430519104, 0.40707099437713623, 0.4208310544490814, 0.4345911145210266, 0.4483511745929718, 0.462111234664917, 0.4758712947368622, 0.4896313548088074, 0.5033913850784302, 0.5171514749526978]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 9.0, 14.0, 22.0, 30.0, 45.0, 79.0, 109.0, 179.0, 299.0, 529.0, 1141.0, 2583.0, 7776.0, 29681.0, 264451.0, 675588.0, 48622.0, 10878.0, 3557.0, 1382.0, 642.0, 338.0, 215.0, 118.0, 73.0, 41.0, 33.0, 27.0, 25.0, 19.0, 15.0, 5.0, 2.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.217529296875, -0.2109661102294922, -0.20440292358398438, -0.19783973693847656, -0.19127655029296875, -0.18471336364746094, -0.17815017700195312, -0.1715869903564453, -0.1650238037109375, -0.1584606170654297, -0.15189743041992188, -0.14533424377441406, -0.13877105712890625, -0.13220787048339844, -0.12564468383789062, -0.11908149719238281, -0.112518310546875, -0.10595512390136719, -0.09939193725585938, -0.09282875061035156, -0.08626556396484375, -0.07970237731933594, -0.07313919067382812, -0.06657600402832031, -0.0600128173828125, -0.05344963073730469, -0.046886444091796875, -0.04032325744628906, -0.03376007080078125, -0.027196884155273438, -0.020633697509765625, -0.014070510864257812, -0.00750732421875, -0.0009441375732421875, 0.005619049072265625, 0.012182235717773438, 0.01874542236328125, 0.025308609008789062, 0.031871795654296875, 0.03843498229980469, 0.0449981689453125, 0.05156135559082031, 0.058124542236328125, 0.06468772888183594, 0.07125091552734375, 0.07781410217285156, 0.08437728881835938, 0.09094047546386719, 0.097503662109375, 0.10406684875488281, 0.11063003540039062, 0.11719322204589844, 0.12375640869140625, 0.13031959533691406, 0.13688278198242188, 0.1434459686279297, 0.1500091552734375, 0.1565723419189453, 0.16313552856445312, 0.16969871520996094, 0.17626190185546875, 0.18282508850097656, 0.18938827514648438, 0.1959514617919922, 0.2025146484375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 3.0, 13.0, 12.0, 18.0, 36.0, 36.0, 61.0, 99.0, 101.0, 105.0, 108.0, 98.0, 88.0, 67.0, 43.0, 33.0, 20.0, 20.0, 14.0, 14.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.103515625, -0.10038471221923828, -0.09725379943847656, -0.09412288665771484, -0.09099197387695312, -0.0878610610961914, -0.08473014831542969, -0.08159923553466797, -0.07846832275390625, -0.07533740997314453, -0.07220649719238281, -0.0690755844116211, -0.06594467163085938, -0.06281375885009766, -0.05968284606933594, -0.05655193328857422, -0.0534210205078125, -0.05029010772705078, -0.04715919494628906, -0.044028282165527344, -0.040897369384765625, -0.037766456604003906, -0.03463554382324219, -0.03150463104248047, -0.02837371826171875, -0.02524280548095703, -0.022111892700195312, -0.018980979919433594, -0.015850067138671875, -0.012719154357910156, -0.009588241577148438, -0.006457328796386719, -0.003326416015625, -0.00019550323486328125, 0.0029354095458984375, 0.006066322326660156, 0.009197235107421875, 0.012328147888183594, 0.015459060668945312, 0.01858997344970703, 0.02172088623046875, 0.02485179901123047, 0.027982711791992188, 0.031113624572753906, 0.034244537353515625, 0.037375450134277344, 0.04050636291503906, 0.04363727569580078, 0.0467681884765625, 0.04989910125732422, 0.05303001403808594, 0.056160926818847656, 0.059291839599609375, 0.062422752380371094, 0.06555366516113281, 0.06868457794189453, 0.07181549072265625, 0.07494640350341797, 0.07807731628417969, 0.0812082290649414, 0.08433914184570312, 0.08747005462646484, 0.09060096740722656, 0.09373188018798828, 0.09686279296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 7.0, 6.0, 11.0, 22.0, 25.0, 35.0, 50.0, 73.0, 132.0, 228.0, 400.0, 867.0, 2081.0, 6551.0, 26575.0, 186767.0, 742393.0, 62874.0, 12956.0, 3651.0, 1428.0, 630.0, 300.0, 170.0, 106.0, 80.0, 37.0, 23.0, 18.0, 18.0, 17.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.22072982788085938, -0.21428680419921875, -0.20784378051757812, -0.2014007568359375, -0.19495773315429688, -0.18851470947265625, -0.18207168579101562, -0.175628662109375, -0.16918563842773438, -0.16274261474609375, -0.15629959106445312, -0.1498565673828125, -0.14341354370117188, -0.13697052001953125, -0.13052749633789062, -0.12408447265625, -0.11764144897460938, -0.11119842529296875, -0.10475540161132812, -0.0983123779296875, -0.09186935424804688, -0.08542633056640625, -0.07898330688476562, -0.072540283203125, -0.06609725952148438, -0.05965423583984375, -0.053211212158203125, -0.0467681884765625, -0.040325164794921875, -0.03388214111328125, -0.027439117431640625, -0.02099609375, -0.014553070068359375, -0.00811004638671875, -0.001667022705078125, 0.0047760009765625, 0.011219024658203125, 0.01766204833984375, 0.024105072021484375, 0.030548095703125, 0.036991119384765625, 0.04343414306640625, 0.049877166748046875, 0.0563201904296875, 0.06276321411132812, 0.06920623779296875, 0.07564926147460938, 0.08209228515625, 0.08853530883789062, 0.09497833251953125, 0.10142135620117188, 0.1078643798828125, 0.11430740356445312, 0.12075042724609375, 0.12719345092773438, 0.133636474609375, 0.14007949829101562, 0.14652252197265625, 0.15296554565429688, 0.1594085693359375, 0.16585159301757812, 0.17229461669921875, 0.17873764038085938, 0.1851806640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 7.0, 11.0, 13.0, 15.0, 13.0, 22.0, 26.0, 32.0, 48.0, 44.0, 41.0, 43.0, 60.0, 59.0, 49.0, 54.0, 45.0, 44.0, 35.0, 37.0, 36.0, 34.0, 39.0, 43.0, 24.0, 18.0, 17.0, 17.0, 10.0, 13.0, 4.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27587890625, -0.2677764892578125, -0.259674072265625, -0.2515716552734375, -0.24346923828125, -0.2353668212890625, -0.227264404296875, -0.2191619873046875, -0.2110595703125, -0.2029571533203125, -0.194854736328125, -0.1867523193359375, -0.17864990234375, -0.1705474853515625, -0.162445068359375, -0.1543426513671875, -0.146240234375, -0.1381378173828125, -0.130035400390625, -0.1219329833984375, -0.11383056640625, -0.1057281494140625, -0.097625732421875, -0.0895233154296875, -0.0814208984375, -0.0733184814453125, -0.065216064453125, -0.0571136474609375, -0.04901123046875, -0.0409088134765625, -0.032806396484375, -0.0247039794921875, -0.0166015625, -0.0084991455078125, -0.000396728515625, 0.0077056884765625, 0.01580810546875, 0.0239105224609375, 0.032012939453125, 0.0401153564453125, 0.0482177734375, 0.0563201904296875, 0.064422607421875, 0.0725250244140625, 0.08062744140625, 0.0887298583984375, 0.096832275390625, 0.1049346923828125, 0.113037109375, 0.1211395263671875, 0.129241943359375, 0.1373443603515625, 0.14544677734375, 0.1535491943359375, 0.161651611328125, 0.1697540283203125, 0.1778564453125, 0.1859588623046875, 0.194061279296875, 0.2021636962890625, 0.21026611328125, 0.2183685302734375, 0.226470947265625, 0.2345733642578125, 0.24267578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 5.0, 3.0, 10.0, 12.0, 13.0, 21.0, 28.0, 66.0, 100.0, 232.0, 541.0, 1723.0, 9890.0, 188998.0, 820126.0, 22581.0, 2848.0, 731.0, 287.0, 124.0, 59.0, 45.0, 28.0, 21.0, 12.0, 8.0, 9.0, 5.0, 5.0, 8.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1407470703125, -0.1365032196044922, -0.13225936889648438, -0.12801551818847656, -0.12377166748046875, -0.11952781677246094, -0.11528396606445312, -0.11104011535644531, -0.1067962646484375, -0.10255241394042969, -0.09830856323242188, -0.09406471252441406, -0.08982086181640625, -0.08557701110839844, -0.08133316040039062, -0.07708930969238281, -0.072845458984375, -0.06860160827636719, -0.06435775756835938, -0.06011390686035156, -0.05587005615234375, -0.05162620544433594, -0.047382354736328125, -0.04313850402832031, -0.0388946533203125, -0.03465080261230469, -0.030406951904296875, -0.026163101196289062, -0.02191925048828125, -0.017675399780273438, -0.013431549072265625, -0.009187698364257812, -0.00494384765625, -0.0006999969482421875, 0.003543853759765625, 0.0077877044677734375, 0.01203155517578125, 0.016275405883789062, 0.020519256591796875, 0.024763107299804688, 0.0290069580078125, 0.03325080871582031, 0.037494659423828125, 0.04173851013183594, 0.04598236083984375, 0.05022621154785156, 0.054470062255859375, 0.05871391296386719, 0.062957763671875, 0.06720161437988281, 0.07144546508789062, 0.07568931579589844, 0.07993316650390625, 0.08417701721191406, 0.08842086791992188, 0.09266471862792969, 0.0969085693359375, 0.10115242004394531, 0.10539627075195312, 0.10964012145996094, 0.11388397216796875, 0.11812782287597656, 0.12237167358398438, 0.1266155242919922, 0.130859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 5.0, 1.0, 10.0, 15.0, 20.0, 30.0, 25.0, 61.0, 71.0, 88.0, 134.0, 135.0, 123.0, 81.0, 51.0, 37.0, 24.0, 19.0, 13.0, 9.0, 4.0, 8.0, 1.0, 5.0, 12.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18235969543457e-05, -6.908830255270004e-05, -6.635300815105438e-05, -6.361771374940872e-05, -6.088241934776306e-05, -5.81471249461174e-05, -5.541183054447174e-05, -5.267653614282608e-05, -4.994124174118042e-05, -4.720594733953476e-05, -4.44706529378891e-05, -4.173535853624344e-05, -3.900006413459778e-05, -3.626476973295212e-05, -3.352947533130646e-05, -3.07941809296608e-05, -2.8058886528015137e-05, -2.5323592126369476e-05, -2.2588297724723816e-05, -1.9853003323078156e-05, -1.7117708921432495e-05, -1.4382414519786835e-05, -1.1647120118141174e-05, -8.911825716495514e-06, -6.1765313148498535e-06, -3.441236913204193e-06, -7.059425115585327e-07, 2.0293518900871277e-06, 4.764646291732788e-06, 7.4999406933784485e-06, 1.0235235095024109e-05, 1.297052949666977e-05, 1.570582389831543e-05, 1.844111829996109e-05, 2.117641270160675e-05, 2.391170710325241e-05, 2.664700150489807e-05, 2.938229590654373e-05, 3.211759030818939e-05, 3.485288470983505e-05, 3.758817911148071e-05, 4.032347351312637e-05, 4.3058767914772034e-05, 4.5794062316417694e-05, 4.8529356718063354e-05, 5.1264651119709015e-05, 5.3999945521354675e-05, 5.6735239923000336e-05, 5.9470534324645996e-05, 6.220582872629166e-05, 6.494112312793732e-05, 6.767641752958298e-05, 7.041171193122864e-05, 7.31470063328743e-05, 7.588230073451996e-05, 7.861759513616562e-05, 8.135288953781128e-05, 8.408818393945694e-05, 8.68234783411026e-05, 8.955877274274826e-05, 9.229406714439392e-05, 9.502936154603958e-05, 9.776465594768524e-05, 0.0001004999503493309, 0.00010323524475097656]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 4.0, 4.0, 7.0, 17.0, 32.0, 60.0, 95.0, 227.0, 551.0, 2060.0, 15387.0, 770148.0, 247639.0, 9890.0, 1552.0, 493.0, 170.0, 93.0, 50.0, 21.0, 22.0, 11.0, 12.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.103271484375, -0.09833335876464844, -0.09339523315429688, -0.08845710754394531, -0.08351898193359375, -0.07858085632324219, -0.07364273071289062, -0.06870460510253906, -0.0637664794921875, -0.05882835388183594, -0.053890228271484375, -0.04895210266113281, -0.04401397705078125, -0.03907585144042969, -0.034137725830078125, -0.029199600219726562, -0.024261474609375, -0.019323348999023438, -0.014385223388671875, -0.009447097778320312, -0.00450897216796875, 0.0004291534423828125, 0.005367279052734375, 0.010305404663085938, 0.0152435302734375, 0.020181655883789062, 0.025119781494140625, 0.030057907104492188, 0.03499603271484375, 0.03993415832519531, 0.044872283935546875, 0.04981040954589844, 0.05474853515625, 0.05968666076660156, 0.06462478637695312, 0.06956291198730469, 0.07450103759765625, 0.07943916320800781, 0.08437728881835938, 0.08931541442871094, 0.0942535400390625, 0.09919166564941406, 0.10412979125976562, 0.10906791687011719, 0.11400604248046875, 0.11894416809082031, 0.12388229370117188, 0.12882041931152344, 0.133758544921875, 0.13869667053222656, 0.14363479614257812, 0.1485729217529297, 0.15351104736328125, 0.1584491729736328, 0.16338729858398438, 0.16832542419433594, 0.1732635498046875, 0.17820167541503906, 0.18313980102539062, 0.1880779266357422, 0.19301605224609375, 0.1979541778564453, 0.20289230346679688, 0.20783042907714844, 0.2127685546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 7.0, 9.0, 7.0, 8.0, 20.0, 33.0, 50.0, 51.0, 88.0, 274.0, 183.0, 74.0, 50.0, 39.0, 29.0, 13.0, 15.0, 10.0, 7.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08233642578125, -0.0787210464477539, -0.07510566711425781, -0.07149028778076172, -0.06787490844726562, -0.06425952911376953, -0.06064414978027344, -0.057028770446777344, -0.05341339111328125, -0.049798011779785156, -0.04618263244628906, -0.04256725311279297, -0.038951873779296875, -0.03533649444580078, -0.03172111511230469, -0.028105735778808594, -0.0244903564453125, -0.020874977111816406, -0.017259597778320312, -0.013644218444824219, -0.010028839111328125, -0.006413459777832031, -0.0027980804443359375, 0.0008172988891601562, 0.00443267822265625, 0.008048057556152344, 0.011663436889648438, 0.015278816223144531, 0.018894195556640625, 0.02250957489013672, 0.026124954223632812, 0.029740333557128906, 0.033355712890625, 0.036971092224121094, 0.04058647155761719, 0.04420185089111328, 0.047817230224609375, 0.05143260955810547, 0.05504798889160156, 0.058663368225097656, 0.06227874755859375, 0.06589412689208984, 0.06950950622558594, 0.07312488555908203, 0.07674026489257812, 0.08035564422607422, 0.08397102355957031, 0.0875864028930664, 0.0912017822265625, 0.0948171615600586, 0.09843254089355469, 0.10204792022705078, 0.10566329956054688, 0.10927867889404297, 0.11289405822753906, 0.11650943756103516, 0.12012481689453125, 0.12374019622802734, 0.12735557556152344, 0.13097095489501953, 0.13458633422851562, 0.13820171356201172, 0.1418170928955078, 0.1454324722290039, 0.1490478515625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 573.0, 421.0, 12.0, 4.0], "bins": [-16.600149154663086, -16.327838897705078, -16.055530548095703, -15.783220291137695, -15.510910987854004, -15.238601684570312, -14.966291427612305, -14.693982124328613, -14.421672821044922, -14.14936351776123, -13.877053260803223, -13.604743957519531, -13.33243465423584, -13.060125350952148, -12.78781509399414, -12.51550579071045, -12.243196487426758, -11.970887184143066, -11.698576927185059, -11.426267623901367, -11.153958320617676, -10.881649017333984, -10.609338760375977, -10.337029457092285, -10.064719200134277, -9.792409896850586, -9.520099639892578, -9.247790336608887, -8.975481033325195, -8.703171730041504, -8.430861473083496, -8.158552169799805, -7.8862433433532715, -7.613933563232422, -7.3416242599487305, -7.069314479827881, -6.7970051765441895, -6.52469539642334, -6.252386093139648, -5.980076313018799, -5.707766532897949, -5.4354567527771, -5.163147449493408, -4.890837669372559, -4.618528366088867, -4.346218585968018, -4.073908805847168, -3.8015995025634766, -3.529290199279785, -3.2569806575775146, -2.984671115875244, -2.7123613357543945, -2.440052032470703, -2.1677422523498535, -1.895432710647583, -1.6231231689453125, -1.350813627243042, -1.0785040855407715, -0.8061944842338562, -0.5338848829269409, -0.2615753412246704, 0.010734200477600098, 0.28304386138916016, 0.5553534030914307, 0.827663004398346]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 6.0, 1.0, 5.0, 5.0, 3.0, 8.0, 11.0, 7.0, 14.0, 9.0, 12.0, 13.0, 20.0, 18.0, 24.0, 28.0, 33.0, 21.0, 30.0, 32.0, 32.0, 31.0, 28.0, 42.0, 39.0, 38.0, 45.0, 38.0, 46.0, 38.0, 30.0, 40.0, 32.0, 23.0, 23.0, 18.0, 26.0, 27.0, 13.0, 26.0, 18.0, 10.0, 8.0, 10.0, 6.0, 10.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9027281999588013, -0.8719969391822815, -0.8412656188011169, -0.8105343580245972, -0.7798030376434326, -0.7490717768669128, -0.7183405160903931, -0.6876091957092285, -0.6568779349327087, -0.626146674156189, -0.5954153537750244, -0.5646840929985046, -0.5339527726173401, -0.5032215118408203, -0.47249022126197815, -0.441758930683136, -0.4110276401042938, -0.38029634952545166, -0.3495650589466095, -0.31883376836776733, -0.28810250759124756, -0.2573712170124054, -0.22663992643356323, -0.19590865075588226, -0.1651773601770401, -0.13444606959819794, -0.10371479392051697, -0.0729835033416748, -0.04225222021341324, -0.011520937085151672, 0.01921035349369049, 0.04994162917137146, 0.08067291975021362, 0.11140420287847519, 0.14213548600673676, 0.17286677658557892, 0.2035980522632599, 0.23432934284210205, 0.2650606334209442, 0.2957919239997864, 0.32652318477630615, 0.3572544753551483, 0.3879857659339905, 0.41871702671051025, 0.4494483172893524, 0.4801796078681946, 0.5109108686447144, 0.5416421890258789, 0.5723735094070435, 0.6031047701835632, 0.6338360905647278, 0.6645673513412476, 0.6952986717224121, 0.7260299324989319, 0.7567611932754517, 0.7874925136566162, 0.818223774433136, 0.8489550352096558, 0.8796863555908203, 0.9104176163673401, 0.9411489367485046, 0.9718801975250244, 1.002611517906189, 1.033342719078064, 1.0640740394592285]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 15.0, 10.0, 15.0, 27.0, 102.0, 254.0, 931.0, 7670.0, 4042339.0, 138076.0, 3841.0, 650.0, 189.0, 71.0, 34.0, 22.0, 9.0, 11.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0216293334960938, -0.9905242919921875, -0.9594192504882812, -0.928314208984375, -0.8972091674804688, -0.8661041259765625, -0.8349990844726562, -0.80389404296875, -0.7727890014648438, -0.7416839599609375, -0.7105789184570312, -0.679473876953125, -0.6483688354492188, -0.6172637939453125, -0.5861587524414062, -0.5550537109375, -0.5239486694335938, -0.4928436279296875, -0.46173858642578125, -0.430633544921875, -0.39952850341796875, -0.3684234619140625, -0.33731842041015625, -0.30621337890625, -0.27510833740234375, -0.2440032958984375, -0.21289825439453125, -0.181793212890625, -0.15068817138671875, -0.1195831298828125, -0.08847808837890625, -0.057373046875, -0.02626800537109375, 0.0048370361328125, 0.03594207763671875, 0.067047119140625, 0.09815216064453125, 0.1292572021484375, 0.16036224365234375, 0.19146728515625, 0.22257232666015625, 0.2536773681640625, 0.28478240966796875, 0.315887451171875, 0.34699249267578125, 0.3780975341796875, 0.40920257568359375, 0.4403076171875, 0.47141265869140625, 0.5025177001953125, 0.5336227416992188, 0.564727783203125, 0.5958328247070312, 0.6269378662109375, 0.6580429077148438, 0.68914794921875, 0.7202529907226562, 0.7513580322265625, 0.7824630737304688, 0.813568115234375, 0.8446731567382812, 0.8757781982421875, 0.9068832397460938, 0.93798828125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 8.0, 15.0, 29.0, 31.0, 63.0, 67.0, 105.0, 108.0, 115.0, 109.0, 90.0, 70.0, 51.0, 43.0, 23.0, 21.0, 16.0, 9.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10394287109375, -0.10083866119384766, -0.09773445129394531, -0.09463024139404297, -0.09152603149414062, -0.08842182159423828, -0.08531761169433594, -0.0822134017944336, -0.07910919189453125, -0.0760049819946289, -0.07290077209472656, -0.06979656219482422, -0.06669235229492188, -0.06358814239501953, -0.06048393249511719, -0.057379722595214844, -0.0542755126953125, -0.051171302795410156, -0.04806709289550781, -0.04496288299560547, -0.041858673095703125, -0.03875446319580078, -0.03565025329589844, -0.032546043395996094, -0.02944183349609375, -0.026337623596191406, -0.023233413696289062, -0.02012920379638672, -0.017024993896484375, -0.013920783996582031, -0.010816574096679688, -0.007712364196777344, -0.004608154296875, -0.0015039443969726562, 0.0016002655029296875, 0.004704475402832031, 0.007808685302734375, 0.010912895202636719, 0.014017105102539062, 0.017121315002441406, 0.02022552490234375, 0.023329734802246094, 0.026433944702148438, 0.02953815460205078, 0.032642364501953125, 0.03574657440185547, 0.03885078430175781, 0.041954994201660156, 0.0450592041015625, 0.048163414001464844, 0.05126762390136719, 0.05437183380126953, 0.057476043701171875, 0.06058025360107422, 0.06368446350097656, 0.0667886734008789, 0.06989288330078125, 0.0729970932006836, 0.07610130310058594, 0.07920551300048828, 0.08230972290039062, 0.08541393280029297, 0.08851814270019531, 0.09162235260009766, 0.0947265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 6.0, 16.0, 20.0, 30.0, 30.0, 47.0, 71.0, 73.0, 105.0, 162.0, 269.0, 387.0, 693.0, 1213.0, 2525.0, 7550.0, 44504.0, 3855720.0, 255311.0, 16880.0, 4449.0, 1724.0, 903.0, 563.0, 314.0, 219.0, 124.0, 110.0, 69.0, 46.0, 40.0, 34.0, 21.0, 11.0, 12.0, 8.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388916015625, -0.375396728515625, -0.36187744140625, -0.348358154296875, -0.3348388671875, -0.321319580078125, -0.30780029296875, -0.294281005859375, -0.28076171875, -0.267242431640625, -0.25372314453125, -0.240203857421875, -0.2266845703125, -0.213165283203125, -0.19964599609375, -0.186126708984375, -0.172607421875, -0.159088134765625, -0.14556884765625, -0.132049560546875, -0.1185302734375, -0.105010986328125, -0.09149169921875, -0.077972412109375, -0.064453125, -0.050933837890625, -0.03741455078125, -0.023895263671875, -0.0103759765625, 0.003143310546875, 0.01666259765625, 0.030181884765625, 0.043701171875, 0.057220458984375, 0.07073974609375, 0.084259033203125, 0.0977783203125, 0.111297607421875, 0.12481689453125, 0.138336181640625, 0.15185546875, 0.165374755859375, 0.17889404296875, 0.192413330078125, 0.2059326171875, 0.219451904296875, 0.23297119140625, 0.246490478515625, 0.260009765625, 0.273529052734375, 0.28704833984375, 0.300567626953125, 0.3140869140625, 0.327606201171875, 0.34112548828125, 0.354644775390625, 0.3681640625, 0.381683349609375, 0.39520263671875, 0.408721923828125, 0.4222412109375, 0.435760498046875, 0.44927978515625, 0.462799072265625, 0.476318359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 7.0, 7.0, 21.0, 37.0, 173.0, 3066.0, 615.0, 80.0, 27.0, 16.0, 11.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322265625, -0.31180572509765625, -0.3013458251953125, -0.29088592529296875, -0.280426025390625, -0.26996612548828125, -0.2595062255859375, -0.24904632568359375, -0.23858642578125, -0.22812652587890625, -0.2176666259765625, -0.20720672607421875, -0.196746826171875, -0.18628692626953125, -0.1758270263671875, -0.16536712646484375, -0.1549072265625, -0.14444732666015625, -0.1339874267578125, -0.12352752685546875, -0.113067626953125, -0.10260772705078125, -0.0921478271484375, -0.08168792724609375, -0.07122802734375, -0.06076812744140625, -0.0503082275390625, -0.03984832763671875, -0.029388427734375, -0.01892852783203125, -0.0084686279296875, 0.00199127197265625, 0.012451171875, 0.02291107177734375, 0.0333709716796875, 0.04383087158203125, 0.054290771484375, 0.06475067138671875, 0.0752105712890625, 0.08567047119140625, 0.09613037109375, 0.10659027099609375, 0.1170501708984375, 0.12751007080078125, 0.137969970703125, 0.14842987060546875, 0.1588897705078125, 0.16934967041015625, 0.1798095703125, 0.19026947021484375, 0.2007293701171875, 0.21118927001953125, 0.221649169921875, 0.23210906982421875, 0.2425689697265625, 0.25302886962890625, 0.26348876953125, 0.27394866943359375, 0.2844085693359375, 0.29486846923828125, 0.305328369140625, 0.31578826904296875, 0.3262481689453125, 0.33670806884765625, 0.34716796875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 10.0, 7.0, 19.0, 25.0, 39.0, 52.0, 99.0, 143.0, 172.0, 144.0, 123.0, 68.0, 36.0, 17.0, 11.0, 12.0, 3.0, 3.0, 3.0, 0.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.7999388575553894, -0.7821212410926819, -0.7643036246299744, -0.7464860081672668, -0.7286684513092041, -0.7108508348464966, -0.6930332183837891, -0.6752156019210815, -0.657397985458374, -0.6395803689956665, -0.621762752532959, -0.6039451360702515, -0.586127519607544, -0.5683099627494812, -0.5504923462867737, -0.5326747298240662, -0.5148571133613586, -0.4970394968986511, -0.4792218804359436, -0.46140429377555847, -0.44358667731285095, -0.42576906085014343, -0.4079514741897583, -0.3901338577270508, -0.37231624126434326, -0.35449862480163574, -0.3366810083389282, -0.3188634216785431, -0.30104580521583557, -0.28322818875312805, -0.2654106020927429, -0.2475929856300354, -0.2297753095626831, -0.21195769309997559, -0.19414009153842926, -0.17632248997688293, -0.15850487351417542, -0.1406872570514679, -0.12286965548992157, -0.10505204647779465, -0.08723443746566772, -0.0694168284535408, -0.05159921944141388, -0.03378161042928696, -0.015964001417160034, 0.0018536075949668884, 0.01967121660709381, 0.037488825619220734, 0.055306434631347656, 0.07312404364347458, 0.0909416526556015, 0.10875926166772842, 0.12657687067985535, 0.14439448714256287, 0.1622120887041092, 0.18002969026565552, 0.19784730672836304, 0.21566492319107056, 0.23348252475261688, 0.2513001263141632, 0.2691177427768707, 0.28693535923957825, 0.3047529458999634, 0.3225705623626709, 0.3403881788253784]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 7.0, 17.0, 17.0, 27.0, 20.0, 39.0, 35.0, 53.0, 51.0, 65.0, 59.0, 57.0, 57.0, 77.0, 67.0, 53.0, 46.0, 40.0, 34.0, 35.0, 24.0, 24.0, 20.0, 21.0, 14.0, 16.0, 2.0, 6.0, 3.0, 3.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4931862950325012, -0.4745917022228241, -0.45599713921546936, -0.43740254640579224, -0.4188079833984375, -0.4002133905887604, -0.38161879777908325, -0.3630242347717285, -0.3444296419620514, -0.32583504915237427, -0.30724048614501953, -0.2886458933353424, -0.2700513005256653, -0.25145673751831055, -0.23286214470863342, -0.2142675668001175, -0.19567298889160156, -0.17707841098308563, -0.1584838330745697, -0.13988924026489258, -0.12129466235637665, -0.10270008444786072, -0.08410549908876419, -0.06551091372966766, -0.04691633582115173, -0.028321754187345505, -0.009727172553539276, 0.008867409080266953, 0.02746199071407318, 0.04605656862258911, 0.06465115398168564, 0.08324573934078217, 0.1018403172492981, 0.12043489515781403, 0.13902947306632996, 0.15762406587600708, 0.176218643784523, 0.19481322169303894, 0.21340781450271606, 0.232002392411232, 0.2505969703197479, 0.26919156312942505, 0.2877861261367798, 0.3063807189464569, 0.32497531175613403, 0.34356987476348877, 0.3621644675731659, 0.380759060382843, 0.39935362339019775, 0.4179482161998749, 0.4365427792072296, 0.45513737201690674, 0.4737319350242615, 0.4923265278339386, 0.5109211206436157, 0.5295156836509705, 0.5481102466583252, 0.5667048096656799, 0.5852994322776794, 0.6038939952850342, 0.6224885582923889, 0.6410831212997437, 0.6596777439117432, 0.6782723069190979, 0.6968669295310974]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 6.0, 12.0, 20.0, 27.0, 54.0, 66.0, 124.0, 219.0, 470.0, 1084.0, 3153.0, 15151.0, 150078.0, 780443.0, 83253.0, 10291.0, 2371.0, 873.0, 364.0, 213.0, 102.0, 70.0, 36.0, 22.0, 14.0, 13.0, 7.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4668159484863281, -0.45145416259765625, -0.4360923767089844, -0.4207305908203125, -0.4053688049316406, -0.39000701904296875, -0.3746452331542969, -0.359283447265625, -0.3439216613769531, -0.32855987548828125, -0.3131980895996094, -0.2978363037109375, -0.2824745178222656, -0.26711273193359375, -0.2517509460449219, -0.23638916015625, -0.22102737426757812, -0.20566558837890625, -0.19030380249023438, -0.1749420166015625, -0.15958023071289062, -0.14421844482421875, -0.12885665893554688, -0.113494873046875, -0.09813308715820312, -0.08277130126953125, -0.06740951538085938, -0.0520477294921875, -0.036685943603515625, -0.02132415771484375, -0.005962371826171875, 0.0093994140625, 0.024761199951171875, 0.04012298583984375, 0.055484771728515625, 0.0708465576171875, 0.08620834350585938, 0.10157012939453125, 0.11693191528320312, 0.132293701171875, 0.14765548706054688, 0.16301727294921875, 0.17837905883789062, 0.1937408447265625, 0.20910263061523438, 0.22446441650390625, 0.23982620239257812, 0.25518798828125, 0.2705497741699219, 0.28591156005859375, 0.3012733459472656, 0.3166351318359375, 0.3319969177246094, 0.34735870361328125, 0.3627204895019531, 0.378082275390625, 0.3934440612792969, 0.40880584716796875, 0.4241676330566406, 0.4395294189453125, 0.4548912048339844, 0.47025299072265625, 0.4856147766113281, 0.5009765625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 13.0, 16.0, 21.0, 41.0, 58.0, 73.0, 108.0, 99.0, 112.0, 97.0, 80.0, 68.0, 56.0, 45.0, 36.0, 30.0, 17.0, 11.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1090087890625, -0.10567378997802734, -0.10233879089355469, -0.09900379180908203, -0.09566879272460938, -0.09233379364013672, -0.08899879455566406, -0.0856637954711914, -0.08232879638671875, -0.0789937973022461, -0.07565879821777344, -0.07232379913330078, -0.06898880004882812, -0.06565380096435547, -0.06231880187988281, -0.058983802795410156, -0.0556488037109375, -0.052313804626464844, -0.04897880554199219, -0.04564380645751953, -0.042308807373046875, -0.03897380828857422, -0.03563880920410156, -0.032303810119628906, -0.02896881103515625, -0.025633811950683594, -0.022298812866210938, -0.01896381378173828, -0.015628814697265625, -0.012293815612792969, -0.008958816528320312, -0.005623817443847656, -0.002288818359375, 0.0010461807250976562, 0.0043811798095703125, 0.007716178894042969, 0.011051177978515625, 0.014386177062988281, 0.017721176147460938, 0.021056175231933594, 0.02439117431640625, 0.027726173400878906, 0.031061172485351562, 0.03439617156982422, 0.037731170654296875, 0.04106616973876953, 0.04440116882324219, 0.047736167907714844, 0.0510711669921875, 0.054406166076660156, 0.05774116516113281, 0.06107616424560547, 0.06441116333007812, 0.06774616241455078, 0.07108116149902344, 0.0744161605834961, 0.07775115966796875, 0.0810861587524414, 0.08442115783691406, 0.08775615692138672, 0.09109115600585938, 0.09442615509033203, 0.09776115417480469, 0.10109615325927734, 0.10443115234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 11.0, 5.0, 13.0, 21.0, 17.0, 25.0, 40.0, 48.0, 97.0, 146.0, 199.0, 373.0, 705.0, 1532.0, 3224.0, 9062.0, 39620.0, 451851.0, 484211.0, 41631.0, 9288.0, 3253.0, 1441.0, 717.0, 367.0, 220.0, 132.0, 100.0, 49.0, 40.0, 32.0, 22.0, 13.0, 8.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.423095703125, -0.4110107421875, -0.39892578125, -0.3868408203125, -0.374755859375, -0.3626708984375, -0.3505859375, -0.3385009765625, -0.326416015625, -0.3143310546875, -0.30224609375, -0.2901611328125, -0.278076171875, -0.2659912109375, -0.25390625, -0.2418212890625, -0.229736328125, -0.2176513671875, -0.20556640625, -0.1934814453125, -0.181396484375, -0.1693115234375, -0.1572265625, -0.1451416015625, -0.133056640625, -0.1209716796875, -0.10888671875, -0.0968017578125, -0.084716796875, -0.0726318359375, -0.060546875, -0.0484619140625, -0.036376953125, -0.0242919921875, -0.01220703125, -0.0001220703125, 0.011962890625, 0.0240478515625, 0.0361328125, 0.0482177734375, 0.060302734375, 0.0723876953125, 0.08447265625, 0.0965576171875, 0.108642578125, 0.1207275390625, 0.1328125, 0.1448974609375, 0.156982421875, 0.1690673828125, 0.18115234375, 0.1932373046875, 0.205322265625, 0.2174072265625, 0.2294921875, 0.2415771484375, 0.253662109375, 0.2657470703125, 0.27783203125, 0.2899169921875, 0.302001953125, 0.3140869140625, 0.326171875, 0.3382568359375, 0.350341796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 1.0, 9.0, 15.0, 6.0, 17.0, 16.0, 24.0, 22.0, 41.0, 36.0, 44.0, 80.0, 55.0, 56.0, 61.0, 67.0, 63.0, 65.0, 54.0, 46.0, 40.0, 35.0, 32.0, 26.0, 14.0, 18.0, 12.0, 7.0, 2.0, 3.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.384521484375, -0.372802734375, -0.361083984375, -0.349365234375, -0.337646484375, -0.325927734375, -0.314208984375, -0.302490234375, -0.290771484375, -0.279052734375, -0.267333984375, -0.255615234375, -0.243896484375, -0.232177734375, -0.220458984375, -0.208740234375, -0.197021484375, -0.185302734375, -0.173583984375, -0.161865234375, -0.150146484375, -0.138427734375, -0.126708984375, -0.114990234375, -0.103271484375, -0.091552734375, -0.079833984375, -0.068115234375, -0.056396484375, -0.044677734375, -0.032958984375, -0.021240234375, -0.009521484375, 0.002197265625, 0.013916015625, 0.025634765625, 0.037353515625, 0.049072265625, 0.060791015625, 0.072509765625, 0.084228515625, 0.095947265625, 0.107666015625, 0.119384765625, 0.131103515625, 0.142822265625, 0.154541015625, 0.166259765625, 0.177978515625, 0.189697265625, 0.201416015625, 0.213134765625, 0.224853515625, 0.236572265625, 0.248291015625, 0.260009765625, 0.271728515625, 0.283447265625, 0.295166015625, 0.306884765625, 0.318603515625, 0.330322265625, 0.342041015625, 0.353759765625, 0.365478515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 3.0, 10.0, 11.0, 13.0, 22.0, 29.0, 52.0, 53.0, 84.0, 135.0, 211.0, 337.0, 673.0, 1321.0, 3301.0, 13476.0, 752050.0, 261560.0, 9687.0, 2841.0, 1217.0, 585.0, 306.0, 178.0, 129.0, 78.0, 44.0, 49.0, 38.0, 21.0, 15.0, 15.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441650390625, -0.42862701416015625, -0.4156036376953125, -0.40258026123046875, -0.389556884765625, -0.37653350830078125, -0.3635101318359375, -0.35048675537109375, -0.33746337890625, -0.32444000244140625, -0.3114166259765625, -0.29839324951171875, -0.285369873046875, -0.27234649658203125, -0.2593231201171875, -0.24629974365234375, -0.2332763671875, -0.22025299072265625, -0.2072296142578125, -0.19420623779296875, -0.181182861328125, -0.16815948486328125, -0.1551361083984375, -0.14211273193359375, -0.12908935546875, -0.11606597900390625, -0.1030426025390625, -0.09001922607421875, -0.076995849609375, -0.06397247314453125, -0.0509490966796875, -0.03792572021484375, -0.02490234375, -0.01187896728515625, 0.0011444091796875, 0.01416778564453125, 0.027191162109375, 0.04021453857421875, 0.0532379150390625, 0.06626129150390625, 0.07928466796875, 0.09230804443359375, 0.1053314208984375, 0.11835479736328125, 0.131378173828125, 0.14440155029296875, 0.1574249267578125, 0.17044830322265625, 0.1834716796875, 0.19649505615234375, 0.2095184326171875, 0.22254180908203125, 0.235565185546875, 0.24858856201171875, 0.2616119384765625, 0.27463531494140625, 0.28765869140625, 0.30068206787109375, 0.3137054443359375, 0.32672882080078125, 0.339752197265625, 0.35277557373046875, 0.3657989501953125, 0.37882232666015625, 0.391845703125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 5.0, 10.0, 16.0, 17.0, 36.0, 48.0, 55.0, 70.0, 131.0, 137.0, 125.0, 101.0, 64.0, 42.0, 39.0, 30.0, 19.0, 18.0, 6.0, 5.0, 6.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015151500701904297, -0.00014660321176052094, -0.0001416914165019989, -0.00013677962124347687, -0.00013186782598495483, -0.0001269560307264328, -0.00012204423546791077, -0.00011713244020938873, -0.0001122206449508667, -0.00010730884969234467, -0.00010239705443382263, -9.74852591753006e-05, -9.257346391677856e-05, -8.766166865825653e-05, -8.27498733997345e-05, -7.783807814121246e-05, -7.292628288269043e-05, -6.80144876241684e-05, -6.310269236564636e-05, -5.819089710712433e-05, -5.3279101848602295e-05, -4.836730659008026e-05, -4.345551133155823e-05, -3.8543716073036194e-05, -3.363192081451416e-05, -2.8720125555992126e-05, -2.3808330297470093e-05, -1.889653503894806e-05, -1.3984739780426025e-05, -9.072944521903992e-06, -4.161149263381958e-06, 7.506459951400757e-07, 5.662441253662109e-06, 1.0574236512184143e-05, 1.5486031770706177e-05, 2.039782702922821e-05, 2.5309622287750244e-05, 3.0221417546272278e-05, 3.513321280479431e-05, 4.0045008063316345e-05, 4.495680332183838e-05, 4.986859858036041e-05, 5.4780393838882446e-05, 5.969218909740448e-05, 6.460398435592651e-05, 6.951577961444855e-05, 7.442757487297058e-05, 7.933937013149261e-05, 8.425116539001465e-05, 8.916296064853668e-05, 9.407475590705872e-05, 9.898655116558075e-05, 0.00010389834642410278, 0.00010881014168262482, 0.00011372193694114685, 0.00011863373219966888, 0.00012354552745819092, 0.00012845732271671295, 0.00013336911797523499, 0.00013828091323375702, 0.00014319270849227905, 0.00014810450375080109, 0.00015301629900932312, 0.00015792809426784515, 0.0001628398895263672]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 11.0, 22.0, 23.0, 73.0, 154.0, 411.0, 1543.0, 22925.0, 1011717.0, 9942.0, 1105.0, 352.0, 137.0, 64.0, 25.0, 11.0, 6.0, 4.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7578125, -0.7344207763671875, -0.711029052734375, -0.6876373291015625, -0.66424560546875, -0.6408538818359375, -0.617462158203125, -0.5940704345703125, -0.5706787109375, -0.5472869873046875, -0.523895263671875, -0.5005035400390625, -0.47711181640625, -0.4537200927734375, -0.430328369140625, -0.4069366455078125, -0.383544921875, -0.3601531982421875, -0.336761474609375, -0.3133697509765625, -0.28997802734375, -0.2665863037109375, -0.243194580078125, -0.2198028564453125, -0.1964111328125, -0.1730194091796875, -0.149627685546875, -0.1262359619140625, -0.10284423828125, -0.0794525146484375, -0.056060791015625, -0.0326690673828125, -0.00927734375, 0.0141143798828125, 0.037506103515625, 0.0608978271484375, 0.08428955078125, 0.1076812744140625, 0.131072998046875, 0.1544647216796875, 0.1778564453125, 0.2012481689453125, 0.224639892578125, 0.2480316162109375, 0.27142333984375, 0.2948150634765625, 0.318206787109375, 0.3415985107421875, 0.364990234375, 0.3883819580078125, 0.411773681640625, 0.4351654052734375, 0.45855712890625, 0.4819488525390625, 0.505340576171875, 0.5287322998046875, 0.5521240234375, 0.5755157470703125, 0.598907470703125, 0.6222991943359375, 0.64569091796875, 0.6690826416015625, 0.692474365234375, 0.7158660888671875, 0.7392578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 10.0, 10.0, 15.0, 46.0, 141.0, 512.0, 169.0, 45.0, 23.0, 9.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5220947265625, -0.495361328125, -0.4686279296875, -0.44189453125, -0.4151611328125, -0.388427734375, -0.3616943359375, -0.3349609375, -0.3082275390625, -0.281494140625, -0.2547607421875, -0.22802734375, -0.2012939453125, -0.174560546875, -0.1478271484375, -0.12109375, -0.0943603515625, -0.067626953125, -0.0408935546875, -0.01416015625, 0.0125732421875, 0.039306640625, 0.0660400390625, 0.0927734375, 0.1195068359375, 0.146240234375, 0.1729736328125, 0.19970703125, 0.2264404296875, 0.253173828125, 0.2799072265625, 0.306640625, 0.3333740234375, 0.360107421875, 0.3868408203125, 0.41357421875, 0.4403076171875, 0.467041015625, 0.4937744140625, 0.5205078125, 0.5472412109375, 0.573974609375, 0.6007080078125, 0.62744140625, 0.6541748046875, 0.680908203125, 0.7076416015625, 0.734375, 0.7611083984375, 0.787841796875, 0.8145751953125, 0.84130859375, 0.8680419921875, 0.894775390625, 0.9215087890625, 0.9482421875, 0.9749755859375, 1.001708984375, 1.0284423828125, 1.05517578125, 1.0819091796875, 1.108642578125, 1.1353759765625, 1.162109375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 5.0, 9.0, 17.0, 29.0, 59.0, 118.0, 194.0, 235.0, 176.0, 83.0, 36.0, 15.0, 8.0, 9.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.157985687255859, -4.037571430206299, -3.917156934738159, -3.7967426776885986, -3.676328182220459, -3.5559139251708984, -3.435499429702759, -3.3150851726531982, -3.1946706771850586, -3.074256420135498, -2.9538419246673584, -2.833427667617798, -2.713013172149658, -2.5925989151000977, -2.472184419631958, -2.3517701625823975, -2.231355667114258, -2.1109414100646973, -1.9905269145965576, -1.8701125383377075, -1.7496981620788574, -1.6292839050292969, -1.5088694095611572, -1.3884551525115967, -1.2680408954620361, -1.147626519203186, -1.027212142944336, -0.9067977666854858, -0.7863833904266357, -0.6659690737724304, -0.5455546975135803, -0.4251403212547302, -0.30472588539123535, -0.18431150913238525, -0.06389714777469635, 0.056517213582992554, 0.17693158984184265, 0.29734593629837036, 0.41776031255722046, 0.5381746888160706, 0.6585890650749207, 0.7790034413337708, 0.8994178175926208, 1.0198321342468262, 1.1402465105056763, 1.2606608867645264, 1.3810752630233765, 1.5014896392822266, 1.6219040155410767, 1.7423183917999268, 1.8627327680587769, 1.983147144317627, 2.1035614013671875, 2.223975896835327, 2.3443901538848877, 2.4648046493530273, 2.585218906402588, 2.7056331634521484, 2.826047658920288, 2.9464619159698486, 3.0668764114379883, 3.187290668487549, 3.3077051639556885, 3.428119421005249, 3.5485339164733887]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 6.0, 9.0, 6.0, 4.0, 8.0, 13.0, 17.0, 20.0, 18.0, 28.0, 34.0, 45.0, 45.0, 41.0, 59.0, 45.0, 53.0, 53.0, 53.0, 44.0, 48.0, 41.0, 54.0, 43.0, 32.0, 27.0, 34.0, 24.0, 23.0, 20.0, 18.0, 13.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.561328887939453, -2.4870734214782715, -2.41281795501709, -2.338562488555908, -2.2643070220947266, -2.190051555633545, -2.1157960891723633, -2.0415403842926025, -1.967284917831421, -1.8930294513702393, -1.8187739849090576, -1.744518518447876, -1.6702629327774048, -1.5960074663162231, -1.5217519998550415, -1.4474964141845703, -1.3732410669326782, -1.2989856004714966, -1.224730134010315, -1.1504745483398438, -1.076219081878662, -1.0019636154174805, -0.9277081489562988, -0.8534526228904724, -0.7791971564292908, -0.7049416899681091, -0.6306861639022827, -0.5564306974411011, -0.48217520117759705, -0.407919704914093, -0.3336642384529114, -0.25940871238708496, -0.18515324592590332, -0.11089775711297989, -0.03664226830005646, 0.03761321306228638, 0.1118687093257904, 0.18612420558929443, 0.2603796720504761, 0.3346351981163025, 0.40889066457748413, 0.48314616084098816, 0.5574016571044922, 0.6316571235656738, 0.7059125900268555, 0.7801681160926819, 0.8544235825538635, 0.9286791086196899, 1.0029345750808716, 1.0771900415420532, 1.1514455080032349, 1.225701093673706, 1.2999565601348877, 1.3742120265960693, 1.448467493057251, 1.5227229595184326, 1.5969784259796143, 1.671233892440796, 1.7454893589019775, 1.8197448253631592, 1.8940004110336304, 1.968255877494812, 2.042511463165283, 2.116766929626465, 2.1910223960876465]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 13.0, 11.0, 22.0, 17.0, 38.0, 58.0, 104.0, 185.0, 234.0, 486.0, 909.0, 1835.0, 4201.0, 11720.0, 50951.0, 2982629.0, 1078251.0, 43814.0, 10908.0, 4004.0, 1767.0, 919.0, 490.0, 280.0, 170.0, 85.0, 53.0, 37.0, 24.0, 19.0, 8.0, 7.0, 11.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269287109375, -0.2596549987792969, -0.25002288818359375, -0.24039077758789062, -0.2307586669921875, -0.22112655639648438, -0.21149444580078125, -0.20186233520507812, -0.192230224609375, -0.18259811401367188, -0.17296600341796875, -0.16333389282226562, -0.1537017822265625, -0.14406967163085938, -0.13443756103515625, -0.12480545043945312, -0.11517333984375, -0.10554122924804688, -0.09590911865234375, -0.08627700805664062, -0.0766448974609375, -0.06701278686523438, -0.05738067626953125, -0.047748565673828125, -0.038116455078125, -0.028484344482421875, -0.01885223388671875, -0.009220123291015625, 0.0004119873046875, 0.010044097900390625, 0.01967620849609375, 0.029308319091796875, 0.0389404296875, 0.048572540283203125, 0.05820465087890625, 0.06783676147460938, 0.0774688720703125, 0.08710098266601562, 0.09673309326171875, 0.10636520385742188, 0.115997314453125, 0.12562942504882812, 0.13526153564453125, 0.14489364624023438, 0.1545257568359375, 0.16415786743164062, 0.17378997802734375, 0.18342208862304688, 0.19305419921875, 0.20268630981445312, 0.21231842041015625, 0.22195053100585938, 0.2315826416015625, 0.24121475219726562, 0.25084686279296875, 0.2604789733886719, 0.270111083984375, 0.2797431945800781, 0.28937530517578125, 0.2990074157714844, 0.3086395263671875, 0.3182716369628906, 0.32790374755859375, 0.3375358581542969, 0.34716796875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 15.0, 7.0, 11.0, 16.0, 20.0, 30.0, 42.0, 50.0, 67.0, 72.0, 72.0, 79.0, 84.0, 74.0, 87.0, 53.0, 49.0, 40.0, 30.0, 26.0, 27.0, 18.0, 13.0, 10.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10955810546875, -0.10634708404541016, -0.10313606262207031, -0.09992504119873047, -0.09671401977539062, -0.09350299835205078, -0.09029197692871094, -0.0870809555053711, -0.08386993408203125, -0.0806589126586914, -0.07744789123535156, -0.07423686981201172, -0.07102584838867188, -0.06781482696533203, -0.06460380554199219, -0.061392784118652344, -0.0581817626953125, -0.054970741271972656, -0.05175971984863281, -0.04854869842529297, -0.045337677001953125, -0.04212665557861328, -0.03891563415527344, -0.035704612731933594, -0.03249359130859375, -0.029282569885253906, -0.026071548461914062, -0.02286052703857422, -0.019649505615234375, -0.01643848419189453, -0.013227462768554688, -0.010016441345214844, -0.006805419921875, -0.0035943984985351562, -0.0003833770751953125, 0.0028276443481445312, 0.006038665771484375, 0.009249687194824219, 0.012460708618164062, 0.015671730041503906, 0.01888275146484375, 0.022093772888183594, 0.025304794311523438, 0.02851581573486328, 0.031726837158203125, 0.03493785858154297, 0.03814888000488281, 0.041359901428222656, 0.0445709228515625, 0.047781944274902344, 0.05099296569824219, 0.05420398712158203, 0.057415008544921875, 0.06062602996826172, 0.06383705139160156, 0.0670480728149414, 0.07025909423828125, 0.0734701156616211, 0.07668113708496094, 0.07989215850830078, 0.08310317993164062, 0.08631420135498047, 0.08952522277832031, 0.09273624420166016, 0.095947265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 10.0, 10.0, 7.0, 22.0, 25.0, 27.0, 68.0, 107.0, 172.0, 297.0, 460.0, 884.0, 1654.0, 3581.0, 11512.0, 94162.0, 3877589.0, 179242.0, 15842.0, 4316.0, 1891.0, 1049.0, 549.0, 319.0, 165.0, 101.0, 73.0, 33.0, 47.0, 18.0, 10.0, 15.0, 9.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.476318359375, -0.4625511169433594, -0.44878387451171875, -0.4350166320800781, -0.4212493896484375, -0.4074821472167969, -0.39371490478515625, -0.3799476623535156, -0.366180419921875, -0.3524131774902344, -0.33864593505859375, -0.3248786926269531, -0.3111114501953125, -0.2973442077636719, -0.28357696533203125, -0.2698097229003906, -0.25604248046875, -0.24227523803710938, -0.22850799560546875, -0.21474075317382812, -0.2009735107421875, -0.18720626831054688, -0.17343902587890625, -0.15967178344726562, -0.145904541015625, -0.13213729858398438, -0.11837005615234375, -0.10460281372070312, -0.0908355712890625, -0.07706832885742188, -0.06330108642578125, -0.049533843994140625, -0.0357666015625, -0.021999359130859375, -0.00823211669921875, 0.005535125732421875, 0.0193023681640625, 0.033069610595703125, 0.04683685302734375, 0.060604095458984375, 0.074371337890625, 0.08813858032226562, 0.10190582275390625, 0.11567306518554688, 0.1294403076171875, 0.14320755004882812, 0.15697479248046875, 0.17074203491210938, 0.18450927734375, 0.19827651977539062, 0.21204376220703125, 0.22581100463867188, 0.2395782470703125, 0.2533454895019531, 0.26711273193359375, 0.2808799743652344, 0.294647216796875, 0.3084144592285156, 0.32218170166015625, 0.3359489440917969, 0.3497161865234375, 0.3634834289550781, 0.37725067138671875, 0.3910179138183594, 0.40478515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 15.0, 14.0, 42.0, 130.0, 510.0, 2775.0, 397.0, 108.0, 24.0, 18.0, 6.0, 5.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.431640625, -0.42170143127441406, -0.4117622375488281, -0.4018230438232422, -0.39188385009765625, -0.3819446563720703, -0.3720054626464844, -0.36206626892089844, -0.3521270751953125, -0.34218788146972656, -0.3322486877441406, -0.3223094940185547, -0.31237030029296875, -0.3024311065673828, -0.2924919128417969, -0.28255271911621094, -0.272613525390625, -0.26267433166503906, -0.2527351379394531, -0.2427959442138672, -0.23285675048828125, -0.2229175567626953, -0.21297836303710938, -0.20303916931152344, -0.1930999755859375, -0.18316078186035156, -0.17322158813476562, -0.1632823944091797, -0.15334320068359375, -0.1434040069580078, -0.13346481323242188, -0.12352561950683594, -0.11358642578125, -0.10364723205566406, -0.09370803833007812, -0.08376884460449219, -0.07382965087890625, -0.06389045715332031, -0.053951263427734375, -0.04401206970214844, -0.0340728759765625, -0.024133682250976562, -0.014194488525390625, -0.0042552947998046875, 0.00568389892578125, 0.015623092651367188, 0.025562286376953125, 0.03550148010253906, 0.045440673828125, 0.05537986755371094, 0.06531906127929688, 0.07525825500488281, 0.08519744873046875, 0.09513664245605469, 0.10507583618164062, 0.11501502990722656, 0.1249542236328125, 0.13489341735839844, 0.14483261108398438, 0.1547718048095703, 0.16471099853515625, 0.1746501922607422, 0.18458938598632812, 0.19452857971191406, 0.2044677734375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 16.0, 100.0, 348.0, 442.0, 79.0, 14.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.101809024810791, -4.994061470031738, -4.8863139152526855, -4.778566360473633, -4.670818328857422, -4.563070774078369, -4.455323219299316, -4.347575664520264, -4.239828109741211, -4.132080554962158, -4.0243330001831055, -3.9165852069854736, -3.808837652206421, -3.701089859008789, -3.5933423042297363, -3.4855947494506836, -3.3778469562530518, -3.270099401473999, -3.162351608276367, -3.0546040534973145, -2.9468564987182617, -2.839108943939209, -2.731361150741577, -2.6236135959625244, -2.5158658027648926, -2.40811824798584, -2.300370454788208, -2.1926229000091553, -2.0848753452301025, -1.9771276712417603, -1.869379997253418, -1.7616324424743652, -1.6538846492767334, -1.5461369752883911, -1.4383894205093384, -1.330641746520996, -1.2228941917419434, -1.115146517753601, -1.0073988437652588, -0.8996512293815613, -0.7919036149978638, -0.6841560006141663, -0.5764083862304688, -0.46866071224212646, -0.36091309785842896, -0.25316548347473145, -0.14541780948638916, -0.03767019510269165, 0.07007741928100586, 0.17782504856586456, 0.28557267785072327, 0.39332032203674316, 0.5010679364204407, 0.6088155508041382, 0.7165632247924805, 0.824310839176178, 0.9320584535598755, 1.0398061275482178, 1.1475536823272705, 1.2553013563156128, 1.363049030303955, 1.4707965850830078, 1.57854425907135, 1.6862919330596924, 1.7940394878387451]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 10.0, 7.0, 11.0, 11.0, 13.0, 13.0, 18.0, 21.0, 18.0, 20.0, 28.0, 32.0, 44.0, 49.0, 45.0, 50.0, 43.0, 39.0, 46.0, 41.0, 46.0, 51.0, 43.0, 35.0, 27.0, 34.0, 31.0, 29.0, 23.0, 26.0, 13.0, 24.0, 12.0, 11.0, 5.0, 7.0, 8.0, 6.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0], "bins": [-0.8993347883224487, -0.8758382797241211, -0.8523417711257935, -0.8288452625274658, -0.8053486943244934, -0.7818521857261658, -0.7583556771278381, -0.7348591685295105, -0.7113626003265381, -0.6878660917282104, -0.6643695831298828, -0.6408730745315552, -0.6173765063285828, -0.5938799977302551, -0.5703834891319275, -0.5468869805335999, -0.5233904719352722, -0.4998939633369446, -0.47639742493629456, -0.4529009163379669, -0.4294043779373169, -0.40590786933898926, -0.3824113607406616, -0.358914852142334, -0.33541831374168396, -0.3119218051433563, -0.2884252667427063, -0.26492875814437866, -0.24143223464488983, -0.217935711145401, -0.19443920254707336, -0.17094267904758453, -0.14744609594345093, -0.1239495724439621, -0.10045305639505386, -0.07695654034614563, -0.0534600168466568, -0.02996349334716797, -0.006466984748840332, 0.0170295387506485, 0.04052606225013733, 0.06402258574962616, 0.0875191017985344, 0.11101561784744263, 0.13451214134693146, 0.1580086648464203, 0.18150517344474792, 0.20500169694423676, 0.22849822044372559, 0.2519947290420532, 0.27549126744270325, 0.2989877760410309, 0.3224843144416809, 0.34598082304000854, 0.3694773316383362, 0.3929738402366638, 0.41647037863731384, 0.4399668872356415, 0.4634634256362915, 0.48695993423461914, 0.5104564428329468, 0.5339529514312744, 0.557449460029602, 0.5809460282325745, 0.6044425368309021]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 4.0, 12.0, 19.0, 36.0, 43.0, 90.0, 137.0, 247.0, 442.0, 954.0, 2180.0, 6229.0, 23835.0, 146770.0, 653325.0, 175509.0, 27232.0, 6954.0, 2392.0, 1017.0, 494.0, 266.0, 145.0, 74.0, 48.0, 27.0, 20.0, 12.0, 9.0, 10.0, 7.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37890625, -0.365631103515625, -0.35235595703125, -0.339080810546875, -0.3258056640625, -0.312530517578125, -0.29925537109375, -0.285980224609375, -0.272705078125, -0.259429931640625, -0.24615478515625, -0.232879638671875, -0.2196044921875, -0.206329345703125, -0.19305419921875, -0.179779052734375, -0.16650390625, -0.153228759765625, -0.13995361328125, -0.126678466796875, -0.1134033203125, -0.100128173828125, -0.08685302734375, -0.073577880859375, -0.060302734375, -0.047027587890625, -0.03375244140625, -0.020477294921875, -0.0072021484375, 0.006072998046875, 0.01934814453125, 0.032623291015625, 0.0458984375, 0.059173583984375, 0.07244873046875, 0.085723876953125, 0.0989990234375, 0.112274169921875, 0.12554931640625, 0.138824462890625, 0.152099609375, 0.165374755859375, 0.17864990234375, 0.191925048828125, 0.2052001953125, 0.218475341796875, 0.23175048828125, 0.245025634765625, 0.25830078125, 0.271575927734375, 0.28485107421875, 0.298126220703125, 0.3114013671875, 0.324676513671875, 0.33795166015625, 0.351226806640625, 0.364501953125, 0.377777099609375, 0.39105224609375, 0.404327392578125, 0.4176025390625, 0.430877685546875, 0.44415283203125, 0.457427978515625, 0.470703125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 7.0, 8.0, 10.0, 13.0, 11.0, 20.0, 32.0, 34.0, 40.0, 51.0, 47.0, 69.0, 78.0, 56.0, 77.0, 69.0, 59.0, 54.0, 53.0, 46.0, 43.0, 24.0, 25.0, 16.0, 21.0, 10.0, 8.0, 13.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10854911804199219, -0.10528182983398438, -0.10201454162597656, -0.09874725341796875, -0.09547996520996094, -0.09221267700195312, -0.08894538879394531, -0.0856781005859375, -0.08241081237792969, -0.07914352416992188, -0.07587623596191406, -0.07260894775390625, -0.06934165954589844, -0.06607437133789062, -0.06280708312988281, -0.059539794921875, -0.05627250671386719, -0.053005218505859375, -0.04973793029785156, -0.04647064208984375, -0.04320335388183594, -0.039936065673828125, -0.03666877746582031, -0.0334014892578125, -0.030134201049804688, -0.026866912841796875, -0.023599624633789062, -0.02033233642578125, -0.017065048217773438, -0.013797760009765625, -0.010530471801757812, -0.00726318359375, -0.0039958953857421875, -0.000728607177734375, 0.0025386810302734375, 0.00580596923828125, 0.009073257446289062, 0.012340545654296875, 0.015607833862304688, 0.0188751220703125, 0.022142410278320312, 0.025409698486328125, 0.028676986694335938, 0.03194427490234375, 0.03521156311035156, 0.038478851318359375, 0.04174613952636719, 0.045013427734375, 0.04828071594238281, 0.051548004150390625, 0.05481529235839844, 0.05808258056640625, 0.06134986877441406, 0.06461715698242188, 0.06788444519042969, 0.0711517333984375, 0.07441902160644531, 0.07768630981445312, 0.08095359802246094, 0.08422088623046875, 0.08748817443847656, 0.09075546264648438, 0.09402275085449219, 0.0972900390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 9.0, 7.0, 6.0, 7.0, 12.0, 15.0, 22.0, 47.0, 70.0, 87.0, 159.0, 247.0, 421.0, 787.0, 1874.0, 4854.0, 17872.0, 117831.0, 752276.0, 124993.0, 18097.0, 4956.0, 1930.0, 883.0, 435.0, 233.0, 133.0, 82.0, 58.0, 44.0, 37.0, 21.0, 17.0, 11.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 4.0, 2.0], "bins": [-0.66552734375, -0.6477851867675781, -0.6300430297851562, -0.6123008728027344, -0.5945587158203125, -0.5768165588378906, -0.5590744018554688, -0.5413322448730469, -0.523590087890625, -0.5058479309082031, -0.48810577392578125, -0.4703636169433594, -0.4526214599609375, -0.4348793029785156, -0.41713714599609375, -0.3993949890136719, -0.38165283203125, -0.3639106750488281, -0.34616851806640625, -0.3284263610839844, -0.3106842041015625, -0.2929420471191406, -0.27519989013671875, -0.2574577331542969, -0.239715576171875, -0.22197341918945312, -0.20423126220703125, -0.18648910522460938, -0.1687469482421875, -0.15100479125976562, -0.13326263427734375, -0.11552047729492188, -0.0977783203125, -0.08003616333007812, -0.06229400634765625, -0.044551849365234375, -0.0268096923828125, -0.009067535400390625, 0.00867462158203125, 0.026416778564453125, 0.044158935546875, 0.061901092529296875, 0.07964324951171875, 0.09738540649414062, 0.1151275634765625, 0.13286972045898438, 0.15061187744140625, 0.16835403442382812, 0.18609619140625, 0.20383834838867188, 0.22158050537109375, 0.23932266235351562, 0.2570648193359375, 0.2748069763183594, 0.29254913330078125, 0.3102912902832031, 0.328033447265625, 0.3457756042480469, 0.36351776123046875, 0.3812599182128906, 0.3990020751953125, 0.4167442321777344, 0.43448638916015625, 0.4522285461425781, 0.469970703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 10.0, 13.0, 16.0, 18.0, 29.0, 32.0, 44.0, 53.0, 47.0, 41.0, 53.0, 63.0, 55.0, 72.0, 46.0, 41.0, 56.0, 60.0, 43.0, 33.0, 36.0, 29.0, 26.0, 11.0, 7.0, 7.0, 7.0, 10.0, 10.0, 8.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6171875, -0.5978469848632812, -0.5785064697265625, -0.5591659545898438, -0.539825439453125, -0.5204849243164062, -0.5011444091796875, -0.48180389404296875, -0.46246337890625, -0.44312286376953125, -0.4237823486328125, -0.40444183349609375, -0.385101318359375, -0.36576080322265625, -0.3464202880859375, -0.32707977294921875, -0.3077392578125, -0.28839874267578125, -0.2690582275390625, -0.24971771240234375, -0.230377197265625, -0.21103668212890625, -0.1916961669921875, -0.17235565185546875, -0.15301513671875, -0.13367462158203125, -0.1143341064453125, -0.09499359130859375, -0.075653076171875, -0.05631256103515625, -0.0369720458984375, -0.01763153076171875, 0.001708984375, 0.02104949951171875, 0.0403900146484375, 0.05973052978515625, 0.079071044921875, 0.09841156005859375, 0.1177520751953125, 0.13709259033203125, 0.15643310546875, 0.17577362060546875, 0.1951141357421875, 0.21445465087890625, 0.233795166015625, 0.25313568115234375, 0.2724761962890625, 0.29181671142578125, 0.3111572265625, 0.33049774169921875, 0.3498382568359375, 0.36917877197265625, 0.388519287109375, 0.40785980224609375, 0.4272003173828125, 0.44654083251953125, 0.46588134765625, 0.48522186279296875, 0.5045623779296875, 0.5239028930664062, 0.543243408203125, 0.5625839233398438, 0.5819244384765625, 0.6012649536132812, 0.62060546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 13.0, 13.0, 26.0, 33.0, 58.0, 117.0, 150.0, 313.0, 667.0, 1720.0, 6164.0, 49868.0, 813363.0, 159395.0, 12210.0, 2583.0, 888.0, 441.0, 205.0, 121.0, 65.0, 36.0, 48.0, 11.0, 13.0, 9.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.384765625, -0.37334442138671875, -0.3619232177734375, -0.35050201416015625, -0.339080810546875, -0.32765960693359375, -0.3162384033203125, -0.30481719970703125, -0.29339599609375, -0.28197479248046875, -0.2705535888671875, -0.25913238525390625, -0.247711181640625, -0.23628997802734375, -0.2248687744140625, -0.21344757080078125, -0.2020263671875, -0.19060516357421875, -0.1791839599609375, -0.16776275634765625, -0.156341552734375, -0.14492034912109375, -0.1334991455078125, -0.12207794189453125, -0.11065673828125, -0.09923553466796875, -0.0878143310546875, -0.07639312744140625, -0.064971923828125, -0.05355072021484375, -0.0421295166015625, -0.03070831298828125, -0.019287109375, -0.00786590576171875, 0.0035552978515625, 0.01497650146484375, 0.026397705078125, 0.03781890869140625, 0.0492401123046875, 0.06066131591796875, 0.07208251953125, 0.08350372314453125, 0.0949249267578125, 0.10634613037109375, 0.117767333984375, 0.12918853759765625, 0.1406097412109375, 0.15203094482421875, 0.1634521484375, 0.17487335205078125, 0.1862945556640625, 0.19771575927734375, 0.209136962890625, 0.22055816650390625, 0.2319793701171875, 0.24340057373046875, 0.25482177734375, 0.26624298095703125, 0.2776641845703125, 0.28908538818359375, 0.300506591796875, 0.31192779541015625, 0.3233489990234375, 0.33477020263671875, 0.34619140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 11.0, 12.0, 19.0, 28.0, 24.0, 45.0, 59.0, 72.0, 87.0, 115.0, 92.0, 88.0, 88.0, 59.0, 56.0, 33.0, 28.0, 20.0, 15.0, 13.0, 5.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.952617645263672e-05, -8.549727499485016e-05, -8.14683735370636e-05, -7.743947207927704e-05, -7.341057062149048e-05, -6.938166916370392e-05, -6.535276770591736e-05, -6.13238662481308e-05, -5.729496479034424e-05, -5.326606333255768e-05, -4.923716187477112e-05, -4.520826041698456e-05, -4.1179358959198e-05, -3.715045750141144e-05, -3.312155604362488e-05, -2.9092654585838318e-05, -2.5063753128051758e-05, -2.1034851670265198e-05, -1.7005950212478638e-05, -1.2977048754692078e-05, -8.948147296905518e-06, -4.9192458391189575e-06, -8.903443813323975e-07, 3.1385570764541626e-06, 7.167458534240723e-06, 1.1196359992027283e-05, 1.5225261449813843e-05, 1.9254162907600403e-05, 2.3283064365386963e-05, 2.7311965823173523e-05, 3.134086728096008e-05, 3.536976873874664e-05, 3.93986701965332e-05, 4.342757165431976e-05, 4.745647311210632e-05, 5.148537456989288e-05, 5.551427602767944e-05, 5.9543177485466003e-05, 6.357207894325256e-05, 6.760098040103912e-05, 7.162988185882568e-05, 7.565878331661224e-05, 7.96876847743988e-05, 8.371658623218536e-05, 8.774548768997192e-05, 9.177438914775848e-05, 9.580329060554504e-05, 9.98321920633316e-05, 0.00010386109352111816, 0.00010788999497890472, 0.00011191889643669128, 0.00011594779789447784, 0.0001199766993522644, 0.00012400560081005096, 0.00012803450226783752, 0.00013206340372562408, 0.00013609230518341064, 0.0001401212066411972, 0.00014415010809898376, 0.00014817900955677032, 0.00015220791101455688, 0.00015623681247234344, 0.00016026571393013, 0.00016429461538791656, 0.00016832351684570312]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 9.0, 11.0, 15.0, 23.0, 46.0, 81.0, 143.0, 262.0, 415.0, 872.0, 2362.0, 10599.0, 100646.0, 821192.0, 97352.0, 10352.0, 2293.0, 860.0, 414.0, 218.0, 156.0, 89.0, 52.0, 33.0, 13.0, 13.0, 5.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31103515625, -0.3011589050292969, -0.29128265380859375, -0.2814064025878906, -0.2715301513671875, -0.2616539001464844, -0.25177764892578125, -0.24190139770507812, -0.232025146484375, -0.22214889526367188, -0.21227264404296875, -0.20239639282226562, -0.1925201416015625, -0.18264389038085938, -0.17276763916015625, -0.16289138793945312, -0.15301513671875, -0.14313888549804688, -0.13326263427734375, -0.12338638305664062, -0.1135101318359375, -0.10363388061523438, -0.09375762939453125, -0.08388137817382812, -0.074005126953125, -0.06412887573242188, -0.05425262451171875, -0.044376373291015625, -0.0345001220703125, -0.024623870849609375, -0.01474761962890625, -0.004871368408203125, 0.0050048828125, 0.014881134033203125, 0.02475738525390625, 0.034633636474609375, 0.0445098876953125, 0.054386138916015625, 0.06426239013671875, 0.07413864135742188, 0.084014892578125, 0.09389114379882812, 0.10376739501953125, 0.11364364624023438, 0.1235198974609375, 0.13339614868164062, 0.14327239990234375, 0.15314865112304688, 0.16302490234375, 0.17290115356445312, 0.18277740478515625, 0.19265365600585938, 0.2025299072265625, 0.21240615844726562, 0.22228240966796875, 0.23215866088867188, 0.242034912109375, 0.2519111633300781, 0.26178741455078125, 0.2716636657714844, 0.2815399169921875, 0.2914161682128906, 0.30129241943359375, 0.3111686706542969, 0.321044921875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 6.0, 12.0, 22.0, 25.0, 34.0, 56.0, 87.0, 146.0, 206.0, 147.0, 88.0, 51.0, 45.0, 21.0, 14.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4208984375, -0.4070167541503906, -0.39313507080078125, -0.3792533874511719, -0.3653717041015625, -0.3514900207519531, -0.33760833740234375, -0.3237266540527344, -0.309844970703125, -0.2959632873535156, -0.28208160400390625, -0.2681999206542969, -0.2543182373046875, -0.24043655395507812, -0.22655487060546875, -0.21267318725585938, -0.19879150390625, -0.18490982055664062, -0.17102813720703125, -0.15714645385742188, -0.1432647705078125, -0.12938308715820312, -0.11550140380859375, -0.10161972045898438, -0.087738037109375, -0.07385635375976562, -0.05997467041015625, -0.046092987060546875, -0.0322113037109375, -0.018329620361328125, -0.00444793701171875, 0.009433746337890625, 0.0233154296875, 0.037197113037109375, 0.05107879638671875, 0.06496047973632812, 0.0788421630859375, 0.09272384643554688, 0.10660552978515625, 0.12048721313476562, 0.134368896484375, 0.14825057983398438, 0.16213226318359375, 0.17601394653320312, 0.1898956298828125, 0.20377731323242188, 0.21765899658203125, 0.23154067993164062, 0.24542236328125, 0.2593040466308594, 0.27318572998046875, 0.2870674133300781, 0.3009490966796875, 0.3148307800292969, 0.32871246337890625, 0.3425941467285156, 0.356475830078125, 0.3703575134277344, 0.38423919677734375, 0.3981208801269531, 0.4120025634765625, 0.4258842468261719, 0.43976593017578125, 0.4536476135253906, 0.467529296875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 29.0, 114.0, 413.0, 360.0, 66.0, 14.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-18.472187042236328, -18.136234283447266, -17.800283432006836, -17.464330673217773, -17.128379821777344, -16.79242706298828, -16.45647621154785, -16.12052345275879, -15.784571647644043, -15.448619842529297, -15.11266803741455, -14.776716232299805, -14.440764427185059, -14.104812622070312, -13.76885986328125, -13.432908058166504, -13.096956253051758, -12.761004447937012, -12.425052642822266, -12.08910083770752, -11.753149032592773, -11.417196273803711, -11.081245422363281, -10.745292663574219, -10.409341812133789, -10.073390007019043, -9.737438201904297, -9.40148639678955, -9.065534591674805, -8.729581832885742, -8.393630981445312, -8.05767822265625, -7.721726417541504, -7.385774612426758, -7.049822807312012, -6.713871002197266, -6.377918720245361, -6.041966915130615, -5.706015110015869, -5.370062828063965, -5.034111022949219, -4.698159217834473, -4.362207412719727, -4.0262556076049805, -3.690303325653076, -3.35435152053833, -3.018399715423584, -2.682447671890259, -2.346496105194092, -2.0105443000793457, -1.6745922565460205, -1.3386404514312744, -1.0026885271072388, -0.6667366027832031, -0.33078479766845703, 0.005167245864868164, 0.34111905097961426, 0.6770709753036499, 1.0130228996276855, 1.3489747047424316, 1.6849266290664673, 2.020878553390503, 2.356830358505249, 2.692782402038574, 3.0287342071533203]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 3.0, 4.0, 4.0, 5.0, 9.0, 11.0, 15.0, 32.0, 20.0, 30.0, 23.0, 28.0, 32.0, 51.0, 41.0, 30.0, 47.0, 60.0, 41.0, 41.0, 42.0, 47.0, 41.0, 35.0, 57.0, 43.0, 31.0, 29.0, 28.0, 15.0, 30.0, 14.0, 12.0, 13.0, 7.0, 10.0, 4.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1834774017333984, -3.0944883823394775, -3.0054993629455566, -2.916510581970215, -2.827521562576294, -2.738532543182373, -2.649543523788452, -2.5605545043945312, -2.4715657234191895, -2.3825767040252686, -2.2935876846313477, -2.204598903656006, -2.115609884262085, -2.026620864868164, -1.9376318454742432, -1.8486428260803223, -1.7596538066864014, -1.6706647872924805, -1.5816758871078491, -1.4926868677139282, -1.4036979675292969, -1.314708948135376, -1.225719928741455, -1.1367309093475342, -1.0477420091629028, -0.9587530493736267, -0.8697640895843506, -0.7807750701904297, -0.6917861104011536, -0.6027971506118774, -0.5138081312179565, -0.4248191714286804, -0.3358302116394043, -0.24684123694896698, -0.15785226225852966, -0.06886327266693115, 0.02012568712234497, 0.1091146469116211, 0.198103666305542, 0.2870926260948181, 0.37608158588409424, 0.46507054567337036, 0.5540595054626465, 0.6430485248565674, 0.7320374846458435, 0.8210264444351196, 0.9100154638290405, 0.9990044236183167, 1.0879933834075928, 1.1769824028015137, 1.265971302986145, 1.354960322380066, 1.4439492225646973, 1.5329382419586182, 1.621927261352539, 1.71091628074646, 1.7999051809310913, 1.8888942003250122, 1.9778831005096436, 2.0668721199035645, 2.1558611392974854, 2.2448501586914062, 2.333838939666748, 2.422827959060669, 2.51181697845459]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 5.0, 8.0, 17.0, 18.0, 37.0, 60.0, 89.0, 143.0, 230.0, 358.0, 714.0, 1549.0, 4371.0, 21955.0, 3997562.0, 151801.0, 10216.0, 2729.0, 1069.0, 533.0, 300.0, 202.0, 106.0, 80.0, 47.0, 26.0, 18.0, 14.0, 11.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.64111328125, -0.6250038146972656, -0.6088943481445312, -0.5927848815917969, -0.5766754150390625, -0.5605659484863281, -0.5444564819335938, -0.5283470153808594, -0.512237548828125, -0.4961280822753906, -0.48001861572265625, -0.4639091491699219, -0.4477996826171875, -0.4316902160644531, -0.41558074951171875, -0.3994712829589844, -0.38336181640625, -0.3672523498535156, -0.35114288330078125, -0.3350334167480469, -0.3189239501953125, -0.3028144836425781, -0.28670501708984375, -0.2705955505371094, -0.254486083984375, -0.23837661743164062, -0.22226715087890625, -0.20615768432617188, -0.1900482177734375, -0.17393875122070312, -0.15782928466796875, -0.14171981811523438, -0.1256103515625, -0.10950088500976562, -0.09339141845703125, -0.07728195190429688, -0.0611724853515625, -0.045063018798828125, -0.02895355224609375, -0.012844085693359375, 0.003265380859375, 0.019374847412109375, 0.03548431396484375, 0.051593780517578125, 0.0677032470703125, 0.08381271362304688, 0.09992218017578125, 0.11603164672851562, 0.13214111328125, 0.14825057983398438, 0.16436004638671875, 0.18046951293945312, 0.1965789794921875, 0.21268844604492188, 0.22879791259765625, 0.24490737915039062, 0.261016845703125, 0.2771263122558594, 0.29323577880859375, 0.3093452453613281, 0.3254547119140625, 0.3415641784667969, 0.35767364501953125, 0.3737831115722656, 0.389892578125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 10.0, 6.0, 15.0, 20.0, 22.0, 29.0, 25.0, 39.0, 65.0, 58.0, 79.0, 79.0, 72.0, 65.0, 63.0, 71.0, 54.0, 46.0, 45.0, 37.0, 28.0, 27.0, 16.0, 8.0, 8.0, 5.0, 10.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1572265625, -0.15317344665527344, -0.14912033081054688, -0.1450672149658203, -0.14101409912109375, -0.1369609832763672, -0.13290786743164062, -0.12885475158691406, -0.1248016357421875, -0.12074851989746094, -0.11669540405273438, -0.11264228820800781, -0.10858917236328125, -0.10453605651855469, -0.10048294067382812, -0.09642982482910156, -0.092376708984375, -0.08832359313964844, -0.08427047729492188, -0.08021736145019531, -0.07616424560546875, -0.07211112976074219, -0.06805801391601562, -0.06400489807128906, -0.0599517822265625, -0.05589866638183594, -0.051845550537109375, -0.04779243469238281, -0.04373931884765625, -0.03968620300292969, -0.035633087158203125, -0.03157997131347656, -0.02752685546875, -0.023473739624023438, -0.019420623779296875, -0.015367507934570312, -0.01131439208984375, -0.0072612762451171875, -0.003208160400390625, 0.0008449554443359375, 0.0048980712890625, 0.008951187133789062, 0.013004302978515625, 0.017057418823242188, 0.02111053466796875, 0.025163650512695312, 0.029216766357421875, 0.03326988220214844, 0.037322998046875, 0.04137611389160156, 0.045429229736328125, 0.04948234558105469, 0.05353546142578125, 0.05758857727050781, 0.061641693115234375, 0.06569480895996094, 0.0697479248046875, 0.07380104064941406, 0.07785415649414062, 0.08190727233886719, 0.08596038818359375, 0.09001350402832031, 0.09406661987304688, 0.09811973571777344, 0.1021728515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 8.0, 12.0, 12.0, 28.0, 35.0, 24.0, 54.0, 66.0, 107.0, 148.0, 180.0, 249.0, 359.0, 508.0, 764.0, 1123.0, 2091.0, 4964.0, 15430.0, 110436.0, 3958032.0, 76783.0, 13005.0, 4427.0, 1967.0, 1111.0, 700.0, 458.0, 309.0, 216.0, 170.0, 149.0, 98.0, 48.0, 53.0, 49.0, 19.0, 24.0, 23.0, 6.0, 14.0, 1.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4658203125, -0.4510002136230469, -0.43618011474609375, -0.4213600158691406, -0.4065399169921875, -0.3917198181152344, -0.37689971923828125, -0.3620796203613281, -0.347259521484375, -0.3324394226074219, -0.31761932373046875, -0.3027992248535156, -0.2879791259765625, -0.2731590270996094, -0.25833892822265625, -0.24351882934570312, -0.22869873046875, -0.21387863159179688, -0.19905853271484375, -0.18423843383789062, -0.1694183349609375, -0.15459823608398438, -0.13977813720703125, -0.12495803833007812, -0.110137939453125, -0.09531784057617188, -0.08049774169921875, -0.06567764282226562, -0.0508575439453125, -0.036037445068359375, -0.02121734619140625, -0.006397247314453125, 0.0084228515625, 0.023242950439453125, 0.03806304931640625, 0.052883148193359375, 0.0677032470703125, 0.08252334594726562, 0.09734344482421875, 0.11216354370117188, 0.126983642578125, 0.14180374145507812, 0.15662384033203125, 0.17144393920898438, 0.1862640380859375, 0.20108413696289062, 0.21590423583984375, 0.23072433471679688, 0.24554443359375, 0.2603645324707031, 0.27518463134765625, 0.2900047302246094, 0.3048248291015625, 0.3196449279785156, 0.33446502685546875, 0.3492851257324219, 0.364105224609375, 0.3789253234863281, 0.39374542236328125, 0.4085655212402344, 0.4233856201171875, 0.4382057189941406, 0.45302581787109375, 0.4678459167480469, 0.482666015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 19.0, 72.0, 445.0, 3269.0, 149.0, 62.0, 15.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1943359375, -0.18881607055664062, -0.18329620361328125, -0.17777633666992188, -0.1722564697265625, -0.16673660278320312, -0.16121673583984375, -0.15569686889648438, -0.150177001953125, -0.14465713500976562, -0.13913726806640625, -0.13361740112304688, -0.1280975341796875, -0.12257766723632812, -0.11705780029296875, -0.11153793334960938, -0.10601806640625, -0.10049819946289062, -0.09497833251953125, -0.08945846557617188, -0.0839385986328125, -0.07841873168945312, -0.07289886474609375, -0.06737899780273438, -0.061859130859375, -0.056339263916015625, -0.05081939697265625, -0.045299530029296875, -0.0397796630859375, -0.034259796142578125, -0.02873992919921875, -0.023220062255859375, -0.0177001953125, -0.012180328369140625, -0.00666046142578125, -0.001140594482421875, 0.0043792724609375, 0.009899139404296875, 0.01541900634765625, 0.020938873291015625, 0.026458740234375, 0.031978607177734375, 0.03749847412109375, 0.043018341064453125, 0.0485382080078125, 0.054058074951171875, 0.05957794189453125, 0.06509780883789062, 0.07061767578125, 0.07613754272460938, 0.08165740966796875, 0.08717727661132812, 0.0926971435546875, 0.09821701049804688, 0.10373687744140625, 0.10925674438476562, 0.114776611328125, 0.12029647827148438, 0.12581634521484375, 0.13133621215820312, 0.1368560791015625, 0.14237594604492188, 0.14789581298828125, 0.15341567993164062, 0.158935546875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 17.0, 14.0, 24.0, 55.0, 107.0, 140.0, 157.0, 149.0, 136.0, 72.0, 53.0, 28.0, 12.0, 12.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6229955554008484, -0.6078831553459167, -0.5927706956863403, -0.5776582956314087, -0.562545895576477, -0.5474334359169006, -0.532321035861969, -0.5172086358070374, -0.5020961761474609, -0.4869837462902069, -0.47187134623527527, -0.45675891637802124, -0.4416464865207672, -0.42653408646583557, -0.41142165660858154, -0.3963092565536499, -0.38119685649871826, -0.36608442664146423, -0.3509720265865326, -0.33585959672927856, -0.32074716687202454, -0.3056347668170929, -0.29052233695983887, -0.2754099369049072, -0.2602974772453308, -0.24518506228923798, -0.23007263243198395, -0.2149602174758911, -0.19984780251979828, -0.18473538756370544, -0.16962295770645142, -0.15451054275035858, -0.13939812779426575, -0.12428570538759232, -0.10917329043149948, -0.09406086802482605, -0.07894845306873322, -0.06383603066205978, -0.04872360825538635, -0.03361119329929352, -0.018498770892620087, -0.003386351279914379, 0.011726068332791328, 0.02683848887681961, 0.041950907558202744, 0.057063326239585876, 0.07217574864625931, 0.08728816360235214, 0.10240058600902557, 0.117513008415699, 0.13262543082237244, 0.14773784577846527, 0.1628502607345581, 0.17796269059181213, 0.19307510554790497, 0.2081875205039978, 0.22329995036125183, 0.23841236531734467, 0.2535247802734375, 0.26863721013069153, 0.28374963998794556, 0.2988620400428772, 0.3139744699001312, 0.32908689975738525, 0.3441992998123169]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 4.0, 15.0, 7.0, 13.0, 11.0, 15.0, 29.0, 20.0, 29.0, 28.0, 35.0, 38.0, 39.0, 36.0, 48.0, 40.0, 43.0, 45.0, 42.0, 42.0, 42.0, 40.0, 34.0, 34.0, 44.0, 30.0, 34.0, 25.0, 18.0, 26.0, 20.0, 12.0, 14.0, 8.0, 8.0, 5.0, 1.0, 10.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25805431604385376, -0.24963845312595367, -0.2412225902080536, -0.2328067272901535, -0.22439086437225342, -0.21597498655319214, -0.20755912363529205, -0.19914326071739197, -0.19072739779949188, -0.1823115348815918, -0.1738956719636917, -0.16547980904579163, -0.15706393122673035, -0.14864808320999146, -0.14023220539093018, -0.1318163424730301, -0.12340047955513, -0.11498461663722992, -0.10656875371932983, -0.09815288335084915, -0.08973702043294907, -0.08132115751504898, -0.0729052871465683, -0.06448942422866821, -0.05607356131076813, -0.04765769839286804, -0.03924183174967766, -0.030825966969132423, -0.02241010218858719, -0.013994239270687103, -0.005578372627496719, 0.0028374940156936646, 0.01125335693359375, 0.019669221714138985, 0.02808508649468422, 0.0365009531378746, 0.04491681605577469, 0.053332678973674774, 0.06174854561686516, 0.07016441226005554, 0.07858027517795563, 0.08699613809585571, 0.0954120010137558, 0.10382787138223648, 0.11224373430013657, 0.12065959721803665, 0.12907546758651733, 0.13749133050441742, 0.1459071934223175, 0.1543230563402176, 0.16273891925811768, 0.17115478217601776, 0.17957064509391785, 0.18798652291297913, 0.1964023858308792, 0.2048182487487793, 0.21323411166667938, 0.22164997458457947, 0.23006583750247955, 0.23848170042037964, 0.24689757823944092, 0.2553134262561798, 0.2637293040752411, 0.27214515209198, 0.28056102991104126]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 8.0, 9.0, 13.0, 30.0, 31.0, 70.0, 126.0, 190.0, 368.0, 784.0, 1656.0, 3779.0, 10519.0, 35390.0, 188160.0, 602514.0, 157818.0, 30978.0, 9590.0, 3486.0, 1497.0, 695.0, 378.0, 183.0, 114.0, 66.0, 31.0, 17.0, 17.0, 9.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.422119140625, -0.4077873229980469, -0.39345550537109375, -0.3791236877441406, -0.3647918701171875, -0.3504600524902344, -0.33612823486328125, -0.3217964172363281, -0.307464599609375, -0.2931327819824219, -0.27880096435546875, -0.2644691467285156, -0.2501373291015625, -0.23580551147460938, -0.22147369384765625, -0.20714187622070312, -0.19281005859375, -0.17847824096679688, -0.16414642333984375, -0.14981460571289062, -0.1354827880859375, -0.12115097045898438, -0.10681915283203125, -0.09248733520507812, -0.078155517578125, -0.06382369995117188, -0.04949188232421875, -0.035160064697265625, -0.0208282470703125, -0.006496429443359375, 0.00783538818359375, 0.022167205810546875, 0.0364990234375, 0.050830841064453125, 0.06516265869140625, 0.07949447631835938, 0.0938262939453125, 0.10815811157226562, 0.12248992919921875, 0.13682174682617188, 0.151153564453125, 0.16548538208007812, 0.17981719970703125, 0.19414901733398438, 0.2084808349609375, 0.22281265258789062, 0.23714447021484375, 0.2514762878417969, 0.26580810546875, 0.2801399230957031, 0.29447174072265625, 0.3088035583496094, 0.3231353759765625, 0.3374671936035156, 0.35179901123046875, 0.3661308288574219, 0.380462646484375, 0.3947944641113281, 0.40912628173828125, 0.4234580993652344, 0.4377899169921875, 0.4521217346191406, 0.46645355224609375, 0.4807853698730469, 0.4951171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 10.0, 19.0, 18.0, 23.0, 29.0, 23.0, 27.0, 41.0, 63.0, 53.0, 81.0, 64.0, 86.0, 70.0, 62.0, 53.0, 56.0, 48.0, 38.0, 40.0, 27.0, 17.0, 11.0, 14.0, 12.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1629638671875, -0.15884017944335938, -0.15471649169921875, -0.15059280395507812, -0.1464691162109375, -0.14234542846679688, -0.13822174072265625, -0.13409805297851562, -0.129974365234375, -0.12585067749023438, -0.12172698974609375, -0.11760330200195312, -0.1134796142578125, -0.10935592651367188, -0.10523223876953125, -0.10110855102539062, -0.09698486328125, -0.09286117553710938, -0.08873748779296875, -0.08461380004882812, -0.0804901123046875, -0.07636642456054688, -0.07224273681640625, -0.06811904907226562, -0.063995361328125, -0.059871673583984375, -0.05574798583984375, -0.051624298095703125, -0.0475006103515625, -0.043376922607421875, -0.03925323486328125, -0.035129547119140625, -0.031005859375, -0.026882171630859375, -0.02275848388671875, -0.018634796142578125, -0.0145111083984375, -0.010387420654296875, -0.00626373291015625, -0.002140045166015625, 0.001983642578125, 0.006107330322265625, 0.01023101806640625, 0.014354705810546875, 0.0184783935546875, 0.022602081298828125, 0.02672576904296875, 0.030849456787109375, 0.03497314453125, 0.039096832275390625, 0.04322052001953125, 0.047344207763671875, 0.0514678955078125, 0.055591583251953125, 0.05971527099609375, 0.06383895874023438, 0.067962646484375, 0.07208633422851562, 0.07621002197265625, 0.08033370971679688, 0.0844573974609375, 0.08858108520507812, 0.09270477294921875, 0.09682846069335938, 0.1009521484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 4.0, 12.0, 10.0, 23.0, 20.0, 26.0, 35.0, 55.0, 99.0, 134.0, 230.0, 333.0, 556.0, 921.0, 1707.0, 3545.0, 8304.0, 27038.0, 147167.0, 654281.0, 159162.0, 28331.0, 8665.0, 3636.0, 1730.0, 959.0, 575.0, 357.0, 195.0, 134.0, 97.0, 51.0, 53.0, 20.0, 20.0, 12.0, 9.0, 13.0, 8.0, 7.0, 2.0, 1.0, 6.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4716796875, -0.4567146301269531, -0.44174957275390625, -0.4267845153808594, -0.4118194580078125, -0.3968544006347656, -0.38188934326171875, -0.3669242858886719, -0.351959228515625, -0.3369941711425781, -0.32202911376953125, -0.3070640563964844, -0.2920989990234375, -0.2771339416503906, -0.26216888427734375, -0.24720382690429688, -0.23223876953125, -0.21727371215820312, -0.20230865478515625, -0.18734359741210938, -0.1723785400390625, -0.15741348266601562, -0.14244842529296875, -0.12748336791992188, -0.112518310546875, -0.09755325317382812, -0.08258819580078125, -0.06762313842773438, -0.0526580810546875, -0.037693023681640625, -0.02272796630859375, -0.007762908935546875, 0.0072021484375, 0.022167205810546875, 0.03713226318359375, 0.052097320556640625, 0.0670623779296875, 0.08202743530273438, 0.09699249267578125, 0.11195755004882812, 0.126922607421875, 0.14188766479492188, 0.15685272216796875, 0.17181777954101562, 0.1867828369140625, 0.20174789428710938, 0.21671295166015625, 0.23167800903320312, 0.24664306640625, 0.2616081237792969, 0.27657318115234375, 0.2915382385253906, 0.3065032958984375, 0.3214683532714844, 0.33643341064453125, 0.3513984680175781, 0.366363525390625, 0.3813285827636719, 0.39629364013671875, 0.4112586975097656, 0.4262237548828125, 0.4411888122558594, 0.45615386962890625, 0.4711189270019531, 0.486083984375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 2.0, 6.0, 10.0, 15.0, 13.0, 37.0, 34.0, 35.0, 48.0, 48.0, 54.0, 69.0, 72.0, 59.0, 74.0, 65.0, 65.0, 49.0, 49.0, 42.0, 30.0, 28.0, 25.0, 19.0, 14.0, 10.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68994140625, -0.6648635864257812, -0.6397857666015625, -0.6147079467773438, -0.589630126953125, -0.5645523071289062, -0.5394744873046875, -0.5143966674804688, -0.48931884765625, -0.46424102783203125, -0.4391632080078125, -0.41408538818359375, -0.389007568359375, -0.36392974853515625, -0.3388519287109375, -0.31377410888671875, -0.2886962890625, -0.26361846923828125, -0.2385406494140625, -0.21346282958984375, -0.188385009765625, -0.16330718994140625, -0.1382293701171875, -0.11315155029296875, -0.08807373046875, -0.06299591064453125, -0.0379180908203125, -0.01284027099609375, 0.012237548828125, 0.03731536865234375, 0.0623931884765625, 0.08747100830078125, 0.112548828125, 0.13762664794921875, 0.1627044677734375, 0.18778228759765625, 0.212860107421875, 0.23793792724609375, 0.2630157470703125, 0.28809356689453125, 0.31317138671875, 0.33824920654296875, 0.3633270263671875, 0.38840484619140625, 0.413482666015625, 0.43856048583984375, 0.4636383056640625, 0.48871612548828125, 0.5137939453125, 0.5388717651367188, 0.5639495849609375, 0.5890274047851562, 0.614105224609375, 0.6391830444335938, 0.6642608642578125, 0.6893386840820312, 0.71441650390625, 0.7394943237304688, 0.7645721435546875, 0.7896499633789062, 0.814727783203125, 0.8398056030273438, 0.8648834228515625, 0.8899612426757812, 0.9150390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 21.0, 21.0, 30.0, 68.0, 132.0, 243.0, 736.0, 2845.0, 32082.0, 969000.0, 39054.0, 3006.0, 755.0, 283.0, 113.0, 72.0, 33.0, 24.0, 11.0, 9.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.41339874267578125, -0.3922271728515625, -0.37105560302734375, -0.349884033203125, -0.32871246337890625, -0.3075408935546875, -0.28636932373046875, -0.26519775390625, -0.24402618408203125, -0.2228546142578125, -0.20168304443359375, -0.180511474609375, -0.15933990478515625, -0.1381683349609375, -0.11699676513671875, -0.0958251953125, -0.07465362548828125, -0.0534820556640625, -0.03231048583984375, -0.011138916015625, 0.01003265380859375, 0.0312042236328125, 0.05237579345703125, 0.07354736328125, 0.09471893310546875, 0.1158905029296875, 0.13706207275390625, 0.158233642578125, 0.17940521240234375, 0.2005767822265625, 0.22174835205078125, 0.242919921875, 0.26409149169921875, 0.2852630615234375, 0.30643463134765625, 0.327606201171875, 0.34877777099609375, 0.3699493408203125, 0.39112091064453125, 0.41229248046875, 0.43346405029296875, 0.4546356201171875, 0.47580718994140625, 0.496978759765625, 0.5181503295898438, 0.5393218994140625, 0.5604934692382812, 0.5816650390625, 0.6028366088867188, 0.6240081787109375, 0.6451797485351562, 0.666351318359375, 0.6875228881835938, 0.7086944580078125, 0.7298660278320312, 0.75103759765625, 0.7722091674804688, 0.7933807373046875, 0.8145523071289062, 0.835723876953125, 0.8568954467773438, 0.8780670166015625, 0.8992385864257812, 0.92041015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 14.0, 10.0, 29.0, 53.0, 62.0, 102.0, 146.0, 186.0, 144.0, 108.0, 62.0, 29.0, 18.0, 17.0, 5.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020694732666015625, -0.00020056962966918945, -0.00019419193267822266, -0.00018781423568725586, -0.00018143653869628906, -0.00017505884170532227, -0.00016868114471435547, -0.00016230344772338867, -0.00015592575073242188, -0.00014954805374145508, -0.00014317035675048828, -0.00013679265975952148, -0.0001304149627685547, -0.0001240372657775879, -0.0001176595687866211, -0.0001112818717956543, -0.0001049041748046875, -9.85264778137207e-05, -9.21487808227539e-05, -8.577108383178711e-05, -7.939338684082031e-05, -7.301568984985352e-05, -6.663799285888672e-05, -6.026029586791992e-05, -5.3882598876953125e-05, -4.750490188598633e-05, -4.112720489501953e-05, -3.4749507904052734e-05, -2.8371810913085938e-05, -2.199411392211914e-05, -1.5616416931152344e-05, -9.238719940185547e-06, -2.86102294921875e-06, 3.516674041748047e-06, 9.894371032714844e-06, 1.627206802368164e-05, 2.2649765014648438e-05, 2.9027462005615234e-05, 3.540515899658203e-05, 4.178285598754883e-05, 4.8160552978515625e-05, 5.453824996948242e-05, 6.091594696044922e-05, 6.729364395141602e-05, 7.367134094238281e-05, 8.004903793334961e-05, 8.64267349243164e-05, 9.28044319152832e-05, 9.918212890625e-05, 0.0001055598258972168, 0.0001119375228881836, 0.00011831521987915039, 0.0001246929168701172, 0.00013107061386108398, 0.00013744831085205078, 0.00014382600784301758, 0.00015020370483398438, 0.00015658140182495117, 0.00016295909881591797, 0.00016933679580688477, 0.00017571449279785156, 0.00018209218978881836, 0.00018846988677978516, 0.00019484758377075195, 0.00020122528076171875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 6.0, 2.0, 8.0, 9.0, 19.0, 20.0, 33.0, 49.0, 83.0, 164.0, 280.0, 564.0, 1280.0, 3651.0, 16292.0, 219629.0, 750166.0, 45604.0, 6929.0, 2033.0, 833.0, 398.0, 185.0, 114.0, 69.0, 46.0, 21.0, 16.0, 12.0, 10.0, 12.0, 9.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334716796875, -0.32464599609375, -0.3145751953125, -0.30450439453125, -0.29443359375, -0.28436279296875, -0.2742919921875, -0.26422119140625, -0.254150390625, -0.24407958984375, -0.2340087890625, -0.22393798828125, -0.2138671875, -0.20379638671875, -0.1937255859375, -0.18365478515625, -0.173583984375, -0.16351318359375, -0.1534423828125, -0.14337158203125, -0.13330078125, -0.12322998046875, -0.1131591796875, -0.10308837890625, -0.093017578125, -0.08294677734375, -0.0728759765625, -0.06280517578125, -0.052734375, -0.04266357421875, -0.0325927734375, -0.02252197265625, -0.012451171875, -0.00238037109375, 0.0076904296875, 0.01776123046875, 0.02783203125, 0.03790283203125, 0.0479736328125, 0.05804443359375, 0.068115234375, 0.07818603515625, 0.0882568359375, 0.09832763671875, 0.1083984375, 0.11846923828125, 0.1285400390625, 0.13861083984375, 0.148681640625, 0.15875244140625, 0.1688232421875, 0.17889404296875, 0.18896484375, 0.19903564453125, 0.2091064453125, 0.21917724609375, 0.229248046875, 0.23931884765625, 0.2493896484375, 0.25946044921875, 0.26953125, 0.27960205078125, 0.2896728515625, 0.29974365234375, 0.309814453125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 11.0, 9.0, 15.0, 23.0, 22.0, 25.0, 36.0, 56.0, 88.0, 128.0, 130.0, 133.0, 81.0, 57.0, 45.0, 34.0, 29.0, 21.0, 10.0, 10.0, 5.0, 2.0, 11.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37158203125, -0.3608589172363281, -0.35013580322265625, -0.3394126892089844, -0.3286895751953125, -0.3179664611816406, -0.30724334716796875, -0.2965202331542969, -0.285797119140625, -0.2750740051269531, -0.26435089111328125, -0.2536277770996094, -0.2429046630859375, -0.23218154907226562, -0.22145843505859375, -0.21073532104492188, -0.20001220703125, -0.18928909301757812, -0.17856597900390625, -0.16784286499023438, -0.1571197509765625, -0.14639663696289062, -0.13567352294921875, -0.12495040893554688, -0.114227294921875, -0.10350418090820312, -0.09278106689453125, -0.08205795288085938, -0.0713348388671875, -0.060611724853515625, -0.04988861083984375, -0.039165496826171875, -0.0284423828125, -0.017719268798828125, -0.00699615478515625, 0.003726959228515625, 0.0144500732421875, 0.025173187255859375, 0.03589630126953125, 0.046619415283203125, 0.057342529296875, 0.06806564331054688, 0.07878875732421875, 0.08951187133789062, 0.1002349853515625, 0.11095809936523438, 0.12168121337890625, 0.13240432739257812, 0.14312744140625, 0.15385055541992188, 0.16457366943359375, 0.17529678344726562, 0.1860198974609375, 0.19674301147460938, 0.20746612548828125, 0.21818923950195312, 0.228912353515625, 0.23963546752929688, 0.25035858154296875, 0.2610816955566406, 0.2718048095703125, 0.2825279235839844, 0.29325103759765625, 0.3039741516113281, 0.314697265625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 4.0, 20.0, 53.0, 119.0, 222.0, 278.0, 177.0, 75.0, 28.0, 13.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.642379760742188, -9.41045093536377, -9.178521156311035, -8.946592330932617, -8.714662551879883, -8.482733726501465, -8.25080394744873, -8.018875122070312, -7.786945343017578, -7.555016040802002, -7.323086738586426, -7.09115743637085, -6.859228134155273, -6.627298831939697, -6.395369529724121, -6.163440704345703, -5.931511402130127, -5.699582099914551, -5.467652797698975, -5.235723495483398, -5.003794193267822, -4.771864891052246, -4.539936065673828, -4.308006286621094, -4.076077461242676, -3.8441481590270996, -3.6122188568115234, -3.3802895545959473, -3.148360252380371, -2.916430950164795, -2.684501886367798, -2.4525725841522217, -2.2206435203552246, -1.9887142181396484, -1.7567849159240723, -1.5248557329177856, -1.2929264307022095, -1.0609971284866333, -0.8290679454803467, -0.5971386432647705, -0.36520934104919434, -0.13328006863594055, 0.09864920377731323, 0.33057844638824463, 0.5625077486038208, 0.794437050819397, 1.0263662338256836, 1.2582955360412598, 1.490224838256836, 1.722154140472412, 1.9540834426879883, 2.1860127449035645, 2.4179420471191406, 2.649871349334717, 2.881800413131714, 3.11372971534729, 3.345659017562866, 3.5775883197784424, 3.8095176219940186, 4.041446685791016, 4.273375988006592, 4.505305290222168, 4.737234592437744, 4.96916389465332, 5.2010931968688965]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 6.0, 4.0, 3.0, 12.0, 12.0, 12.0, 6.0, 17.0, 19.0, 21.0, 30.0, 30.0, 28.0, 44.0, 42.0, 46.0, 48.0, 44.0, 46.0, 49.0, 61.0, 47.0, 59.0, 42.0, 46.0, 44.0, 28.0, 23.0, 20.0, 21.0, 18.0, 14.0, 13.0, 10.0, 7.0, 5.0, 6.0, 6.0, 2.0, 4.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1959125995635986, -3.0993895530700684, -3.002866268157959, -2.9063432216644287, -2.8098199367523193, -2.713296890258789, -2.6167736053466797, -2.5202505588531494, -2.423727512359619, -2.327204465866089, -2.2306811809539795, -2.134158134460449, -2.03763484954834, -1.9411118030548096, -1.8445886373519897, -1.74806547164917, -1.6515421867370605, -1.5550190210342407, -1.458495855331421, -1.3619728088378906, -1.2654495239257812, -1.168926477432251, -1.0724033117294312, -0.9758801460266113, -0.8793569803237915, -0.7828338146209717, -0.6863106489181519, -0.5897875428199768, -0.493264377117157, -0.39674121141433716, -0.3002181053161621, -0.20369493961334229, -0.10717201232910156, -0.010648861527442932, 0.0858742892742157, 0.18239742517471313, 0.27892059087753296, 0.3754437565803528, 0.47196686267852783, 0.5684900283813477, 0.6650131940841675, 0.7615363597869873, 0.8580595254898071, 0.9545826315879822, 1.0511057376861572, 1.1476290225982666, 1.2441520690917969, 1.3406752347946167, 1.4371984004974365, 1.5337215662002563, 1.6302447319030762, 1.7267677783966064, 1.8232910633087158, 1.919814109802246, 2.0163373947143555, 2.1128604412078857, 2.209383487701416, 2.3059065341949463, 2.4024298191070557, 2.498952865600586, 2.5954761505126953, 2.6919991970062256, 2.788522243499756, 2.8850455284118652, 2.9815688133239746]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 6.0, 7.0, 8.0, 14.0, 14.0, 23.0, 33.0, 61.0, 80.0, 110.0, 220.0, 332.0, 611.0, 1188.0, 2708.0, 7137.0, 31063.0, 3952858.0, 173193.0, 15834.0, 4709.0, 1974.0, 922.0, 467.0, 287.0, 142.0, 92.0, 74.0, 35.0, 21.0, 17.0, 12.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7001953125, -0.6830329895019531, -0.6658706665039062, -0.6487083435058594, -0.6315460205078125, -0.6143836975097656, -0.5972213745117188, -0.5800590515136719, -0.562896728515625, -0.5457344055175781, -0.5285720825195312, -0.5114097595214844, -0.4942474365234375, -0.4770851135253906, -0.45992279052734375, -0.4427604675292969, -0.42559814453125, -0.4084358215332031, -0.39127349853515625, -0.3741111755371094, -0.3569488525390625, -0.3397865295410156, -0.32262420654296875, -0.3054618835449219, -0.288299560546875, -0.2711372375488281, -0.25397491455078125, -0.23681259155273438, -0.2196502685546875, -0.20248794555664062, -0.18532562255859375, -0.16816329956054688, -0.1510009765625, -0.13383865356445312, -0.11667633056640625, -0.09951400756835938, -0.0823516845703125, -0.06518936157226562, -0.04802703857421875, -0.030864715576171875, -0.013702392578125, 0.003459930419921875, 0.02062225341796875, 0.037784576416015625, 0.0549468994140625, 0.07210922241210938, 0.08927154541015625, 0.10643386840820312, 0.12359619140625, 0.14075851440429688, 0.15792083740234375, 0.17508316040039062, 0.1922454833984375, 0.20940780639648438, 0.22657012939453125, 0.24373245239257812, 0.260894775390625, 0.2780570983886719, 0.29521942138671875, 0.3123817443847656, 0.3295440673828125, 0.3467063903808594, 0.36386871337890625, 0.3810310363769531, 0.398193359375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 7.0, 13.0, 17.0, 23.0, 31.0, 35.0, 46.0, 49.0, 70.0, 74.0, 84.0, 83.0, 63.0, 75.0, 71.0, 59.0, 46.0, 42.0, 24.0, 27.0, 19.0, 11.0, 12.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.212158203125, -0.20728492736816406, -0.20241165161132812, -0.1975383758544922, -0.19266510009765625, -0.1877918243408203, -0.18291854858398438, -0.17804527282714844, -0.1731719970703125, -0.16829872131347656, -0.16342544555664062, -0.1585521697998047, -0.15367889404296875, -0.1488056182861328, -0.14393234252929688, -0.13905906677246094, -0.134185791015625, -0.12931251525878906, -0.12443923950195312, -0.11956596374511719, -0.11469268798828125, -0.10981941223144531, -0.10494613647460938, -0.10007286071777344, -0.0951995849609375, -0.09032630920410156, -0.08545303344726562, -0.08057975769042969, -0.07570648193359375, -0.07083320617675781, -0.06595993041992188, -0.06108665466308594, -0.05621337890625, -0.05134010314941406, -0.046466827392578125, -0.04159355163574219, -0.03672027587890625, -0.03184700012207031, -0.026973724365234375, -0.022100448608398438, -0.0172271728515625, -0.012353897094726562, -0.007480621337890625, -0.0026073455810546875, 0.00226593017578125, 0.0071392059326171875, 0.012012481689453125, 0.016885757446289062, 0.021759033203125, 0.026632308959960938, 0.031505584716796875, 0.03637886047363281, 0.04125213623046875, 0.04612541198730469, 0.050998687744140625, 0.05587196350097656, 0.0607452392578125, 0.06561851501464844, 0.07049179077148438, 0.07536506652832031, 0.08023834228515625, 0.08511161804199219, 0.08998489379882812, 0.09485816955566406, 0.0997314453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 6.0, 12.0, 7.0, 25.0, 21.0, 46.0, 51.0, 68.0, 100.0, 145.0, 187.0, 250.0, 434.0, 606.0, 966.0, 1687.0, 3049.0, 6478.0, 19508.0, 124772.0, 3913656.0, 92330.0, 16845.0, 5885.0, 2788.0, 1518.0, 886.0, 605.0, 413.0, 242.0, 205.0, 101.0, 107.0, 79.0, 60.0, 35.0, 30.0, 19.0, 19.0, 14.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.57470703125, -0.5569915771484375, -0.539276123046875, -0.5215606689453125, -0.50384521484375, -0.4861297607421875, -0.468414306640625, -0.4506988525390625, -0.4329833984375, -0.4152679443359375, -0.397552490234375, -0.3798370361328125, -0.36212158203125, -0.3444061279296875, -0.326690673828125, -0.3089752197265625, -0.291259765625, -0.2735443115234375, -0.255828857421875, -0.2381134033203125, -0.22039794921875, -0.2026824951171875, -0.184967041015625, -0.1672515869140625, -0.1495361328125, -0.1318206787109375, -0.114105224609375, -0.0963897705078125, -0.07867431640625, -0.0609588623046875, -0.043243408203125, -0.0255279541015625, -0.0078125, 0.0099029541015625, 0.027618408203125, 0.0453338623046875, 0.06304931640625, 0.0807647705078125, 0.098480224609375, 0.1161956787109375, 0.1339111328125, 0.1516265869140625, 0.169342041015625, 0.1870574951171875, 0.20477294921875, 0.2224884033203125, 0.240203857421875, 0.2579193115234375, 0.275634765625, 0.2933502197265625, 0.311065673828125, 0.3287811279296875, 0.34649658203125, 0.3642120361328125, 0.381927490234375, 0.3996429443359375, 0.4173583984375, 0.4350738525390625, 0.452789306640625, 0.4705047607421875, 0.48822021484375, 0.5059356689453125, 0.523651123046875, 0.5413665771484375, 0.55908203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 11.0, 28.0, 70.0, 208.0, 3332.0, 278.0, 66.0, 31.0, 10.0, 11.0, 7.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3115234375, -0.3038444519042969, -0.29616546630859375, -0.2884864807128906, -0.2808074951171875, -0.2731285095214844, -0.26544952392578125, -0.2577705383300781, -0.250091552734375, -0.24241256713867188, -0.23473358154296875, -0.22705459594726562, -0.2193756103515625, -0.21169662475585938, -0.20401763916015625, -0.19633865356445312, -0.18865966796875, -0.18098068237304688, -0.17330169677734375, -0.16562271118164062, -0.1579437255859375, -0.15026473999023438, -0.14258575439453125, -0.13490676879882812, -0.127227783203125, -0.11954879760742188, -0.11186981201171875, -0.10419082641601562, -0.0965118408203125, -0.08883285522460938, -0.08115386962890625, -0.07347488403320312, -0.0657958984375, -0.058116912841796875, -0.05043792724609375, -0.042758941650390625, -0.0350799560546875, -0.027400970458984375, -0.01972198486328125, -0.012042999267578125, -0.004364013671875, 0.003314971923828125, 0.01099395751953125, 0.018672943115234375, 0.0263519287109375, 0.034030914306640625, 0.04170989990234375, 0.049388885498046875, 0.05706787109375, 0.06474685668945312, 0.07242584228515625, 0.08010482788085938, 0.0877838134765625, 0.09546279907226562, 0.10314178466796875, 0.11082077026367188, 0.118499755859375, 0.12617874145507812, 0.13385772705078125, 0.14153671264648438, 0.1492156982421875, 0.15689468383789062, 0.16457366943359375, 0.17225265502929688, 0.179931640625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 9.0, 18.0, 44.0, 51.0, 153.0, 167.0, 219.0, 167.0, 80.0, 50.0, 29.0, 12.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7165275812149048, -1.682455062866211, -1.6483824253082275, -1.6143099069595337, -1.5802373886108398, -1.5461647510528564, -1.5120922327041626, -1.4780197143554688, -1.4439470767974854, -1.4098745584487915, -1.375801920890808, -1.3417294025421143, -1.3076568841934204, -1.2735843658447266, -1.2395117282867432, -1.2054392099380493, -1.1713666915893555, -1.1372941732406616, -1.1032215356826782, -1.0691490173339844, -1.0350764989852905, -1.0010039806365967, -0.9669313430786133, -0.9328588247299194, -0.8987862467765808, -0.8647136688232422, -0.8306411504745483, -0.7965685725212097, -0.7624959945678711, -0.7284234762191772, -0.6943508982658386, -0.6602783203125, -0.6262056827545166, -0.592133104801178, -0.5580605864524841, -0.5239880084991455, -0.4899154603481293, -0.45584291219711304, -0.4217703342437744, -0.3876977860927582, -0.35362523794174194, -0.3195526897907257, -0.2854801416397095, -0.25140756368637085, -0.21733501553535461, -0.18326246738433838, -0.14918990433216095, -0.11511734127998352, -0.08104479312896729, -0.04697223752737045, -0.01289968192577362, 0.02117287367582321, 0.055245429277420044, 0.08931797742843628, 0.12339054048061371, 0.15746310353279114, 0.19153565168380737, 0.2256081998348236, 0.25968074798583984, 0.29375332593917847, 0.3278258740901947, 0.36189842224121094, 0.39597100019454956, 0.4300435483455658, 0.46411609649658203]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 9.0, 6.0, 12.0, 21.0, 21.0, 21.0, 21.0, 23.0, 26.0, 22.0, 26.0, 47.0, 53.0, 45.0, 39.0, 39.0, 45.0, 44.0, 55.0, 55.0, 35.0, 40.0, 32.0, 45.0, 34.0, 31.0, 20.0, 27.0, 21.0, 16.0, 12.0, 12.0, 9.0, 11.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.45489203929901123, -0.4417952001094818, -0.4286983609199524, -0.41560155153274536, -0.40250471234321594, -0.3894078731536865, -0.3763110339641571, -0.3632141947746277, -0.35011738538742065, -0.33702054619789124, -0.3239237070083618, -0.3108268976211548, -0.29773005843162537, -0.28463321924209595, -0.27153638005256653, -0.2584395408630371, -0.24534271657466888, -0.23224587738513947, -0.21914905309677124, -0.20605221390724182, -0.1929553896188736, -0.17985855042934418, -0.16676172614097595, -0.15366488695144653, -0.14056804776191711, -0.1274712085723877, -0.11437438428401947, -0.10127754509449005, -0.08818072080612183, -0.07508388161659241, -0.061987049877643585, -0.04889021813869476, -0.03579339385032654, -0.022696562111377716, -0.009599728509783745, 0.0034971050918102264, 0.01659393683075905, 0.02969077229499817, 0.04278760403394699, 0.05588443577289581, 0.06898126751184464, 0.08207809925079346, 0.09517493098974228, 0.1082717627286911, 0.12136860191822052, 0.13446542620658875, 0.14756226539611816, 0.16065910458564758, 0.1737559288740158, 0.18685276806354523, 0.19994959235191345, 0.21304643154144287, 0.2261432558298111, 0.23924009501934052, 0.25233691930770874, 0.26543375849723816, 0.2785305976867676, 0.291627436876297, 0.3047242760658264, 0.31782108545303345, 0.33091792464256287, 0.3440147638320923, 0.3571116030216217, 0.3702084422111511, 0.38330525159835815]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 11.0, 9.0, 10.0, 16.0, 22.0, 49.0, 88.0, 152.0, 299.0, 522.0, 1137.0, 2294.0, 5345.0, 14581.0, 54679.0, 318271.0, 516207.0, 99080.0, 22287.0, 7444.0, 3089.0, 1390.0, 751.0, 380.0, 201.0, 97.0, 58.0, 33.0, 14.0, 3.0, 14.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.484375, -0.4697761535644531, -0.45517730712890625, -0.4405784606933594, -0.4259796142578125, -0.4113807678222656, -0.39678192138671875, -0.3821830749511719, -0.367584228515625, -0.3529853820800781, -0.33838653564453125, -0.3237876892089844, -0.3091888427734375, -0.2945899963378906, -0.27999114990234375, -0.2653923034667969, -0.25079345703125, -0.23619461059570312, -0.22159576416015625, -0.20699691772460938, -0.1923980712890625, -0.17779922485351562, -0.16320037841796875, -0.14860153198242188, -0.134002685546875, -0.11940383911132812, -0.10480499267578125, -0.09020614624023438, -0.0756072998046875, -0.061008453369140625, -0.04640960693359375, -0.031810760498046875, -0.0172119140625, -0.002613067626953125, 0.01198577880859375, 0.026584625244140625, 0.0411834716796875, 0.055782318115234375, 0.07038116455078125, 0.08498001098632812, 0.099578857421875, 0.11417770385742188, 0.12877655029296875, 0.14337539672851562, 0.1579742431640625, 0.17257308959960938, 0.18717193603515625, 0.20177078247070312, 0.21636962890625, 0.23096847534179688, 0.24556732177734375, 0.2601661682128906, 0.2747650146484375, 0.2893638610839844, 0.30396270751953125, 0.3185615539550781, 0.333160400390625, 0.3477592468261719, 0.36235809326171875, 0.3769569396972656, 0.3915557861328125, 0.4061546325683594, 0.42075347900390625, 0.4353523254394531, 0.449951171875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 9.0, 9.0, 8.0, 19.0, 25.0, 21.0, 28.0, 38.0, 43.0, 46.0, 62.0, 60.0, 52.0, 75.0, 71.0, 62.0, 63.0, 55.0, 57.0, 44.0, 34.0, 20.0, 24.0, 17.0, 15.0, 15.0, 13.0, 8.0, 6.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.189208984375, -0.1845846176147461, -0.1799602508544922, -0.17533588409423828, -0.17071151733398438, -0.16608715057373047, -0.16146278381347656, -0.15683841705322266, -0.15221405029296875, -0.14758968353271484, -0.14296531677246094, -0.13834095001220703, -0.13371658325195312, -0.12909221649169922, -0.12446784973144531, -0.1198434829711914, -0.1152191162109375, -0.1105947494506836, -0.10597038269042969, -0.10134601593017578, -0.09672164916992188, -0.09209728240966797, -0.08747291564941406, -0.08284854888916016, -0.07822418212890625, -0.07359981536865234, -0.06897544860839844, -0.06435108184814453, -0.059726715087890625, -0.05510234832763672, -0.05047798156738281, -0.045853614807128906, -0.041229248046875, -0.036604881286621094, -0.03198051452636719, -0.02735614776611328, -0.022731781005859375, -0.01810741424560547, -0.013483047485351562, -0.008858680725097656, -0.00423431396484375, 0.00039005279541015625, 0.0050144195556640625, 0.009638786315917969, 0.014263153076171875, 0.01888751983642578, 0.023511886596679688, 0.028136253356933594, 0.0327606201171875, 0.037384986877441406, 0.04200935363769531, 0.04663372039794922, 0.051258087158203125, 0.05588245391845703, 0.06050682067871094, 0.06513118743896484, 0.06975555419921875, 0.07437992095947266, 0.07900428771972656, 0.08362865447998047, 0.08825302124023438, 0.09287738800048828, 0.09750175476074219, 0.1021261215209961, 0.10675048828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 6.0, 6.0, 13.0, 18.0, 23.0, 37.0, 59.0, 107.0, 208.0, 350.0, 800.0, 2434.0, 12181.0, 402013.0, 611154.0, 14658.0, 2747.0, 878.0, 356.0, 203.0, 106.0, 68.0, 50.0, 21.0, 14.0, 16.0, 8.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99169921875, -0.9536209106445312, -0.9155426025390625, -0.8774642944335938, -0.839385986328125, -0.8013076782226562, -0.7632293701171875, -0.7251510620117188, -0.68707275390625, -0.6489944458007812, -0.6109161376953125, -0.5728378295898438, -0.534759521484375, -0.49668121337890625, -0.4586029052734375, -0.42052459716796875, -0.3824462890625, -0.34436798095703125, -0.3062896728515625, -0.26821136474609375, -0.230133056640625, -0.19205474853515625, -0.1539764404296875, -0.11589813232421875, -0.07781982421875, -0.03974151611328125, -0.0016632080078125, 0.03641510009765625, 0.074493408203125, 0.11257171630859375, 0.1506500244140625, 0.18872833251953125, 0.226806640625, 0.26488494873046875, 0.3029632568359375, 0.34104156494140625, 0.379119873046875, 0.41719818115234375, 0.4552764892578125, 0.49335479736328125, 0.53143310546875, 0.5695114135742188, 0.6075897216796875, 0.6456680297851562, 0.683746337890625, 0.7218246459960938, 0.7599029541015625, 0.7979812622070312, 0.8360595703125, 0.8741378784179688, 0.9122161865234375, 0.9502944946289062, 0.988372802734375, 1.0264511108398438, 1.0645294189453125, 1.1026077270507812, 1.14068603515625, 1.1787643432617188, 1.2168426513671875, 1.2549209594726562, 1.292999267578125, 1.3310775756835938, 1.3691558837890625, 1.4072341918945312, 1.4453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 2.0, 4.0, 8.0, 7.0, 10.0, 17.0, 10.0, 25.0, 28.0, 33.0, 35.0, 46.0, 61.0, 50.0, 57.0, 72.0, 67.0, 65.0, 69.0, 55.0, 45.0, 59.0, 50.0, 30.0, 21.0, 18.0, 18.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80615234375, -0.7767257690429688, -0.7472991943359375, -0.7178726196289062, -0.688446044921875, -0.6590194702148438, -0.6295928955078125, -0.6001663208007812, -0.57073974609375, -0.5413131713867188, -0.5118865966796875, -0.48246002197265625, -0.453033447265625, -0.42360687255859375, -0.3941802978515625, -0.36475372314453125, -0.3353271484375, -0.30590057373046875, -0.2764739990234375, -0.24704742431640625, -0.217620849609375, -0.18819427490234375, -0.1587677001953125, -0.12934112548828125, -0.09991455078125, -0.07048797607421875, -0.0410614013671875, -0.01163482666015625, 0.017791748046875, 0.04721832275390625, 0.0766448974609375, 0.10607147216796875, 0.135498046875, 0.16492462158203125, 0.1943511962890625, 0.22377777099609375, 0.253204345703125, 0.28263092041015625, 0.3120574951171875, 0.34148406982421875, 0.37091064453125, 0.40033721923828125, 0.4297637939453125, 0.45919036865234375, 0.488616943359375, 0.5180435180664062, 0.5474700927734375, 0.5768966674804688, 0.6063232421875, 0.6357498168945312, 0.6651763916015625, 0.6946029663085938, 0.724029541015625, 0.7534561157226562, 0.7828826904296875, 0.8123092651367188, 0.84173583984375, 0.8711624145507812, 0.9005889892578125, 0.9300155639648438, 0.959442138671875, 0.9888687133789062, 1.0182952880859375, 1.0477218627929688, 1.0771484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 7.0, 10.0, 13.0, 31.0, 65.0, 144.0, 393.0, 1447.0, 18329.0, 1016425.0, 10015.0, 1084.0, 298.0, 143.0, 78.0, 23.0, 17.0, 10.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380859375, -1.3265380859375, -1.272216796875, -1.2178955078125, -1.16357421875, -1.1092529296875, -1.054931640625, -1.0006103515625, -0.9462890625, -0.8919677734375, -0.837646484375, -0.7833251953125, -0.72900390625, -0.6746826171875, -0.620361328125, -0.5660400390625, -0.51171875, -0.4573974609375, -0.403076171875, -0.3487548828125, -0.29443359375, -0.2401123046875, -0.185791015625, -0.1314697265625, -0.0771484375, -0.0228271484375, 0.031494140625, 0.0858154296875, 0.14013671875, 0.1944580078125, 0.248779296875, 0.3031005859375, 0.357421875, 0.4117431640625, 0.466064453125, 0.5203857421875, 0.57470703125, 0.6290283203125, 0.683349609375, 0.7376708984375, 0.7919921875, 0.8463134765625, 0.900634765625, 0.9549560546875, 1.00927734375, 1.0635986328125, 1.117919921875, 1.1722412109375, 1.2265625, 1.2808837890625, 1.335205078125, 1.3895263671875, 1.44384765625, 1.4981689453125, 1.552490234375, 1.6068115234375, 1.6611328125, 1.7154541015625, 1.769775390625, 1.8240966796875, 1.87841796875, 1.9327392578125, 1.987060546875, 2.0413818359375, 2.095703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 14.0, 17.0, 19.0, 27.0, 35.0, 51.0, 41.0, 75.0, 67.0, 76.0, 114.0, 93.0, 68.0, 64.0, 51.0, 42.0, 25.0, 28.0, 15.0, 16.0, 12.0, 11.0, 8.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.08970832824707e-05, -8.780695497989655e-05, -8.471682667732239e-05, -8.162669837474823e-05, -7.853657007217407e-05, -7.544644176959991e-05, -7.235631346702576e-05, -6.92661851644516e-05, -6.617605686187744e-05, -6.308592855930328e-05, -5.9995800256729126e-05, -5.690567195415497e-05, -5.381554365158081e-05, -5.072541534900665e-05, -4.7635287046432495e-05, -4.454515874385834e-05, -4.145503044128418e-05, -3.836490213871002e-05, -3.5274773836135864e-05, -3.2184645533561707e-05, -2.909451723098755e-05, -2.600438892841339e-05, -2.2914260625839233e-05, -1.9824132323265076e-05, -1.6734004020690918e-05, -1.364387571811676e-05, -1.0553747415542603e-05, -7.463619112968445e-06, -4.373490810394287e-06, -1.2833625078201294e-06, 1.8067657947540283e-06, 4.896894097328186e-06, 7.987022399902344e-06, 1.1077150702476501e-05, 1.416727900505066e-05, 1.7257407307624817e-05, 2.0347535610198975e-05, 2.3437663912773132e-05, 2.652779221534729e-05, 2.9617920517921448e-05, 3.2708048820495605e-05, 3.579817712306976e-05, 3.888830542564392e-05, 4.197843372821808e-05, 4.5068562030792236e-05, 4.8158690333366394e-05, 5.124881863594055e-05, 5.433894693851471e-05, 5.742907524108887e-05, 6.0519203543663025e-05, 6.360933184623718e-05, 6.669946014881134e-05, 6.97895884513855e-05, 7.287971675395966e-05, 7.596984505653381e-05, 7.905997335910797e-05, 8.215010166168213e-05, 8.524022996425629e-05, 8.833035826683044e-05, 9.14204865694046e-05, 9.451061487197876e-05, 9.760074317455292e-05, 0.00010069087147712708, 0.00010378099977970123, 0.00010687112808227539]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 9.0, 15.0, 15.0, 33.0, 73.0, 138.0, 305.0, 762.0, 2849.0, 40938.0, 978501.0, 21482.0, 2274.0, 630.0, 246.0, 118.0, 63.0, 31.0, 17.0, 12.0, 3.0, 6.0, 6.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9033203125, -0.8691253662109375, -0.834930419921875, -0.8007354736328125, -0.76654052734375, -0.7323455810546875, -0.698150634765625, -0.6639556884765625, -0.6297607421875, -0.5955657958984375, -0.561370849609375, -0.5271759033203125, -0.49298095703125, -0.4587860107421875, -0.424591064453125, -0.3903961181640625, -0.356201171875, -0.3220062255859375, -0.287811279296875, -0.2536163330078125, -0.21942138671875, -0.1852264404296875, -0.151031494140625, -0.1168365478515625, -0.0826416015625, -0.0484466552734375, -0.014251708984375, 0.0199432373046875, 0.05413818359375, 0.0883331298828125, 0.122528076171875, 0.1567230224609375, 0.19091796875, 0.2251129150390625, 0.259307861328125, 0.2935028076171875, 0.32769775390625, 0.3618927001953125, 0.396087646484375, 0.4302825927734375, 0.4644775390625, 0.4986724853515625, 0.532867431640625, 0.5670623779296875, 0.60125732421875, 0.6354522705078125, 0.669647216796875, 0.7038421630859375, 0.738037109375, 0.7722320556640625, 0.806427001953125, 0.8406219482421875, 0.87481689453125, 0.9090118408203125, 0.943206787109375, 0.9774017333984375, 1.0115966796875, 1.0457916259765625, 1.079986572265625, 1.1141815185546875, 1.14837646484375, 1.1825714111328125, 1.216766357421875, 1.2509613037109375, 1.28515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 20.0, 21.0, 21.0, 65.0, 111.0, 299.0, 248.0, 86.0, 47.0, 28.0, 22.0, 8.0, 6.0, 6.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21875, -1.1816558837890625, -1.144561767578125, -1.1074676513671875, -1.07037353515625, -1.0332794189453125, -0.996185302734375, -0.9590911865234375, -0.9219970703125, -0.8849029541015625, -0.847808837890625, -0.8107147216796875, -0.77362060546875, -0.7365264892578125, -0.699432373046875, -0.6623382568359375, -0.625244140625, -0.5881500244140625, -0.551055908203125, -0.5139617919921875, -0.47686767578125, -0.4397735595703125, -0.402679443359375, -0.3655853271484375, -0.3284912109375, -0.2913970947265625, -0.254302978515625, -0.2172088623046875, -0.18011474609375, -0.1430206298828125, -0.105926513671875, -0.0688323974609375, -0.03173828125, 0.0053558349609375, 0.042449951171875, 0.0795440673828125, 0.11663818359375, 0.1537322998046875, 0.190826416015625, 0.2279205322265625, 0.2650146484375, 0.3021087646484375, 0.339202880859375, 0.3762969970703125, 0.41339111328125, 0.4504852294921875, 0.487579345703125, 0.5246734619140625, 0.561767578125, 0.5988616943359375, 0.635955810546875, 0.6730499267578125, 0.71014404296875, 0.7472381591796875, 0.784332275390625, 0.8214263916015625, 0.8585205078125, 0.8956146240234375, 0.932708740234375, 0.9698028564453125, 1.00689697265625, 1.0439910888671875, 1.081085205078125, 1.1181793212890625, 1.1552734375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 34.0, 179.0, 582.0, 188.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.54459762573242, -31.744001388549805, -30.943405151367188, -30.14280891418457, -29.342212677001953, -28.54161834716797, -27.74102210998535, -26.940425872802734, -26.139829635620117, -25.3392333984375, -24.538637161254883, -23.738040924072266, -22.93744659423828, -22.13684844970703, -21.336254119873047, -20.53565788269043, -19.735061645507812, -18.934465408325195, -18.133869171142578, -17.33327293395996, -16.532676696777344, -15.732081413269043, -14.931486129760742, -14.130889892578125, -13.330293655395508, -12.52969741821289, -11.729101181030273, -10.928505897521973, -10.127909660339355, -9.327313423156738, -8.526718139648438, -7.72612190246582, -6.925527572631836, -6.124931335449219, -5.32433557510376, -4.523739814758301, -3.7231435775756836, -2.9225473403930664, -2.1219515800476074, -1.3213558197021484, -0.5207595825195312, 0.27983641624450684, 1.080432415008545, 1.881028413772583, 2.681624412536621, 3.4822206497192383, 4.282816410064697, 5.083412170410156, 5.884008407592773, 6.684604644775391, 7.48520040512085, 8.285796165466309, 9.086392402648926, 9.886988639831543, 10.687583923339844, 11.488180160522461, 12.288776397705078, 13.089372634887695, 13.889968872070312, 14.690564155578613, 15.49116039276123, 16.29175567626953, 17.09235191345215, 17.892948150634766, 18.693544387817383]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 5.0, 2.0, 8.0, 6.0, 14.0, 14.0, 16.0, 25.0, 20.0, 31.0, 38.0, 31.0, 45.0, 52.0, 50.0, 56.0, 65.0, 63.0, 52.0, 59.0, 50.0, 47.0, 37.0, 38.0, 23.0, 29.0, 32.0, 19.0, 7.0, 17.0, 12.0, 3.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.801705360412598, -4.664665222167969, -4.527624607086182, -4.390584468841553, -4.253543853759766, -4.116503715515137, -3.979463577270508, -3.8424232006073, -3.705382823944092, -3.568342447280884, -3.431302070617676, -3.294261932373047, -3.157221555709839, -3.020181179046631, -2.883141040802002, -2.746100664138794, -2.609060287475586, -2.472019910812378, -2.33497953414917, -2.197939395904541, -2.060899019241333, -1.923858642578125, -1.7868183851242065, -1.649778127670288, -1.51273775100708, -1.375697374343872, -1.2386571168899536, -1.1016168594360352, -0.9645764827728271, -0.8275361657142639, -0.6904958486557007, -0.5534555315971375, -0.4164149761199951, -0.2793746590614319, -0.14233434200286865, -0.00529402494430542, 0.1317462921142578, 0.26878660917282104, 0.4058269262313843, 0.5428672432899475, 0.6799075603485107, 0.816947877407074, 0.9539881944656372, 1.0910284519195557, 1.2280688285827637, 1.3651092052459717, 1.5021494626998901, 1.6391897201538086, 1.7762300968170166, 1.9132704734802246, 2.0503106117248535, 2.1873509883880615, 2.3243913650512695, 2.4614317417144775, 2.5984721183776855, 2.7355122566223145, 2.8725526332855225, 3.0095930099487305, 3.1466331481933594, 3.2836735248565674, 3.4207139015197754, 3.5577542781829834, 3.6947946548461914, 3.8318347930908203, 3.9688751697540283]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 9.0, 22.0, 34.0, 74.0, 125.0, 283.0, 555.0, 2165.0, 18343.0, 4149482.0, 19641.0, 2367.0, 646.0, 250.0, 111.0, 62.0, 34.0, 14.0, 21.0, 9.0, 9.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.131591796875, -2.07763671875, -2.023681640625, -1.9697265625, -1.915771484375, -1.86181640625, -1.807861328125, -1.75390625, -1.699951171875, -1.64599609375, -1.592041015625, -1.5380859375, -1.484130859375, -1.43017578125, -1.376220703125, -1.322265625, -1.268310546875, -1.21435546875, -1.160400390625, -1.1064453125, -1.052490234375, -0.99853515625, -0.944580078125, -0.890625, -0.836669921875, -0.78271484375, -0.728759765625, -0.6748046875, -0.620849609375, -0.56689453125, -0.512939453125, -0.458984375, -0.405029296875, -0.35107421875, -0.297119140625, -0.2431640625, -0.189208984375, -0.13525390625, -0.081298828125, -0.02734375, 0.026611328125, 0.08056640625, 0.134521484375, 0.1884765625, 0.242431640625, 0.29638671875, 0.350341796875, 0.404296875, 0.458251953125, 0.51220703125, 0.566162109375, 0.6201171875, 0.674072265625, 0.72802734375, 0.781982421875, 0.8359375, 0.889892578125, 0.94384765625, 0.997802734375, 1.0517578125, 1.105712890625, 1.15966796875, 1.213623046875, 1.267578125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 10.0, 5.0, 11.0, 16.0, 17.0, 22.0, 25.0, 29.0, 35.0, 50.0, 52.0, 51.0, 54.0, 61.0, 59.0, 59.0, 58.0, 59.0, 44.0, 57.0, 46.0, 30.0, 37.0, 20.0, 22.0, 14.0, 16.0, 10.0, 10.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1588134765625, -0.15386199951171875, -0.1489105224609375, -0.14395904541015625, -0.139007568359375, -0.13405609130859375, -0.1291046142578125, -0.12415313720703125, -0.11920166015625, -0.11425018310546875, -0.1092987060546875, -0.10434722900390625, -0.099395751953125, -0.09444427490234375, -0.0894927978515625, -0.08454132080078125, -0.07958984375, -0.07463836669921875, -0.0696868896484375, -0.06473541259765625, -0.059783935546875, -0.05483245849609375, -0.0498809814453125, -0.04492950439453125, -0.03997802734375, -0.03502655029296875, -0.0300750732421875, -0.02512359619140625, -0.020172119140625, -0.01522064208984375, -0.0102691650390625, -0.00531768798828125, -0.0003662109375, 0.00458526611328125, 0.0095367431640625, 0.01448822021484375, 0.019439697265625, 0.02439117431640625, 0.0293426513671875, 0.03429412841796875, 0.03924560546875, 0.04419708251953125, 0.0491485595703125, 0.05410003662109375, 0.059051513671875, 0.06400299072265625, 0.0689544677734375, 0.07390594482421875, 0.078857421875, 0.08380889892578125, 0.0887603759765625, 0.09371185302734375, 0.098663330078125, 0.10361480712890625, 0.1085662841796875, 0.11351776123046875, 0.11846923828125, 0.12342071533203125, 0.1283721923828125, 0.13332366943359375, 0.138275146484375, 0.14322662353515625, 0.1481781005859375, 0.15312957763671875, 0.1580810546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 9.0, 8.0, 9.0, 6.0, 23.0, 20.0, 34.0, 61.0, 70.0, 115.0, 206.0, 351.0, 644.0, 1355.0, 3387.0, 13231.0, 3602592.0, 554068.0, 12094.0, 3139.0, 1295.0, 622.0, 362.0, 211.0, 125.0, 74.0, 49.0, 41.0, 21.0, 19.0, 12.0, 7.0, 11.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7158203125, -1.6706390380859375, -1.625457763671875, -1.5802764892578125, -1.53509521484375, -1.4899139404296875, -1.444732666015625, -1.3995513916015625, -1.3543701171875, -1.3091888427734375, -1.264007568359375, -1.2188262939453125, -1.17364501953125, -1.1284637451171875, -1.083282470703125, -1.0381011962890625, -0.992919921875, -0.9477386474609375, -0.902557373046875, -0.8573760986328125, -0.81219482421875, -0.7670135498046875, -0.721832275390625, -0.6766510009765625, -0.6314697265625, -0.5862884521484375, -0.541107177734375, -0.4959259033203125, -0.45074462890625, -0.4055633544921875, -0.360382080078125, -0.3152008056640625, -0.27001953125, -0.2248382568359375, -0.179656982421875, -0.1344757080078125, -0.08929443359375, -0.0441131591796875, 0.001068115234375, 0.0462493896484375, 0.0914306640625, 0.1366119384765625, 0.181793212890625, 0.2269744873046875, 0.27215576171875, 0.3173370361328125, 0.362518310546875, 0.4076995849609375, 0.452880859375, 0.4980621337890625, 0.543243408203125, 0.5884246826171875, 0.63360595703125, 0.6787872314453125, 0.723968505859375, 0.7691497802734375, 0.8143310546875, 0.8595123291015625, 0.904693603515625, 0.9498748779296875, 0.99505615234375, 1.0402374267578125, 1.085418701171875, 1.1305999755859375, 1.17578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 4.0, 4.0, 7.0, 12.0, 26.0, 36.0, 92.0, 450.0, 3201.0, 140.0, 46.0, 21.0, 9.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33203125, -0.3241539001464844, -0.31627655029296875, -0.3083992004394531, -0.3005218505859375, -0.2926445007324219, -0.28476715087890625, -0.2768898010253906, -0.269012451171875, -0.2611351013183594, -0.25325775146484375, -0.24538040161132812, -0.2375030517578125, -0.22962570190429688, -0.22174835205078125, -0.21387100219726562, -0.20599365234375, -0.19811630249023438, -0.19023895263671875, -0.18236160278320312, -0.1744842529296875, -0.16660690307617188, -0.15872955322265625, -0.15085220336914062, -0.142974853515625, -0.13509750366210938, -0.12722015380859375, -0.11934280395507812, -0.1114654541015625, -0.10358810424804688, -0.09571075439453125, -0.08783340454101562, -0.0799560546875, -0.07207870483398438, -0.06420135498046875, -0.056324005126953125, -0.0484466552734375, -0.040569305419921875, -0.03269195556640625, -0.024814605712890625, -0.016937255859375, -0.009059906005859375, -0.00118255615234375, 0.006694793701171875, 0.0145721435546875, 0.022449493408203125, 0.03032684326171875, 0.038204193115234375, 0.04608154296875, 0.053958892822265625, 0.06183624267578125, 0.06971359252929688, 0.0775909423828125, 0.08546829223632812, 0.09334564208984375, 0.10122299194335938, 0.109100341796875, 0.11697769165039062, 0.12485504150390625, 0.13273239135742188, 0.1406097412109375, 0.14848709106445312, 0.15636444091796875, 0.16424179077148438, 0.172119140625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 8.0, 16.0, 24.0, 52.0, 95.0, 143.0, 205.0, 184.0, 135.0, 69.0, 38.0, 17.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3066192865371704, -1.2592202425003052, -1.2118213176727295, -1.1644222736358643, -1.117023229598999, -1.0696241855621338, -1.022225260734558, -0.9748262166976929, -0.9274272322654724, -0.880028247833252, -0.8326292037963867, -0.7852302193641663, -0.7378312349319458, -0.6904321908950806, -0.6430332064628601, -0.5956342220306396, -0.5482351779937744, -0.500836193561554, -0.4534371495246887, -0.40603816509246826, -0.3586391508579254, -0.31124013662338257, -0.2638411521911621, -0.21644213795661926, -0.16904312372207642, -0.12164411693811417, -0.07424511015415192, -0.026846110820770264, 0.020552903413772583, 0.06795191764831543, 0.11535090208053589, 0.16274991631507874, 0.21014904975891113, 0.257548063993454, 0.3049470782279968, 0.3523460626602173, 0.39974507689476013, 0.447144091129303, 0.49454307556152344, 0.5419421195983887, 0.5893411040306091, 0.6367400884628296, 0.6841391324996948, 0.7315381169319153, 0.7789371013641357, 0.826336145401001, 0.8737351298332214, 0.9211341142654419, 0.9685331583023071, 1.0159322023391724, 1.063331127166748, 1.1107301712036133, 1.1581292152404785, 1.2055282592773438, 1.2529271841049194, 1.3003262281417847, 1.3477251529693604, 1.3951241970062256, 1.4425231218338013, 1.4899221658706665, 1.5373212099075317, 1.5847201347351074, 1.6321191787719727, 1.679518222808838, 1.7269172668457031]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 12.0, 13.0, 13.0, 7.0, 10.0, 15.0, 23.0, 24.0, 25.0, 29.0, 31.0, 35.0, 31.0, 24.0, 43.0, 40.0, 40.0, 39.0, 49.0, 46.0, 44.0, 39.0, 38.0, 28.0, 45.0, 26.0, 35.0, 26.0, 25.0, 25.0, 27.0, 13.0, 20.0, 14.0, 14.0, 7.0, 9.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6180504560470581, -0.5989565849304199, -0.5798627138137817, -0.5607688426971436, -0.5416749715805054, -0.5225811004638672, -0.503487229347229, -0.48439332842826843, -0.46529945731163025, -0.44620558619499207, -0.4271117150783539, -0.4080178439617157, -0.3889239430427551, -0.36983007192611694, -0.35073620080947876, -0.3316423296928406, -0.3125484585762024, -0.2934545874595642, -0.274360716342926, -0.25526684522628784, -0.23617295920848846, -0.21707908809185028, -0.1979852020740509, -0.17889133095741272, -0.15979745984077454, -0.14070358872413635, -0.12160971015691757, -0.10251583158969879, -0.08342196047306061, -0.06432808935642242, -0.045234210789203644, -0.026140332221984863, -0.007046401500701904, 0.012047473341226578, 0.03114134818315506, 0.05023522302508354, 0.06932909786701202, 0.08842296898365021, 0.10751684755086899, 0.12661072611808777, 0.14570459723472595, 0.16479846835136414, 0.18389233946800232, 0.2029862254858017, 0.22208009660243988, 0.24117396771907806, 0.26026785373687744, 0.2793617248535156, 0.2984555959701538, 0.317549467086792, 0.3366433382034302, 0.35573720932006836, 0.37483108043670654, 0.3939249515533447, 0.4130188524723053, 0.4321127235889435, 0.45120659470558167, 0.47030046582221985, 0.48939433693885803, 0.5084882378578186, 0.5275821089744568, 0.546675980091095, 0.5657698512077332, 0.5848637223243713, 0.6039575934410095]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 18.0, 13.0, 19.0, 41.0, 56.0, 80.0, 161.0, 360.0, 629.0, 1598.0, 5181.0, 27970.0, 337749.0, 614470.0, 48735.0, 7682.0, 2183.0, 779.0, 385.0, 171.0, 115.0, 54.0, 43.0, 13.0, 16.0, 6.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8076171875, -0.7852630615234375, -0.762908935546875, -0.7405548095703125, -0.71820068359375, -0.6958465576171875, -0.673492431640625, -0.6511383056640625, -0.6287841796875, -0.6064300537109375, -0.584075927734375, -0.5617218017578125, -0.53936767578125, -0.5170135498046875, -0.494659423828125, -0.4723052978515625, -0.449951171875, -0.4275970458984375, -0.405242919921875, -0.3828887939453125, -0.36053466796875, -0.3381805419921875, -0.315826416015625, -0.2934722900390625, -0.2711181640625, -0.2487640380859375, -0.226409912109375, -0.2040557861328125, -0.18170166015625, -0.1593475341796875, -0.136993408203125, -0.1146392822265625, -0.09228515625, -0.0699310302734375, -0.047576904296875, -0.0252227783203125, -0.00286865234375, 0.0194854736328125, 0.041839599609375, 0.0641937255859375, 0.0865478515625, 0.1089019775390625, 0.131256103515625, 0.1536102294921875, 0.17596435546875, 0.1983184814453125, 0.220672607421875, 0.2430267333984375, 0.265380859375, 0.2877349853515625, 0.310089111328125, 0.3324432373046875, 0.35479736328125, 0.3771514892578125, 0.399505615234375, 0.4218597412109375, 0.4442138671875, 0.4665679931640625, 0.488922119140625, 0.5112762451171875, 0.53363037109375, 0.5559844970703125, 0.578338623046875, 0.6006927490234375, 0.623046875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 8.0, 7.0, 11.0, 16.0, 22.0, 22.0, 20.0, 33.0, 41.0, 39.0, 62.0, 48.0, 58.0, 58.0, 62.0, 57.0, 57.0, 52.0, 45.0, 45.0, 46.0, 36.0, 31.0, 27.0, 17.0, 17.0, 12.0, 11.0, 4.0, 9.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169921875, -0.16457176208496094, -0.15922164916992188, -0.1538715362548828, -0.14852142333984375, -0.1431713104248047, -0.13782119750976562, -0.13247108459472656, -0.1271209716796875, -0.12177085876464844, -0.11642074584960938, -0.11107063293457031, -0.10572052001953125, -0.10037040710449219, -0.09502029418945312, -0.08967018127441406, -0.084320068359375, -0.07896995544433594, -0.07361984252929688, -0.06826972961425781, -0.06291961669921875, -0.05756950378417969, -0.052219390869140625, -0.04686927795410156, -0.0415191650390625, -0.03616905212402344, -0.030818939208984375, -0.025468826293945312, -0.02011871337890625, -0.014768600463867188, -0.009418487548828125, -0.0040683746337890625, 0.00128173828125, 0.0066318511962890625, 0.011981964111328125, 0.017332077026367188, 0.02268218994140625, 0.028032302856445312, 0.033382415771484375, 0.03873252868652344, 0.0440826416015625, 0.04943275451660156, 0.054782867431640625, 0.06013298034667969, 0.06548309326171875, 0.07083320617675781, 0.07618331909179688, 0.08153343200683594, 0.086883544921875, 0.09223365783691406, 0.09758377075195312, 0.10293388366699219, 0.10828399658203125, 0.11363410949707031, 0.11898422241210938, 0.12433433532714844, 0.1296844482421875, 0.13503456115722656, 0.14038467407226562, 0.1457347869873047, 0.15108489990234375, 0.1564350128173828, 0.16178512573242188, 0.16713523864746094, 0.1724853515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 6.0, 9.0, 9.0, 23.0, 32.0, 30.0, 67.0, 86.0, 150.0, 283.0, 695.0, 2126.0, 10374.0, 305979.0, 707410.0, 16910.0, 2726.0, 857.0, 332.0, 174.0, 105.0, 58.0, 37.0, 16.0, 17.0, 7.0, 8.0, 10.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.416015625, -1.3831634521484375, -1.350311279296875, -1.3174591064453125, -1.28460693359375, -1.2517547607421875, -1.218902587890625, -1.1860504150390625, -1.1531982421875, -1.1203460693359375, -1.087493896484375, -1.0546417236328125, -1.02178955078125, -0.9889373779296875, -0.956085205078125, -0.9232330322265625, -0.890380859375, -0.8575286865234375, -0.824676513671875, -0.7918243408203125, -0.75897216796875, -0.7261199951171875, -0.693267822265625, -0.6604156494140625, -0.6275634765625, -0.5947113037109375, -0.561859130859375, -0.5290069580078125, -0.49615478515625, -0.4633026123046875, -0.430450439453125, -0.3975982666015625, -0.36474609375, -0.3318939208984375, -0.299041748046875, -0.2661895751953125, -0.23333740234375, -0.2004852294921875, -0.167633056640625, -0.1347808837890625, -0.1019287109375, -0.0690765380859375, -0.036224365234375, -0.0033721923828125, 0.02947998046875, 0.0623321533203125, 0.095184326171875, 0.1280364990234375, 0.160888671875, 0.1937408447265625, 0.226593017578125, 0.2594451904296875, 0.29229736328125, 0.3251495361328125, 0.358001708984375, 0.3908538818359375, 0.4237060546875, 0.4565582275390625, 0.489410400390625, 0.5222625732421875, 0.55511474609375, 0.5879669189453125, 0.620819091796875, 0.6536712646484375, 0.6865234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 17.0, 13.0, 13.0, 30.0, 29.0, 27.0, 35.0, 58.0, 57.0, 68.0, 65.0, 66.0, 77.0, 65.0, 62.0, 44.0, 40.0, 51.0, 36.0, 27.0, 30.0, 20.0, 23.0, 13.0, 7.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94384765625, -0.9093399047851562, -0.8748321533203125, -0.8403244018554688, -0.805816650390625, -0.7713088989257812, -0.7368011474609375, -0.7022933959960938, -0.66778564453125, -0.6332778930664062, -0.5987701416015625, -0.5642623901367188, -0.529754638671875, -0.49524688720703125, -0.4607391357421875, -0.42623138427734375, -0.3917236328125, -0.35721588134765625, -0.3227081298828125, -0.28820037841796875, -0.253692626953125, -0.21918487548828125, -0.1846771240234375, -0.15016937255859375, -0.11566162109375, -0.08115386962890625, -0.0466461181640625, -0.01213836669921875, 0.022369384765625, 0.05687713623046875, 0.0913848876953125, 0.12589263916015625, 0.160400390625, 0.19490814208984375, 0.2294158935546875, 0.26392364501953125, 0.298431396484375, 0.33293914794921875, 0.3674468994140625, 0.40195465087890625, 0.43646240234375, 0.47097015380859375, 0.5054779052734375, 0.5399856567382812, 0.574493408203125, 0.6090011596679688, 0.6435089111328125, 0.6780166625976562, 0.7125244140625, 0.7470321655273438, 0.7815399169921875, 0.8160476684570312, 0.850555419921875, 0.8850631713867188, 0.9195709228515625, 0.9540786743164062, 0.98858642578125, 1.0230941772460938, 1.0576019287109375, 1.0921096801757812, 1.126617431640625, 1.1611251831054688, 1.1956329345703125, 1.2301406860351562, 1.2646484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 10.0, 16.0, 28.0, 100.0, 223.0, 785.0, 5090.0, 918788.0, 120327.0, 2382.0, 503.0, 152.0, 73.0, 35.0, 11.0, 15.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08203125, -1.041717529296875, -1.00140380859375, -0.961090087890625, -0.9207763671875, -0.880462646484375, -0.84014892578125, -0.799835205078125, -0.759521484375, -0.719207763671875, -0.67889404296875, -0.638580322265625, -0.5982666015625, -0.557952880859375, -0.51763916015625, -0.477325439453125, -0.43701171875, -0.396697998046875, -0.35638427734375, -0.316070556640625, -0.2757568359375, -0.235443115234375, -0.19512939453125, -0.154815673828125, -0.114501953125, -0.074188232421875, -0.03387451171875, 0.006439208984375, 0.0467529296875, 0.087066650390625, 0.12738037109375, 0.167694091796875, 0.2080078125, 0.248321533203125, 0.28863525390625, 0.328948974609375, 0.3692626953125, 0.409576416015625, 0.44989013671875, 0.490203857421875, 0.530517578125, 0.570831298828125, 0.61114501953125, 0.651458740234375, 0.6917724609375, 0.732086181640625, 0.77239990234375, 0.812713623046875, 0.85302734375, 0.893341064453125, 0.93365478515625, 0.973968505859375, 1.0142822265625, 1.054595947265625, 1.09490966796875, 1.135223388671875, 1.175537109375, 1.215850830078125, 1.25616455078125, 1.296478271484375, 1.3367919921875, 1.377105712890625, 1.41741943359375, 1.457733154296875, 1.498046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 15.0, 15.0, 19.0, 30.0, 30.0, 45.0, 63.0, 81.0, 111.0, 119.0, 104.0, 75.0, 81.0, 53.0, 38.0, 32.0, 24.0, 14.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00012874603271484375, -0.00012563727796077728, -0.00012252852320671082, -0.00011941976845264435, -0.00011631101369857788, -0.00011320225894451141, -0.00011009350419044495, -0.00010698474943637848, -0.00010387599468231201, -0.00010076723992824554, -9.765848517417908e-05, -9.454973042011261e-05, -9.144097566604614e-05, -8.833222091197968e-05, -8.522346615791321e-05, -8.211471140384674e-05, -7.900595664978027e-05, -7.58972018957138e-05, -7.278844714164734e-05, -6.967969238758087e-05, -6.65709376335144e-05, -6.346218287944794e-05, -6.035342812538147e-05, -5.7244673371315e-05, -5.4135918617248535e-05, -5.102716386318207e-05, -4.79184091091156e-05, -4.480965435504913e-05, -4.1700899600982666e-05, -3.85921448469162e-05, -3.548339009284973e-05, -3.2374635338783264e-05, -2.9265880584716797e-05, -2.615712583065033e-05, -2.3048371076583862e-05, -1.9939616322517395e-05, -1.6830861568450928e-05, -1.372210681438446e-05, -1.0613352060317993e-05, -7.504597306251526e-06, -4.395842552185059e-06, -1.2870877981185913e-06, 1.821666955947876e-06, 4.930421710014343e-06, 8.03917646408081e-06, 1.1147931218147278e-05, 1.4256685972213745e-05, 1.7365440726280212e-05, 2.047419548034668e-05, 2.3582950234413147e-05, 2.6691704988479614e-05, 2.980045974254608e-05, 3.290921449661255e-05, 3.6017969250679016e-05, 3.9126724004745483e-05, 4.223547875881195e-05, 4.534423351287842e-05, 4.8452988266944885e-05, 5.156174302101135e-05, 5.467049777507782e-05, 5.777925252914429e-05, 6.0888007283210754e-05, 6.399676203727722e-05, 6.710551679134369e-05, 7.021427154541016e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 4.0, 4.0, 13.0, 22.0, 47.0, 95.0, 174.0, 470.0, 1713.0, 14816.0, 907970.0, 117352.0, 4384.0, 877.0, 331.0, 116.0, 78.0, 38.0, 21.0, 9.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1337890625, -1.1059722900390625, -1.078155517578125, -1.0503387451171875, -1.02252197265625, -0.9947052001953125, -0.966888427734375, -0.9390716552734375, -0.9112548828125, -0.8834381103515625, -0.855621337890625, -0.8278045654296875, -0.79998779296875, -0.7721710205078125, -0.744354248046875, -0.7165374755859375, -0.688720703125, -0.6609039306640625, -0.633087158203125, -0.6052703857421875, -0.57745361328125, -0.5496368408203125, -0.521820068359375, -0.4940032958984375, -0.4661865234375, -0.4383697509765625, -0.410552978515625, -0.3827362060546875, -0.35491943359375, -0.3271026611328125, -0.299285888671875, -0.2714691162109375, -0.24365234375, -0.2158355712890625, -0.188018798828125, -0.1602020263671875, -0.13238525390625, -0.1045684814453125, -0.076751708984375, -0.0489349365234375, -0.0211181640625, 0.0066986083984375, 0.034515380859375, 0.0623321533203125, 0.09014892578125, 0.1179656982421875, 0.145782470703125, 0.1735992431640625, 0.201416015625, 0.2292327880859375, 0.257049560546875, 0.2848663330078125, 0.31268310546875, 0.3404998779296875, 0.368316650390625, 0.3961334228515625, 0.4239501953125, 0.4517669677734375, 0.479583740234375, 0.5074005126953125, 0.53521728515625, 0.5630340576171875, 0.590850830078125, 0.6186676025390625, 0.646484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 8.0, 19.0, 29.0, 28.0, 48.0, 90.0, 132.0, 156.0, 169.0, 102.0, 71.0, 41.0, 44.0, 21.0, 16.0, 8.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7177734375, -0.6992645263671875, -0.680755615234375, -0.6622467041015625, -0.64373779296875, -0.6252288818359375, -0.606719970703125, -0.5882110595703125, -0.5697021484375, -0.5511932373046875, -0.532684326171875, -0.5141754150390625, -0.49566650390625, -0.4771575927734375, -0.458648681640625, -0.4401397705078125, -0.421630859375, -0.4031219482421875, -0.384613037109375, -0.3661041259765625, -0.34759521484375, -0.3290863037109375, -0.310577392578125, -0.2920684814453125, -0.2735595703125, -0.2550506591796875, -0.236541748046875, -0.2180328369140625, -0.19952392578125, -0.1810150146484375, -0.162506103515625, -0.1439971923828125, -0.12548828125, -0.1069793701171875, -0.088470458984375, -0.0699615478515625, -0.05145263671875, -0.0329437255859375, -0.014434814453125, 0.0040740966796875, 0.0225830078125, 0.0410919189453125, 0.059600830078125, 0.0781097412109375, 0.09661865234375, 0.1151275634765625, 0.133636474609375, 0.1521453857421875, 0.170654296875, 0.1891632080078125, 0.207672119140625, 0.2261810302734375, 0.24468994140625, 0.2631988525390625, 0.281707763671875, 0.3002166748046875, 0.3187255859375, 0.3372344970703125, 0.355743408203125, 0.3742523193359375, 0.39276123046875, 0.4112701416015625, 0.429779052734375, 0.4482879638671875, 0.466796875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 11.0, 63.0, 296.0, 433.0, 162.0, 26.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.198760986328125, -26.678014755249023, -26.157270431518555, -25.636524200439453, -25.115779876708984, -24.595033645629883, -24.07428741455078, -23.553543090820312, -23.03279685974121, -22.51205062866211, -21.99130630493164, -21.47056007385254, -20.94981575012207, -20.42906951904297, -19.9083251953125, -19.3875789642334, -18.866832733154297, -18.346086502075195, -17.825342178344727, -17.304595947265625, -16.783851623535156, -16.263105392456055, -15.74236011505127, -15.221614837646484, -14.700870513916016, -14.18012523651123, -13.659379959106445, -13.138633728027344, -12.617888450622559, -12.097143173217773, -11.576397895812988, -11.055652618408203, -10.534905433654785, -10.01416015625, -9.493414878845215, -8.97266960144043, -8.451923370361328, -7.931178092956543, -7.410432815551758, -6.889687538146973, -6.368941783905029, -5.848196506500244, -5.327450752258301, -4.806705474853516, -4.2859601974487305, -3.765214443206787, -3.244469165802002, -2.7237236499786377, -2.2029781341552734, -1.6822326183319092, -1.1614872217178345, -0.6407418251037598, -0.11999630928039551, 0.40074920654296875, 0.9214944839477539, 1.4422399997711182, 1.9629855155944824, 2.4837310314178467, 3.004476547241211, 3.525221824645996, 4.045967102050781, 4.566712856292725, 5.08745813369751, 5.608203887939453, 6.128949165344238]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 2.0, 12.0, 6.0, 10.0, 2.0, 13.0, 11.0, 14.0, 17.0, 17.0, 17.0, 27.0, 35.0, 27.0, 31.0, 24.0, 50.0, 32.0, 42.0, 49.0, 40.0, 46.0, 55.0, 37.0, 39.0, 54.0, 41.0, 30.0, 28.0, 28.0, 32.0, 20.0, 21.0, 17.0, 12.0, 17.0, 8.0, 9.0, 5.0, 6.0, 3.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.625253915786743, -3.512847900390625, -3.400442123413086, -3.288036346435547, -3.1756303310394287, -3.0632243156433105, -2.9508185386657715, -2.8384127616882324, -2.7260067462921143, -2.613600730895996, -2.501194953918457, -2.388789176940918, -2.2763831615448, -2.1639771461486816, -2.0515713691711426, -1.939165472984314, -1.8267595767974854, -1.7143536806106567, -1.6019477844238281, -1.4895418882369995, -1.377135992050171, -1.2647300958633423, -1.1523241996765137, -1.039918303489685, -0.9275124073028564, -0.8151065111160278, -0.7027006149291992, -0.5902947187423706, -0.477888822555542, -0.3654829263687134, -0.25307703018188477, -0.14067113399505615, -0.02826523780822754, 0.08414065837860107, 0.1965465545654297, 0.3089524507522583, 0.4213583469390869, 0.5337642431259155, 0.6461701393127441, 0.7585760354995728, 0.8709819316864014, 0.98338782787323, 1.0957937240600586, 1.2081996202468872, 1.3206055164337158, 1.4330114126205444, 1.545417308807373, 1.6578232049942017, 1.7702291011810303, 1.8826349973678589, 1.9950408935546875, 2.1074466705322266, 2.2198526859283447, 2.332258701324463, 2.444664478302002, 2.557070255279541, 2.669476270675659, 2.7818822860717773, 2.8942880630493164, 3.0066938400268555, 3.1190998554229736, 3.231505870819092, 3.343911647796631, 3.45631742477417, 3.568723440170288]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 5.0, 2.0, 11.0, 4.0, 8.0, 15.0, 18.0, 34.0, 45.0, 77.0, 106.0, 193.0, 324.0, 561.0, 1241.0, 3367.0, 15033.0, 318368.0, 3823686.0, 23414.0, 4701.0, 1561.0, 662.0, 323.0, 186.0, 117.0, 78.0, 49.0, 33.0, 22.0, 16.0, 13.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.1328125, -1.105255126953125, -1.07769775390625, -1.050140380859375, -1.0225830078125, -0.995025634765625, -0.96746826171875, -0.939910888671875, -0.912353515625, -0.884796142578125, -0.85723876953125, -0.829681396484375, -0.8021240234375, -0.774566650390625, -0.74700927734375, -0.719451904296875, -0.69189453125, -0.664337158203125, -0.63677978515625, -0.609222412109375, -0.5816650390625, -0.554107666015625, -0.52655029296875, -0.498992919921875, -0.471435546875, -0.443878173828125, -0.41632080078125, -0.388763427734375, -0.3612060546875, -0.333648681640625, -0.30609130859375, -0.278533935546875, -0.2509765625, -0.223419189453125, -0.19586181640625, -0.168304443359375, -0.1407470703125, -0.113189697265625, -0.08563232421875, -0.058074951171875, -0.030517578125, -0.002960205078125, 0.02459716796875, 0.052154541015625, 0.0797119140625, 0.107269287109375, 0.13482666015625, 0.162384033203125, 0.18994140625, 0.217498779296875, 0.24505615234375, 0.272613525390625, 0.3001708984375, 0.327728271484375, 0.35528564453125, 0.382843017578125, 0.410400390625, 0.437957763671875, 0.46551513671875, 0.493072509765625, 0.5206298828125, 0.548187255859375, 0.57574462890625, 0.603302001953125, 0.630859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 4.0, 3.0, 8.0, 8.0, 12.0, 9.0, 19.0, 14.0, 35.0, 24.0, 31.0, 46.0, 62.0, 35.0, 56.0, 61.0, 66.0, 76.0, 64.0, 78.0, 40.0, 35.0, 50.0, 37.0, 29.0, 30.0, 18.0, 12.0, 9.0, 5.0, 4.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.20751953125, -0.2017230987548828, -0.19592666625976562, -0.19013023376464844, -0.18433380126953125, -0.17853736877441406, -0.17274093627929688, -0.1669445037841797, -0.1611480712890625, -0.1553516387939453, -0.14955520629882812, -0.14375877380371094, -0.13796234130859375, -0.13216590881347656, -0.12636947631835938, -0.12057304382324219, -0.114776611328125, -0.10898017883300781, -0.10318374633789062, -0.09738731384277344, -0.09159088134765625, -0.08579444885253906, -0.07999801635742188, -0.07420158386230469, -0.0684051513671875, -0.06260871887207031, -0.056812286376953125, -0.05101585388183594, -0.04521942138671875, -0.03942298889160156, -0.033626556396484375, -0.027830123901367188, -0.02203369140625, -0.016237258911132812, -0.010440826416015625, -0.0046443939208984375, 0.00115203857421875, 0.0069484710693359375, 0.012744903564453125, 0.018541336059570312, 0.0243377685546875, 0.030134201049804688, 0.035930633544921875, 0.04172706604003906, 0.04752349853515625, 0.05331993103027344, 0.059116363525390625, 0.06491279602050781, 0.070709228515625, 0.07650566101074219, 0.08230209350585938, 0.08809852600097656, 0.09389495849609375, 0.09969139099121094, 0.10548782348632812, 0.11128425598144531, 0.1170806884765625, 0.12287712097167969, 0.12867355346679688, 0.13446998596191406, 0.14026641845703125, 0.14606285095214844, 0.15185928344726562, 0.1576557159423828, 0.1634521484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 10.0, 18.0, 8.0, 15.0, 34.0, 41.0, 79.0, 114.0, 250.0, 657.0, 2326.0, 10367.0, 173912.0, 3974481.0, 25913.0, 4043.0, 1109.0, 422.0, 171.0, 94.0, 59.0, 45.0, 36.0, 15.0, 13.0, 11.0, 11.0, 2.0, 9.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.634765625, -1.589630126953125, -1.54449462890625, -1.499359130859375, -1.4542236328125, -1.409088134765625, -1.36395263671875, -1.318817138671875, -1.273681640625, -1.228546142578125, -1.18341064453125, -1.138275146484375, -1.0931396484375, -1.048004150390625, -1.00286865234375, -0.957733154296875, -0.91259765625, -0.867462158203125, -0.82232666015625, -0.777191162109375, -0.7320556640625, -0.686920166015625, -0.64178466796875, -0.596649169921875, -0.551513671875, -0.506378173828125, -0.46124267578125, -0.416107177734375, -0.3709716796875, -0.325836181640625, -0.28070068359375, -0.235565185546875, -0.1904296875, -0.145294189453125, -0.10015869140625, -0.055023193359375, -0.0098876953125, 0.035247802734375, 0.08038330078125, 0.125518798828125, 0.170654296875, 0.215789794921875, 0.26092529296875, 0.306060791015625, 0.3511962890625, 0.396331787109375, 0.44146728515625, 0.486602783203125, 0.53173828125, 0.576873779296875, 0.62200927734375, 0.667144775390625, 0.7122802734375, 0.757415771484375, 0.80255126953125, 0.847686767578125, 0.892822265625, 0.937957763671875, 0.98309326171875, 1.028228759765625, 1.0733642578125, 1.118499755859375, 1.16363525390625, 1.208770751953125, 1.25390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 7.0, 8.0, 25.0, 34.0, 46.0, 115.0, 353.0, 2960.0, 282.0, 93.0, 61.0, 30.0, 14.0, 17.0, 7.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 3.0], "bins": [-0.638671875, -0.6257495880126953, -0.6128273010253906, -0.5999050140380859, -0.5869827270507812, -0.5740604400634766, -0.5611381530761719, -0.5482158660888672, -0.5352935791015625, -0.5223712921142578, -0.5094490051269531, -0.49652671813964844, -0.48360443115234375, -0.47068214416503906, -0.4577598571777344, -0.4448375701904297, -0.431915283203125, -0.4189929962158203, -0.4060707092285156, -0.39314842224121094, -0.38022613525390625, -0.36730384826660156, -0.3543815612792969, -0.3414592742919922, -0.3285369873046875, -0.3156147003173828, -0.3026924133300781, -0.28977012634277344, -0.27684783935546875, -0.26392555236816406, -0.2510032653808594, -0.2380809783935547, -0.22515869140625, -0.2122364044189453, -0.19931411743164062, -0.18639183044433594, -0.17346954345703125, -0.16054725646972656, -0.14762496948242188, -0.1347026824951172, -0.1217803955078125, -0.10885810852050781, -0.09593582153320312, -0.08301353454589844, -0.07009124755859375, -0.05716896057128906, -0.044246673583984375, -0.03132438659667969, -0.018402099609375, -0.0054798126220703125, 0.007442474365234375, 0.020364761352539062, 0.03328704833984375, 0.04620933532714844, 0.059131622314453125, 0.07205390930175781, 0.0849761962890625, 0.09789848327636719, 0.11082077026367188, 0.12374305725097656, 0.13666534423828125, 0.14958763122558594, 0.16250991821289062, 0.1754322052001953, 0.1883544921875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 6.0, 7.0, 13.0, 12.0, 16.0, 37.0, 45.0, 85.0, 147.0, 169.0, 155.0, 128.0, 76.0, 46.0, 26.0, 15.0, 10.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.813605785369873, -1.7510530948638916, -1.6885004043579102, -1.6259477138519287, -1.5633951425552368, -1.5008424520492554, -1.438289761543274, -1.3757370710372925, -1.3131844997406006, -1.2506318092346191, -1.1880791187286377, -1.1255264282226562, -1.0629738569259644, -1.000421166419983, -0.9378684759140015, -0.87531578540802, -0.8127630949020386, -0.7502104043960571, -0.6876577734947205, -0.625105082988739, -0.5625524520874023, -0.4999997615814209, -0.43744707107543945, -0.3748944103717804, -0.31234174966812134, -0.24978908896446228, -0.18723641335964203, -0.12468373775482178, -0.06213107705116272, 0.0004215836524963379, 0.06297427415847778, 0.12552693486213684, 0.1880795955657959, 0.25063225626945496, 0.313184916973114, 0.37573760747909546, 0.4382902681827545, 0.5008429288864136, 0.563395619392395, 0.6259483098983765, 0.6885009407997131, 0.7510536313056946, 0.8136062622070312, 0.8761589527130127, 0.9387116432189941, 1.0012643337249756, 1.063817024230957, 1.126369595527649, 1.1889222860336304, 1.2514749765396118, 1.3140276670455933, 1.3765802383422852, 1.4391329288482666, 1.501685619354248, 1.5642383098602295, 1.626791000366211, 1.6893436908721924, 1.7518963813781738, 1.8144490718841553, 1.8770017623901367, 1.9395543336868286, 2.0021071434020996, 2.064659595489502, 2.1272122859954834, 2.189764976501465]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 2.0, 11.0, 5.0, 8.0, 13.0, 17.0, 17.0, 17.0, 30.0, 24.0, 28.0, 37.0, 45.0, 48.0, 49.0, 69.0, 62.0, 52.0, 57.0, 54.0, 46.0, 57.0, 34.0, 38.0, 34.0, 26.0, 25.0, 21.0, 22.0, 11.0, 12.0, 8.0, 8.0, 2.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9570510983467102, -0.918036162853241, -0.8790212273597717, -0.8400062918663025, -0.8009912967681885, -0.7619763612747192, -0.72296142578125, -0.6839464902877808, -0.6449315547943115, -0.6059166193008423, -0.566901683807373, -0.5278867483139038, -0.4888717830181122, -0.44985684752464294, -0.4108418822288513, -0.3718269467353821, -0.33281201124191284, -0.2937970757484436, -0.25478214025497437, -0.21576717495918274, -0.1767522394657135, -0.13773730397224426, -0.09872235357761383, -0.0597074031829834, -0.02069246768951416, 0.018322475254535675, 0.05733741819858551, 0.09635236114263535, 0.13536730408668518, 0.17438223958015442, 0.21339718997478485, 0.2524121403694153, 0.2914271354675293, 0.33044207096099854, 0.3694570064544678, 0.4084719717502594, 0.44748690724372864, 0.4865018427371979, 0.5255168080329895, 0.5645317435264587, 0.603546679019928, 0.6425616145133972, 0.6815765500068665, 0.7205914855003357, 0.7596064805984497, 0.798621416091919, 0.8376363515853882, 0.8766512870788574, 0.9156662225723267, 0.9546811580657959, 0.9936960935592651, 1.0327110290527344, 1.0717259645462036, 1.1107409000396729, 1.149755835533142, 1.1887707710266113, 1.2277858257293701, 1.2668007612228394, 1.3058156967163086, 1.3448306322097778, 1.383845567703247, 1.4228605031967163, 1.4618754386901855, 1.5008904933929443, 1.539905309677124]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 9.0, 7.0, 13.0, 20.0, 33.0, 78.0, 109.0, 276.0, 518.0, 1302.0, 3795.0, 14472.0, 75954.0, 488421.0, 388131.0, 58453.0, 11688.0, 3278.0, 1041.0, 470.0, 224.0, 118.0, 53.0, 35.0, 14.0, 17.0, 6.0, 8.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53369140625, -0.5131072998046875, -0.492523193359375, -0.4719390869140625, -0.45135498046875, -0.4307708740234375, -0.410186767578125, -0.3896026611328125, -0.3690185546875, -0.3484344482421875, -0.327850341796875, -0.3072662353515625, -0.28668212890625, -0.2660980224609375, -0.245513916015625, -0.2249298095703125, -0.204345703125, -0.1837615966796875, -0.163177490234375, -0.1425933837890625, -0.12200927734375, -0.1014251708984375, -0.080841064453125, -0.0602569580078125, -0.0396728515625, -0.0190887451171875, 0.001495361328125, 0.0220794677734375, 0.04266357421875, 0.0632476806640625, 0.083831787109375, 0.1044158935546875, 0.125, 0.1455841064453125, 0.166168212890625, 0.1867523193359375, 0.20733642578125, 0.2279205322265625, 0.248504638671875, 0.2690887451171875, 0.2896728515625, 0.3102569580078125, 0.330841064453125, 0.3514251708984375, 0.37200927734375, 0.3925933837890625, 0.413177490234375, 0.4337615966796875, 0.454345703125, 0.4749298095703125, 0.495513916015625, 0.5160980224609375, 0.53668212890625, 0.5572662353515625, 0.577850341796875, 0.5984344482421875, 0.6190185546875, 0.6396026611328125, 0.660186767578125, 0.6807708740234375, 0.70135498046875, 0.7219390869140625, 0.742523193359375, 0.7631072998046875, 0.78369140625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 10.0, 5.0, 6.0, 9.0, 12.0, 14.0, 23.0, 20.0, 23.0, 34.0, 48.0, 47.0, 53.0, 65.0, 60.0, 60.0, 66.0, 79.0, 54.0, 42.0, 38.0, 40.0, 25.0, 40.0, 35.0, 32.0, 16.0, 12.0, 12.0, 5.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.231201171875, -0.2251148223876953, -0.21902847290039062, -0.21294212341308594, -0.20685577392578125, -0.20076942443847656, -0.19468307495117188, -0.1885967254638672, -0.1825103759765625, -0.1764240264892578, -0.17033767700195312, -0.16425132751464844, -0.15816497802734375, -0.15207862854003906, -0.14599227905273438, -0.1399059295654297, -0.133819580078125, -0.1277332305908203, -0.12164688110351562, -0.11556053161621094, -0.10947418212890625, -0.10338783264160156, -0.09730148315429688, -0.09121513366699219, -0.0851287841796875, -0.07904243469238281, -0.07295608520507812, -0.06686973571777344, -0.06078338623046875, -0.05469703674316406, -0.048610687255859375, -0.04252433776855469, -0.03643798828125, -0.030351638793945312, -0.024265289306640625, -0.018178939819335938, -0.01209259033203125, -0.0060062408447265625, 8.0108642578125e-05, 0.0061664581298828125, 0.0122528076171875, 0.018339157104492188, 0.024425506591796875, 0.030511856079101562, 0.03659820556640625, 0.04268455505371094, 0.048770904541015625, 0.05485725402832031, 0.060943603515625, 0.06702995300292969, 0.07311630249023438, 0.07920265197753906, 0.08528900146484375, 0.09137535095214844, 0.09746170043945312, 0.10354804992675781, 0.1096343994140625, 0.11572074890136719, 0.12180709838867188, 0.12789344787597656, 0.13397979736328125, 0.14006614685058594, 0.14615249633789062, 0.1522388458251953, 0.1583251953125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 11.0, 14.0, 18.0, 18.0, 25.0, 43.0, 38.0, 72.0, 107.0, 155.0, 217.0, 392.0, 678.0, 1470.0, 4229.0, 22178.0, 301824.0, 663196.0, 43415.0, 6399.0, 1936.0, 863.0, 429.0, 267.0, 160.0, 126.0, 81.0, 41.0, 39.0, 24.0, 18.0, 22.0, 6.0, 10.0, 6.0, 8.0, 2.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.96484375, -0.9365921020507812, -0.9083404541015625, -0.8800888061523438, -0.851837158203125, -0.8235855102539062, -0.7953338623046875, -0.7670822143554688, -0.73883056640625, -0.7105789184570312, -0.6823272705078125, -0.6540756225585938, -0.625823974609375, -0.5975723266601562, -0.5693206787109375, -0.5410690307617188, -0.5128173828125, -0.48456573486328125, -0.4563140869140625, -0.42806243896484375, -0.399810791015625, -0.37155914306640625, -0.3433074951171875, -0.31505584716796875, -0.28680419921875, -0.25855255126953125, -0.2303009033203125, -0.20204925537109375, -0.173797607421875, -0.14554595947265625, -0.1172943115234375, -0.08904266357421875, -0.060791015625, -0.03253936767578125, -0.0042877197265625, 0.02396392822265625, 0.052215576171875, 0.08046722412109375, 0.1087188720703125, 0.13697052001953125, 0.16522216796875, 0.19347381591796875, 0.2217254638671875, 0.24997711181640625, 0.278228759765625, 0.30648040771484375, 0.3347320556640625, 0.36298370361328125, 0.3912353515625, 0.41948699951171875, 0.4477386474609375, 0.47599029541015625, 0.504241943359375, 0.5324935913085938, 0.5607452392578125, 0.5889968872070312, 0.61724853515625, 0.6455001831054688, 0.6737518310546875, 0.7020034790039062, 0.730255126953125, 0.7585067749023438, 0.7867584228515625, 0.8150100708007812, 0.84326171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 4.0, 4.0, 9.0, 6.0, 12.0, 8.0, 20.0, 17.0, 17.0, 28.0, 30.0, 29.0, 40.0, 42.0, 35.0, 60.0, 60.0, 60.0, 67.0, 56.0, 61.0, 60.0, 42.0, 35.0, 19.0, 42.0, 28.0, 25.0, 17.0, 8.0, 12.0, 9.0, 10.0, 6.0, 11.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.1005859375, -1.0703506469726562, -1.0401153564453125, -1.0098800659179688, -0.979644775390625, -0.9494094848632812, -0.9191741943359375, -0.8889389038085938, -0.85870361328125, -0.8284683227539062, -0.7982330322265625, -0.7679977416992188, -0.737762451171875, -0.7075271606445312, -0.6772918701171875, -0.6470565795898438, -0.6168212890625, -0.5865859985351562, -0.5563507080078125, -0.5261154174804688, -0.495880126953125, -0.46564483642578125, -0.4354095458984375, -0.40517425537109375, -0.37493896484375, -0.34470367431640625, -0.3144683837890625, -0.28423309326171875, -0.253997802734375, -0.22376251220703125, -0.1935272216796875, -0.16329193115234375, -0.133056640625, -0.10282135009765625, -0.0725860595703125, -0.04235076904296875, -0.012115478515625, 0.01811981201171875, 0.0483551025390625, 0.07859039306640625, 0.10882568359375, 0.13906097412109375, 0.1692962646484375, 0.19953155517578125, 0.229766845703125, 0.26000213623046875, 0.2902374267578125, 0.32047271728515625, 0.3507080078125, 0.38094329833984375, 0.4111785888671875, 0.44141387939453125, 0.471649169921875, 0.5018844604492188, 0.5321197509765625, 0.5623550415039062, 0.59259033203125, 0.6228256225585938, 0.6530609130859375, 0.6832962036132812, 0.713531494140625, 0.7437667846679688, 0.7740020751953125, 0.8042373657226562, 0.83447265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 14.0, 20.0, 39.0, 61.0, 143.0, 235.0, 701.0, 2586.0, 32533.0, 972247.0, 35882.0, 2757.0, 727.0, 278.0, 148.0, 66.0, 40.0, 24.0, 12.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.88330078125, -0.858428955078125, -0.83355712890625, -0.808685302734375, -0.7838134765625, -0.758941650390625, -0.73406982421875, -0.709197998046875, -0.684326171875, -0.659454345703125, -0.63458251953125, -0.609710693359375, -0.5848388671875, -0.559967041015625, -0.53509521484375, -0.510223388671875, -0.4853515625, -0.460479736328125, -0.43560791015625, -0.410736083984375, -0.3858642578125, -0.360992431640625, -0.33612060546875, -0.311248779296875, -0.286376953125, -0.261505126953125, -0.23663330078125, -0.211761474609375, -0.1868896484375, -0.162017822265625, -0.13714599609375, -0.112274169921875, -0.08740234375, -0.062530517578125, -0.03765869140625, -0.012786865234375, 0.0120849609375, 0.036956787109375, 0.06182861328125, 0.086700439453125, 0.111572265625, 0.136444091796875, 0.16131591796875, 0.186187744140625, 0.2110595703125, 0.235931396484375, 0.26080322265625, 0.285675048828125, 0.310546875, 0.335418701171875, 0.36029052734375, 0.385162353515625, 0.4100341796875, 0.434906005859375, 0.45977783203125, 0.484649658203125, 0.509521484375, 0.534393310546875, 0.55926513671875, 0.584136962890625, 0.6090087890625, 0.633880615234375, 0.65875244140625, 0.683624267578125, 0.70849609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 10.0, 10.0, 21.0, 16.0, 37.0, 33.0, 51.0, 50.0, 69.0, 114.0, 149.0, 106.0, 78.0, 57.0, 51.0, 40.0, 26.0, 23.0, 11.0, 13.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012046098709106445, -0.00011662300676107407, -0.00011278502643108368, -0.00010894704610109329, -0.0001051090657711029, -0.00010127108544111252, -9.743310511112213e-05, -9.359512478113174e-05, -8.975714445114136e-05, -8.591916412115097e-05, -8.208118379116058e-05, -7.82432034611702e-05, -7.440522313117981e-05, -7.056724280118942e-05, -6.672926247119904e-05, -6.289128214120865e-05, -5.905330181121826e-05, -5.5215321481227875e-05, -5.137734115123749e-05, -4.75393608212471e-05, -4.3701380491256714e-05, -3.986340016126633e-05, -3.602541983127594e-05, -3.218743950128555e-05, -2.8349459171295166e-05, -2.451147884130478e-05, -2.0673498511314392e-05, -1.6835518181324005e-05, -1.2997537851333618e-05, -9.159557521343231e-06, -5.321577191352844e-06, -1.4835968613624573e-06, 2.3543834686279297e-06, 6.192363798618317e-06, 1.0030344128608704e-05, 1.386832445859909e-05, 1.7706304788589478e-05, 2.1544285118579865e-05, 2.538226544857025e-05, 2.922024577856064e-05, 3.3058226108551025e-05, 3.689620643854141e-05, 4.07341867685318e-05, 4.4572167098522186e-05, 4.841014742851257e-05, 5.224812775850296e-05, 5.608610808849335e-05, 5.9924088418483734e-05, 6.376206874847412e-05, 6.760004907846451e-05, 7.14380294084549e-05, 7.527600973844528e-05, 7.911399006843567e-05, 8.295197039842606e-05, 8.678995072841644e-05, 9.062793105840683e-05, 9.446591138839722e-05, 9.83038917183876e-05, 0.00010214187204837799, 0.00010597985237836838, 0.00010981783270835876, 0.00011365581303834915, 0.00011749379336833954, 0.00012133177369832993, 0.0001251697540283203]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 13.0, 16.0, 25.0, 39.0, 83.0, 147.0, 288.0, 712.0, 2463.0, 20264.0, 849496.0, 165694.0, 6994.0, 1311.0, 486.0, 223.0, 135.0, 62.0, 42.0, 27.0, 8.0, 8.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56787109375, -0.5466690063476562, -0.5254669189453125, -0.5042648315429688, -0.483062744140625, -0.46186065673828125, -0.4406585693359375, -0.41945648193359375, -0.39825439453125, -0.37705230712890625, -0.3558502197265625, -0.33464813232421875, -0.313446044921875, -0.29224395751953125, -0.2710418701171875, -0.24983978271484375, -0.2286376953125, -0.20743560791015625, -0.1862335205078125, -0.16503143310546875, -0.143829345703125, -0.12262725830078125, -0.1014251708984375, -0.08022308349609375, -0.05902099609375, -0.03781890869140625, -0.0166168212890625, 0.00458526611328125, 0.025787353515625, 0.04698944091796875, 0.0681915283203125, 0.08939361572265625, 0.110595703125, 0.13179779052734375, 0.1529998779296875, 0.17420196533203125, 0.195404052734375, 0.21660614013671875, 0.2378082275390625, 0.25901031494140625, 0.28021240234375, 0.30141448974609375, 0.3226165771484375, 0.34381866455078125, 0.365020751953125, 0.38622283935546875, 0.4074249267578125, 0.42862701416015625, 0.4498291015625, 0.47103118896484375, 0.4922332763671875, 0.5134353637695312, 0.534637451171875, 0.5558395385742188, 0.5770416259765625, 0.5982437133789062, 0.61944580078125, 0.6406478881835938, 0.6618499755859375, 0.6830520629882812, 0.704254150390625, 0.7254562377929688, 0.7466583251953125, 0.7678604125976562, 0.7890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 5.0, 16.0, 22.0, 27.0, 58.0, 65.0, 136.0, 168.0, 172.0, 124.0, 77.0, 43.0, 32.0, 22.0, 11.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.471923828125, -0.4530067443847656, -0.43408966064453125, -0.4151725769042969, -0.3962554931640625, -0.3773384094238281, -0.35842132568359375, -0.3395042419433594, -0.320587158203125, -0.3016700744628906, -0.28275299072265625, -0.2638359069824219, -0.2449188232421875, -0.22600173950195312, -0.20708465576171875, -0.18816757202148438, -0.16925048828125, -0.15033340454101562, -0.13141632080078125, -0.11249923706054688, -0.0935821533203125, -0.07466506958007812, -0.05574798583984375, -0.036830902099609375, -0.017913818359375, 0.001003265380859375, 0.01992034912109375, 0.038837432861328125, 0.0577545166015625, 0.07667160034179688, 0.09558868408203125, 0.11450576782226562, 0.1334228515625, 0.15233993530273438, 0.17125701904296875, 0.19017410278320312, 0.2090911865234375, 0.22800827026367188, 0.24692535400390625, 0.2658424377441406, 0.284759521484375, 0.3036766052246094, 0.32259368896484375, 0.3415107727050781, 0.3604278564453125, 0.3793449401855469, 0.39826202392578125, 0.4171791076660156, 0.43609619140625, 0.4550132751464844, 0.47393035888671875, 0.4928474426269531, 0.5117645263671875, 0.5306816101074219, 0.5495986938476562, 0.5685157775878906, 0.587432861328125, 0.6063499450683594, 0.6252670288085938, 0.6441841125488281, 0.6631011962890625, 0.6820182800292969, 0.7009353637695312, 0.7198524475097656, 0.73876953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 34.0, 175.0, 456.0, 269.0, 52.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.47958755493164, -17.929616928100586, -17.37964630126953, -16.829673767089844, -16.27970314025879, -15.729732513427734, -15.17976188659668, -14.629790306091309, -14.079818725585938, -13.529848098754883, -12.979876518249512, -12.429905891418457, -11.879934310913086, -11.329963684082031, -10.779993057250977, -10.230021476745605, -9.68005084991455, -9.130080223083496, -8.580108642578125, -8.03013801574707, -7.480166435241699, -6.9301958084106445, -6.380224704742432, -5.830253601074219, -5.280282497406006, -4.730311393737793, -4.18034029006958, -3.6303694248199463, -3.0803983211517334, -2.5304272174835205, -1.9804563522338867, -1.4304852485656738, -0.8805141448974609, -0.3305431008338928, 0.2194279432296753, 0.7693989276885986, 1.3193700313568115, 1.8693411350250244, 2.419312000274658, 2.969283103942871, 3.519254207611084, 4.069225311279297, 4.61919641494751, 5.169167518615723, 5.719138145446777, 6.269109725952148, 6.819080352783203, 7.369051456451416, 7.919022560119629, 8.468993186950684, 9.018964767456055, 9.56893539428711, 10.11890697479248, 10.668877601623535, 11.218849182128906, 11.768819808959961, 12.318790435791016, 12.86876106262207, 13.418732643127441, 13.968703269958496, 14.518674850463867, 15.068645477294922, 15.618616104125977, 16.16858673095703, 16.71855926513672]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 2.0, 5.0, 6.0, 9.0, 6.0, 11.0, 11.0, 9.0, 15.0, 27.0, 28.0, 38.0, 33.0, 44.0, 49.0, 50.0, 50.0, 62.0, 51.0, 47.0, 59.0, 54.0, 39.0, 39.0, 40.0, 29.0, 31.0, 29.0, 20.0, 16.0, 11.0, 13.0, 10.0, 9.0, 11.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0], "bins": [-4.85911750793457, -4.733467102050781, -4.607816696166992, -4.482166290283203, -4.356515884399414, -4.230865478515625, -4.105215072631836, -3.979564666748047, -3.853914260864258, -3.7282638549804688, -3.6026134490966797, -3.4769630432128906, -3.3513126373291016, -3.2256622314453125, -3.1000118255615234, -2.9743614196777344, -2.8487110137939453, -2.7230606079101562, -2.597410202026367, -2.471759796142578, -2.346109390258789, -2.220458984375, -2.094808578491211, -1.9691581726074219, -1.8435077667236328, -1.7178573608398438, -1.5922069549560547, -1.4665565490722656, -1.3409061431884766, -1.2152557373046875, -1.0896053314208984, -0.9639549255371094, -0.8383049964904785, -0.7126545906066895, -0.5870041847229004, -0.46135377883911133, -0.33570337295532227, -0.2100529670715332, -0.08440256118774414, 0.04124784469604492, 0.16689825057983398, 0.29254865646362305, 0.4181990623474121, 0.5438494682312012, 0.6694998741149902, 0.7951502799987793, 0.9208006858825684, 1.0464510917663574, 1.1721014976501465, 1.2977519035339355, 1.4234023094177246, 1.5490527153015137, 1.6747031211853027, 1.8003535270690918, 1.9260039329528809, 2.05165433883667, 2.177304744720459, 2.302955150604248, 2.428605556488037, 2.554255962371826, 2.6799063682556152, 2.8055567741394043, 2.9312071800231934, 3.0568575859069824, 3.1825079917907715]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 5.0, 6.0, 3.0, 13.0, 6.0, 14.0, 11.0, 11.0, 15.0, 34.0, 48.0, 74.0, 99.0, 165.0, 284.0, 516.0, 824.0, 1455.0, 3198.0, 7884.0, 25760.0, 170495.0, 3578722.0, 347712.0, 38791.0, 10644.0, 3794.0, 1749.0, 861.0, 464.0, 244.0, 162.0, 79.0, 56.0, 31.0, 15.0, 12.0, 6.0, 8.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.56640625, -0.5513496398925781, -0.5362930297851562, -0.5212364196777344, -0.5061798095703125, -0.4911231994628906, -0.47606658935546875, -0.4610099792480469, -0.445953369140625, -0.4308967590332031, -0.41584014892578125, -0.4007835388183594, -0.3857269287109375, -0.3706703186035156, -0.35561370849609375, -0.3405570983886719, -0.32550048828125, -0.3104438781738281, -0.29538726806640625, -0.2803306579589844, -0.2652740478515625, -0.2502174377441406, -0.23516082763671875, -0.22010421752929688, -0.205047607421875, -0.18999099731445312, -0.17493438720703125, -0.15987777709960938, -0.1448211669921875, -0.12976455688476562, -0.11470794677734375, -0.09965133666992188, -0.0845947265625, -0.06953811645507812, -0.05448150634765625, -0.039424896240234375, -0.0243682861328125, -0.009311676025390625, 0.00574493408203125, 0.020801544189453125, 0.035858154296875, 0.050914764404296875, 0.06597137451171875, 0.08102798461914062, 0.0960845947265625, 0.11114120483398438, 0.12619781494140625, 0.14125442504882812, 0.15631103515625, 0.17136764526367188, 0.18642425537109375, 0.20148086547851562, 0.2165374755859375, 0.23159408569335938, 0.24665069580078125, 0.2617073059082031, 0.276763916015625, 0.2918205261230469, 0.30687713623046875, 0.3219337463378906, 0.3369903564453125, 0.3520469665527344, 0.36710357666015625, 0.3821601867675781, 0.397216796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 8.0, 10.0, 12.0, 19.0, 20.0, 46.0, 56.0, 70.0, 75.0, 85.0, 94.0, 95.0, 77.0, 76.0, 50.0, 47.0, 54.0, 33.0, 29.0, 12.0, 10.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.3583984375, -0.35002708435058594, -0.3416557312011719, -0.3332843780517578, -0.32491302490234375, -0.3165416717529297, -0.3081703186035156, -0.29979896545410156, -0.2914276123046875, -0.28305625915527344, -0.2746849060058594, -0.2663135528564453, -0.25794219970703125, -0.2495708465576172, -0.24119949340820312, -0.23282814025878906, -0.224456787109375, -0.21608543395996094, -0.20771408081054688, -0.1993427276611328, -0.19097137451171875, -0.1826000213623047, -0.17422866821289062, -0.16585731506347656, -0.1574859619140625, -0.14911460876464844, -0.14074325561523438, -0.1323719024658203, -0.12400054931640625, -0.11562919616699219, -0.10725784301757812, -0.09888648986816406, -0.09051513671875, -0.08214378356933594, -0.07377243041992188, -0.06540107727050781, -0.05702972412109375, -0.04865837097167969, -0.040287017822265625, -0.03191566467285156, -0.0235443115234375, -0.015172958374023438, -0.006801605224609375, 0.0015697479248046875, 0.00994110107421875, 0.018312454223632812, 0.026683807373046875, 0.03505516052246094, 0.043426513671875, 0.05179786682128906, 0.060169219970703125, 0.06854057312011719, 0.07691192626953125, 0.08528327941894531, 0.09365463256835938, 0.10202598571777344, 0.1103973388671875, 0.11876869201660156, 0.12714004516601562, 0.1355113983154297, 0.14388275146484375, 0.1522541046142578, 0.16062545776367188, 0.16899681091308594, 0.1773681640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 4.0, 17.0, 15.0, 26.0, 46.0, 67.0, 122.0, 224.0, 425.0, 1032.0, 2828.0, 9604.0, 57120.0, 3151320.0, 924665.0, 35539.0, 7232.0, 2227.0, 858.0, 397.0, 195.0, 112.0, 66.0, 45.0, 26.0, 15.0, 15.0, 8.0, 7.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.802734375, -0.7783279418945312, -0.7539215087890625, -0.7295150756835938, -0.705108642578125, -0.6807022094726562, -0.6562957763671875, -0.6318893432617188, -0.60748291015625, -0.5830764770507812, -0.5586700439453125, -0.5342636108398438, -0.509857177734375, -0.48545074462890625, -0.4610443115234375, -0.43663787841796875, -0.4122314453125, -0.38782501220703125, -0.3634185791015625, -0.33901214599609375, -0.314605712890625, -0.29019927978515625, -0.2657928466796875, -0.24138641357421875, -0.21697998046875, -0.19257354736328125, -0.1681671142578125, -0.14376068115234375, -0.119354248046875, -0.09494781494140625, -0.0705413818359375, -0.04613494873046875, -0.021728515625, 0.00267791748046875, 0.0270843505859375, 0.05149078369140625, 0.075897216796875, 0.10030364990234375, 0.1247100830078125, 0.14911651611328125, 0.17352294921875, 0.19792938232421875, 0.2223358154296875, 0.24674224853515625, 0.271148681640625, 0.29555511474609375, 0.3199615478515625, 0.34436798095703125, 0.3687744140625, 0.39318084716796875, 0.4175872802734375, 0.44199371337890625, 0.466400146484375, 0.49080657958984375, 0.5152130126953125, 0.5396194458007812, 0.56402587890625, 0.5884323120117188, 0.6128387451171875, 0.6372451782226562, 0.661651611328125, 0.6860580444335938, 0.7104644775390625, 0.7348709106445312, 0.75927734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 3.0, 8.0, 13.0, 14.0, 19.0, 32.0, 54.0, 88.0, 168.0, 349.0, 971.0, 1362.0, 489.0, 214.0, 94.0, 75.0, 27.0, 21.0, 20.0, 12.0, 12.0, 5.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7548828125, -0.7327651977539062, -0.7106475830078125, -0.6885299682617188, -0.666412353515625, -0.6442947387695312, -0.6221771240234375, -0.6000595092773438, -0.57794189453125, -0.5558242797851562, -0.5337066650390625, -0.5115890502929688, -0.489471435546875, -0.46735382080078125, -0.4452362060546875, -0.42311859130859375, -0.4010009765625, -0.37888336181640625, -0.3567657470703125, -0.33464813232421875, -0.312530517578125, -0.29041290283203125, -0.2682952880859375, -0.24617767333984375, -0.22406005859375, -0.20194244384765625, -0.1798248291015625, -0.15770721435546875, -0.135589599609375, -0.11347198486328125, -0.0913543701171875, -0.06923675537109375, -0.047119140625, -0.02500152587890625, -0.0028839111328125, 0.01923370361328125, 0.041351318359375, 0.06346893310546875, 0.0855865478515625, 0.10770416259765625, 0.12982177734375, 0.15193939208984375, 0.1740570068359375, 0.19617462158203125, 0.218292236328125, 0.24040985107421875, 0.2625274658203125, 0.28464508056640625, 0.3067626953125, 0.32888031005859375, 0.3509979248046875, 0.37311553955078125, 0.395233154296875, 0.41735076904296875, 0.4394683837890625, 0.46158599853515625, 0.48370361328125, 0.5058212280273438, 0.5279388427734375, 0.5500564575195312, 0.572174072265625, 0.5942916870117188, 0.6164093017578125, 0.6385269165039062, 0.66064453125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 22.0, 94.0, 288.0, 386.0, 148.0, 34.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.180972099304199, -6.842856407165527, -6.5047407150268555, -6.166625022888184, -5.828509330749512, -5.49039363861084, -5.15227746963501, -4.814161777496338, -4.476046085357666, -4.137930393218994, -3.7998147010803223, -3.4616987705230713, -3.1235830783843994, -2.7854673862457275, -2.4473514556884766, -2.1092357635498047, -1.7711200714111328, -1.433004379272461, -1.0948885679244995, -0.7567727565765381, -0.4186570644378662, -0.08054137229919434, 0.25757455825805664, 0.5956902503967285, 0.9338059425354004, 1.2719216346740723, 1.6100374460220337, 1.9481532573699951, 2.286268949508667, 2.624384641647339, 2.96250057220459, 3.3006162643432617, 3.638731002807617, 3.976846694946289, 4.314962387084961, 4.653078079223633, 4.991193771362305, 5.329309463500977, 5.667425632476807, 6.0055413246154785, 6.34365701675415, 6.681772708892822, 7.019888401031494, 7.358004570007324, 7.696120262145996, 8.034235954284668, 8.37235164642334, 8.710467338562012, 9.048583030700684, 9.386698722839355, 9.724814414978027, 10.0629301071167, 10.401045799255371, 10.739161491394043, 11.077278137207031, 11.415393829345703, 11.753509521484375, 12.091625213623047, 12.429740905761719, 12.76785659790039, 13.105972290039062, 13.444087982177734, 13.782203674316406, 14.120319366455078, 14.45843505859375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 9.0, 12.0, 11.0, 14.0, 21.0, 19.0, 27.0, 31.0, 30.0, 49.0, 36.0, 27.0, 33.0, 45.0, 32.0, 49.0, 44.0, 50.0, 58.0, 43.0, 40.0, 37.0, 36.0, 24.0, 28.0, 20.0, 29.0, 26.0, 18.0, 18.0, 7.0, 14.0, 8.0, 9.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.060170888900757, -1.991247296333313, -1.9223237037658691, -1.8534002304077148, -1.784476637840271, -1.7155530452728271, -1.6466295719146729, -1.577705979347229, -1.5087823867797852, -1.4398587942123413, -1.3709352016448975, -1.3020117282867432, -1.2330881357192993, -1.1641645431518555, -1.0952410697937012, -1.0263174772262573, -0.9573938846588135, -0.8884702920913696, -0.8195467591285706, -0.7506232261657715, -0.6816996335983276, -0.6127760410308838, -0.5438525080680847, -0.47492894530296326, -0.4060053825378418, -0.33708181977272034, -0.2681582570075989, -0.19923469424247742, -0.13031113147735596, -0.0613875687122345, 0.007535994052886963, 0.07645955681800842, 0.14538335800170898, 0.21430692076683044, 0.2832304835319519, 0.35215404629707336, 0.4210776090621948, 0.4900011718273163, 0.5589247345924377, 0.6278482675552368, 0.6967718601226807, 0.7656954526901245, 0.8346189856529236, 0.9035425186157227, 0.9724661111831665, 1.0413897037506104, 1.1103131771087646, 1.1792367696762085, 1.2481603622436523, 1.3170839548110962, 1.38600754737854, 1.4549310207366943, 1.5238546133041382, 1.592778205871582, 1.6617016792297363, 1.7306252717971802, 1.799548864364624, 1.8684724569320679, 1.9373960494995117, 2.006319522857666, 2.0752429962158203, 2.1441667079925537, 2.213090181350708, 2.2820138931274414, 2.3509373664855957]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 9.0, 19.0, 17.0, 33.0, 58.0, 96.0, 150.0, 241.0, 425.0, 773.0, 1536.0, 3157.0, 7367.0, 20199.0, 69340.0, 315976.0, 474402.0, 107676.0, 28874.0, 10054.0, 4095.0, 1875.0, 882.0, 546.0, 289.0, 159.0, 109.0, 65.0, 48.0, 25.0, 16.0, 7.0, 11.0, 7.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64990234375, -0.6328697204589844, -0.6158370971679688, -0.5988044738769531, -0.5817718505859375, -0.5647392272949219, -0.5477066040039062, -0.5306739807128906, -0.513641357421875, -0.4966087341308594, -0.47957611083984375, -0.4625434875488281, -0.4455108642578125, -0.4284782409667969, -0.41144561767578125, -0.3944129943847656, -0.37738037109375, -0.3603477478027344, -0.34331512451171875, -0.3262825012207031, -0.3092498779296875, -0.2922172546386719, -0.27518463134765625, -0.2581520080566406, -0.241119384765625, -0.22408676147460938, -0.20705413818359375, -0.19002151489257812, -0.1729888916015625, -0.15595626831054688, -0.13892364501953125, -0.12189102172851562, -0.1048583984375, -0.08782577514648438, -0.07079315185546875, -0.053760528564453125, -0.0367279052734375, -0.019695281982421875, -0.00266265869140625, 0.014369964599609375, 0.031402587890625, 0.048435211181640625, 0.06546783447265625, 0.08250045776367188, 0.0995330810546875, 0.11656570434570312, 0.13359832763671875, 0.15063095092773438, 0.16766357421875, 0.18469619750976562, 0.20172882080078125, 0.21876144409179688, 0.2357940673828125, 0.2528266906738281, 0.26985931396484375, 0.2868919372558594, 0.303924560546875, 0.3209571838378906, 0.33798980712890625, 0.3550224304199219, 0.3720550537109375, 0.3890876770019531, 0.40612030029296875, 0.4231529235839844, 0.440185546875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 11.0, 21.0, 15.0, 27.0, 32.0, 60.0, 49.0, 65.0, 59.0, 76.0, 89.0, 69.0, 70.0, 67.0, 52.0, 49.0, 33.0, 35.0, 27.0, 29.0, 23.0, 4.0, 6.0, 6.0, 0.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.2538928985595703, -0.24655532836914062, -0.23921775817871094, -0.23188018798828125, -0.22454261779785156, -0.21720504760742188, -0.2098674774169922, -0.2025299072265625, -0.1951923370361328, -0.18785476684570312, -0.18051719665527344, -0.17317962646484375, -0.16584205627441406, -0.15850448608398438, -0.1511669158935547, -0.143829345703125, -0.1364917755126953, -0.12915420532226562, -0.12181663513183594, -0.11447906494140625, -0.10714149475097656, -0.09980392456054688, -0.09246635437011719, -0.0851287841796875, -0.07779121398925781, -0.07045364379882812, -0.06311607360839844, -0.05577850341796875, -0.04844093322753906, -0.041103363037109375, -0.03376579284667969, -0.02642822265625, -0.019090652465820312, -0.011753082275390625, -0.0044155120849609375, 0.00292205810546875, 0.010259628295898438, 0.017597198486328125, 0.024934768676757812, 0.0322723388671875, 0.03960990905761719, 0.046947479248046875, 0.05428504943847656, 0.06162261962890625, 0.06896018981933594, 0.07629776000976562, 0.08363533020019531, 0.090972900390625, 0.09831047058105469, 0.10564804077148438, 0.11298561096191406, 0.12032318115234375, 0.12766075134277344, 0.13499832153320312, 0.1423358917236328, 0.1496734619140625, 0.1570110321044922, 0.16434860229492188, 0.17168617248535156, 0.17902374267578125, 0.18636131286621094, 0.19369888305664062, 0.2010364532470703, 0.2083740234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 9.0, 17.0, 21.0, 28.0, 44.0, 65.0, 119.0, 199.0, 392.0, 955.0, 2641.0, 13089.0, 433675.0, 578056.0, 14616.0, 2718.0, 933.0, 437.0, 199.0, 125.0, 79.0, 28.0, 32.0, 13.0, 16.0, 7.0, 7.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.1240234375, -1.0791015625, -1.0341796875, -0.9892578125, -0.9443359375, -0.8994140625, -0.8544921875, -0.8095703125, -0.7646484375, -0.7197265625, -0.6748046875, -0.6298828125, -0.5849609375, -0.5400390625, -0.4951171875, -0.4501953125, -0.4052734375, -0.3603515625, -0.3154296875, -0.2705078125, -0.2255859375, -0.1806640625, -0.1357421875, -0.0908203125, -0.0458984375, -0.0009765625, 0.0439453125, 0.0888671875, 0.1337890625, 0.1787109375, 0.2236328125, 0.2685546875, 0.3134765625, 0.3583984375, 0.4033203125, 0.4482421875, 0.4931640625, 0.5380859375, 0.5830078125, 0.6279296875, 0.6728515625, 0.7177734375, 0.7626953125, 0.8076171875, 0.8525390625, 0.8974609375, 0.9423828125, 0.9873046875, 1.0322265625, 1.0771484375, 1.1220703125, 1.1669921875, 1.2119140625, 1.2568359375, 1.3017578125, 1.3466796875, 1.3916015625, 1.4365234375, 1.4814453125, 1.5263671875, 1.5712890625, 1.6162109375, 1.6611328125, 1.7060546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 12.0, 9.0, 11.0, 18.0, 26.0, 19.0, 22.0, 32.0, 42.0, 51.0, 63.0, 52.0, 63.0, 86.0, 71.0, 58.0, 62.0, 57.0, 44.0, 42.0, 32.0, 25.0, 15.0, 27.0, 17.0, 17.0, 9.0, 8.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9423828125, -0.9064178466796875, -0.870452880859375, -0.8344879150390625, -0.79852294921875, -0.7625579833984375, -0.726593017578125, -0.6906280517578125, -0.6546630859375, -0.6186981201171875, -0.582733154296875, -0.5467681884765625, -0.51080322265625, -0.4748382568359375, -0.438873291015625, -0.4029083251953125, -0.366943359375, -0.3309783935546875, -0.295013427734375, -0.2590484619140625, -0.22308349609375, -0.1871185302734375, -0.151153564453125, -0.1151885986328125, -0.0792236328125, -0.0432586669921875, -0.007293701171875, 0.0286712646484375, 0.06463623046875, 0.1006011962890625, 0.136566162109375, 0.1725311279296875, 0.20849609375, 0.2444610595703125, 0.280426025390625, 0.3163909912109375, 0.35235595703125, 0.3883209228515625, 0.424285888671875, 0.4602508544921875, 0.4962158203125, 0.5321807861328125, 0.568145751953125, 0.6041107177734375, 0.64007568359375, 0.6760406494140625, 0.712005615234375, 0.7479705810546875, 0.783935546875, 0.8199005126953125, 0.855865478515625, 0.8918304443359375, 0.92779541015625, 0.9637603759765625, 0.999725341796875, 1.0356903076171875, 1.0716552734375, 1.1076202392578125, 1.143585205078125, 1.1795501708984375, 1.21551513671875, 1.2514801025390625, 1.287445068359375, 1.3234100341796875, 1.359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 12.0, 16.0, 7.0, 10.0, 34.0, 59.0, 111.0, 249.0, 663.0, 2142.0, 14385.0, 868329.0, 154152.0, 6203.0, 1287.0, 445.0, 181.0, 120.0, 51.0, 29.0, 24.0, 14.0, 5.0, 8.0, 1.0, 4.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8076171875, -0.7785797119140625, -0.749542236328125, -0.7205047607421875, -0.69146728515625, -0.6624298095703125, -0.633392333984375, -0.6043548583984375, -0.5753173828125, -0.5462799072265625, -0.517242431640625, -0.4882049560546875, -0.45916748046875, -0.4301300048828125, -0.401092529296875, -0.3720550537109375, -0.343017578125, -0.3139801025390625, -0.284942626953125, -0.2559051513671875, -0.22686767578125, -0.1978302001953125, -0.168792724609375, -0.1397552490234375, -0.1107177734375, -0.0816802978515625, -0.052642822265625, -0.0236053466796875, 0.00543212890625, 0.0344696044921875, 0.063507080078125, 0.0925445556640625, 0.12158203125, 0.1506195068359375, 0.179656982421875, 0.2086944580078125, 0.23773193359375, 0.2667694091796875, 0.295806884765625, 0.3248443603515625, 0.3538818359375, 0.3829193115234375, 0.411956787109375, 0.4409942626953125, 0.47003173828125, 0.4990692138671875, 0.528106689453125, 0.5571441650390625, 0.586181640625, 0.6152191162109375, 0.644256591796875, 0.6732940673828125, 0.70233154296875, 0.7313690185546875, 0.760406494140625, 0.7894439697265625, 0.8184814453125, 0.8475189208984375, 0.876556396484375, 0.9055938720703125, 0.93463134765625, 0.9636688232421875, 0.992706298828125, 1.0217437744140625, 1.05078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 17.0, 20.0, 40.0, 62.0, 86.0, 107.0, 146.0, 128.0, 104.0, 79.0, 60.0, 46.0, 25.0, 21.0, 10.0, 12.0, 2.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021529197692871094, -0.00020461156964302063, -0.00019393116235733032, -0.00018325075507164001, -0.0001725703477859497, -0.0001618899405002594, -0.0001512095332145691, -0.00014052912592887878, -0.00012984871864318848, -0.00011916831135749817, -0.00010848790407180786, -9.780749678611755e-05, -8.712708950042725e-05, -7.644668221473694e-05, -6.576627492904663e-05, -5.508586764335632e-05, -4.4405460357666016e-05, -3.372505307197571e-05, -2.30446457862854e-05, -1.2364238500595093e-05, -1.6838312149047852e-06, 8.996576070785522e-06, 1.967698335647583e-05, 3.0357390642166138e-05, 4.1037797927856445e-05, 5.171820521354675e-05, 6.239861249923706e-05, 7.307901978492737e-05, 8.375942707061768e-05, 9.443983435630798e-05, 0.00010512024164199829, 0.0001158006489276886, 0.0001264810562133789, 0.00013716146349906921, 0.00014784187078475952, 0.00015852227807044983, 0.00016920268535614014, 0.00017988309264183044, 0.00019056349992752075, 0.00020124390721321106, 0.00021192431449890137, 0.00022260472178459167, 0.00023328512907028198, 0.0002439655363559723, 0.0002546459436416626, 0.0002653263509273529, 0.0002760067582130432, 0.0002866871654987335, 0.00029736757278442383, 0.00030804798007011414, 0.00031872838735580444, 0.00032940879464149475, 0.00034008920192718506, 0.00035076960921287537, 0.0003614500164985657, 0.000372130423784256, 0.0003828108310699463, 0.0003934912383556366, 0.0004041716456413269, 0.0004148520529270172, 0.0004255324602127075, 0.00043621286749839783, 0.00044689327478408813, 0.00045757368206977844, 0.00046825408935546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 4.0, 16.0, 23.0, 38.0, 37.0, 77.0, 90.0, 162.0, 270.0, 505.0, 1018.0, 2762.0, 13351.0, 219298.0, 773084.0, 30374.0, 4470.0, 1408.0, 700.0, 329.0, 186.0, 127.0, 62.0, 51.0, 30.0, 28.0, 13.0, 10.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5458984375, -0.52581787109375, -0.5057373046875, -0.48565673828125, -0.465576171875, -0.44549560546875, -0.4254150390625, -0.40533447265625, -0.38525390625, -0.36517333984375, -0.3450927734375, -0.32501220703125, -0.304931640625, -0.28485107421875, -0.2647705078125, -0.24468994140625, -0.224609375, -0.20452880859375, -0.1844482421875, -0.16436767578125, -0.144287109375, -0.12420654296875, -0.1041259765625, -0.08404541015625, -0.06396484375, -0.04388427734375, -0.0238037109375, -0.00372314453125, 0.016357421875, 0.03643798828125, 0.0565185546875, 0.07659912109375, 0.0966796875, 0.11676025390625, 0.1368408203125, 0.15692138671875, 0.177001953125, 0.19708251953125, 0.2171630859375, 0.23724365234375, 0.25732421875, 0.27740478515625, 0.2974853515625, 0.31756591796875, 0.337646484375, 0.35772705078125, 0.3778076171875, 0.39788818359375, 0.41796875, 0.43804931640625, 0.4581298828125, 0.47821044921875, 0.498291015625, 0.51837158203125, 0.5384521484375, 0.55853271484375, 0.57861328125, 0.59869384765625, 0.6187744140625, 0.63885498046875, 0.658935546875, 0.67901611328125, 0.6990966796875, 0.71917724609375, 0.7392578125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 6.0, 8.0, 14.0, 8.0, 23.0, 34.0, 33.0, 48.0, 58.0, 63.0, 72.0, 98.0, 87.0, 78.0, 67.0, 67.0, 44.0, 47.0, 32.0, 26.0, 13.0, 10.0, 16.0, 9.0, 4.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32421875, -0.3105316162109375, -0.296844482421875, -0.2831573486328125, -0.26947021484375, -0.2557830810546875, -0.242095947265625, -0.2284088134765625, -0.2147216796875, -0.2010345458984375, -0.187347412109375, -0.1736602783203125, -0.15997314453125, -0.1462860107421875, -0.132598876953125, -0.1189117431640625, -0.105224609375, -0.0915374755859375, -0.077850341796875, -0.0641632080078125, -0.05047607421875, -0.0367889404296875, -0.023101806640625, -0.0094146728515625, 0.0042724609375, 0.0179595947265625, 0.031646728515625, 0.0453338623046875, 0.05902099609375, 0.0727081298828125, 0.086395263671875, 0.1000823974609375, 0.11376953125, 0.1274566650390625, 0.141143798828125, 0.1548309326171875, 0.16851806640625, 0.1822052001953125, 0.195892333984375, 0.2095794677734375, 0.2232666015625, 0.2369537353515625, 0.250640869140625, 0.2643280029296875, 0.27801513671875, 0.2917022705078125, 0.305389404296875, 0.3190765380859375, 0.332763671875, 0.3464508056640625, 0.360137939453125, 0.3738250732421875, 0.38751220703125, 0.4011993408203125, 0.414886474609375, 0.4285736083984375, 0.4422607421875, 0.4559478759765625, 0.469635009765625, 0.4833221435546875, 0.49700927734375, 0.5106964111328125, 0.524383544921875, 0.5380706787109375, 0.5517578125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 11.0, 52.0, 164.0, 389.0, 244.0, 96.0, 26.0, 6.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.409454345703125, -10.003876686096191, -9.598299026489258, -9.192720413208008, -8.787142753601074, -8.38156509399414, -7.975986957550049, -7.570408821105957, -7.164831161499023, -6.75925350189209, -6.353675365447998, -5.948097229003906, -5.542519569396973, -5.136941909790039, -4.731363773345947, -4.3257856369018555, -3.920207977294922, -3.514630079269409, -3.1090521812438965, -2.703474283218384, -2.297896385192871, -1.8923184871673584, -1.4867405891418457, -1.081162691116333, -0.6755847930908203, -0.2700068950653076, 0.13557100296020508, 0.5411489009857178, 0.9467267990112305, 1.3523046970367432, 1.7578825950622559, 2.1634604930877686, 2.5690383911132812, 2.974616289138794, 3.3801941871643066, 3.7857720851898193, 4.191349983215332, 4.596927642822266, 5.002505779266357, 5.408083915710449, 5.813661575317383, 6.219239234924316, 6.624817371368408, 7.0303955078125, 7.435973167419434, 7.841550827026367, 8.247129440307617, 8.65270709991455, 9.058284759521484, 9.463862419128418, 9.869440078735352, 10.275018692016602, 10.680596351623535, 11.086174011230469, 11.491752624511719, 11.897330284118652, 12.302907943725586, 12.70848560333252, 13.114063262939453, 13.519641876220703, 13.925219535827637, 14.33079719543457, 14.73637580871582, 15.141953468322754, 15.547531127929688]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 3.0, 10.0, 4.0, 5.0, 14.0, 9.0, 15.0, 12.0, 24.0, 30.0, 27.0, 40.0, 38.0, 52.0, 49.0, 62.0, 60.0, 64.0, 61.0, 53.0, 47.0, 54.0, 54.0, 35.0, 29.0, 30.0, 26.0, 16.0, 14.0, 16.0, 12.0, 8.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-4.932521343231201, -4.801183223724365, -4.669845104217529, -4.538506984710693, -4.407168388366699, -4.275830268859863, -4.144492149353027, -4.013154029846191, -3.8818159103393555, -3.7504777908325195, -3.6191396713256836, -3.4878013134002686, -3.3564631938934326, -3.2251250743865967, -3.0937867164611816, -2.9624485969543457, -2.8311104774475098, -2.699772357940674, -2.568434238433838, -2.437095880508423, -2.305757761001587, -2.174419641494751, -2.043081283569336, -1.9117431640625, -1.780405044555664, -1.6490669250488281, -1.5177286863327026, -1.3863904476165771, -1.2550523281097412, -1.1237142086029053, -0.9923759698867798, -0.8610377907752991, -0.7296993732452393, -0.5983611941337585, -0.46702301502227783, -0.3356848359107971, -0.2043466567993164, -0.0730084776878357, 0.05832970142364502, 0.18966788053512573, 0.32100605964660645, 0.45234423875808716, 0.5836824178695679, 0.7150205969810486, 0.8463587760925293, 0.97769695520401, 1.1090351343154907, 1.2403733730316162, 1.3717114925384521, 1.503049612045288, 1.6343878507614136, 1.765726089477539, 1.897064208984375, 2.028402328491211, 2.159740447998047, 2.291078805923462, 2.422416925430298, 2.553755044937134, 2.685093402862549, 2.8164315223693848, 2.9477696418762207, 3.0791077613830566, 3.2104458808898926, 3.3417842388153076, 3.4731223583221436]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 13.0, 8.0, 10.0, 17.0, 16.0, 29.0, 34.0, 68.0, 140.0, 414.0, 4166860.0, 26001.0, 344.0, 153.0, 78.0, 35.0, 22.0, 12.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.23394775390625, -7.9835205078125, -7.73309326171875, -7.482666015625, -7.23223876953125, -6.9818115234375, -6.73138427734375, -6.48095703125, -6.23052978515625, -5.9801025390625, -5.72967529296875, -5.479248046875, -5.22882080078125, -4.9783935546875, -4.72796630859375, -4.4775390625, -4.22711181640625, -3.9766845703125, -3.72625732421875, -3.475830078125, -3.22540283203125, -2.9749755859375, -2.72454833984375, -2.47412109375, -2.22369384765625, -1.9732666015625, -1.72283935546875, -1.472412109375, -1.22198486328125, -0.9715576171875, -0.72113037109375, -0.470703125, -0.22027587890625, 0.0301513671875, 0.28057861328125, 0.531005859375, 0.78143310546875, 1.0318603515625, 1.28228759765625, 1.53271484375, 1.78314208984375, 2.0335693359375, 2.28399658203125, 2.534423828125, 2.78485107421875, 3.0352783203125, 3.28570556640625, 3.5361328125, 3.78656005859375, 4.0369873046875, 4.28741455078125, 4.537841796875, 4.78826904296875, 5.0386962890625, 5.28912353515625, 5.53955078125, 5.78997802734375, 6.0404052734375, 6.29083251953125, 6.541259765625, 6.79168701171875, 7.0421142578125, 7.29254150390625, 7.54296875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 7.0, 8.0, 10.0, 20.0, 16.0, 21.0, 39.0, 66.0, 77.0, 90.0, 108.0, 113.0, 88.0, 73.0, 67.0, 58.0, 46.0, 36.0, 17.0, 12.0, 8.0, 11.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.45654296875, -0.4466590881347656, -0.43677520751953125, -0.4268913269042969, -0.4170074462890625, -0.4071235656738281, -0.39723968505859375, -0.3873558044433594, -0.377471923828125, -0.3675880432128906, -0.35770416259765625, -0.3478202819824219, -0.3379364013671875, -0.3280525207519531, -0.31816864013671875, -0.3082847595214844, -0.29840087890625, -0.2885169982910156, -0.27863311767578125, -0.2687492370605469, -0.2588653564453125, -0.24898147583007812, -0.23909759521484375, -0.22921371459960938, -0.219329833984375, -0.20944595336914062, -0.19956207275390625, -0.18967819213867188, -0.1797943115234375, -0.16991043090820312, -0.16002655029296875, -0.15014266967773438, -0.1402587890625, -0.13037490844726562, -0.12049102783203125, -0.11060714721679688, -0.1007232666015625, -0.09083938598632812, -0.08095550537109375, -0.07107162475585938, -0.061187744140625, -0.051303863525390625, -0.04141998291015625, -0.031536102294921875, -0.0216522216796875, -0.011768341064453125, -0.00188446044921875, 0.007999420166015625, 0.01788330078125, 0.027767181396484375, 0.03765106201171875, 0.047534942626953125, 0.0574188232421875, 0.06730270385742188, 0.07718658447265625, 0.08707046508789062, 0.096954345703125, 0.10683822631835938, 0.11672210693359375, 0.12660598754882812, 0.1364898681640625, 0.14637374877929688, 0.15625762939453125, 0.16614151000976562, 0.176025390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 8.0, 10.0, 13.0, 19.0, 27.0, 42.0, 62.0, 117.0, 182.0, 320.0, 583.0, 1057.0, 2172.0, 4560.0, 11104.0, 33615.0, 144002.0, 1693643.0, 2090298.0, 157754.0, 34820.0, 11418.0, 4292.0, 2041.0, 907.0, 484.0, 275.0, 154.0, 99.0, 51.0, 50.0, 23.0, 16.0, 21.0, 11.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.468017578125, -0.45571136474609375, -0.4434051513671875, -0.43109893798828125, -0.418792724609375, -0.40648651123046875, -0.3941802978515625, -0.38187408447265625, -0.36956787109375, -0.35726165771484375, -0.3449554443359375, -0.33264923095703125, -0.320343017578125, -0.30803680419921875, -0.2957305908203125, -0.28342437744140625, -0.2711181640625, -0.25881195068359375, -0.2465057373046875, -0.23419952392578125, -0.221893310546875, -0.20958709716796875, -0.1972808837890625, -0.18497467041015625, -0.17266845703125, -0.16036224365234375, -0.1480560302734375, -0.13574981689453125, -0.123443603515625, -0.11113739013671875, -0.0988311767578125, -0.08652496337890625, -0.07421875, -0.06191253662109375, -0.0496063232421875, -0.03730010986328125, -0.024993896484375, -0.01268768310546875, -0.0003814697265625, 0.01192474365234375, 0.02423095703125, 0.03653717041015625, 0.0488433837890625, 0.06114959716796875, 0.073455810546875, 0.08576202392578125, 0.0980682373046875, 0.11037445068359375, 0.1226806640625, 0.13498687744140625, 0.1472930908203125, 0.15959930419921875, 0.171905517578125, 0.18421173095703125, 0.1965179443359375, 0.20882415771484375, 0.22113037109375, 0.23343658447265625, 0.2457427978515625, 0.25804901123046875, 0.270355224609375, 0.28266143798828125, 0.2949676513671875, 0.30727386474609375, 0.319580078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 9.0, 17.0, 30.0, 23.0, 37.0, 58.0, 123.0, 218.0, 308.0, 668.0, 1123.0, 644.0, 361.0, 149.0, 105.0, 54.0, 46.0, 21.0, 15.0, 10.0, 4.0, 11.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.460693359375, -0.4444999694824219, -0.42830657958984375, -0.4121131896972656, -0.3959197998046875, -0.3797264099121094, -0.36353302001953125, -0.3473396301269531, -0.331146240234375, -0.3149528503417969, -0.29875946044921875, -0.2825660705566406, -0.2663726806640625, -0.2501792907714844, -0.23398590087890625, -0.21779251098632812, -0.20159912109375, -0.18540573120117188, -0.16921234130859375, -0.15301895141601562, -0.1368255615234375, -0.12063217163085938, -0.10443878173828125, -0.08824539184570312, -0.072052001953125, -0.055858612060546875, -0.03966522216796875, -0.023471832275390625, -0.0072784423828125, 0.008914947509765625, 0.02510833740234375, 0.041301727294921875, 0.0574951171875, 0.07368850708007812, 0.08988189697265625, 0.10607528686523438, 0.1222686767578125, 0.13846206665039062, 0.15465545654296875, 0.17084884643554688, 0.187042236328125, 0.20323562622070312, 0.21942901611328125, 0.23562240600585938, 0.2518157958984375, 0.2680091857910156, 0.28420257568359375, 0.3003959655761719, 0.31658935546875, 0.3327827453613281, 0.34897613525390625, 0.3651695251464844, 0.3813629150390625, 0.3975563049316406, 0.41374969482421875, 0.4299430847167969, 0.446136474609375, 0.4623298645019531, 0.47852325439453125, 0.4947166442871094, 0.5109100341796875, 0.5271034240722656, 0.5432968139648438, 0.5594902038574219, 0.57568359375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 4.0, 2.0, 4.0, 9.0, 8.0, 14.0, 63.0, 133.0, 269.0, 260.0, 153.0, 56.0, 11.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.224889755249023, -9.033588409423828, -8.842286109924316, -8.650983810424805, -8.45968246459961, -8.268381118774414, -8.077078819274902, -7.885776996612549, -7.694475173950195, -7.503173351287842, -7.311871528625488, -7.120569705963135, -6.929267883300781, -6.737966060638428, -6.546664237976074, -6.355362415313721, -6.164060592651367, -5.972758769989014, -5.78145694732666, -5.590155124664307, -5.398853302001953, -5.2075514793396, -5.016249656677246, -4.824947834014893, -4.633646011352539, -4.4423441886901855, -4.251042366027832, -4.0597405433654785, -3.868438720703125, -3.6771368980407715, -3.485835075378418, -3.2945332527160645, -3.10323166847229, -2.9119298458099365, -2.720628023147583, -2.5293262004852295, -2.338024377822876, -2.1467225551605225, -1.955420732498169, -1.7641189098358154, -1.572817087173462, -1.3815152645111084, -1.1902134418487549, -0.9989116191864014, -0.8076097965240479, -0.6163079738616943, -0.4250061511993408, -0.2337043285369873, -0.04240250587463379, 0.14889931678771973, 0.34020113945007324, 0.5315029621124268, 0.7228047847747803, 0.9141066074371338, 1.1054084300994873, 1.2967102527618408, 1.4880120754241943, 1.6793138980865479, 1.8706157207489014, 2.061917543411255, 2.2532193660736084, 2.444521188735962, 2.6358230113983154, 2.827124834060669, 3.0184266567230225]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 9.0, 13.0, 16.0, 14.0, 10.0, 27.0, 30.0, 27.0, 35.0, 42.0, 51.0, 48.0, 50.0, 57.0, 54.0, 51.0, 59.0, 54.0, 49.0, 42.0, 48.0, 32.0, 35.0, 28.0, 29.0, 20.0, 22.0, 13.0, 15.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1493704319000244, -2.072101593017578, -1.9948326349258423, -1.917563796043396, -1.8402948379516602, -1.7630259990692139, -1.6857571601867676, -1.6084883213043213, -1.5312193632125854, -1.4539505243301392, -1.3766815662384033, -1.299412727355957, -1.2221438884735107, -1.144874930381775, -1.0676060914993286, -0.9903371930122375, -0.9130682945251465, -0.8357993960380554, -0.7585304975509644, -0.6812616586685181, -0.603992760181427, -0.5267238616943359, -0.44945499300956726, -0.3721861243247986, -0.2949172258377075, -0.21764834225177765, -0.14037945866584778, -0.06311057507991791, 0.014158308506011963, 0.09142720699310303, 0.1686960756778717, 0.24596494436264038, 0.32323408126831055, 0.4005029797554016, 0.4777718484401703, 0.555040717124939, 0.63230961561203, 0.7095785140991211, 0.7868473529815674, 0.8641162514686584, 0.9413851499557495, 1.0186539888381958, 1.0959229469299316, 1.173191785812378, 1.2504606246948242, 1.32772958278656, 1.4049984216690063, 1.4822673797607422, 1.5595362186431885, 1.6368050575256348, 1.7140740156173706, 1.791342854499817, 1.8686118125915527, 1.945880651473999, 2.0231494903564453, 2.1004183292388916, 2.177687168121338, 2.254956007003784, 2.3322248458862305, 2.409493923187256, 2.486762762069702, 2.5640316009521484, 2.6413004398345947, 2.718569278717041, 2.7958383560180664]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 9.0, 9.0, 10.0, 17.0, 17.0, 41.0, 56.0, 86.0, 154.0, 226.0, 402.0, 742.0, 1244.0, 2476.0, 4875.0, 10753.0, 27938.0, 85719.0, 311572.0, 416518.0, 121543.0, 37714.0, 13917.0, 5928.0, 2880.0, 1535.0, 859.0, 494.0, 313.0, 185.0, 116.0, 65.0, 42.0, 36.0, 19.0, 17.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5107421875, -0.49620819091796875, -0.4816741943359375, -0.46714019775390625, -0.452606201171875, -0.43807220458984375, -0.4235382080078125, -0.40900421142578125, -0.39447021484375, -0.37993621826171875, -0.3654022216796875, -0.35086822509765625, -0.336334228515625, -0.32180023193359375, -0.3072662353515625, -0.29273223876953125, -0.2781982421875, -0.26366424560546875, -0.2491302490234375, -0.23459625244140625, -0.220062255859375, -0.20552825927734375, -0.1909942626953125, -0.17646026611328125, -0.16192626953125, -0.14739227294921875, -0.1328582763671875, -0.11832427978515625, -0.103790283203125, -0.08925628662109375, -0.0747222900390625, -0.06018829345703125, -0.045654296875, -0.03112030029296875, -0.0165863037109375, -0.00205230712890625, 0.012481689453125, 0.02701568603515625, 0.0415496826171875, 0.05608367919921875, 0.07061767578125, 0.08515167236328125, 0.0996856689453125, 0.11421966552734375, 0.128753662109375, 0.14328765869140625, 0.1578216552734375, 0.17235565185546875, 0.1868896484375, 0.20142364501953125, 0.2159576416015625, 0.23049163818359375, 0.245025634765625, 0.25955963134765625, 0.2740936279296875, 0.28862762451171875, 0.30316162109375, 0.31769561767578125, 0.3322296142578125, 0.34676361083984375, 0.361297607421875, 0.37583160400390625, 0.3903656005859375, 0.40489959716796875, 0.41943359375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 6.0, 5.0, 10.0, 15.0, 14.0, 15.0, 28.0, 40.0, 32.0, 41.0, 59.0, 37.0, 71.0, 73.0, 73.0, 79.0, 54.0, 54.0, 51.0, 44.0, 33.0, 30.0, 27.0, 22.0, 26.0, 10.0, 11.0, 8.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24365234375, -0.2369537353515625, -0.230255126953125, -0.2235565185546875, -0.21685791015625, -0.2101593017578125, -0.203460693359375, -0.1967620849609375, -0.1900634765625, -0.1833648681640625, -0.176666259765625, -0.1699676513671875, -0.16326904296875, -0.1565704345703125, -0.149871826171875, -0.1431732177734375, -0.136474609375, -0.1297760009765625, -0.123077392578125, -0.1163787841796875, -0.10968017578125, -0.1029815673828125, -0.096282958984375, -0.0895843505859375, -0.0828857421875, -0.0761871337890625, -0.069488525390625, -0.0627899169921875, -0.05609130859375, -0.0493927001953125, -0.042694091796875, -0.0359954833984375, -0.029296875, -0.0225982666015625, -0.015899658203125, -0.0092010498046875, -0.00250244140625, 0.0041961669921875, 0.010894775390625, 0.0175933837890625, 0.0242919921875, 0.0309906005859375, 0.037689208984375, 0.0443878173828125, 0.05108642578125, 0.0577850341796875, 0.064483642578125, 0.0711822509765625, 0.077880859375, 0.0845794677734375, 0.091278076171875, 0.0979766845703125, 0.10467529296875, 0.1113739013671875, 0.118072509765625, 0.1247711181640625, 0.1314697265625, 0.1381683349609375, 0.144866943359375, 0.1515655517578125, 0.15826416015625, 0.1649627685546875, 0.171661376953125, 0.1783599853515625, 0.18505859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 9.0, 12.0, 19.0, 38.0, 54.0, 86.0, 119.0, 238.0, 501.0, 1154.0, 3395.0, 16267.0, 178315.0, 776068.0, 60576.0, 7893.0, 2134.0, 838.0, 387.0, 169.0, 107.0, 59.0, 36.0, 23.0, 13.0, 15.0, 5.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8017578125, -0.7700653076171875, -0.738372802734375, -0.7066802978515625, -0.67498779296875, -0.6432952880859375, -0.611602783203125, -0.5799102783203125, -0.5482177734375, -0.5165252685546875, -0.484832763671875, -0.4531402587890625, -0.42144775390625, -0.3897552490234375, -0.358062744140625, -0.3263702392578125, -0.294677734375, -0.2629852294921875, -0.231292724609375, -0.1996002197265625, -0.16790771484375, -0.1362152099609375, -0.104522705078125, -0.0728302001953125, -0.0411376953125, -0.0094451904296875, 0.022247314453125, 0.0539398193359375, 0.08563232421875, 0.1173248291015625, 0.149017333984375, 0.1807098388671875, 0.21240234375, 0.2440948486328125, 0.275787353515625, 0.3074798583984375, 0.33917236328125, 0.3708648681640625, 0.402557373046875, 0.4342498779296875, 0.4659423828125, 0.4976348876953125, 0.529327392578125, 0.5610198974609375, 0.59271240234375, 0.6244049072265625, 0.656097412109375, 0.6877899169921875, 0.719482421875, 0.7511749267578125, 0.782867431640625, 0.8145599365234375, 0.84625244140625, 0.8779449462890625, 0.909637451171875, 0.9413299560546875, 0.9730224609375, 1.0047149658203125, 1.036407470703125, 1.0680999755859375, 1.09979248046875, 1.1314849853515625, 1.163177490234375, 1.1948699951171875, 1.2265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 1.0, 4.0, 9.0, 5.0, 17.0, 19.0, 25.0, 28.0, 44.0, 46.0, 45.0, 53.0, 67.0, 67.0, 73.0, 60.0, 77.0, 50.0, 58.0, 46.0, 43.0, 43.0, 33.0, 29.0, 11.0, 13.0, 11.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7060546875, -0.672393798828125, -0.63873291015625, -0.605072021484375, -0.5714111328125, -0.537750244140625, -0.50408935546875, -0.470428466796875, -0.436767578125, -0.403106689453125, -0.36944580078125, -0.335784912109375, -0.3021240234375, -0.268463134765625, -0.23480224609375, -0.201141357421875, -0.16748046875, -0.133819580078125, -0.10015869140625, -0.066497802734375, -0.0328369140625, 0.000823974609375, 0.03448486328125, 0.068145751953125, 0.101806640625, 0.135467529296875, 0.16912841796875, 0.202789306640625, 0.2364501953125, 0.270111083984375, 0.30377197265625, 0.337432861328125, 0.37109375, 0.404754638671875, 0.43841552734375, 0.472076416015625, 0.5057373046875, 0.539398193359375, 0.57305908203125, 0.606719970703125, 0.640380859375, 0.674041748046875, 0.70770263671875, 0.741363525390625, 0.7750244140625, 0.808685302734375, 0.84234619140625, 0.876007080078125, 0.90966796875, 0.943328857421875, 0.97698974609375, 1.010650634765625, 1.0443115234375, 1.077972412109375, 1.11163330078125, 1.145294189453125, 1.178955078125, 1.212615966796875, 1.24627685546875, 1.279937744140625, 1.3135986328125, 1.347259521484375, 1.38092041015625, 1.414581298828125, 1.4482421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 9.0, 4.0, 8.0, 28.0, 20.0, 36.0, 69.0, 125.0, 218.0, 437.0, 1011.0, 3180.0, 20365.0, 833644.0, 177482.0, 8594.0, 1823.0, 724.0, 327.0, 167.0, 80.0, 70.0, 35.0, 22.0, 18.0, 16.0, 8.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.841796875, -0.8161392211914062, -0.7904815673828125, -0.7648239135742188, -0.739166259765625, -0.7135086059570312, -0.6878509521484375, -0.6621932983398438, -0.63653564453125, -0.6108779907226562, -0.5852203369140625, -0.5595626831054688, -0.533905029296875, -0.5082473754882812, -0.4825897216796875, -0.45693206787109375, -0.4312744140625, -0.40561676025390625, -0.3799591064453125, -0.35430145263671875, -0.328643798828125, -0.30298614501953125, -0.2773284912109375, -0.25167083740234375, -0.22601318359375, -0.20035552978515625, -0.1746978759765625, -0.14904022216796875, -0.123382568359375, -0.09772491455078125, -0.0720672607421875, -0.04640960693359375, -0.020751953125, 0.00490570068359375, 0.0305633544921875, 0.05622100830078125, 0.081878662109375, 0.10753631591796875, 0.1331939697265625, 0.15885162353515625, 0.18450927734375, 0.21016693115234375, 0.2358245849609375, 0.26148223876953125, 0.287139892578125, 0.31279754638671875, 0.3384552001953125, 0.36411285400390625, 0.3897705078125, 0.41542816162109375, 0.4410858154296875, 0.46674346923828125, 0.492401123046875, 0.5180587768554688, 0.5437164306640625, 0.5693740844726562, 0.59503173828125, 0.6206893920898438, 0.6463470458984375, 0.6720046997070312, 0.697662353515625, 0.7233200073242188, 0.7489776611328125, 0.7746353149414062, 0.80029296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 5.0, 3.0, 11.0, 8.0, 18.0, 9.0, 23.0, 24.0, 28.0, 28.0, 37.0, 52.0, 81.0, 103.0, 119.0, 100.0, 88.0, 62.0, 43.0, 34.0, 24.0, 15.0, 16.0, 16.0, 7.0, 4.0, 4.0, 7.0, 7.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013399124145507812, -0.0001301141455769539, -0.00012623704969882965, -0.00012235995382070541, -0.00011848285794258118, -0.00011460576206445694, -0.0001107286661863327, -0.00010685157030820847, -0.00010297447443008423, -9.909737855195999e-05, -9.522028267383575e-05, -9.134318679571152e-05, -8.746609091758728e-05, -8.358899503946304e-05, -7.97118991613388e-05, -7.583480328321457e-05, -7.195770740509033e-05, -6.80806115269661e-05, -6.420351564884186e-05, -6.032641977071762e-05, -5.6449323892593384e-05, -5.257222801446915e-05, -4.869513213634491e-05, -4.481803625822067e-05, -4.0940940380096436e-05, -3.70638445019722e-05, -3.318674862384796e-05, -2.9309652745723724e-05, -2.5432556867599487e-05, -2.155546098947525e-05, -1.7678365111351013e-05, -1.3801269233226776e-05, -9.924173355102539e-06, -6.047077476978302e-06, -2.169981598854065e-06, 1.7071142792701721e-06, 5.584210157394409e-06, 9.461306035518646e-06, 1.3338401913642883e-05, 1.721549779176712e-05, 2.1092593669891357e-05, 2.4969689548015594e-05, 2.884678542613983e-05, 3.272388130426407e-05, 3.6600977182388306e-05, 4.047807306051254e-05, 4.435516893863678e-05, 4.823226481676102e-05, 5.2109360694885254e-05, 5.598645657300949e-05, 5.986355245113373e-05, 6.374064832925797e-05, 6.76177442073822e-05, 7.149484008550644e-05, 7.537193596363068e-05, 7.924903184175491e-05, 8.312612771987915e-05, 8.700322359800339e-05, 9.088031947612762e-05, 9.475741535425186e-05, 9.86345112323761e-05, 0.00010251160711050034, 0.00010638870298862457, 0.00011026579886674881, 0.00011414289474487305]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 8.0, 14.0, 17.0, 38.0, 41.0, 61.0, 85.0, 146.0, 285.0, 483.0, 1091.0, 3219.0, 14736.0, 229280.0, 762668.0, 28458.0, 4949.0, 1538.0, 613.0, 304.0, 190.0, 91.0, 63.0, 44.0, 40.0, 27.0, 9.0, 12.0, 10.0, 5.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.7197265625, -0.6992568969726562, -0.6787872314453125, -0.6583175659179688, -0.637847900390625, -0.6173782348632812, -0.5969085693359375, -0.5764389038085938, -0.55596923828125, -0.5354995727539062, -0.5150299072265625, -0.49456024169921875, -0.474090576171875, -0.45362091064453125, -0.4331512451171875, -0.41268157958984375, -0.3922119140625, -0.37174224853515625, -0.3512725830078125, -0.33080291748046875, -0.310333251953125, -0.28986358642578125, -0.2693939208984375, -0.24892425537109375, -0.22845458984375, -0.20798492431640625, -0.1875152587890625, -0.16704559326171875, -0.146575927734375, -0.12610626220703125, -0.1056365966796875, -0.08516693115234375, -0.064697265625, -0.04422760009765625, -0.0237579345703125, -0.00328826904296875, 0.017181396484375, 0.03765106201171875, 0.0581207275390625, 0.07859039306640625, 0.09906005859375, 0.11952972412109375, 0.1399993896484375, 0.16046905517578125, 0.180938720703125, 0.20140838623046875, 0.2218780517578125, 0.24234771728515625, 0.2628173828125, 0.28328704833984375, 0.3037567138671875, 0.32422637939453125, 0.344696044921875, 0.36516571044921875, 0.3856353759765625, 0.40610504150390625, 0.42657470703125, 0.44704437255859375, 0.4675140380859375, 0.48798370361328125, 0.508453369140625, 0.5289230346679688, 0.5493927001953125, 0.5698623657226562, 0.59033203125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 10.0, 11.0, 8.0, 11.0, 14.0, 18.0, 23.0, 38.0, 45.0, 80.0, 99.0, 125.0, 117.0, 123.0, 70.0, 41.0, 53.0, 21.0, 17.0, 19.0, 15.0, 4.0, 10.0, 7.0, 7.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.52685546875, -0.5129890441894531, -0.49912261962890625, -0.4852561950683594, -0.4713897705078125, -0.4575233459472656, -0.44365692138671875, -0.4297904968261719, -0.415924072265625, -0.4020576477050781, -0.38819122314453125, -0.3743247985839844, -0.3604583740234375, -0.3465919494628906, -0.33272552490234375, -0.3188591003417969, -0.30499267578125, -0.2911262512207031, -0.27725982666015625, -0.2633934020996094, -0.2495269775390625, -0.23566055297851562, -0.22179412841796875, -0.20792770385742188, -0.194061279296875, -0.18019485473632812, -0.16632843017578125, -0.15246200561523438, -0.1385955810546875, -0.12472915649414062, -0.11086273193359375, -0.09699630737304688, -0.0831298828125, -0.06926345825195312, -0.05539703369140625, -0.041530609130859375, -0.0276641845703125, -0.013797760009765625, 6.866455078125e-05, 0.013935089111328125, 0.027801513671875, 0.041667938232421875, 0.05553436279296875, 0.06940078735351562, 0.0832672119140625, 0.09713363647460938, 0.11100006103515625, 0.12486648559570312, 0.13873291015625, 0.15259933471679688, 0.16646575927734375, 0.18033218383789062, 0.1941986083984375, 0.20806503295898438, 0.22193145751953125, 0.23579788208007812, 0.249664306640625, 0.2635307312011719, 0.27739715576171875, 0.2912635803222656, 0.3051300048828125, 0.3189964294433594, 0.33286285400390625, 0.3467292785644531, 0.360595703125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 8.0, 29.0, 66.0, 159.0, 274.0, 243.0, 125.0, 37.0, 23.0, 10.0, 8.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.0038423538208, -11.729766845703125, -11.45569133758545, -11.181615829467773, -10.907540321350098, -10.633464813232422, -10.359389305114746, -10.08531379699707, -9.811239242553711, -9.537163734436035, -9.26308822631836, -8.989012718200684, -8.714937210083008, -8.440861701965332, -8.166786193847656, -7.892711162567139, -7.618635177612305, -7.344559669494629, -7.070484161376953, -6.796408653259277, -6.522333145141602, -6.248257637023926, -5.974182605743408, -5.700107097625732, -5.426031589508057, -5.151956081390381, -4.877880573272705, -4.603805065155029, -4.329730033874512, -4.055654525756836, -3.78157901763916, -3.5075035095214844, -3.2334280014038086, -2.959352493286133, -2.685276985168457, -2.4112017154693604, -2.1371262073516846, -1.8630506992340088, -1.5889753103256226, -1.3148999214172363, -1.0408244132995605, -0.7667489647865295, -0.49267351627349854, -0.21859806776046753, 0.05547738075256348, 0.32955288887023926, 0.6036282777786255, 0.8777036666870117, 1.1517791748046875, 1.4258546829223633, 1.6999300718307495, 1.9740054607391357, 2.2480809688568115, 2.5221564769744873, 2.796231746673584, 3.0703072547912598, 3.3443827629089355, 3.6184582710266113, 3.892533779144287, 4.166609287261963, 4.4406843185424805, 4.714759826660156, 4.988835334777832, 5.262910842895508, 5.536986351013184]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 11.0, 7.0, 5.0, 9.0, 11.0, 11.0, 9.0, 22.0, 27.0, 23.0, 33.0, 38.0, 33.0, 32.0, 34.0, 57.0, 62.0, 57.0, 67.0, 61.0, 60.0, 50.0, 32.0, 37.0, 42.0, 19.0, 33.0, 20.0, 24.0, 13.0, 17.0, 11.0, 8.0, 10.0, 9.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.661123752593994, -3.5503969192504883, -3.4396703243255615, -3.3289434909820557, -3.21821665763855, -3.107490062713623, -2.996763229370117, -2.8860363960266113, -2.7753095626831055, -2.6645827293395996, -2.553856134414673, -2.443129301071167, -2.332402467727661, -2.2216758728027344, -2.1109490394592285, -2.0002222061157227, -1.8894954919815063, -1.77876877784729, -1.6680419445037842, -1.5573152303695679, -1.446588397026062, -1.3358616828918457, -1.2251348495483398, -1.1144081354141235, -1.0036814212799072, -0.8929546475410461, -0.7822278738021851, -0.6715011596679688, -0.5607743263244629, -0.4500476121902466, -0.3393208384513855, -0.22859406471252441, -0.11786723136901855, -0.007140465080738068, 0.10358630120754242, 0.2143130600452423, 0.3250398337841034, 0.4357665777206421, 0.5464933514595032, 0.6572201251983643, 0.7679468989372253, 0.8786736726760864, 0.9894004464149475, 1.1001272201538086, 1.210853934288025, 1.3215806484222412, 1.432307481765747, 1.543034315109253, 1.6537610292434692, 1.7644877433776855, 1.8752145767211914, 1.9859412908554077, 2.096668004989624, 2.20739483833313, 2.3181216716766357, 2.4288482666015625, 2.5395750999450684, 2.650301933288574, 2.761028528213501, 2.871755361557007, 2.9824821949005127, 3.0932087898254395, 3.2039356231689453, 3.314662456512451, 3.425389289855957]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 9.0, 20.0, 17.0, 21.0, 28.0, 49.0, 74.0, 174.0, 620.0, 3348.0, 36471.0, 3619891.0, 518704.0, 12440.0, 1680.0, 383.0, 148.0, 71.0, 36.0, 32.0, 19.0, 14.0, 7.0, 7.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.904296875, -0.8775482177734375, -0.850799560546875, -0.8240509033203125, -0.79730224609375, -0.7705535888671875, -0.743804931640625, -0.7170562744140625, -0.6903076171875, -0.6635589599609375, -0.636810302734375, -0.6100616455078125, -0.58331298828125, -0.5565643310546875, -0.529815673828125, -0.5030670166015625, -0.476318359375, -0.4495697021484375, -0.422821044921875, -0.3960723876953125, -0.36932373046875, -0.3425750732421875, -0.315826416015625, -0.2890777587890625, -0.2623291015625, -0.2355804443359375, -0.208831787109375, -0.1820831298828125, -0.15533447265625, -0.1285858154296875, -0.101837158203125, -0.0750885009765625, -0.04833984375, -0.0215911865234375, 0.005157470703125, 0.0319061279296875, 0.05865478515625, 0.0854034423828125, 0.112152099609375, 0.1389007568359375, 0.1656494140625, 0.1923980712890625, 0.219146728515625, 0.2458953857421875, 0.27264404296875, 0.2993927001953125, 0.326141357421875, 0.3528900146484375, 0.379638671875, 0.4063873291015625, 0.433135986328125, 0.4598846435546875, 0.48663330078125, 0.5133819580078125, 0.540130615234375, 0.5668792724609375, 0.5936279296875, 0.6203765869140625, 0.647125244140625, 0.6738739013671875, 0.70062255859375, 0.7273712158203125, 0.754119873046875, 0.7808685302734375, 0.8076171875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 10.0, 5.0, 9.0, 8.0, 11.0, 14.0, 37.0, 46.0, 29.0, 49.0, 63.0, 59.0, 55.0, 75.0, 72.0, 65.0, 57.0, 55.0, 49.0, 44.0, 33.0, 29.0, 35.0, 16.0, 16.0, 12.0, 11.0, 11.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.201904296875, -0.1954517364501953, -0.18899917602539062, -0.18254661560058594, -0.17609405517578125, -0.16964149475097656, -0.16318893432617188, -0.1567363739013672, -0.1502838134765625, -0.1438312530517578, -0.13737869262695312, -0.13092613220214844, -0.12447357177734375, -0.11802101135253906, -0.11156845092773438, -0.10511589050292969, -0.098663330078125, -0.09221076965332031, -0.08575820922851562, -0.07930564880371094, -0.07285308837890625, -0.06640052795410156, -0.059947967529296875, -0.05349540710449219, -0.0470428466796875, -0.04059028625488281, -0.034137725830078125, -0.027685165405273438, -0.02123260498046875, -0.014780044555664062, -0.008327484130859375, -0.0018749237060546875, 0.00457763671875, 0.011030197143554688, 0.017482757568359375, 0.023935317993164062, 0.03038787841796875, 0.03684043884277344, 0.043292999267578125, 0.04974555969238281, 0.0561981201171875, 0.06265068054199219, 0.06910324096679688, 0.07555580139160156, 0.08200836181640625, 0.08846092224121094, 0.09491348266601562, 0.10136604309082031, 0.107818603515625, 0.11427116394042969, 0.12072372436523438, 0.12717628479003906, 0.13362884521484375, 0.14008140563964844, 0.14653396606445312, 0.1529865264892578, 0.1594390869140625, 0.1658916473388672, 0.17234420776367188, 0.17879676818847656, 0.18524932861328125, 0.19170188903808594, 0.19815444946289062, 0.2046070098876953, 0.2110595703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 1.0, 7.0, 5.0, 14.0, 9.0, 15.0, 20.0, 32.0, 51.0, 83.0, 136.0, 223.0, 380.0, 773.0, 1910.0, 5772.0, 21823.0, 136969.0, 2683311.0, 1242836.0, 79484.0, 14073.0, 3795.0, 1338.0, 534.0, 260.0, 160.0, 74.0, 63.0, 41.0, 15.0, 19.0, 16.0, 11.0, 6.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43017578125, -0.415283203125, -0.400390625, -0.385498046875, -0.37060546875, -0.355712890625, -0.3408203125, -0.325927734375, -0.31103515625, -0.296142578125, -0.28125, -0.266357421875, -0.25146484375, -0.236572265625, -0.2216796875, -0.206787109375, -0.19189453125, -0.177001953125, -0.162109375, -0.147216796875, -0.13232421875, -0.117431640625, -0.1025390625, -0.087646484375, -0.07275390625, -0.057861328125, -0.04296875, -0.028076171875, -0.01318359375, 0.001708984375, 0.0166015625, 0.031494140625, 0.04638671875, 0.061279296875, 0.076171875, 0.091064453125, 0.10595703125, 0.120849609375, 0.1357421875, 0.150634765625, 0.16552734375, 0.180419921875, 0.1953125, 0.210205078125, 0.22509765625, 0.239990234375, 0.2548828125, 0.269775390625, 0.28466796875, 0.299560546875, 0.314453125, 0.329345703125, 0.34423828125, 0.359130859375, 0.3740234375, 0.388916015625, 0.40380859375, 0.418701171875, 0.43359375, 0.448486328125, 0.46337890625, 0.478271484375, 0.4931640625, 0.508056640625, 0.52294921875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 3.0, 11.0, 15.0, 12.0, 21.0, 28.0, 22.0, 30.0, 40.0, 47.0, 82.0, 165.0, 196.0, 260.0, 455.0, 641.0, 654.0, 489.0, 280.0, 177.0, 118.0, 98.0, 63.0, 36.0, 31.0, 30.0, 12.0, 12.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.419921875, -0.4068260192871094, -0.39373016357421875, -0.3806343078613281, -0.3675384521484375, -0.3544425964355469, -0.34134674072265625, -0.3282508850097656, -0.315155029296875, -0.3020591735839844, -0.28896331787109375, -0.2758674621582031, -0.2627716064453125, -0.24967575073242188, -0.23657989501953125, -0.22348403930664062, -0.21038818359375, -0.19729232788085938, -0.18419647216796875, -0.17110061645507812, -0.1580047607421875, -0.14490890502929688, -0.13181304931640625, -0.11871719360351562, -0.105621337890625, -0.09252548217773438, -0.07942962646484375, -0.06633377075195312, -0.0532379150390625, -0.040142059326171875, -0.02704620361328125, -0.013950347900390625, -0.0008544921875, 0.012241363525390625, 0.02533721923828125, 0.038433074951171875, 0.0515289306640625, 0.06462478637695312, 0.07772064208984375, 0.09081649780273438, 0.103912353515625, 0.11700820922851562, 0.13010406494140625, 0.14319992065429688, 0.1562957763671875, 0.16939163208007812, 0.18248748779296875, 0.19558334350585938, 0.20867919921875, 0.22177505493164062, 0.23487091064453125, 0.24796676635742188, 0.2610626220703125, 0.2741584777832031, 0.28725433349609375, 0.3003501892089844, 0.313446044921875, 0.3265419006347656, 0.33963775634765625, 0.3527336120605469, 0.3658294677734375, 0.3789253234863281, 0.39202117919921875, 0.4051170349121094, 0.418212890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 12.0, 34.0, 150.0, 413.0, 301.0, 63.0, 14.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.2432918548584, -16.897762298583984, -16.55223274230957, -16.206703186035156, -15.861173629760742, -15.515644073486328, -15.170114517211914, -14.8245849609375, -14.479055404663086, -14.133525848388672, -13.787996292114258, -13.442466735839844, -13.09693717956543, -12.751407623291016, -12.405878067016602, -12.060348510742188, -11.714818954467773, -11.36928939819336, -11.023759841918945, -10.678230285644531, -10.332700729370117, -9.987171173095703, -9.641641616821289, -9.296112060546875, -8.950581550598145, -8.60505199432373, -8.259522438049316, -7.913992881774902, -7.568463325500488, -7.222933769226074, -6.87740421295166, -6.531874656677246, -6.186345100402832, -5.840815544128418, -5.495285987854004, -5.14975643157959, -4.804226875305176, -4.458697319030762, -4.113167762756348, -3.7676379680633545, -3.4221084117889404, -3.0765788555145264, -2.7310492992401123, -2.385519504547119, -2.039989948272705, -1.6944605112075806, -1.348930835723877, -1.003401279449463, -0.6578717231750488, -0.3123421370983124, 0.03318744897842407, 0.3787170648574829, 0.724246621131897, 1.069776177406311, 1.4153058528900146, 1.7608354091644287, 2.1063649654388428, 2.451894521713257, 2.797424077987671, 3.142953872680664, 3.488483428955078, 3.834012985229492, 4.179542541503906, 4.52507209777832, 4.870601654052734]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 5.0, 2.0, 4.0, 7.0, 7.0, 10.0, 10.0, 20.0, 21.0, 33.0, 22.0, 30.0, 24.0, 32.0, 43.0, 40.0, 27.0, 37.0, 44.0, 45.0, 52.0, 33.0, 52.0, 51.0, 44.0, 43.0, 33.0, 26.0, 33.0, 21.0, 21.0, 17.0, 17.0, 26.0, 9.0, 12.0, 8.0, 5.0, 7.0, 9.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.052689790725708, -1.9804867506027222, -1.9082838296890259, -1.83608078956604, -1.7638778686523438, -1.691674828529358, -1.619471788406372, -1.5472688674926758, -1.47506582736969, -1.402862787246704, -1.3306598663330078, -1.258456826210022, -1.1862537860870361, -1.1140508651733398, -1.041847825050354, -0.9696448445320129, -0.8974418640136719, -0.8252388834953308, -0.7530359029769897, -0.6808328628540039, -0.6086298823356628, -0.5364269018173218, -0.4642238914966583, -0.3920208811759949, -0.3198179006576538, -0.24761490523815155, -0.1754119098186493, -0.10320891439914703, -0.031005918979644775, 0.04119706153869629, 0.11340007185935974, 0.1856030821800232, 0.25780582427978516, 0.3300088047981262, 0.4022118151187897, 0.4744148254394531, 0.5466178059577942, 0.6188207864761353, 0.6910238265991211, 0.7632268071174622, 0.8354297876358032, 0.9076327681541443, 0.9798357486724854, 1.0520387887954712, 1.124241828918457, 1.1964447498321533, 1.2686477899551392, 1.340850830078125, 1.4130537509918213, 1.4852567911148071, 1.5574597120285034, 1.6296627521514893, 1.7018656730651855, 1.7740687131881714, 1.8462717533111572, 1.9184746742248535, 1.9906777143478394, 2.062880754470825, 2.1350836753845215, 2.2072865962982178, 2.279489755630493, 2.3516926765441895, 2.4238955974578857, 2.496098756790161, 2.5683016777038574]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 11.0, 4.0, 8.0, 6.0, 23.0, 23.0, 32.0, 49.0, 61.0, 106.0, 166.0, 299.0, 516.0, 882.0, 1697.0, 3578.0, 8014.0, 19844.0, 52870.0, 151186.0, 385726.0, 271309.0, 94513.0, 33467.0, 12974.0, 5640.0, 2578.0, 1279.0, 648.0, 393.0, 225.0, 132.0, 88.0, 77.0, 44.0, 30.0, 22.0, 8.0, 12.0, 5.0, 3.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364501953125, -0.35137939453125, -0.3382568359375, -0.32513427734375, -0.31201171875, -0.29888916015625, -0.2857666015625, -0.27264404296875, -0.259521484375, -0.24639892578125, -0.2332763671875, -0.22015380859375, -0.20703125, -0.19390869140625, -0.1807861328125, -0.16766357421875, -0.154541015625, -0.14141845703125, -0.1282958984375, -0.11517333984375, -0.10205078125, -0.08892822265625, -0.0758056640625, -0.06268310546875, -0.049560546875, -0.03643798828125, -0.0233154296875, -0.01019287109375, 0.0029296875, 0.01605224609375, 0.0291748046875, 0.04229736328125, 0.055419921875, 0.06854248046875, 0.0816650390625, 0.09478759765625, 0.10791015625, 0.12103271484375, 0.1341552734375, 0.14727783203125, 0.160400390625, 0.17352294921875, 0.1866455078125, 0.19976806640625, 0.212890625, 0.22601318359375, 0.2391357421875, 0.25225830078125, 0.265380859375, 0.27850341796875, 0.2916259765625, 0.30474853515625, 0.31787109375, 0.33099365234375, 0.3441162109375, 0.35723876953125, 0.370361328125, 0.38348388671875, 0.3966064453125, 0.40972900390625, 0.4228515625, 0.43597412109375, 0.4490966796875, 0.46221923828125, 0.475341796875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 2.0, 5.0, 3.0, 8.0, 10.0, 13.0, 10.0, 17.0, 31.0, 35.0, 32.0, 53.0, 53.0, 58.0, 69.0, 77.0, 61.0, 55.0, 42.0, 53.0, 56.0, 43.0, 39.0, 35.0, 30.0, 16.0, 26.0, 19.0, 7.0, 10.0, 8.0, 4.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.193603515625, -0.187255859375, -0.180908203125, -0.174560546875, -0.168212890625, -0.161865234375, -0.155517578125, -0.149169921875, -0.142822265625, -0.136474609375, -0.130126953125, -0.123779296875, -0.117431640625, -0.111083984375, -0.104736328125, -0.098388671875, -0.092041015625, -0.085693359375, -0.079345703125, -0.072998046875, -0.066650390625, -0.060302734375, -0.053955078125, -0.047607421875, -0.041259765625, -0.034912109375, -0.028564453125, -0.022216796875, -0.015869140625, -0.009521484375, -0.003173828125, 0.003173828125, 0.009521484375, 0.015869140625, 0.022216796875, 0.028564453125, 0.034912109375, 0.041259765625, 0.047607421875, 0.053955078125, 0.060302734375, 0.066650390625, 0.072998046875, 0.079345703125, 0.085693359375, 0.092041015625, 0.098388671875, 0.104736328125, 0.111083984375, 0.117431640625, 0.123779296875, 0.130126953125, 0.136474609375, 0.142822265625, 0.149169921875, 0.155517578125, 0.161865234375, 0.168212890625, 0.174560546875, 0.180908203125, 0.187255859375, 0.193603515625, 0.199951171875, 0.206298828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 9.0, 7.0, 18.0, 33.0, 44.0, 69.0, 144.0, 264.0, 531.0, 1187.0, 3430.0, 17867.0, 485431.0, 515788.0, 17827.0, 3453.0, 1271.0, 523.0, 277.0, 159.0, 94.0, 45.0, 29.0, 24.0, 12.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2138671875, -1.1720123291015625, -1.130157470703125, -1.0883026123046875, -1.04644775390625, -1.0045928955078125, -0.962738037109375, -0.9208831787109375, -0.8790283203125, -0.8371734619140625, -0.795318603515625, -0.7534637451171875, -0.71160888671875, -0.6697540283203125, -0.627899169921875, -0.5860443115234375, -0.544189453125, -0.5023345947265625, -0.460479736328125, -0.4186248779296875, -0.37677001953125, -0.3349151611328125, -0.293060302734375, -0.2512054443359375, -0.2093505859375, -0.1674957275390625, -0.125640869140625, -0.0837860107421875, -0.04193115234375, -7.62939453125e-05, 0.041778564453125, 0.0836334228515625, 0.12548828125, 0.1673431396484375, 0.209197998046875, 0.2510528564453125, 0.29290771484375, 0.3347625732421875, 0.376617431640625, 0.4184722900390625, 0.4603271484375, 0.5021820068359375, 0.544036865234375, 0.5858917236328125, 0.62774658203125, 0.6696014404296875, 0.711456298828125, 0.7533111572265625, 0.795166015625, 0.8370208740234375, 0.878875732421875, 0.9207305908203125, 0.96258544921875, 1.0044403076171875, 1.046295166015625, 1.0881500244140625, 1.1300048828125, 1.1718597412109375, 1.213714599609375, 1.2555694580078125, 1.29742431640625, 1.3392791748046875, 1.381134033203125, 1.4229888916015625, 1.46484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 13.0, 10.0, 15.0, 17.0, 21.0, 44.0, 52.0, 61.0, 54.0, 49.0, 52.0, 76.0, 75.0, 67.0, 79.0, 73.0, 50.0, 38.0, 30.0, 21.0, 24.0, 22.0, 11.0, 5.0, 6.0, 9.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.5966796875, -1.5577545166015625, -1.518829345703125, -1.4799041748046875, -1.44097900390625, -1.4020538330078125, -1.363128662109375, -1.3242034912109375, -1.2852783203125, -1.2463531494140625, -1.207427978515625, -1.1685028076171875, -1.12957763671875, -1.0906524658203125, -1.051727294921875, -1.0128021240234375, -0.973876953125, -0.9349517822265625, -0.896026611328125, -0.8571014404296875, -0.81817626953125, -0.7792510986328125, -0.740325927734375, -0.7014007568359375, -0.6624755859375, -0.6235504150390625, -0.584625244140625, -0.5457000732421875, -0.50677490234375, -0.4678497314453125, -0.428924560546875, -0.3899993896484375, -0.35107421875, -0.3121490478515625, -0.273223876953125, -0.2342987060546875, -0.19537353515625, -0.1564483642578125, -0.117523193359375, -0.0785980224609375, -0.0396728515625, -0.0007476806640625, 0.038177490234375, 0.0771026611328125, 0.11602783203125, 0.1549530029296875, 0.193878173828125, 0.2328033447265625, 0.271728515625, 0.3106536865234375, 0.349578857421875, 0.3885040283203125, 0.42742919921875, 0.4663543701171875, 0.505279541015625, 0.5442047119140625, 0.5831298828125, 0.6220550537109375, 0.660980224609375, 0.6999053955078125, 0.73883056640625, 0.7777557373046875, 0.816680908203125, 0.8556060791015625, 0.89453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 9.0, 4.0, 12.0, 19.0, 14.0, 32.0, 32.0, 65.0, 134.0, 225.0, 467.0, 1055.0, 3202.0, 15121.0, 174019.0, 800635.0, 43811.0, 6448.0, 1758.0, 695.0, 315.0, 190.0, 103.0, 63.0, 34.0, 29.0, 18.0, 11.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.609375, -0.591583251953125, -0.57379150390625, -0.555999755859375, -0.5382080078125, -0.520416259765625, -0.50262451171875, -0.484832763671875, -0.467041015625, -0.449249267578125, -0.43145751953125, -0.413665771484375, -0.3958740234375, -0.378082275390625, -0.36029052734375, -0.342498779296875, -0.32470703125, -0.306915283203125, -0.28912353515625, -0.271331787109375, -0.2535400390625, -0.235748291015625, -0.21795654296875, -0.200164794921875, -0.182373046875, -0.164581298828125, -0.14678955078125, -0.128997802734375, -0.1112060546875, -0.093414306640625, -0.07562255859375, -0.057830810546875, -0.0400390625, -0.022247314453125, -0.00445556640625, 0.013336181640625, 0.0311279296875, 0.048919677734375, 0.06671142578125, 0.084503173828125, 0.102294921875, 0.120086669921875, 0.13787841796875, 0.155670166015625, 0.1734619140625, 0.191253662109375, 0.20904541015625, 0.226837158203125, 0.24462890625, 0.262420654296875, 0.28021240234375, 0.298004150390625, 0.3157958984375, 0.333587646484375, 0.35137939453125, 0.369171142578125, 0.386962890625, 0.404754638671875, 0.42254638671875, 0.440338134765625, 0.4581298828125, 0.475921630859375, 0.49371337890625, 0.511505126953125, 0.529296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 8.0, 5.0, 9.0, 5.0, 12.0, 8.0, 16.0, 15.0, 19.0, 21.0, 35.0, 30.0, 47.0, 44.0, 59.0, 71.0, 75.0, 77.0, 62.0, 70.0, 62.0, 56.0, 33.0, 29.0, 30.0, 23.0, 14.0, 16.0, 14.0, 15.0, 4.0, 9.0, 9.0, 7.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0001323223114013672, -0.0001287553459405899, -0.00012518838047981262, -0.00012162141501903534, -0.00011805444955825806, -0.00011448748409748077, -0.00011092051863670349, -0.00010735355317592621, -0.00010378658771514893, -0.00010021962225437164, -9.665265679359436e-05, -9.308569133281708e-05, -8.95187258720398e-05, -8.595176041126251e-05, -8.238479495048523e-05, -7.881782948970795e-05, -7.525086402893066e-05, -7.168389856815338e-05, -6.81169331073761e-05, -6.454996764659882e-05, -6.098300218582153e-05, -5.741603672504425e-05, -5.384907126426697e-05, -5.0282105803489685e-05, -4.67151403427124e-05, -4.314817488193512e-05, -3.958120942115784e-05, -3.6014243960380554e-05, -3.244727849960327e-05, -2.888031303882599e-05, -2.5313347578048706e-05, -2.1746382117271423e-05, -1.817941665649414e-05, -1.4612451195716858e-05, -1.1045485734939575e-05, -7.4785202741622925e-06, -3.91155481338501e-06, -3.4458935260772705e-07, 3.2223761081695557e-06, 6.789341568946838e-06, 1.0356307029724121e-05, 1.3923272490501404e-05, 1.7490237951278687e-05, 2.105720341205597e-05, 2.4624168872833252e-05, 2.8191134333610535e-05, 3.175809979438782e-05, 3.53250652551651e-05, 3.889203071594238e-05, 4.2458996176719666e-05, 4.602596163749695e-05, 4.959292709827423e-05, 5.3159892559051514e-05, 5.6726858019828796e-05, 6.029382348060608e-05, 6.386078894138336e-05, 6.742775440216064e-05, 7.099471986293793e-05, 7.456168532371521e-05, 7.812865078449249e-05, 8.169561624526978e-05, 8.526258170604706e-05, 8.882954716682434e-05, 9.239651262760162e-05, 9.59634780883789e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 0.0, 8.0, 8.0, 9.0, 10.0, 15.0, 32.0, 54.0, 83.0, 173.0, 257.0, 686.0, 2007.0, 8895.0, 135885.0, 870459.0, 24248.0, 3801.0, 1047.0, 425.0, 187.0, 97.0, 52.0, 38.0, 25.0, 19.0, 10.0, 9.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.87939453125, -0.8551254272460938, -0.8308563232421875, -0.8065872192382812, -0.782318115234375, -0.7580490112304688, -0.7337799072265625, -0.7095108032226562, -0.68524169921875, -0.6609725952148438, -0.6367034912109375, -0.6124343872070312, -0.588165283203125, -0.5638961791992188, -0.5396270751953125, -0.5153579711914062, -0.4910888671875, -0.46681976318359375, -0.4425506591796875, -0.41828155517578125, -0.394012451171875, -0.36974334716796875, -0.3454742431640625, -0.32120513916015625, -0.29693603515625, -0.27266693115234375, -0.2483978271484375, -0.22412872314453125, -0.199859619140625, -0.17559051513671875, -0.1513214111328125, -0.12705230712890625, -0.102783203125, -0.07851409912109375, -0.0542449951171875, -0.02997589111328125, -0.005706787109375, 0.01856231689453125, 0.0428314208984375, 0.06710052490234375, 0.09136962890625, 0.11563873291015625, 0.1399078369140625, 0.16417694091796875, 0.188446044921875, 0.21271514892578125, 0.2369842529296875, 0.26125335693359375, 0.2855224609375, 0.30979156494140625, 0.3340606689453125, 0.35832977294921875, 0.382598876953125, 0.40686798095703125, 0.4311370849609375, 0.45540618896484375, 0.47967529296875, 0.5039443969726562, 0.5282135009765625, 0.5524826049804688, 0.576751708984375, 0.6010208129882812, 0.6252899169921875, 0.6495590209960938, 0.673828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 13.0, 15.0, 22.0, 30.0, 34.0, 47.0, 61.0, 83.0, 108.0, 99.0, 105.0, 98.0, 78.0, 62.0, 37.0, 21.0, 13.0, 13.0, 9.0, 11.0, 8.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.54296875, -0.5287208557128906, -0.5144729614257812, -0.5002250671386719, -0.4859771728515625, -0.4717292785644531, -0.45748138427734375, -0.4432334899902344, -0.428985595703125, -0.4147377014160156, -0.40048980712890625, -0.3862419128417969, -0.3719940185546875, -0.3577461242675781, -0.34349822998046875, -0.3292503356933594, -0.31500244140625, -0.3007545471191406, -0.28650665283203125, -0.2722587585449219, -0.2580108642578125, -0.24376296997070312, -0.22951507568359375, -0.21526718139648438, -0.201019287109375, -0.18677139282226562, -0.17252349853515625, -0.15827560424804688, -0.1440277099609375, -0.12977981567382812, -0.11553192138671875, -0.10128402709960938, -0.0870361328125, -0.07278823852539062, -0.05854034423828125, -0.044292449951171875, -0.0300445556640625, -0.015796661376953125, -0.00154876708984375, 0.012699127197265625, 0.026947021484375, 0.041194915771484375, 0.05544281005859375, 0.06969070434570312, 0.0839385986328125, 0.09818649291992188, 0.11243438720703125, 0.12668228149414062, 0.14093017578125, 0.15517807006835938, 0.16942596435546875, 0.18367385864257812, 0.1979217529296875, 0.21216964721679688, 0.22641754150390625, 0.24066543579101562, 0.254913330078125, 0.2691612243652344, 0.28340911865234375, 0.2976570129394531, 0.3119049072265625, 0.3261528015136719, 0.34040069580078125, 0.3546485900878906, 0.368896484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 9.0, 15.0, 31.0, 72.0, 110.0, 196.0, 250.0, 134.0, 75.0, 35.0, 25.0, 15.0, 9.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.048914909362793, -5.83397102355957, -5.619027137756348, -5.404083251953125, -5.189139366149902, -4.97419548034668, -4.759251594543457, -4.544307708740234, -4.329363822937012, -4.114419937133789, -3.8994760513305664, -3.6845321655273438, -3.469588279724121, -3.2546443939208984, -3.0397002696990967, -2.824756383895874, -2.6098122596740723, -2.3948683738708496, -2.179924488067627, -1.9649804830551147, -1.750036597251892, -1.5350927114486694, -1.3201487064361572, -1.1052048206329346, -0.8902609348297119, -0.6753170490264893, -0.4603731036186218, -0.2454291582107544, -0.03048527240753174, 0.18445861339569092, 0.3994026184082031, 0.6143465042114258, 0.8292899131774902, 1.044233798980713, 1.2591776847839355, 1.4741216897964478, 1.6890655755996704, 1.904009461402893, 2.1189534664154053, 2.333897352218628, 2.5488412380218506, 2.7637851238250732, 2.978729009628296, 3.1936731338500977, 3.4086170196533203, 3.623560905456543, 3.8385047912597656, 4.053448677062988, 4.268392562866211, 4.483336448669434, 4.698280334472656, 4.913224220275879, 5.128168106079102, 5.343111991882324, 5.558055877685547, 5.7729997634887695, 5.987943649291992, 6.202887535095215, 6.4178314208984375, 6.63277530670166, 6.847719192504883, 7.0626630783081055, 7.277606964111328, 7.492550849914551, 7.707495212554932]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 3.0, 4.0, 13.0, 5.0, 9.0, 21.0, 15.0, 19.0, 25.0, 25.0, 23.0, 34.0, 39.0, 40.0, 37.0, 42.0, 40.0, 57.0, 65.0, 56.0, 37.0, 54.0, 37.0, 29.0, 40.0, 39.0, 32.0, 20.0, 14.0, 20.0, 13.0, 15.0, 16.0, 15.0, 9.0, 9.0, 10.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.35766339302063, -3.2456111907958984, -3.133558988571167, -3.0215067863464355, -2.909454822540283, -2.7974026203155518, -2.6853504180908203, -2.573298215866089, -2.4612460136413574, -2.349193811416626, -2.2371416091918945, -2.125089645385742, -2.0130374431610107, -1.9009852409362793, -1.7889330387115479, -1.6768808364868164, -1.564828872680664, -1.4527766704559326, -1.3407245874404907, -1.2286723852157593, -1.1166203022003174, -1.004568099975586, -0.8925158977508545, -0.7804637551307678, -0.6684116125106812, -0.5563594698905945, -0.4443072974681854, -0.33225512504577637, -0.2202029824256897, -0.10815083980560303, 0.003901362419128418, 0.11595350503921509, 0.22800588607788086, 0.34005802869796753, 0.4521102011203766, 0.5641623735427856, 0.6762145161628723, 0.788266658782959, 0.9003188610076904, 1.0123710632324219, 1.1244231462478638, 1.2364753484725952, 1.348527431488037, 1.4605796337127686, 1.5726318359375, 1.684683918952942, 1.7967361211776733, 1.9087882041931152, 2.0208404064178467, 2.132892608642578, 2.2449448108673096, 2.356997013092041, 2.4690489768981934, 2.581101179122925, 2.6931533813476562, 2.8052055835723877, 2.917257785797119, 3.0293099880218506, 3.141362190246582, 3.2534141540527344, 3.365466356277466, 3.4775185585021973, 3.5895707607269287, 3.70162296295166, 3.8136749267578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 13.0, 13.0, 15.0, 29.0, 49.0, 79.0, 157.0, 317.0, 726.0, 1666.0, 4762.0, 17324.0, 111431.0, 2894953.0, 1092376.0, 54001.0, 10574.0, 3231.0, 1248.0, 573.0, 282.0, 196.0, 91.0, 47.0, 37.0, 14.0, 23.0, 14.0, 16.0, 3.0, 5.0, 1.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.33251953125, -0.3191375732421875, -0.305755615234375, -0.2923736572265625, -0.27899169921875, -0.2656097412109375, -0.252227783203125, -0.2388458251953125, -0.2254638671875, -0.2120819091796875, -0.198699951171875, -0.1853179931640625, -0.17193603515625, -0.1585540771484375, -0.145172119140625, -0.1317901611328125, -0.118408203125, -0.1050262451171875, -0.091644287109375, -0.0782623291015625, -0.06488037109375, -0.0514984130859375, -0.038116455078125, -0.0247344970703125, -0.0113525390625, 0.0020294189453125, 0.015411376953125, 0.0287933349609375, 0.04217529296875, 0.0555572509765625, 0.068939208984375, 0.0823211669921875, 0.095703125, 0.1090850830078125, 0.122467041015625, 0.1358489990234375, 0.14923095703125, 0.1626129150390625, 0.175994873046875, 0.1893768310546875, 0.2027587890625, 0.2161407470703125, 0.229522705078125, 0.2429046630859375, 0.25628662109375, 0.2696685791015625, 0.283050537109375, 0.2964324951171875, 0.309814453125, 0.3231964111328125, 0.336578369140625, 0.3499603271484375, 0.36334228515625, 0.3767242431640625, 0.390106201171875, 0.4034881591796875, 0.4168701171875, 0.4302520751953125, 0.443634033203125, 0.4570159912109375, 0.47039794921875, 0.4837799072265625, 0.497161865234375, 0.5105438232421875, 0.52392578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 4.0, 4.0, 14.0, 13.0, 12.0, 16.0, 30.0, 30.0, 36.0, 49.0, 53.0, 53.0, 70.0, 62.0, 65.0, 55.0, 74.0, 65.0, 56.0, 37.0, 47.0, 31.0, 27.0, 25.0, 15.0, 15.0, 13.0, 8.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.186279296875, -0.17932510375976562, -0.17237091064453125, -0.16541671752929688, -0.1584625244140625, -0.15150833129882812, -0.14455413818359375, -0.13759994506835938, -0.130645751953125, -0.12369155883789062, -0.11673736572265625, -0.10978317260742188, -0.1028289794921875, -0.09587478637695312, -0.08892059326171875, -0.08196640014648438, -0.07501220703125, -0.06805801391601562, -0.06110382080078125, -0.054149627685546875, -0.0471954345703125, -0.040241241455078125, -0.03328704833984375, -0.026332855224609375, -0.019378662109375, -0.012424468994140625, -0.00547027587890625, 0.001483917236328125, 0.0084381103515625, 0.015392303466796875, 0.02234649658203125, 0.029300689697265625, 0.0362548828125, 0.043209075927734375, 0.05016326904296875, 0.057117462158203125, 0.0640716552734375, 0.07102584838867188, 0.07798004150390625, 0.08493423461914062, 0.091888427734375, 0.09884262084960938, 0.10579681396484375, 0.11275100708007812, 0.1197052001953125, 0.12665939331054688, 0.13361358642578125, 0.14056777954101562, 0.14752197265625, 0.15447616577148438, 0.16143035888671875, 0.16838455200195312, 0.1753387451171875, 0.18229293823242188, 0.18924713134765625, 0.19620132446289062, 0.203155517578125, 0.21010971069335938, 0.21706390380859375, 0.22401809692382812, 0.2309722900390625, 0.23792648315429688, 0.24488067626953125, 0.2518348693847656, 0.2587890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 7.0, 15.0, 14.0, 34.0, 37.0, 64.0, 104.0, 144.0, 256.0, 497.0, 1019.0, 2422.0, 7580.0, 34120.0, 324734.0, 3518839.0, 265292.0, 29104.0, 6101.0, 1956.0, 816.0, 461.0, 241.0, 125.0, 110.0, 53.0, 32.0, 22.0, 16.0, 9.0, 10.0, 7.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4140625, -0.39898681640625, -0.3839111328125, -0.36883544921875, -0.353759765625, -0.33868408203125, -0.3236083984375, -0.30853271484375, -0.29345703125, -0.27838134765625, -0.2633056640625, -0.24822998046875, -0.233154296875, -0.21807861328125, -0.2030029296875, -0.18792724609375, -0.1728515625, -0.15777587890625, -0.1427001953125, -0.12762451171875, -0.112548828125, -0.09747314453125, -0.0823974609375, -0.06732177734375, -0.05224609375, -0.03717041015625, -0.0220947265625, -0.00701904296875, 0.008056640625, 0.02313232421875, 0.0382080078125, 0.05328369140625, 0.068359375, 0.08343505859375, 0.0985107421875, 0.11358642578125, 0.128662109375, 0.14373779296875, 0.1588134765625, 0.17388916015625, 0.18896484375, 0.20404052734375, 0.2191162109375, 0.23419189453125, 0.249267578125, 0.26434326171875, 0.2794189453125, 0.29449462890625, 0.3095703125, 0.32464599609375, 0.3397216796875, 0.35479736328125, 0.369873046875, 0.38494873046875, 0.4000244140625, 0.41510009765625, 0.43017578125, 0.44525146484375, 0.4603271484375, 0.47540283203125, 0.490478515625, 0.50555419921875, 0.5206298828125, 0.53570556640625, 0.55078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 2.0, 6.0, 8.0, 14.0, 23.0, 38.0, 47.0, 76.0, 115.0, 215.0, 392.0, 913.0, 1033.0, 534.0, 272.0, 140.0, 71.0, 58.0, 34.0, 28.0, 20.0, 8.0, 10.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6413803100585938, -0.6226043701171875, -0.6038284301757812, -0.585052490234375, -0.5662765502929688, -0.5475006103515625, -0.5287246704101562, -0.50994873046875, -0.49117279052734375, -0.4723968505859375, -0.45362091064453125, -0.434844970703125, -0.41606903076171875, -0.3972930908203125, -0.37851715087890625, -0.3597412109375, -0.34096527099609375, -0.3221893310546875, -0.30341339111328125, -0.284637451171875, -0.26586151123046875, -0.2470855712890625, -0.22830963134765625, -0.20953369140625, -0.19075775146484375, -0.1719818115234375, -0.15320587158203125, -0.134429931640625, -0.11565399169921875, -0.0968780517578125, -0.07810211181640625, -0.059326171875, -0.04055023193359375, -0.0217742919921875, -0.00299835205078125, 0.015777587890625, 0.03455352783203125, 0.0533294677734375, 0.07210540771484375, 0.09088134765625, 0.10965728759765625, 0.1284332275390625, 0.14720916748046875, 0.165985107421875, 0.18476104736328125, 0.2035369873046875, 0.22231292724609375, 0.2410888671875, 0.25986480712890625, 0.2786407470703125, 0.29741668701171875, 0.316192626953125, 0.33496856689453125, 0.3537445068359375, 0.37252044677734375, 0.39129638671875, 0.41007232666015625, 0.4288482666015625, 0.44762420654296875, 0.466400146484375, 0.48517608642578125, 0.5039520263671875, 0.5227279663085938, 0.54150390625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 3.0, 6.0, 26.0, 64.0, 161.0, 313.0, 258.0, 102.0, 31.0, 11.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21705961227417, -5.012783527374268, -4.808507919311523, -4.604231834411621, -4.399955749511719, -4.195680141448975, -3.9914040565490723, -3.787128210067749, -3.582852363586426, -3.3785765171051025, -3.1743004322052, -2.970024585723877, -2.7657487392425537, -2.5614728927612305, -2.357196807861328, -2.152920961380005, -1.9486448764801025, -1.7443689107894897, -1.5400930643081665, -1.3358170986175537, -1.1315412521362305, -0.9272652864456177, -0.7229893207550049, -0.5187134742736816, -0.31443750858306885, -0.11016158759593964, 0.09411433339118958, 0.29839026927948, 0.502666175365448, 0.706942081451416, 0.9112180471420288, 1.115493893623352, 1.3197698593139648, 1.5240458250045776, 1.7283216714859009, 1.9325976371765137, 2.136873483657837, 2.34114933013916, 2.5454254150390625, 2.7497012615203857, 2.953977108001709, 3.1582529544830322, 3.3625290393829346, 3.566804885864258, 3.771080732345581, 3.9753565788269043, 4.179632663726807, 4.383908271789551, 4.588184356689453, 4.7924604415893555, 4.9967360496521, 5.201012134552002, 5.405288219451904, 5.609563827514648, 5.813839912414551, 6.018115997314453, 6.2223920822143555, 6.426668167114258, 6.630943775177002, 6.835219860076904, 7.039495944976807, 7.243771553039551, 7.448047637939453, 7.6523237228393555, 7.8565993309021]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 8.0, 3.0, 8.0, 11.0, 10.0, 10.0, 15.0, 19.0, 17.0, 16.0, 25.0, 26.0, 34.0, 30.0, 37.0, 33.0, 45.0, 54.0, 42.0, 59.0, 49.0, 44.0, 38.0, 45.0, 43.0, 36.0, 39.0, 28.0, 32.0, 24.0, 25.0, 19.0, 16.0, 14.0, 8.0, 11.0, 5.0, 7.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.229215621948242, -2.1623589992523193, -2.0955023765563965, -2.0286459922790527, -1.9617893695831299, -1.894932746887207, -1.8280762434005737, -1.7612197399139404, -1.6943631172180176, -1.6275064945220947, -1.5606499910354614, -1.4937934875488281, -1.4269368648529053, -1.3600802421569824, -1.2932237386703491, -1.2263672351837158, -1.159510612487793, -1.0926539897918701, -1.0257974863052368, -0.9589409232139587, -0.8920843601226807, -0.8252277970314026, -0.7583712339401245, -0.6915146708488464, -0.6246581077575684, -0.5578015446662903, -0.4909449815750122, -0.42408841848373413, -0.35723185539245605, -0.290375292301178, -0.2235187292098999, -0.15666216611862183, -0.08980584144592285, -0.022949278354644775, 0.0439072847366333, 0.11076384782791138, 0.17762041091918945, 0.24447697401046753, 0.3113335371017456, 0.3781901001930237, 0.44504666328430176, 0.5119032263755798, 0.5787597894668579, 0.645616352558136, 0.7124729156494141, 0.7793294787406921, 0.8461860418319702, 0.9130426049232483, 0.9798991680145264, 1.0467557907104492, 1.1136122941970825, 1.1804687976837158, 1.2473254203796387, 1.3141820430755615, 1.3810385465621948, 1.4478950500488281, 1.514751672744751, 1.5816082954406738, 1.6484647989273071, 1.7153213024139404, 1.7821779251098633, 1.8490345478057861, 1.9158910512924194, 1.9827475547790527, 2.0496041774749756]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 8.0, 9.0, 20.0, 28.0, 47.0, 84.0, 131.0, 237.0, 472.0, 970.0, 2544.0, 6826.0, 23086.0, 99484.0, 492421.0, 334327.0, 63401.0, 15831.0, 5059.0, 1867.0, 799.0, 400.0, 208.0, 96.0, 66.0, 45.0, 21.0, 16.0, 13.0, 13.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5927734375, -0.5735626220703125, -0.554351806640625, -0.5351409912109375, -0.51593017578125, -0.4967193603515625, -0.477508544921875, -0.4582977294921875, -0.4390869140625, -0.4198760986328125, -0.400665283203125, -0.3814544677734375, -0.36224365234375, -0.3430328369140625, -0.323822021484375, -0.3046112060546875, -0.285400390625, -0.2661895751953125, -0.246978759765625, -0.2277679443359375, -0.20855712890625, -0.1893463134765625, -0.170135498046875, -0.1509246826171875, -0.1317138671875, -0.1125030517578125, -0.093292236328125, -0.0740814208984375, -0.05487060546875, -0.0356597900390625, -0.016448974609375, 0.0027618408203125, 0.02197265625, 0.0411834716796875, 0.060394287109375, 0.0796051025390625, 0.09881591796875, 0.1180267333984375, 0.137237548828125, 0.1564483642578125, 0.1756591796875, 0.1948699951171875, 0.214080810546875, 0.2332916259765625, 0.25250244140625, 0.2717132568359375, 0.290924072265625, 0.3101348876953125, 0.329345703125, 0.3485565185546875, 0.367767333984375, 0.3869781494140625, 0.40618896484375, 0.4253997802734375, 0.444610595703125, 0.4638214111328125, 0.4830322265625, 0.5022430419921875, 0.521453857421875, 0.5406646728515625, 0.55987548828125, 0.5790863037109375, 0.598297119140625, 0.6175079345703125, 0.63671875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 3.0, 5.0, 4.0, 9.0, 18.0, 15.0, 22.0, 35.0, 36.0, 37.0, 51.0, 55.0, 62.0, 48.0, 62.0, 60.0, 75.0, 56.0, 68.0, 54.0, 44.0, 34.0, 33.0, 26.0, 17.0, 17.0, 15.0, 13.0, 7.0, 4.0, 7.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1907958984375, -0.18406295776367188, -0.17733001708984375, -0.17059707641601562, -0.1638641357421875, -0.15713119506835938, -0.15039825439453125, -0.14366531372070312, -0.136932373046875, -0.13019943237304688, -0.12346649169921875, -0.11673355102539062, -0.1100006103515625, -0.10326766967773438, -0.09653472900390625, -0.08980178833007812, -0.08306884765625, -0.07633590698242188, -0.06960296630859375, -0.06287002563476562, -0.0561370849609375, -0.049404144287109375, -0.04267120361328125, -0.035938262939453125, -0.029205322265625, -0.022472381591796875, -0.01573944091796875, -0.009006500244140625, -0.0022735595703125, 0.004459381103515625, 0.01119232177734375, 0.017925262451171875, 0.024658203125, 0.031391143798828125, 0.03812408447265625, 0.044857025146484375, 0.0515899658203125, 0.058322906494140625, 0.06505584716796875, 0.07178878784179688, 0.078521728515625, 0.08525466918945312, 0.09198760986328125, 0.09872055053710938, 0.1054534912109375, 0.11218643188476562, 0.11891937255859375, 0.12565231323242188, 0.13238525390625, 0.13911819458007812, 0.14585113525390625, 0.15258407592773438, 0.1593170166015625, 0.16604995727539062, 0.17278289794921875, 0.17951583862304688, 0.186248779296875, 0.19298171997070312, 0.19971466064453125, 0.20644760131835938, 0.2131805419921875, 0.21991348266601562, 0.22664642333984375, 0.23337936401367188, 0.2401123046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 15.0, 4.0, 26.0, 26.0, 55.0, 87.0, 138.0, 270.0, 604.0, 1554.0, 6946.0, 88050.0, 904599.0, 39638.0, 4354.0, 1174.0, 490.0, 189.0, 121.0, 68.0, 50.0, 22.0, 24.0, 11.0, 10.0, 10.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.576171875, -1.5316162109375, -1.487060546875, -1.4425048828125, -1.39794921875, -1.3533935546875, -1.308837890625, -1.2642822265625, -1.2197265625, -1.1751708984375, -1.130615234375, -1.0860595703125, -1.04150390625, -0.9969482421875, -0.952392578125, -0.9078369140625, -0.86328125, -0.8187255859375, -0.774169921875, -0.7296142578125, -0.68505859375, -0.6405029296875, -0.595947265625, -0.5513916015625, -0.5068359375, -0.4622802734375, -0.417724609375, -0.3731689453125, -0.32861328125, -0.2840576171875, -0.239501953125, -0.1949462890625, -0.150390625, -0.1058349609375, -0.061279296875, -0.0167236328125, 0.02783203125, 0.0723876953125, 0.116943359375, 0.1614990234375, 0.2060546875, 0.2506103515625, 0.295166015625, 0.3397216796875, 0.38427734375, 0.4288330078125, 0.473388671875, 0.5179443359375, 0.5625, 0.6070556640625, 0.651611328125, 0.6961669921875, 0.74072265625, 0.7852783203125, 0.829833984375, 0.8743896484375, 0.9189453125, 0.9635009765625, 1.008056640625, 1.0526123046875, 1.09716796875, 1.1417236328125, 1.186279296875, 1.2308349609375, 1.275390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 7.0, 4.0, 5.0, 4.0, 4.0, 9.0, 11.0, 6.0, 11.0, 15.0, 17.0, 28.0, 31.0, 44.0, 44.0, 45.0, 54.0, 73.0, 74.0, 61.0, 79.0, 43.0, 63.0, 48.0, 40.0, 40.0, 33.0, 28.0, 12.0, 20.0, 6.0, 10.0, 12.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0185546875, -0.9913482666015625, -0.964141845703125, -0.9369354248046875, -0.90972900390625, -0.8825225830078125, -0.855316162109375, -0.8281097412109375, -0.8009033203125, -0.7736968994140625, -0.746490478515625, -0.7192840576171875, -0.69207763671875, -0.6648712158203125, -0.637664794921875, -0.6104583740234375, -0.583251953125, -0.5560455322265625, -0.528839111328125, -0.5016326904296875, -0.47442626953125, -0.4472198486328125, -0.420013427734375, -0.3928070068359375, -0.3656005859375, -0.3383941650390625, -0.311187744140625, -0.2839813232421875, -0.25677490234375, -0.2295684814453125, -0.202362060546875, -0.1751556396484375, -0.14794921875, -0.1207427978515625, -0.093536376953125, -0.0663299560546875, -0.03912353515625, -0.0119171142578125, 0.015289306640625, 0.0424957275390625, 0.0697021484375, 0.0969085693359375, 0.124114990234375, 0.1513214111328125, 0.17852783203125, 0.2057342529296875, 0.232940673828125, 0.2601470947265625, 0.287353515625, 0.3145599365234375, 0.341766357421875, 0.3689727783203125, 0.39617919921875, 0.4233856201171875, 0.450592041015625, 0.4777984619140625, 0.5050048828125, 0.5322113037109375, 0.559417724609375, 0.5866241455078125, 0.61383056640625, 0.6410369873046875, 0.668243408203125, 0.6954498291015625, 0.72265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 2.0, 4.0, 5.0, 8.0, 15.0, 19.0, 35.0, 47.0, 81.0, 157.0, 377.0, 1017.0, 4009.0, 40631.0, 920899.0, 73268.0, 5811.0, 1293.0, 453.0, 174.0, 98.0, 57.0, 33.0, 24.0, 11.0, 3.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66064453125, -0.6397323608398438, -0.6188201904296875, -0.5979080200195312, -0.576995849609375, -0.5560836791992188, -0.5351715087890625, -0.5142593383789062, -0.49334716796875, -0.47243499755859375, -0.4515228271484375, -0.43061065673828125, -0.409698486328125, -0.38878631591796875, -0.3678741455078125, -0.34696197509765625, -0.3260498046875, -0.30513763427734375, -0.2842254638671875, -0.26331329345703125, -0.242401123046875, -0.22148895263671875, -0.2005767822265625, -0.17966461181640625, -0.15875244140625, -0.13784027099609375, -0.1169281005859375, -0.09601593017578125, -0.075103759765625, -0.05419158935546875, -0.0332794189453125, -0.01236724853515625, 0.008544921875, 0.02945709228515625, 0.0503692626953125, 0.07128143310546875, 0.092193603515625, 0.11310577392578125, 0.1340179443359375, 0.15493011474609375, 0.17584228515625, 0.19675445556640625, 0.2176666259765625, 0.23857879638671875, 0.259490966796875, 0.28040313720703125, 0.3013153076171875, 0.32222747802734375, 0.3431396484375, 0.36405181884765625, 0.3849639892578125, 0.40587615966796875, 0.426788330078125, 0.44770050048828125, 0.4686126708984375, 0.48952484130859375, 0.51043701171875, 0.5313491821289062, 0.5522613525390625, 0.5731735229492188, 0.594085693359375, 0.6149978637695312, 0.6359100341796875, 0.6568222045898438, 0.677734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 6.0, 9.0, 6.0, 13.0, 16.0, 17.0, 23.0, 37.0, 39.0, 53.0, 70.0, 117.0, 144.0, 142.0, 76.0, 54.0, 36.0, 29.0, 20.0, 16.0, 17.0, 12.0, 11.0, 6.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.910894393920898e-05, -8.535105735063553e-05, -8.159317076206207e-05, -7.783528417348862e-05, -7.407739758491516e-05, -7.03195109963417e-05, -6.656162440776825e-05, -6.28037378191948e-05, -5.904585123062134e-05, -5.528796464204788e-05, -5.1530078053474426e-05, -4.777219146490097e-05, -4.4014304876327515e-05, -4.025641828775406e-05, -3.64985316991806e-05, -3.274064511060715e-05, -2.898275852203369e-05, -2.5224871933460236e-05, -2.146698534488678e-05, -1.7709098756313324e-05, -1.3951212167739868e-05, -1.0193325579166412e-05, -6.4354389905929565e-06, -2.6775524020195007e-06, 1.080334186553955e-06, 4.838220775127411e-06, 8.596107363700867e-06, 1.2353993952274323e-05, 1.611188054084778e-05, 1.9869767129421234e-05, 2.362765371799469e-05, 2.7385540306568146e-05, 3.11434268951416e-05, 3.490131348371506e-05, 3.865920007228851e-05, 4.241708666086197e-05, 4.6174973249435425e-05, 4.993285983800888e-05, 5.3690746426582336e-05, 5.744863301515579e-05, 6.120651960372925e-05, 6.49644061923027e-05, 6.872229278087616e-05, 7.248017936944962e-05, 7.623806595802307e-05, 7.999595254659653e-05, 8.375383913516998e-05, 8.751172572374344e-05, 9.12696123123169e-05, 9.502749890089035e-05, 9.87853854894638e-05, 0.00010254327207803726, 0.00010630115866661072, 0.00011005904525518417, 0.00011381693184375763, 0.00011757481843233109, 0.00012133270502090454, 0.000125090591609478, 0.00012884847819805145, 0.0001326063647866249, 0.00013636425137519836, 0.00014012213796377182, 0.00014388002455234528, 0.00014763791114091873, 0.0001513957977294922]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 5.0, 7.0, 18.0, 25.0, 41.0, 67.0, 106.0, 229.0, 407.0, 978.0, 3479.0, 19025.0, 522602.0, 477111.0, 19075.0, 3493.0, 964.0, 431.0, 221.0, 107.0, 51.0, 36.0, 20.0, 14.0, 8.0, 9.0, 6.0, 8.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64404296875, -0.625640869140625, -0.60723876953125, -0.588836669921875, -0.5704345703125, -0.552032470703125, -0.53363037109375, -0.515228271484375, -0.496826171875, -0.478424072265625, -0.46002197265625, -0.441619873046875, -0.4232177734375, -0.404815673828125, -0.38641357421875, -0.368011474609375, -0.349609375, -0.331207275390625, -0.31280517578125, -0.294403076171875, -0.2760009765625, -0.257598876953125, -0.23919677734375, -0.220794677734375, -0.202392578125, -0.183990478515625, -0.16558837890625, -0.147186279296875, -0.1287841796875, -0.110382080078125, -0.09197998046875, -0.073577880859375, -0.05517578125, -0.036773681640625, -0.01837158203125, 3.0517578125e-05, 0.0184326171875, 0.036834716796875, 0.05523681640625, 0.073638916015625, 0.092041015625, 0.110443115234375, 0.12884521484375, 0.147247314453125, 0.1656494140625, 0.184051513671875, 0.20245361328125, 0.220855712890625, 0.2392578125, 0.257659912109375, 0.27606201171875, 0.294464111328125, 0.3128662109375, 0.331268310546875, 0.34967041015625, 0.368072509765625, 0.386474609375, 0.404876708984375, 0.42327880859375, 0.441680908203125, 0.4600830078125, 0.478485107421875, 0.49688720703125, 0.515289306640625, 0.53369140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 7.0, 6.0, 10.0, 8.0, 14.0, 13.0, 9.0, 21.0, 30.0, 39.0, 54.0, 81.0, 106.0, 136.0, 121.0, 92.0, 77.0, 46.0, 23.0, 23.0, 22.0, 13.0, 10.0, 9.0, 5.0, 6.0, 3.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322021484375, -0.3099098205566406, -0.29779815673828125, -0.2856864929199219, -0.2735748291015625, -0.2614631652832031, -0.24935150146484375, -0.23723983764648438, -0.225128173828125, -0.21301651000976562, -0.20090484619140625, -0.18879318237304688, -0.1766815185546875, -0.16456985473632812, -0.15245819091796875, -0.14034652709960938, -0.12823486328125, -0.11612319946289062, -0.10401153564453125, -0.09189987182617188, -0.0797882080078125, -0.06767654418945312, -0.05556488037109375, -0.043453216552734375, -0.031341552734375, -0.019229888916015625, -0.00711822509765625, 0.004993438720703125, 0.0171051025390625, 0.029216766357421875, 0.04132843017578125, 0.053440093994140625, 0.0655517578125, 0.07766342163085938, 0.08977508544921875, 0.10188674926757812, 0.1139984130859375, 0.12611007690429688, 0.13822174072265625, 0.15033340454101562, 0.162445068359375, 0.17455673217773438, 0.18666839599609375, 0.19878005981445312, 0.2108917236328125, 0.22300338745117188, 0.23511505126953125, 0.24722671508789062, 0.25933837890625, 0.2714500427246094, 0.28356170654296875, 0.2956733703613281, 0.3077850341796875, 0.3198966979980469, 0.33200836181640625, 0.3441200256347656, 0.356231689453125, 0.3683433532714844, 0.38045501708984375, 0.3925666809082031, 0.4046783447265625, 0.4167900085449219, 0.42890167236328125, 0.4410133361816406, 0.453125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0, 8.0, 17.0, 43.0, 66.0, 119.0, 197.0, 251.0, 156.0, 70.0, 28.0, 15.0, 9.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.248492240905762, -7.053330421447754, -6.858168125152588, -6.66300630569458, -6.467844009399414, -6.272682189941406, -6.077520370483398, -5.882358551025391, -5.687196254730225, -5.492034435272217, -5.296872138977051, -5.101710319519043, -4.906548500061035, -4.711386203765869, -4.516224384307861, -4.321062088012695, -4.1259002685546875, -3.9307382106781006, -3.7355761528015137, -3.540414333343506, -3.345252275466919, -3.150090217590332, -2.954928398132324, -2.7597663402557373, -2.5646042823791504, -2.3694422245025635, -2.1742801666259766, -1.9791183471679688, -1.7839562892913818, -1.588794231414795, -1.3936322927474976, -1.1984703540802002, -1.0033082962036133, -0.8081462979316711, -0.612984299659729, -0.41782230138778687, -0.22266030311584473, -0.027498304843902588, 0.16766369342803955, 0.3628256320953369, 0.5579876899719238, 0.753149688243866, 0.9483116865158081, 1.1434736251831055, 1.3386356830596924, 1.5337977409362793, 1.7289596796035767, 1.924121618270874, 2.119283676147461, 2.314445734024048, 2.5096077919006348, 2.7047696113586426, 2.8999316692352295, 3.0950937271118164, 3.290255546569824, 3.485417604446411, 3.680579662322998, 3.875741720199585, 4.070903778076172, 4.26606559753418, 4.4612274169921875, 4.6563897132873535, 4.851551532745361, 5.046713829040527, 5.241875648498535]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 13.0, 6.0, 13.0, 10.0, 10.0, 20.0, 35.0, 32.0, 36.0, 43.0, 41.0, 69.0, 80.0, 66.0, 61.0, 72.0, 60.0, 46.0, 46.0, 28.0, 39.0, 34.0, 28.0, 22.0, 18.0, 17.0, 12.0, 5.0, 12.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5050852298736572, -3.396188735961914, -3.287292242050171, -3.1783957481384277, -3.0694992542266846, -2.9606027603149414, -2.8517065048217773, -2.742809772491455, -2.633913516998291, -2.525017023086548, -2.4161205291748047, -2.3072240352630615, -2.1983275413513184, -2.089431047439575, -1.9805346727371216, -1.8716381788253784, -1.7627415657043457, -1.6538450717926025, -1.5449485778808594, -1.4360520839691162, -1.327155590057373, -1.2182590961456299, -1.1093627214431763, -1.000466227531433, -0.8915697336196899, -0.7826732397079468, -0.6737767457962036, -0.5648803114891052, -0.45598381757736206, -0.3470873236656189, -0.2381908893585205, -0.12929439544677734, -0.020397663116455078, 0.08849881589412689, 0.19739529490470886, 0.30629175901412964, 0.4151882529258728, 0.524084746837616, 0.6329811811447144, 0.7418776750564575, 0.8507741689682007, 0.9596706628799438, 1.068567156791687, 1.1774635314941406, 1.2863600254058838, 1.395256519317627, 1.5041530132293701, 1.6130495071411133, 1.7219460010528564, 1.8308424949645996, 1.9397389888763428, 2.048635482788086, 2.157531976699829, 2.2664284706115723, 2.3753247261047363, 2.4842214584350586, 2.5931177139282227, 2.702014207839966, 2.810910701751709, 2.919807195663452, 3.0287036895751953, 3.1376001834869385, 3.2464966773986816, 3.3553929328918457, 3.464289665222168]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 10.0, 17.0, 14.0, 23.0, 48.0, 71.0, 117.0, 250.0, 512.0, 1323.0, 3936.0, 17400.0, 344443.0, 3757122.0, 56495.0, 8276.0, 2429.0, 902.0, 398.0, 168.0, 107.0, 66.0, 41.0, 20.0, 28.0, 12.0, 11.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.552734375, -0.5338516235351562, -0.5149688720703125, -0.49608612060546875, -0.477203369140625, -0.45832061767578125, -0.4394378662109375, -0.42055511474609375, -0.40167236328125, -0.38278961181640625, -0.3639068603515625, -0.34502410888671875, -0.326141357421875, -0.30725860595703125, -0.2883758544921875, -0.26949310302734375, -0.2506103515625, -0.23172760009765625, -0.2128448486328125, -0.19396209716796875, -0.175079345703125, -0.15619659423828125, -0.1373138427734375, -0.11843109130859375, -0.09954833984375, -0.08066558837890625, -0.0617828369140625, -0.04290008544921875, -0.024017333984375, -0.00513458251953125, 0.0137481689453125, 0.03263092041015625, 0.051513671875, 0.07039642333984375, 0.0892791748046875, 0.10816192626953125, 0.127044677734375, 0.14592742919921875, 0.1648101806640625, 0.18369293212890625, 0.20257568359375, 0.22145843505859375, 0.2403411865234375, 0.25922393798828125, 0.278106689453125, 0.29698944091796875, 0.3158721923828125, 0.33475494384765625, 0.3536376953125, 0.37252044677734375, 0.3914031982421875, 0.41028594970703125, 0.429168701171875, 0.44805145263671875, 0.4669342041015625, 0.48581695556640625, 0.50469970703125, 0.5235824584960938, 0.5424652099609375, 0.5613479614257812, 0.580230712890625, 0.5991134643554688, 0.6179962158203125, 0.6368789672851562, 0.65576171875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 13.0, 23.0, 31.0, 52.0, 63.0, 73.0, 97.0, 96.0, 89.0, 112.0, 103.0, 66.0, 55.0, 46.0, 41.0, 12.0, 10.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.396484375, -0.3861656188964844, -0.37584686279296875, -0.3655281066894531, -0.3552093505859375, -0.3448905944824219, -0.33457183837890625, -0.3242530822753906, -0.313934326171875, -0.3036155700683594, -0.29329681396484375, -0.2829780578613281, -0.2726593017578125, -0.2623405456542969, -0.25202178955078125, -0.24170303344726562, -0.23138427734375, -0.22106552124023438, -0.21074676513671875, -0.20042800903320312, -0.1901092529296875, -0.17979049682617188, -0.16947174072265625, -0.15915298461914062, -0.148834228515625, -0.13851547241210938, -0.12819671630859375, -0.11787796020507812, -0.1075592041015625, -0.09724044799804688, -0.08692169189453125, -0.07660293579101562, -0.0662841796875, -0.055965423583984375, -0.04564666748046875, -0.035327911376953125, -0.0250091552734375, -0.014690399169921875, -0.00437164306640625, 0.005947113037109375, 0.016265869140625, 0.026584625244140625, 0.03690338134765625, 0.047222137451171875, 0.0575408935546875, 0.06785964965820312, 0.07817840576171875, 0.08849716186523438, 0.09881591796875, 0.10913467407226562, 0.11945343017578125, 0.12977218627929688, 0.1400909423828125, 0.15040969848632812, 0.16072845458984375, 0.17104721069335938, 0.181365966796875, 0.19168472290039062, 0.20200347900390625, 0.21232223510742188, 0.2226409912109375, 0.23295974731445312, 0.24327850341796875, 0.2535972595214844, 0.263916015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 11.0, 4.0, 8.0, 18.0, 24.0, 17.0, 36.0, 30.0, 58.0, 80.0, 114.0, 196.0, 264.0, 448.0, 799.0, 1565.0, 3700.0, 11946.0, 62166.0, 1745370.0, 2281030.0, 66937.0, 12028.0, 3646.0, 1708.0, 822.0, 423.0, 268.0, 164.0, 128.0, 87.0, 45.0, 42.0, 27.0, 9.0, 22.0, 12.0, 5.0, 8.0, 3.0, 2.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.5068359375, -0.4919395446777344, -0.47704315185546875, -0.4621467590332031, -0.4472503662109375, -0.4323539733886719, -0.41745758056640625, -0.4025611877441406, -0.387664794921875, -0.3727684020996094, -0.35787200927734375, -0.3429756164550781, -0.3280792236328125, -0.3131828308105469, -0.29828643798828125, -0.2833900451660156, -0.26849365234375, -0.2535972595214844, -0.23870086669921875, -0.22380447387695312, -0.2089080810546875, -0.19401168823242188, -0.17911529541015625, -0.16421890258789062, -0.149322509765625, -0.13442611694335938, -0.11952972412109375, -0.10463333129882812, -0.0897369384765625, -0.07484054565429688, -0.05994415283203125, -0.045047760009765625, -0.0301513671875, -0.015254974365234375, -0.00035858154296875, 0.014537811279296875, 0.0294342041015625, 0.044330596923828125, 0.05922698974609375, 0.07412338256835938, 0.089019775390625, 0.10391616821289062, 0.11881256103515625, 0.13370895385742188, 0.1486053466796875, 0.16350173950195312, 0.17839813232421875, 0.19329452514648438, 0.20819091796875, 0.22308731079101562, 0.23798370361328125, 0.2528800964355469, 0.2677764892578125, 0.2826728820800781, 0.29756927490234375, 0.3124656677246094, 0.327362060546875, 0.3422584533691406, 0.35715484619140625, 0.3720512390136719, 0.3869476318359375, 0.4018440246582031, 0.41674041748046875, 0.4316368103027344, 0.446533203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 6.0, 9.0, 12.0, 12.0, 18.0, 23.0, 53.0, 45.0, 87.0, 99.0, 199.0, 502.0, 1024.0, 980.0, 433.0, 203.0, 116.0, 72.0, 53.0, 33.0, 28.0, 12.0, 8.0, 15.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45166015625, -0.43750762939453125, -0.4233551025390625, -0.40920257568359375, -0.395050048828125, -0.38089752197265625, -0.3667449951171875, -0.35259246826171875, -0.33843994140625, -0.32428741455078125, -0.3101348876953125, -0.29598236083984375, -0.281829833984375, -0.26767730712890625, -0.2535247802734375, -0.23937225341796875, -0.2252197265625, -0.21106719970703125, -0.1969146728515625, -0.18276214599609375, -0.168609619140625, -0.15445709228515625, -0.1403045654296875, -0.12615203857421875, -0.11199951171875, -0.09784698486328125, -0.0836944580078125, -0.06954193115234375, -0.055389404296875, -0.04123687744140625, -0.0270843505859375, -0.01293182373046875, 0.001220703125, 0.01537322998046875, 0.0295257568359375, 0.04367828369140625, 0.057830810546875, 0.07198333740234375, 0.0861358642578125, 0.10028839111328125, 0.11444091796875, 0.12859344482421875, 0.1427459716796875, 0.15689849853515625, 0.171051025390625, 0.18520355224609375, 0.1993560791015625, 0.21350860595703125, 0.2276611328125, 0.24181365966796875, 0.2559661865234375, 0.27011871337890625, 0.284271240234375, 0.29842376708984375, 0.3125762939453125, 0.32672882080078125, 0.34088134765625, 0.35503387451171875, 0.3691864013671875, 0.38333892822265625, 0.397491455078125, 0.41164398193359375, 0.4257965087890625, 0.43994903564453125, 0.4541015625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 10.0, 16.0, 49.0, 135.0, 283.0, 304.0, 122.0, 47.0, 14.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.207853317260742, -6.019106388092041, -5.83035945892334, -5.6416120529174805, -5.452865123748779, -5.264118194580078, -5.075370788574219, -4.886623859405518, -4.697876930236816, -4.509130001068115, -4.320383071899414, -4.131635665893555, -3.9428887367248535, -3.7541418075561523, -3.565394639968872, -3.376647472381592, -3.1879005432128906, -2.9991536140441895, -2.810406446456909, -2.621659278869629, -2.4329123497009277, -2.2441654205322266, -2.0554182529449463, -1.8666712045669556, -1.6779241561889648, -1.4891771078109741, -1.3004300594329834, -1.1116830110549927, -0.922935962677002, -0.7341889142990112, -0.5454418659210205, -0.3566948175430298, -0.16794776916503906, 0.02079927921295166, 0.20954632759094238, 0.3982933759689331, 0.5870404243469238, 0.7757874727249146, 0.9645345211029053, 1.153281569480896, 1.3420286178588867, 1.5307756662368774, 1.7195227146148682, 1.9082697629928589, 2.0970168113708496, 2.285763740539551, 2.474510908126831, 2.6632580757141113, 2.8520050048828125, 3.0407519340515137, 3.229499101638794, 3.418246269226074, 3.6069931983947754, 3.7957401275634766, 3.984487295150757, 4.173234462738037, 4.361981391906738, 4.5507283210754395, 4.739475250244141, 4.92822265625, 5.116969585418701, 5.305716514587402, 5.494463920593262, 5.683210849761963, 5.871957778930664]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 11.0, 12.0, 10.0, 11.0, 15.0, 21.0, 16.0, 32.0, 32.0, 15.0, 31.0, 36.0, 37.0, 45.0, 37.0, 47.0, 43.0, 41.0, 54.0, 46.0, 35.0, 43.0, 33.0, 29.0, 42.0, 36.0, 34.0, 22.0, 23.0, 16.0, 14.0, 16.0, 8.0, 14.0, 4.0, 8.0, 7.0, 2.0, 3.0, 0.0, 3.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5050184726715088, -1.4553773403167725, -1.4057360887527466, -1.3560948371887207, -1.3064537048339844, -1.256812572479248, -1.2071713209152222, -1.1575300693511963, -1.10788893699646, -1.0582478046417236, -1.0086065530776978, -0.9589653611183167, -0.9093241691589355, -0.8596829771995544, -0.8100417852401733, -0.7604005932807922, -0.7107594013214111, -0.66111820936203, -0.6114770174026489, -0.5618358254432678, -0.5121946334838867, -0.4625534415245056, -0.4129122495651245, -0.3632710576057434, -0.3136298656463623, -0.2639886736869812, -0.2143474817276001, -0.164706289768219, -0.11506509780883789, -0.06542390584945679, -0.015782713890075684, 0.03385847806930542, 0.08349967002868652, 0.13314086198806763, 0.18278205394744873, 0.23242324590682983, 0.28206443786621094, 0.33170562982559204, 0.38134682178497314, 0.43098801374435425, 0.48062920570373535, 0.5302703976631165, 0.5799115896224976, 0.6295527815818787, 0.6791939735412598, 0.7288351655006409, 0.778476357460022, 0.8281175494194031, 0.8777587413787842, 0.9273999333381653, 0.9770411252975464, 1.0266823768615723, 1.0763235092163086, 1.125964641571045, 1.1756058931350708, 1.2252471446990967, 1.274888277053833, 1.3245294094085693, 1.3741706609725952, 1.423811912536621, 1.4734530448913574, 1.5230941772460938, 1.5727354288101196, 1.6223766803741455, 1.6720178127288818]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 3.0, 8.0, 7.0, 13.0, 30.0, 36.0, 58.0, 102.0, 201.0, 444.0, 1398.0, 5727.0, 45333.0, 669596.0, 300414.0, 20293.0, 3228.0, 926.0, 341.0, 165.0, 101.0, 35.0, 29.0, 24.0, 11.0, 11.0, 8.0, 7.0, 5.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.712890625, -0.6863174438476562, -0.6597442626953125, -0.6331710815429688, -0.606597900390625, -0.5800247192382812, -0.5534515380859375, -0.5268783569335938, -0.50030517578125, -0.47373199462890625, -0.4471588134765625, -0.42058563232421875, -0.394012451171875, -0.36743927001953125, -0.3408660888671875, -0.31429290771484375, -0.2877197265625, -0.26114654541015625, -0.2345733642578125, -0.20800018310546875, -0.181427001953125, -0.15485382080078125, -0.1282806396484375, -0.10170745849609375, -0.07513427734375, -0.04856109619140625, -0.0219879150390625, 0.00458526611328125, 0.031158447265625, 0.05773162841796875, 0.0843048095703125, 0.11087799072265625, 0.137451171875, 0.16402435302734375, 0.1905975341796875, 0.21717071533203125, 0.243743896484375, 0.27031707763671875, 0.2968902587890625, 0.32346343994140625, 0.35003662109375, 0.37660980224609375, 0.4031829833984375, 0.42975616455078125, 0.456329345703125, 0.48290252685546875, 0.5094757080078125, 0.5360488891601562, 0.5626220703125, 0.5891952514648438, 0.6157684326171875, 0.6423416137695312, 0.668914794921875, 0.6954879760742188, 0.7220611572265625, 0.7486343383789062, 0.77520751953125, 0.8017807006835938, 0.8283538818359375, 0.8549270629882812, 0.881500244140625, 0.9080734252929688, 0.9346466064453125, 0.9612197875976562, 0.98779296875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 11.0, 14.0, 21.0, 29.0, 48.0, 59.0, 82.0, 87.0, 109.0, 107.0, 82.0, 78.0, 73.0, 71.0, 42.0, 31.0, 27.0, 9.0, 12.0, 6.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.376708984375, -0.366668701171875, -0.35662841796875, -0.346588134765625, -0.3365478515625, -0.326507568359375, -0.31646728515625, -0.306427001953125, -0.29638671875, -0.286346435546875, -0.27630615234375, -0.266265869140625, -0.2562255859375, -0.246185302734375, -0.23614501953125, -0.226104736328125, -0.216064453125, -0.206024169921875, -0.19598388671875, -0.185943603515625, -0.1759033203125, -0.165863037109375, -0.15582275390625, -0.145782470703125, -0.1357421875, -0.125701904296875, -0.11566162109375, -0.105621337890625, -0.0955810546875, -0.085540771484375, -0.07550048828125, -0.065460205078125, -0.055419921875, -0.045379638671875, -0.03533935546875, -0.025299072265625, -0.0152587890625, -0.005218505859375, 0.00482177734375, 0.014862060546875, 0.02490234375, 0.034942626953125, 0.04498291015625, 0.055023193359375, 0.0650634765625, 0.075103759765625, 0.08514404296875, 0.095184326171875, 0.105224609375, 0.115264892578125, 0.12530517578125, 0.135345458984375, 0.1453857421875, 0.155426025390625, 0.16546630859375, 0.175506591796875, 0.185546875, 0.195587158203125, 0.20562744140625, 0.215667724609375, 0.2257080078125, 0.235748291015625, 0.24578857421875, 0.255828857421875, 0.265869140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 5.0, 5.0, 9.0, 12.0, 12.0, 13.0, 25.0, 38.0, 56.0, 71.0, 114.0, 155.0, 333.0, 784.0, 2113.0, 7827.0, 53837.0, 703657.0, 248922.0, 23514.0, 4439.0, 1371.0, 551.0, 224.0, 167.0, 67.0, 64.0, 38.0, 31.0, 25.0, 15.0, 12.0, 8.0, 11.0, 6.0, 5.0, 7.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7236328125, -0.7039718627929688, -0.6843109130859375, -0.6646499633789062, -0.644989013671875, -0.6253280639648438, -0.6056671142578125, -0.5860061645507812, -0.56634521484375, -0.5466842651367188, -0.5270233154296875, -0.5073623657226562, -0.487701416015625, -0.46804046630859375, -0.4483795166015625, -0.42871856689453125, -0.4090576171875, -0.38939666748046875, -0.3697357177734375, -0.35007476806640625, -0.330413818359375, -0.31075286865234375, -0.2910919189453125, -0.27143096923828125, -0.25177001953125, -0.23210906982421875, -0.2124481201171875, -0.19278717041015625, -0.173126220703125, -0.15346527099609375, -0.1338043212890625, -0.11414337158203125, -0.094482421875, -0.07482147216796875, -0.0551605224609375, -0.03549957275390625, -0.015838623046875, 0.00382232666015625, 0.0234832763671875, 0.04314422607421875, 0.06280517578125, 0.08246612548828125, 0.1021270751953125, 0.12178802490234375, 0.141448974609375, 0.16110992431640625, 0.1807708740234375, 0.20043182373046875, 0.2200927734375, 0.23975372314453125, 0.2594146728515625, 0.27907562255859375, 0.298736572265625, 0.31839752197265625, 0.3380584716796875, 0.35771942138671875, 0.37738037109375, 0.39704132080078125, 0.4167022705078125, 0.43636322021484375, 0.456024169921875, 0.47568511962890625, 0.4953460693359375, 0.5150070190429688, 0.53466796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 11.0, 21.0, 29.0, 43.0, 46.0, 47.0, 54.0, 65.0, 66.0, 72.0, 78.0, 77.0, 62.0, 74.0, 53.0, 47.0, 42.0, 28.0, 21.0, 20.0, 12.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93603515625, -0.9078140258789062, -0.8795928955078125, -0.8513717651367188, -0.823150634765625, -0.7949295043945312, -0.7667083740234375, -0.7384872436523438, -0.71026611328125, -0.6820449829101562, -0.6538238525390625, -0.6256027221679688, -0.597381591796875, -0.5691604614257812, -0.5409393310546875, -0.5127182006835938, -0.4844970703125, -0.45627593994140625, -0.4280548095703125, -0.39983367919921875, -0.371612548828125, -0.34339141845703125, -0.3151702880859375, -0.28694915771484375, -0.25872802734375, -0.23050689697265625, -0.2022857666015625, -0.17406463623046875, -0.145843505859375, -0.11762237548828125, -0.0894012451171875, -0.06118011474609375, -0.032958984375, -0.00473785400390625, 0.0234832763671875, 0.05170440673828125, 0.079925537109375, 0.10814666748046875, 0.1363677978515625, 0.16458892822265625, 0.19281005859375, 0.22103118896484375, 0.2492523193359375, 0.27747344970703125, 0.305694580078125, 0.33391571044921875, 0.3621368408203125, 0.39035797119140625, 0.4185791015625, 0.44680023193359375, 0.4750213623046875, 0.5032424926757812, 0.531463623046875, 0.5596847534179688, 0.5879058837890625, 0.6161270141601562, 0.64434814453125, 0.6725692749023438, 0.7007904052734375, 0.7290115356445312, 0.757232666015625, 0.7854537963867188, 0.8136749267578125, 0.8418960571289062, 0.8701171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 7.0, 9.0, 14.0, 17.0, 44.0, 80.0, 178.0, 474.0, 1778.0, 10743.0, 142688.0, 850764.0, 35758.0, 4511.0, 911.0, 325.0, 109.0, 47.0, 26.0, 21.0, 16.0, 10.0, 10.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3798828125, -0.3684654235839844, -0.35704803466796875, -0.3456306457519531, -0.3342132568359375, -0.3227958679199219, -0.31137847900390625, -0.2999610900878906, -0.288543701171875, -0.2771263122558594, -0.26570892333984375, -0.2542915344238281, -0.2428741455078125, -0.23145675659179688, -0.22003936767578125, -0.20862197875976562, -0.19720458984375, -0.18578720092773438, -0.17436981201171875, -0.16295242309570312, -0.1515350341796875, -0.14011764526367188, -0.12870025634765625, -0.11728286743164062, -0.105865478515625, -0.09444808959960938, -0.08303070068359375, -0.07161331176757812, -0.0601959228515625, -0.048778533935546875, -0.03736114501953125, -0.025943756103515625, -0.0145263671875, -0.003108978271484375, 0.00830841064453125, 0.019725799560546875, 0.0311431884765625, 0.042560577392578125, 0.05397796630859375, 0.06539535522460938, 0.076812744140625, 0.08823013305664062, 0.09964752197265625, 0.11106491088867188, 0.1224822998046875, 0.13389968872070312, 0.14531707763671875, 0.15673446655273438, 0.16815185546875, 0.17956924438476562, 0.19098663330078125, 0.20240402221679688, 0.2138214111328125, 0.22523880004882812, 0.23665618896484375, 0.24807357788085938, 0.259490966796875, 0.2709083557128906, 0.28232574462890625, 0.2937431335449219, 0.3051605224609375, 0.3165779113769531, 0.32799530029296875, 0.3394126892089844, 0.350830078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 3.0, 4.0, 6.0, 7.0, 2.0, 10.0, 11.0, 19.0, 31.0, 58.0, 74.0, 101.0, 114.0, 153.0, 136.0, 75.0, 59.0, 32.0, 24.0, 24.0, 17.0, 8.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010478496551513672, -0.00010211393237113953, -9.944289922714233e-05, -9.677186608314514e-05, -9.410083293914795e-05, -9.142979979515076e-05, -8.875876665115356e-05, -8.608773350715637e-05, -8.341670036315918e-05, -8.074566721916199e-05, -7.80746340751648e-05, -7.54036009311676e-05, -7.273256778717041e-05, -7.006153464317322e-05, -6.739050149917603e-05, -6.471946835517883e-05, -6.204843521118164e-05, -5.937740206718445e-05, -5.6706368923187256e-05, -5.4035335779190063e-05, -5.136430263519287e-05, -4.869326949119568e-05, -4.6022236347198486e-05, -4.3351203203201294e-05, -4.06801700592041e-05, -3.800913691520691e-05, -3.533810377120972e-05, -3.2667070627212524e-05, -2.9996037483215332e-05, -2.732500433921814e-05, -2.4653971195220947e-05, -2.1982938051223755e-05, -1.9311904907226562e-05, -1.664087176322937e-05, -1.3969838619232178e-05, -1.1298805475234985e-05, -8.627772331237793e-06, -5.956739187240601e-06, -3.285706043243408e-06, -6.146728992462158e-07, 2.0563602447509766e-06, 4.727393388748169e-06, 7.398426532745361e-06, 1.0069459676742554e-05, 1.2740492820739746e-05, 1.541152596473694e-05, 1.808255910873413e-05, 2.0753592252731323e-05, 2.3424625396728516e-05, 2.6095658540725708e-05, 2.87666916847229e-05, 3.143772482872009e-05, 3.4108757972717285e-05, 3.677979111671448e-05, 3.945082426071167e-05, 4.212185740470886e-05, 4.4792890548706055e-05, 4.746392369270325e-05, 5.013495683670044e-05, 5.280598998069763e-05, 5.5477023124694824e-05, 5.8148056268692017e-05, 6.081908941268921e-05, 6.34901225566864e-05, 6.61611557006836e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 4.0, 5.0, 6.0, 11.0, 16.0, 39.0, 54.0, 167.0, 571.0, 2757.0, 25498.0, 920559.0, 92083.0, 5431.0, 926.0, 252.0, 81.0, 38.0, 25.0, 9.0, 7.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.373779296875, -0.3579978942871094, -0.34221649169921875, -0.3264350891113281, -0.3106536865234375, -0.2948722839355469, -0.27909088134765625, -0.2633094787597656, -0.247528076171875, -0.23174667358398438, -0.21596527099609375, -0.20018386840820312, -0.1844024658203125, -0.16862106323242188, -0.15283966064453125, -0.13705825805664062, -0.12127685546875, -0.10549545288085938, -0.08971405029296875, -0.07393264770507812, -0.0581512451171875, -0.042369842529296875, -0.02658843994140625, -0.010807037353515625, 0.004974365234375, 0.020755767822265625, 0.03653717041015625, 0.052318572998046875, 0.0680999755859375, 0.08388137817382812, 0.09966278076171875, 0.11544418334960938, 0.1312255859375, 0.14700698852539062, 0.16278839111328125, 0.17856979370117188, 0.1943511962890625, 0.21013259887695312, 0.22591400146484375, 0.24169540405273438, 0.257476806640625, 0.2732582092285156, 0.28903961181640625, 0.3048210144042969, 0.3206024169921875, 0.3363838195800781, 0.35216522216796875, 0.3679466247558594, 0.38372802734375, 0.3995094299316406, 0.41529083251953125, 0.4310722351074219, 0.4468536376953125, 0.4626350402832031, 0.47841644287109375, 0.4941978454589844, 0.509979248046875, 0.5257606506347656, 0.5415420532226562, 0.5573234558105469, 0.5731048583984375, 0.5888862609863281, 0.6046676635742188, 0.6204490661621094, 0.63623046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 6.0, 8.0, 7.0, 8.0, 7.0, 19.0, 28.0, 44.0, 45.0, 107.0, 125.0, 132.0, 145.0, 114.0, 72.0, 28.0, 39.0, 20.0, 16.0, 10.0, 7.0, 1.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.315185546875, -0.30636024475097656, -0.2975349426269531, -0.2887096405029297, -0.27988433837890625, -0.2710590362548828, -0.2622337341308594, -0.25340843200683594, -0.2445831298828125, -0.23575782775878906, -0.22693252563476562, -0.2181072235107422, -0.20928192138671875, -0.2004566192626953, -0.19163131713867188, -0.18280601501464844, -0.173980712890625, -0.16515541076660156, -0.15633010864257812, -0.1475048065185547, -0.13867950439453125, -0.1298542022705078, -0.12102890014648438, -0.11220359802246094, -0.1033782958984375, -0.09455299377441406, -0.08572769165039062, -0.07690238952636719, -0.06807708740234375, -0.05925178527832031, -0.050426483154296875, -0.04160118103027344, -0.03277587890625, -0.023950576782226562, -0.015125274658203125, -0.0062999725341796875, 0.00252532958984375, 0.011350631713867188, 0.020175933837890625, 0.029001235961914062, 0.0378265380859375, 0.04665184020996094, 0.055477142333984375, 0.06430244445800781, 0.07312774658203125, 0.08195304870605469, 0.09077835083007812, 0.09960365295410156, 0.108428955078125, 0.11725425720214844, 0.12607955932617188, 0.1349048614501953, 0.14373016357421875, 0.1525554656982422, 0.16138076782226562, 0.17020606994628906, 0.1790313720703125, 0.18785667419433594, 0.19668197631835938, 0.2055072784423828, 0.21433258056640625, 0.2231578826904297, 0.23198318481445312, 0.24080848693847656, 0.2496337890625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 10.0, 5.0, 10.0, 18.0, 30.0, 68.0, 105.0, 145.0, 202.0, 144.0, 98.0, 64.0, 34.0, 22.0, 14.0, 5.0, 2.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.164175033569336, -3.0608623027801514, -2.9575493335723877, -2.854236602783203, -2.7509236335754395, -2.647610902786255, -2.5442981719970703, -2.4409852027893066, -2.337672472000122, -2.2343597412109375, -2.131046772003174, -2.0277340412139893, -1.9244211912155151, -1.821108341217041, -1.7177956104278564, -1.6144827604293823, -1.5111699104309082, -1.407857060432434, -1.30454421043396, -1.2012314796447754, -1.0979186296463013, -0.9946057796478271, -0.8912929892539978, -0.7879801988601685, -0.6846673488616943, -0.5813544988632202, -0.47804170846939087, -0.37472888827323914, -0.2714160680770874, -0.16810321807861328, -0.06479042768478394, 0.03852236270904541, 0.14183497428894043, 0.24514779448509216, 0.3484606146812439, 0.45177343487739563, 0.5550862550735474, 0.6583991050720215, 0.7617118954658508, 0.8650246858596802, 0.9683375358581543, 1.0716503858566284, 1.1749632358551025, 1.278275966644287, 1.3815888166427612, 1.4849016666412354, 1.58821439743042, 1.691527247428894, 1.7948400974273682, 1.8981529474258423, 2.0014657974243164, 2.104778528213501, 2.2080912590026855, 2.311404228210449, 2.414716958999634, 2.5180296897888184, 2.621342658996582, 2.7246553897857666, 2.8279683589935303, 2.931281089782715, 3.0345940589904785, 3.137906789779663, 3.2412195205688477, 3.3445324897766113, 3.447845220565796]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 6.0, 3.0, 11.0, 7.0, 20.0, 15.0, 15.0, 23.0, 28.0, 21.0, 38.0, 35.0, 54.0, 50.0, 61.0, 66.0, 74.0, 62.0, 61.0, 46.0, 41.0, 31.0, 22.0, 30.0, 38.0, 22.0, 16.0, 16.0, 19.0, 16.0, 9.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.1785826683044434, -3.0959415435791016, -3.0133001804351807, -2.930659055709839, -2.848017692565918, -2.765376567840576, -2.6827352046966553, -2.6000940799713135, -2.5174527168273926, -2.434811592102051, -2.35217022895813, -2.269529104232788, -2.186887741088867, -2.1042466163635254, -2.0216052532196045, -1.9389641284942627, -1.856323003768921, -1.7736817598342896, -1.6910405158996582, -1.6083992719650269, -1.5257580280303955, -1.4431169033050537, -1.3604756593704224, -1.277834415435791, -1.1951931715011597, -1.1125519275665283, -1.029910683631897, -0.9472694993019104, -0.864628255367279, -0.7819870114326477, -0.6993458271026611, -0.6167045831680298, -0.5340631008148193, -0.451421856880188, -0.36878064274787903, -0.28613942861557007, -0.20349818468093872, -0.12085694074630737, -0.03821572661399841, 0.04442548751831055, 0.1270667314529419, 0.20970796048641205, 0.2923491895198822, 0.37499040365219116, 0.4576316475868225, 0.5402728915214539, 0.6229140758514404, 0.7055553197860718, 0.7881965637207031, 0.8708378076553345, 0.9534790515899658, 1.0361202955245972, 1.1187615394592285, 1.2014026641845703, 1.2840439081192017, 1.366685152053833, 1.4493263959884644, 1.5319676399230957, 1.614608883857727, 1.6972501277923584, 1.7798912525177002, 1.862532615661621, 1.945173740386963, 2.0278148651123047, 2.1104562282562256]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 3.0, 12.0, 10.0, 7.0, 18.0, 34.0, 40.0, 63.0, 93.0, 171.0, 318.0, 674.0, 1662.0, 4597.0, 16369.0, 115491.0, 3390179.0, 613094.0, 37682.0, 8345.0, 2914.0, 1220.0, 521.0, 289.0, 177.0, 79.0, 64.0, 51.0, 24.0, 18.0, 12.0, 10.0, 5.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.359130859375, -0.3478202819824219, -0.33650970458984375, -0.3251991271972656, -0.3138885498046875, -0.3025779724121094, -0.29126739501953125, -0.2799568176269531, -0.268646240234375, -0.2573356628417969, -0.24602508544921875, -0.23471450805664062, -0.2234039306640625, -0.21209335327148438, -0.20078277587890625, -0.18947219848632812, -0.17816162109375, -0.16685104370117188, -0.15554046630859375, -0.14422988891601562, -0.1329193115234375, -0.12160873413085938, -0.11029815673828125, -0.09898757934570312, -0.087677001953125, -0.07636642456054688, -0.06505584716796875, -0.053745269775390625, -0.0424346923828125, -0.031124114990234375, -0.01981353759765625, -0.008502960205078125, 0.0028076171875, 0.014118194580078125, 0.02542877197265625, 0.036739349365234375, 0.0480499267578125, 0.059360504150390625, 0.07067108154296875, 0.08198165893554688, 0.093292236328125, 0.10460281372070312, 0.11591339111328125, 0.12722396850585938, 0.1385345458984375, 0.14984512329101562, 0.16115570068359375, 0.17246627807617188, 0.18377685546875, 0.19508743286132812, 0.20639801025390625, 0.21770858764648438, 0.2290191650390625, 0.24032974243164062, 0.25164031982421875, 0.2629508972167969, 0.274261474609375, 0.2855720520019531, 0.29688262939453125, 0.3081932067871094, 0.3195037841796875, 0.3308143615722656, 0.34212493896484375, 0.3534355163574219, 0.36474609375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 18.0, 23.0, 40.0, 57.0, 86.0, 93.0, 112.0, 117.0, 89.0, 79.0, 71.0, 62.0, 53.0, 28.0, 27.0, 12.0, 5.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382080078125, -0.3721656799316406, -0.36225128173828125, -0.3523368835449219, -0.3424224853515625, -0.3325080871582031, -0.32259368896484375, -0.3126792907714844, -0.302764892578125, -0.2928504943847656, -0.28293609619140625, -0.2730216979980469, -0.2631072998046875, -0.2531929016113281, -0.24327850341796875, -0.23336410522460938, -0.22344970703125, -0.21353530883789062, -0.20362091064453125, -0.19370651245117188, -0.1837921142578125, -0.17387771606445312, -0.16396331787109375, -0.15404891967773438, -0.144134521484375, -0.13422012329101562, -0.12430572509765625, -0.11439132690429688, -0.1044769287109375, -0.09456253051757812, -0.08464813232421875, -0.07473373413085938, -0.0648193359375, -0.054904937744140625, -0.04499053955078125, -0.035076141357421875, -0.0251617431640625, -0.015247344970703125, -0.00533294677734375, 0.004581451416015625, 0.014495849609375, 0.024410247802734375, 0.03432464599609375, 0.044239044189453125, 0.0541534423828125, 0.06406784057617188, 0.07398223876953125, 0.08389663696289062, 0.09381103515625, 0.10372543334960938, 0.11363983154296875, 0.12355422973632812, 0.1334686279296875, 0.14338302612304688, 0.15329742431640625, 0.16321182250976562, 0.173126220703125, 0.18304061889648438, 0.19295501708984375, 0.20286941528320312, 0.2127838134765625, 0.22269821166992188, 0.23261260986328125, 0.24252700805664062, 0.25244140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 16.0, 17.0, 38.0, 51.0, 87.0, 144.0, 232.0, 535.0, 1763.0, 13596.0, 349777.0, 3777382.0, 44856.0, 4156.0, 861.0, 335.0, 179.0, 92.0, 52.0, 33.0, 26.0, 21.0, 14.0, 5.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.712890625, -0.691436767578125, -0.66998291015625, -0.648529052734375, -0.6270751953125, -0.605621337890625, -0.58416748046875, -0.562713623046875, -0.541259765625, -0.519805908203125, -0.49835205078125, -0.476898193359375, -0.4554443359375, -0.433990478515625, -0.41253662109375, -0.391082763671875, -0.36962890625, -0.348175048828125, -0.32672119140625, -0.305267333984375, -0.2838134765625, -0.262359619140625, -0.24090576171875, -0.219451904296875, -0.197998046875, -0.176544189453125, -0.15509033203125, -0.133636474609375, -0.1121826171875, -0.090728759765625, -0.06927490234375, -0.047821044921875, -0.0263671875, -0.004913330078125, 0.01654052734375, 0.037994384765625, 0.0594482421875, 0.080902099609375, 0.10235595703125, 0.123809814453125, 0.145263671875, 0.166717529296875, 0.18817138671875, 0.209625244140625, 0.2310791015625, 0.252532958984375, 0.27398681640625, 0.295440673828125, 0.31689453125, 0.338348388671875, 0.35980224609375, 0.381256103515625, 0.4027099609375, 0.424163818359375, 0.44561767578125, 0.467071533203125, 0.488525390625, 0.509979248046875, 0.53143310546875, 0.552886962890625, 0.5743408203125, 0.595794677734375, 0.61724853515625, 0.638702392578125, 0.66015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 15.0, 12.0, 19.0, 23.0, 31.0, 38.0, 63.0, 120.0, 210.0, 411.0, 1007.0, 1075.0, 503.0, 184.0, 121.0, 62.0, 41.0, 39.0, 29.0, 13.0, 10.0, 10.0, 8.0, 2.0, 2.0, 5.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.433837890625, -0.421112060546875, -0.40838623046875, -0.395660400390625, -0.3829345703125, -0.370208740234375, -0.35748291015625, -0.344757080078125, -0.33203125, -0.319305419921875, -0.30657958984375, -0.293853759765625, -0.2811279296875, -0.268402099609375, -0.25567626953125, -0.242950439453125, -0.230224609375, -0.217498779296875, -0.20477294921875, -0.192047119140625, -0.1793212890625, -0.166595458984375, -0.15386962890625, -0.141143798828125, -0.12841796875, -0.115692138671875, -0.10296630859375, -0.090240478515625, -0.0775146484375, -0.064788818359375, -0.05206298828125, -0.039337158203125, -0.026611328125, -0.013885498046875, -0.00115966796875, 0.011566162109375, 0.0242919921875, 0.037017822265625, 0.04974365234375, 0.062469482421875, 0.0751953125, 0.087921142578125, 0.10064697265625, 0.113372802734375, 0.1260986328125, 0.138824462890625, 0.15155029296875, 0.164276123046875, 0.177001953125, 0.189727783203125, 0.20245361328125, 0.215179443359375, 0.2279052734375, 0.240631103515625, 0.25335693359375, 0.266082763671875, 0.27880859375, 0.291534423828125, 0.30426025390625, 0.316986083984375, 0.3297119140625, 0.342437744140625, 0.35516357421875, 0.367889404296875, 0.380615234375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 16.0, 31.0, 67.0, 138.0, 206.0, 206.0, 154.0, 91.0, 40.0, 15.0, 10.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.637744188308716, -3.5208239555358887, -3.4039037227630615, -3.2869834899902344, -3.1700632572174072, -3.05314302444458, -2.936222553253174, -2.819302558898926, -2.7023820877075195, -2.5854618549346924, -2.4685416221618652, -2.351621389389038, -2.234701156616211, -2.117780923843384, -2.0008606910705566, -1.88394033908844, -1.7670202255249023, -1.6500999927520752, -1.533179759979248, -1.416259527206421, -1.2993392944335938, -1.1824190616607666, -1.06549870967865, -0.9485784769058228, -0.8316582441329956, -0.7147380113601685, -0.5978177785873413, -0.4808974862098694, -0.36397725343704224, -0.2470570206642151, -0.13013672828674316, -0.013216495513916016, 0.10370397567749023, 0.22062422335147858, 0.3375444710254669, 0.45446473360061646, 0.5713849663734436, 0.6883051991462708, 0.8052254915237427, 0.9221457242965698, 1.039065957069397, 1.1559861898422241, 1.2729064226150513, 1.389826774597168, 1.5067470073699951, 1.6236672401428223, 1.7405874729156494, 1.8575077056884766, 1.9744279384613037, 2.091348171234131, 2.208268404006958, 2.325188636779785, 2.4421088695526123, 2.5590291023254395, 2.6759495735168457, 2.7928695678710938, 2.9097900390625, 3.026710271835327, 3.1436305046081543, 3.2605507373809814, 3.3774709701538086, 3.4943912029266357, 3.611311435699463, 3.728231906890869, 3.845151901245117]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 3.0, 6.0, 6.0, 9.0, 5.0, 9.0, 11.0, 21.0, 20.0, 17.0, 23.0, 22.0, 37.0, 26.0, 38.0, 31.0, 41.0, 39.0, 43.0, 46.0, 44.0, 45.0, 58.0, 42.0, 29.0, 30.0, 43.0, 33.0, 36.0, 28.0, 21.0, 15.0, 23.0, 13.0, 14.0, 16.0, 11.0, 9.0, 10.0, 6.0, 12.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1957745552062988, -1.1551610231399536, -1.1145474910736084, -1.0739339590072632, -1.033320426940918, -0.9927068948745728, -0.9520934224128723, -0.9114798903465271, -0.8708663582801819, -0.8302528262138367, -0.7896392941474915, -0.7490257620811462, -0.7084122896194458, -0.6677987575531006, -0.6271852254867554, -0.5865716934204102, -0.5459581613540649, -0.5053446292877197, -0.4647310972213745, -0.4241175949573517, -0.38350406289100647, -0.34289053082466125, -0.3022770285606384, -0.2616634964942932, -0.221049964427948, -0.18043643236160278, -0.13982291519641876, -0.09920939058065414, -0.058595865964889526, -0.01798233389854431, 0.02263118326663971, 0.06324470043182373, 0.10385823249816895, 0.14447176456451416, 0.18508528172969818, 0.2256987988948822, 0.2663123309612274, 0.30692586302757263, 0.34753936529159546, 0.3881528973579407, 0.4287664294242859, 0.4693799614906311, 0.5099934935569763, 0.5506070256233215, 0.591220498085022, 0.6318340301513672, 0.6724475622177124, 0.7130610942840576, 0.7536746263504028, 0.794288158416748, 0.8349016904830933, 0.8755152225494385, 0.9161287546157837, 0.9567422866821289, 0.9973557591438293, 1.0379693508148193, 1.078582763671875, 1.1191962957382202, 1.1598098278045654, 1.2004233598709106, 1.2410368919372559, 1.281650424003601, 1.3222639560699463, 1.362877368927002, 1.4034910202026367]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 20.0, 20.0, 47.0, 88.0, 141.0, 320.0, 867.0, 3034.0, 16633.0, 177840.0, 741914.0, 93769.0, 10408.0, 2171.0, 687.0, 283.0, 139.0, 75.0, 35.0, 15.0, 13.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84814453125, -0.8271408081054688, -0.8061370849609375, -0.7851333618164062, -0.764129638671875, -0.7431259155273438, -0.7221221923828125, -0.7011184692382812, -0.68011474609375, -0.6591110229492188, -0.6381072998046875, -0.6171035766601562, -0.596099853515625, -0.5750961303710938, -0.5540924072265625, -0.5330886840820312, -0.5120849609375, -0.49108123779296875, -0.4700775146484375, -0.44907379150390625, -0.428070068359375, -0.40706634521484375, -0.3860626220703125, -0.36505889892578125, -0.34405517578125, -0.32305145263671875, -0.3020477294921875, -0.28104400634765625, -0.260040283203125, -0.23903656005859375, -0.2180328369140625, -0.19702911376953125, -0.176025390625, -0.15502166748046875, -0.1340179443359375, -0.11301422119140625, -0.092010498046875, -0.07100677490234375, -0.0500030517578125, -0.02899932861328125, -0.00799560546875, 0.01300811767578125, 0.0340118408203125, 0.05501556396484375, 0.076019287109375, 0.09702301025390625, 0.1180267333984375, 0.13903045654296875, 0.1600341796875, 0.18103790283203125, 0.2020416259765625, 0.22304534912109375, 0.244049072265625, 0.26505279541015625, 0.2860565185546875, 0.30706024169921875, 0.32806396484375, 0.34906768798828125, 0.3700714111328125, 0.39107513427734375, 0.412078857421875, 0.43308258056640625, 0.4540863037109375, 0.47509002685546875, 0.49609375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 11.0, 11.0, 17.0, 30.0, 47.0, 65.0, 71.0, 92.0, 104.0, 96.0, 100.0, 79.0, 76.0, 62.0, 45.0, 29.0, 22.0, 23.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380859375, -0.3709678649902344, -0.36107635498046875, -0.3511848449707031, -0.3412933349609375, -0.3314018249511719, -0.32151031494140625, -0.3116188049316406, -0.301727294921875, -0.2918357849121094, -0.28194427490234375, -0.2720527648925781, -0.2621612548828125, -0.2522697448730469, -0.24237823486328125, -0.23248672485351562, -0.22259521484375, -0.21270370483398438, -0.20281219482421875, -0.19292068481445312, -0.1830291748046875, -0.17313766479492188, -0.16324615478515625, -0.15335464477539062, -0.143463134765625, -0.13357162475585938, -0.12368011474609375, -0.11378860473632812, -0.1038970947265625, -0.09400558471679688, -0.08411407470703125, -0.07422256469726562, -0.0643310546875, -0.054439544677734375, -0.04454803466796875, -0.034656524658203125, -0.0247650146484375, -0.014873504638671875, -0.00498199462890625, 0.004909515380859375, 0.014801025390625, 0.024692535400390625, 0.03458404541015625, 0.044475555419921875, 0.0543670654296875, 0.06425857543945312, 0.07415008544921875, 0.08404159545898438, 0.09393310546875, 0.10382461547851562, 0.11371612548828125, 0.12360763549804688, 0.1334991455078125, 0.14339065551757812, 0.15328216552734375, 0.16317367553710938, 0.173065185546875, 0.18295669555664062, 0.19284820556640625, 0.20273971557617188, 0.2126312255859375, 0.22252273559570312, 0.23241424560546875, 0.24230575561523438, 0.252197265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 5.0, 7.0, 17.0, 15.0, 32.0, 50.0, 53.0, 98.0, 161.0, 286.0, 656.0, 1777.0, 7553.0, 64893.0, 862603.0, 97198.0, 9488.0, 2082.0, 736.0, 322.0, 172.0, 101.0, 64.0, 64.0, 35.0, 17.0, 15.0, 10.0, 10.0, 7.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7041015625, -0.6810684204101562, -0.6580352783203125, -0.6350021362304688, -0.611968994140625, -0.5889358520507812, -0.5659027099609375, -0.5428695678710938, -0.51983642578125, -0.49680328369140625, -0.4737701416015625, -0.45073699951171875, -0.427703857421875, -0.40467071533203125, -0.3816375732421875, -0.35860443115234375, -0.3355712890625, -0.31253814697265625, -0.2895050048828125, -0.26647186279296875, -0.243438720703125, -0.22040557861328125, -0.1973724365234375, -0.17433929443359375, -0.15130615234375, -0.12827301025390625, -0.1052398681640625, -0.08220672607421875, -0.059173583984375, -0.03614044189453125, -0.0131072998046875, 0.00992584228515625, 0.032958984375, 0.05599212646484375, 0.0790252685546875, 0.10205841064453125, 0.125091552734375, 0.14812469482421875, 0.1711578369140625, 0.19419097900390625, 0.21722412109375, 0.24025726318359375, 0.2632904052734375, 0.28632354736328125, 0.309356689453125, 0.33238983154296875, 0.3554229736328125, 0.37845611572265625, 0.4014892578125, 0.42452239990234375, 0.4475555419921875, 0.47058868408203125, 0.493621826171875, 0.5166549682617188, 0.5396881103515625, 0.5627212524414062, 0.58575439453125, 0.6087875366210938, 0.6318206787109375, 0.6548538208007812, 0.677886962890625, 0.7009201049804688, 0.7239532470703125, 0.7469863891601562, 0.77001953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 5.0, 1.0, 4.0, 9.0, 8.0, 6.0, 14.0, 22.0, 25.0, 42.0, 39.0, 45.0, 59.0, 44.0, 74.0, 65.0, 73.0, 78.0, 66.0, 60.0, 43.0, 53.0, 28.0, 29.0, 23.0, 21.0, 9.0, 8.0, 9.0, 6.0, 3.0, 5.0, 3.0, 5.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.71435546875, -0.6890487670898438, -0.6637420654296875, -0.6384353637695312, -0.613128662109375, -0.5878219604492188, -0.5625152587890625, -0.5372085571289062, -0.51190185546875, -0.48659515380859375, -0.4612884521484375, -0.43598175048828125, -0.410675048828125, -0.38536834716796875, -0.3600616455078125, -0.33475494384765625, -0.3094482421875, -0.28414154052734375, -0.2588348388671875, -0.23352813720703125, -0.208221435546875, -0.18291473388671875, -0.1576080322265625, -0.13230133056640625, -0.10699462890625, -0.08168792724609375, -0.0563812255859375, -0.03107452392578125, -0.005767822265625, 0.01953887939453125, 0.0448455810546875, 0.07015228271484375, 0.095458984375, 0.12076568603515625, 0.1460723876953125, 0.17137908935546875, 0.196685791015625, 0.22199249267578125, 0.2472991943359375, 0.27260589599609375, 0.29791259765625, 0.32321929931640625, 0.3485260009765625, 0.37383270263671875, 0.399139404296875, 0.42444610595703125, 0.4497528076171875, 0.47505950927734375, 0.5003662109375, 0.5256729125976562, 0.5509796142578125, 0.5762863159179688, 0.601593017578125, 0.6268997192382812, 0.6522064208984375, 0.6775131225585938, 0.70281982421875, 0.7281265258789062, 0.7534332275390625, 0.7787399291992188, 0.804046630859375, 0.8293533325195312, 0.8546600341796875, 0.8799667358398438, 0.9052734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 7.0, 11.0, 7.0, 19.0, 19.0, 30.0, 60.0, 92.0, 180.0, 415.0, 1041.0, 3900.0, 19236.0, 286148.0, 705022.0, 25461.0, 4679.0, 1293.0, 460.0, 194.0, 110.0, 55.0, 42.0, 21.0, 12.0, 14.0, 10.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2261962890625, -0.21751976013183594, -0.20884323120117188, -0.2001667022705078, -0.19149017333984375, -0.1828136444091797, -0.17413711547851562, -0.16546058654785156, -0.1567840576171875, -0.14810752868652344, -0.13943099975585938, -0.1307544708251953, -0.12207794189453125, -0.11340141296386719, -0.10472488403320312, -0.09604835510253906, -0.087371826171875, -0.07869529724121094, -0.07001876831054688, -0.06134223937988281, -0.05266571044921875, -0.04398918151855469, -0.035312652587890625, -0.026636123657226562, -0.0179595947265625, -0.009283065795898438, -0.000606536865234375, 0.008069992065429688, 0.01674652099609375, 0.025423049926757812, 0.034099578857421875, 0.04277610778808594, 0.05145263671875, 0.06012916564941406, 0.06880569458007812, 0.07748222351074219, 0.08615875244140625, 0.09483528137207031, 0.10351181030273438, 0.11218833923339844, 0.1208648681640625, 0.12954139709472656, 0.13821792602539062, 0.1468944549560547, 0.15557098388671875, 0.1642475128173828, 0.17292404174804688, 0.18160057067871094, 0.190277099609375, 0.19895362854003906, 0.20763015747070312, 0.2163066864013672, 0.22498321533203125, 0.2336597442626953, 0.24233627319335938, 0.25101280212402344, 0.2596893310546875, 0.26836585998535156, 0.2770423889160156, 0.2857189178466797, 0.29439544677734375, 0.3030719757080078, 0.3117485046386719, 0.32042503356933594, 0.3291015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 9.0, 8.0, 15.0, 11.0, 14.0, 24.0, 30.0, 39.0, 65.0, 68.0, 106.0, 131.0, 128.0, 100.0, 45.0, 53.0, 32.0, 20.0, 19.0, 16.0, 14.0, 7.0, 7.0, 7.0, 7.0, 3.0, 0.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3882598876953125e-05, -5.207117646932602e-05, -5.0259754061698914e-05, -4.844833165407181e-05, -4.66369092464447e-05, -4.4825486838817596e-05, -4.301406443119049e-05, -4.1202642023563385e-05, -3.939121961593628e-05, -3.7579797208309174e-05, -3.576837480068207e-05, -3.395695239305496e-05, -3.2145529985427856e-05, -3.033410757780075e-05, -2.8522685170173645e-05, -2.671126276254654e-05, -2.4899840354919434e-05, -2.3088417947292328e-05, -2.1276995539665222e-05, -1.9465573132038116e-05, -1.765415072441101e-05, -1.5842728316783905e-05, -1.40313059091568e-05, -1.2219883501529694e-05, -1.0408461093902588e-05, -8.597038686275482e-06, -6.7856162786483765e-06, -4.974193871021271e-06, -3.162771463394165e-06, -1.3513490557670593e-06, 4.600733518600464e-07, 2.271495759487152e-06, 4.082918167114258e-06, 5.8943405747413635e-06, 7.70576298236847e-06, 9.517185389995575e-06, 1.132860779762268e-05, 1.3140030205249786e-05, 1.4951452612876892e-05, 1.6762875020503998e-05, 1.8574297428131104e-05, 2.038571983575821e-05, 2.2197142243385315e-05, 2.400856465101242e-05, 2.5819987058639526e-05, 2.7631409466266632e-05, 2.9442831873893738e-05, 3.1254254281520844e-05, 3.306567668914795e-05, 3.4877099096775055e-05, 3.668852150440216e-05, 3.8499943912029266e-05, 4.031136631965637e-05, 4.212278872728348e-05, 4.3934211134910583e-05, 4.574563354253769e-05, 4.7557055950164795e-05, 4.93684783577919e-05, 5.1179900765419006e-05, 5.299132317304611e-05, 5.480274558067322e-05, 5.6614167988300323e-05, 5.842559039592743e-05, 6.0237012803554535e-05, 6.204843521118164e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 9.0, 11.0, 12.0, 16.0, 38.0, 30.0, 65.0, 68.0, 117.0, 203.0, 355.0, 747.0, 1546.0, 4044.0, 12658.0, 51933.0, 656707.0, 267466.0, 36784.0, 9591.0, 3272.0, 1322.0, 710.0, 337.0, 181.0, 103.0, 82.0, 52.0, 23.0, 13.0, 15.0, 8.0, 7.0, 9.0, 1.0, 2.0, 7.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.1324939727783203, -0.12717056274414062, -0.12184715270996094, -0.11652374267578125, -0.11120033264160156, -0.10587692260742188, -0.10055351257324219, -0.0952301025390625, -0.08990669250488281, -0.08458328247070312, -0.07925987243652344, -0.07393646240234375, -0.06861305236816406, -0.06328964233398438, -0.05796623229980469, -0.052642822265625, -0.04731941223144531, -0.041996002197265625, -0.03667259216308594, -0.03134918212890625, -0.026025772094726562, -0.020702362060546875, -0.015378952026367188, -0.0100555419921875, -0.0047321319580078125, 0.000591278076171875, 0.0059146881103515625, 0.01123809814453125, 0.016561508178710938, 0.021884918212890625, 0.027208328247070312, 0.03253173828125, 0.03785514831542969, 0.043178558349609375, 0.04850196838378906, 0.05382537841796875, 0.05914878845214844, 0.06447219848632812, 0.06979560852050781, 0.0751190185546875, 0.08044242858886719, 0.08576583862304688, 0.09108924865722656, 0.09641265869140625, 0.10173606872558594, 0.10705947875976562, 0.11238288879394531, 0.117706298828125, 0.12302970886230469, 0.12835311889648438, 0.13367652893066406, 0.13899993896484375, 0.14432334899902344, 0.14964675903320312, 0.1549701690673828, 0.1602935791015625, 0.1656169891357422, 0.17094039916992188, 0.17626380920410156, 0.18158721923828125, 0.18691062927246094, 0.19223403930664062, 0.1975574493408203, 0.202880859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 7.0, 7.0, 6.0, 8.0, 12.0, 15.0, 17.0, 26.0, 35.0, 45.0, 57.0, 97.0, 108.0, 117.0, 124.0, 82.0, 53.0, 39.0, 35.0, 14.0, 17.0, 15.0, 24.0, 6.0, 6.0, 4.0, 4.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127197265625, -0.12171554565429688, -0.11623382568359375, -0.11075210571289062, -0.1052703857421875, -0.09978866577148438, -0.09430694580078125, -0.08882522583007812, -0.083343505859375, -0.07786178588867188, -0.07238006591796875, -0.06689834594726562, -0.0614166259765625, -0.055934906005859375, -0.05045318603515625, -0.044971466064453125, -0.03948974609375, -0.034008026123046875, -0.02852630615234375, -0.023044586181640625, -0.0175628662109375, -0.012081146240234375, -0.00659942626953125, -0.001117706298828125, 0.004364013671875, 0.009845733642578125, 0.01532745361328125, 0.020809173583984375, 0.0262908935546875, 0.031772613525390625, 0.03725433349609375, 0.042736053466796875, 0.0482177734375, 0.053699493408203125, 0.05918121337890625, 0.06466293334960938, 0.0701446533203125, 0.07562637329101562, 0.08110809326171875, 0.08658981323242188, 0.092071533203125, 0.09755325317382812, 0.10303497314453125, 0.10851669311523438, 0.1139984130859375, 0.11948013305664062, 0.12496185302734375, 0.13044357299804688, 0.13592529296875, 0.14140701293945312, 0.14688873291015625, 0.15237045288085938, 0.1578521728515625, 0.16333389282226562, 0.16881561279296875, 0.17429733276367188, 0.179779052734375, 0.18526077270507812, 0.19074249267578125, 0.19622421264648438, 0.2017059326171875, 0.20718765258789062, 0.21266937255859375, 0.21815109252929688, 0.2236328125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 14.0, 44.0, 141.0, 446.0, 219.0, 81.0, 17.0, 15.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.024956703186035, -8.797606468200684, -8.570255279541016, -8.342905044555664, -8.115553855895996, -7.888203144073486, -7.660852432250977, -7.433501720428467, -7.206151008605957, -6.978800296783447, -6.7514495849609375, -6.524098873138428, -6.296748161315918, -6.069397449493408, -5.842046737670898, -5.614696025848389, -5.387345314025879, -5.159994602203369, -4.932643890380859, -4.70529317855835, -4.47794246673584, -4.25059175491333, -4.02324104309082, -3.7958903312683105, -3.568540096282959, -3.341189384460449, -3.1138386726379395, -2.8864879608154297, -2.65913724899292, -2.43178653717041, -2.2044358253479004, -1.9770852327346802, -1.7497344017028809, -1.522383689880371, -1.2950329780578613, -1.0676822662353516, -0.8403316140174866, -0.6129809617996216, -0.3856302499771118, -0.15827953815460205, 0.06907117366790771, 0.2964218854904175, 0.5237725973129272, 0.7511232495307922, 0.978473961353302, 1.205824613571167, 1.4331753253936768, 1.6605260372161865, 1.8878767490386963, 2.115227460861206, 2.342578172683716, 2.5699288845062256, 2.7972795963287354, 3.024630069732666, 3.251980781555176, 3.4793314933776855, 3.7066822052001953, 3.934032917022705, 4.161383628845215, 4.388734340667725, 4.616085052490234, 4.843435764312744, 5.070786476135254, 5.298137187957764, 5.525487899780273]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 3.0, 12.0, 3.0, 13.0, 10.0, 9.0, 18.0, 14.0, 19.0, 21.0, 27.0, 26.0, 37.0, 40.0, 41.0, 43.0, 60.0, 67.0, 85.0, 71.0, 50.0, 55.0, 36.0, 21.0, 25.0, 26.0, 31.0, 27.0, 15.0, 16.0, 11.0, 8.0, 11.0, 12.0, 11.0, 4.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.055661201477051, -1.980941891670227, -1.9062225818634033, -1.8315033912658691, -1.7567840814590454, -1.6820647716522217, -1.6073455810546875, -1.5326262712478638, -1.45790696144104, -1.3831876516342163, -1.3084683418273926, -1.2337491512298584, -1.1590298414230347, -1.084310531616211, -1.0095913410186768, -0.934872031211853, -0.8601527214050293, -0.7854334115982056, -0.7107141613960266, -0.6359949111938477, -0.5612756013870239, -0.4865563213825226, -0.41183704137802124, -0.3371177911758423, -0.26239848136901855, -0.1876792013645172, -0.11295992136001587, -0.038240641355514526, 0.036478638648986816, 0.11119791865348816, 0.1859171986579895, 0.26063644886016846, 0.3353555202484131, 0.41007480025291443, 0.48479408025741577, 0.5595133304595947, 0.6342326402664185, 0.7089519500732422, 0.7836712002754211, 0.8583904504776001, 0.9331097602844238, 1.0078290700912476, 1.0825483798980713, 1.1572675704956055, 1.2319868803024292, 1.306706190109253, 1.381425380706787, 1.4561446905136108, 1.5308640003204346, 1.6055833101272583, 1.680302619934082, 1.7550218105316162, 1.82974112033844, 1.9044604301452637, 1.9791796207427979, 2.053898811340332, 2.1286182403564453, 2.2033374309539795, 2.2780568599700928, 2.352776050567627, 2.4274954795837402, 2.5022146701812744, 2.5769338607788086, 2.651653289794922, 2.726372480392456]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 10.0, 13.0, 9.0, 22.0, 39.0, 48.0, 83.0, 123.0, 232.0, 476.0, 829.0, 1833.0, 4947.0, 15595.0, 78996.0, 1862591.0, 2121040.0, 81630.0, 16362.0, 5117.0, 2055.0, 948.0, 505.0, 286.0, 152.0, 112.0, 68.0, 49.0, 22.0, 19.0, 12.0, 15.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359375, -0.3469886779785156, -0.33460235595703125, -0.3222160339355469, -0.3098297119140625, -0.2974433898925781, -0.28505706787109375, -0.2726707458496094, -0.260284423828125, -0.24789810180664062, -0.23551177978515625, -0.22312545776367188, -0.2107391357421875, -0.19835281372070312, -0.18596649169921875, -0.17358016967773438, -0.16119384765625, -0.14880752563476562, -0.13642120361328125, -0.12403488159179688, -0.1116485595703125, -0.09926223754882812, -0.08687591552734375, -0.07448959350585938, -0.062103271484375, -0.049716949462890625, -0.03733062744140625, -0.024944305419921875, -0.0125579833984375, -0.000171661376953125, 0.01221466064453125, 0.024600982666015625, 0.0369873046875, 0.049373626708984375, 0.06175994873046875, 0.07414627075195312, 0.0865325927734375, 0.09891891479492188, 0.11130523681640625, 0.12369155883789062, 0.136077880859375, 0.14846420288085938, 0.16085052490234375, 0.17323684692382812, 0.1856231689453125, 0.19800949096679688, 0.21039581298828125, 0.22278213500976562, 0.23516845703125, 0.24755477905273438, 0.25994110107421875, 0.2723274230957031, 0.2847137451171875, 0.2971000671386719, 0.30948638916015625, 0.3218727111816406, 0.334259033203125, 0.3466453552246094, 0.35903167724609375, 0.3714179992675781, 0.3838043212890625, 0.3961906433105469, 0.40857696533203125, 0.4209632873535156, 0.433349609375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 10.0, 9.0, 14.0, 24.0, 31.0, 32.0, 51.0, 58.0, 55.0, 78.0, 100.0, 95.0, 90.0, 56.0, 65.0, 59.0, 46.0, 33.0, 24.0, 23.0, 19.0, 13.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.282958984375, -0.2747344970703125, -0.266510009765625, -0.2582855224609375, -0.25006103515625, -0.2418365478515625, -0.233612060546875, -0.2253875732421875, -0.2171630859375, -0.2089385986328125, -0.200714111328125, -0.1924896240234375, -0.18426513671875, -0.1760406494140625, -0.167816162109375, -0.1595916748046875, -0.1513671875, -0.1431427001953125, -0.134918212890625, -0.1266937255859375, -0.11846923828125, -0.1102447509765625, -0.102020263671875, -0.0937957763671875, -0.0855712890625, -0.0773468017578125, -0.069122314453125, -0.0608978271484375, -0.05267333984375, -0.0444488525390625, -0.036224365234375, -0.0279998779296875, -0.019775390625, -0.0115509033203125, -0.003326416015625, 0.0048980712890625, 0.01312255859375, 0.0213470458984375, 0.029571533203125, 0.0377960205078125, 0.0460205078125, 0.0542449951171875, 0.062469482421875, 0.0706939697265625, 0.07891845703125, 0.0871429443359375, 0.095367431640625, 0.1035919189453125, 0.11181640625, 0.1200408935546875, 0.128265380859375, 0.1364898681640625, 0.14471435546875, 0.1529388427734375, 0.161163330078125, 0.1693878173828125, 0.1776123046875, 0.1858367919921875, 0.194061279296875, 0.2022857666015625, 0.21051025390625, 0.2187347412109375, 0.226959228515625, 0.2351837158203125, 0.243408203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 9.0, 6.0, 8.0, 10.0, 18.0, 20.0, 23.0, 29.0, 55.0, 88.0, 102.0, 207.0, 395.0, 982.0, 3606.0, 19123.0, 223546.0, 3786054.0, 140549.0, 14654.0, 2971.0, 918.0, 346.0, 192.0, 114.0, 79.0, 44.0, 33.0, 27.0, 15.0, 17.0, 14.0, 12.0, 8.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5478515625, -0.52984619140625, -0.5118408203125, -0.49383544921875, -0.475830078125, -0.45782470703125, -0.4398193359375, -0.42181396484375, -0.40380859375, -0.38580322265625, -0.3677978515625, -0.34979248046875, -0.331787109375, -0.31378173828125, -0.2957763671875, -0.27777099609375, -0.259765625, -0.24176025390625, -0.2237548828125, -0.20574951171875, -0.187744140625, -0.16973876953125, -0.1517333984375, -0.13372802734375, -0.11572265625, -0.09771728515625, -0.0797119140625, -0.06170654296875, -0.043701171875, -0.02569580078125, -0.0076904296875, 0.01031494140625, 0.0283203125, 0.04632568359375, 0.0643310546875, 0.08233642578125, 0.100341796875, 0.11834716796875, 0.1363525390625, 0.15435791015625, 0.17236328125, 0.19036865234375, 0.2083740234375, 0.22637939453125, 0.244384765625, 0.26239013671875, 0.2803955078125, 0.29840087890625, 0.31640625, 0.33441162109375, 0.3524169921875, 0.37042236328125, 0.388427734375, 0.40643310546875, 0.4244384765625, 0.44244384765625, 0.46044921875, 0.47845458984375, 0.4964599609375, 0.51446533203125, 0.532470703125, 0.55047607421875, 0.5684814453125, 0.58648681640625, 0.6044921875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 6.0, 5.0, 6.0, 6.0, 11.0, 8.0, 19.0, 25.0, 35.0, 42.0, 46.0, 82.0, 108.0, 226.0, 387.0, 707.0, 912.0, 579.0, 306.0, 187.0, 81.0, 79.0, 53.0, 31.0, 36.0, 15.0, 13.0, 13.0, 10.0, 3.0, 5.0, 6.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32177734375, -0.3099822998046875, -0.298187255859375, -0.2863922119140625, -0.27459716796875, -0.2628021240234375, -0.251007080078125, -0.2392120361328125, -0.2274169921875, -0.2156219482421875, -0.203826904296875, -0.1920318603515625, -0.18023681640625, -0.1684417724609375, -0.156646728515625, -0.1448516845703125, -0.133056640625, -0.1212615966796875, -0.109466552734375, -0.0976715087890625, -0.08587646484375, -0.0740814208984375, -0.062286376953125, -0.0504913330078125, -0.0386962890625, -0.0269012451171875, -0.015106201171875, -0.0033111572265625, 0.00848388671875, 0.0202789306640625, 0.032073974609375, 0.0438690185546875, 0.0556640625, 0.0674591064453125, 0.079254150390625, 0.0910491943359375, 0.10284423828125, 0.1146392822265625, 0.126434326171875, 0.1382293701171875, 0.1500244140625, 0.1618194580078125, 0.173614501953125, 0.1854095458984375, 0.19720458984375, 0.2089996337890625, 0.220794677734375, 0.2325897216796875, 0.244384765625, 0.2561798095703125, 0.267974853515625, 0.2797698974609375, 0.29156494140625, 0.3033599853515625, 0.315155029296875, 0.3269500732421875, 0.3387451171875, 0.3505401611328125, 0.362335205078125, 0.3741302490234375, 0.38592529296875, 0.3977203369140625, 0.409515380859375, 0.4213104248046875, 0.43310546875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 9.0, 31.0, 58.0, 156.0, 205.0, 197.0, 147.0, 92.0, 38.0, 23.0, 13.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564911365509033, -2.437615394592285, -2.310319185256958, -2.183022975921631, -2.055727005004883, -1.9284309148788452, -1.8011348247528076, -1.67383873462677, -1.5465426445007324, -1.4192465543746948, -1.2919504642486572, -1.1646543741226196, -1.037358283996582, -0.9100621938705444, -0.7827661037445068, -0.6554700136184692, -0.5281739234924316, -0.40087783336639404, -0.27358174324035645, -0.14628565311431885, -0.01898956298828125, 0.10830652713775635, 0.23560261726379395, 0.36289870738983154, 0.49019479751586914, 0.6174908876419067, 0.7447869777679443, 0.8720830678939819, 0.9993791580200195, 1.1266752481460571, 1.2539713382720947, 1.3812674283981323, 1.50856351852417, 1.6358596086502075, 1.7631556987762451, 1.8904517889022827, 2.0177478790283203, 2.1450438499450684, 2.2723400592803955, 2.3996362686157227, 2.5269322395324707, 2.6542282104492188, 2.781524419784546, 2.908820629119873, 3.036116600036621, 3.163412570953369, 3.2907087802886963, 3.4180049896240234, 3.5453009605407715, 3.6725969314575195, 3.7998931407928467, 3.927189350128174, 4.054485321044922, 4.18178129196167, 4.309077262878418, 4.436373710632324, 4.563669681549072, 4.69096565246582, 4.818262100219727, 4.945558071136475, 5.072854042053223, 5.200150012969971, 5.327445983886719, 5.454742431640625, 5.582038402557373]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 3.0, 4.0, 4.0, 7.0, 8.0, 10.0, 9.0, 18.0, 20.0, 17.0, 18.0, 28.0, 25.0, 30.0, 37.0, 38.0, 37.0, 45.0, 51.0, 52.0, 50.0, 53.0, 60.0, 46.0, 36.0, 32.0, 45.0, 23.0, 26.0, 25.0, 21.0, 23.0, 13.0, 18.0, 19.0, 16.0, 5.0, 8.0, 8.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-1.9096438884735107, -1.860107183456421, -1.8105703592300415, -1.7610336542129517, -1.7114969491958618, -1.661960244178772, -1.6124234199523926, -1.5628867149353027, -1.513350009918213, -1.463813304901123, -1.4142764806747437, -1.3647397756576538, -1.315203070640564, -1.2656663656234741, -1.2161295413970947, -1.1665928363800049, -1.117056131362915, -1.0675194263458252, -1.0179826021194458, -0.968445897102356, -0.9189091920852661, -0.8693724274635315, -0.8198356628417969, -0.770298957824707, -0.7207621335983276, -0.671225368976593, -0.6216886639595032, -0.5721518993377686, -0.5226151943206787, -0.4730784296989441, -0.42354169487953186, -0.37400496006011963, -0.3244682550430298, -0.27493152022361755, -0.22539478540420532, -0.1758580356836319, -0.12632130086421967, -0.07678456604480743, -0.02724781632423401, 0.022288918495178223, 0.07182565331459045, 0.12136238813400269, 0.17089912295341492, 0.22043587267398834, 0.26997262239456177, 0.3195093274116516, 0.36904609203338623, 0.41858282685279846, 0.4681195616722107, 0.5176563262939453, 0.5671930313110352, 0.6167297959327698, 0.6662665009498596, 0.7158032655715942, 0.7653399705886841, 0.8148767352104187, 0.8644134998321533, 0.9139502644538879, 0.9634869694709778, 1.0130237340927124, 1.0625604391098022, 1.112097144126892, 1.1616339683532715, 1.2111706733703613, 1.2607073783874512]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 16.0, 17.0, 27.0, 40.0, 63.0, 121.0, 211.0, 382.0, 730.0, 1748.0, 4312.0, 13260.0, 49967.0, 262569.0, 557631.0, 118241.0, 26329.0, 7650.0, 2839.0, 1185.0, 519.0, 257.0, 157.0, 83.0, 53.0, 38.0, 27.0, 16.0, 13.0, 10.0, 6.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.55908203125, -0.5432319641113281, -0.5273818969726562, -0.5115318298339844, -0.4956817626953125, -0.4798316955566406, -0.46398162841796875, -0.4481315612792969, -0.432281494140625, -0.4164314270019531, -0.40058135986328125, -0.3847312927246094, -0.3688812255859375, -0.3530311584472656, -0.33718109130859375, -0.3213310241699219, -0.30548095703125, -0.2896308898925781, -0.27378082275390625, -0.2579307556152344, -0.2420806884765625, -0.22623062133789062, -0.21038055419921875, -0.19453048706054688, -0.178680419921875, -0.16283035278320312, -0.14698028564453125, -0.13113021850585938, -0.1152801513671875, -0.09943008422851562, -0.08358001708984375, -0.06772994995117188, -0.0518798828125, -0.036029815673828125, -0.02017974853515625, -0.004329681396484375, 0.0115203857421875, 0.027370452880859375, 0.04322052001953125, 0.059070587158203125, 0.074920654296875, 0.09077072143554688, 0.10662078857421875, 0.12247085571289062, 0.1383209228515625, 0.15417098999023438, 0.17002105712890625, 0.18587112426757812, 0.20172119140625, 0.21757125854492188, 0.23342132568359375, 0.24927139282226562, 0.2651214599609375, 0.2809715270996094, 0.29682159423828125, 0.3126716613769531, 0.328521728515625, 0.3443717956542969, 0.36022186279296875, 0.3760719299316406, 0.3919219970703125, 0.4077720642089844, 0.42362213134765625, 0.4394721984863281, 0.455322265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 10.0, 6.0, 25.0, 26.0, 31.0, 27.0, 56.0, 57.0, 71.0, 73.0, 74.0, 93.0, 85.0, 66.0, 60.0, 44.0, 42.0, 38.0, 40.0, 25.0, 20.0, 17.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28271484375, -0.2745037078857422, -0.2662925720214844, -0.25808143615722656, -0.24987030029296875, -0.24165916442871094, -0.23344802856445312, -0.2252368927001953, -0.2170257568359375, -0.2088146209716797, -0.20060348510742188, -0.19239234924316406, -0.18418121337890625, -0.17597007751464844, -0.16775894165039062, -0.1595478057861328, -0.151336669921875, -0.1431255340576172, -0.13491439819335938, -0.12670326232910156, -0.11849212646484375, -0.11028099060058594, -0.10206985473632812, -0.09385871887207031, -0.0856475830078125, -0.07743644714355469, -0.06922531127929688, -0.06101417541503906, -0.05280303955078125, -0.04459190368652344, -0.036380767822265625, -0.028169631958007812, -0.01995849609375, -0.011747360229492188, -0.003536224365234375, 0.0046749114990234375, 0.01288604736328125, 0.021097183227539062, 0.029308319091796875, 0.03751945495605469, 0.0457305908203125, 0.05394172668457031, 0.062152862548828125, 0.07036399841308594, 0.07857513427734375, 0.08678627014160156, 0.09499740600585938, 0.10320854187011719, 0.111419677734375, 0.11963081359863281, 0.12784194946289062, 0.13605308532714844, 0.14426422119140625, 0.15247535705566406, 0.16068649291992188, 0.1688976287841797, 0.1771087646484375, 0.1853199005126953, 0.19353103637695312, 0.20174217224121094, 0.20995330810546875, 0.21816444396972656, 0.22637557983398438, 0.2345867156982422, 0.2427978515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 3.0, 1.0, 9.0, 7.0, 11.0, 15.0, 26.0, 23.0, 42.0, 83.0, 136.0, 250.0, 541.0, 1324.0, 3884.0, 16296.0, 171782.0, 803394.0, 40124.0, 6954.0, 1986.0, 787.0, 374.0, 200.0, 95.0, 70.0, 39.0, 29.0, 17.0, 11.0, 10.0, 5.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.79931640625, -0.7759628295898438, -0.7526092529296875, -0.7292556762695312, -0.705902099609375, -0.6825485229492188, -0.6591949462890625, -0.6358413696289062, -0.61248779296875, -0.5891342163085938, -0.5657806396484375, -0.5424270629882812, -0.519073486328125, -0.49571990966796875, -0.4723663330078125, -0.44901275634765625, -0.4256591796875, -0.40230560302734375, -0.3789520263671875, -0.35559844970703125, -0.332244873046875, -0.30889129638671875, -0.2855377197265625, -0.26218414306640625, -0.23883056640625, -0.21547698974609375, -0.1921234130859375, -0.16876983642578125, -0.145416259765625, -0.12206268310546875, -0.0987091064453125, -0.07535552978515625, -0.052001953125, -0.02864837646484375, -0.0052947998046875, 0.01805877685546875, 0.041412353515625, 0.06476593017578125, 0.0881195068359375, 0.11147308349609375, 0.13482666015625, 0.15818023681640625, 0.1815338134765625, 0.20488739013671875, 0.228240966796875, 0.25159454345703125, 0.2749481201171875, 0.29830169677734375, 0.3216552734375, 0.34500885009765625, 0.3683624267578125, 0.39171600341796875, 0.415069580078125, 0.43842315673828125, 0.4617767333984375, 0.48513031005859375, 0.50848388671875, 0.5318374633789062, 0.5551910400390625, 0.5785446166992188, 0.601898193359375, 0.6252517700195312, 0.6486053466796875, 0.6719589233398438, 0.6953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 9.0, 6.0, 8.0, 14.0, 18.0, 23.0, 36.0, 26.0, 27.0, 48.0, 52.0, 54.0, 60.0, 68.0, 67.0, 72.0, 69.0, 56.0, 51.0, 47.0, 35.0, 27.0, 25.0, 17.0, 13.0, 16.0, 11.0, 9.0, 3.0, 5.0, 2.0, 3.0, 5.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.73974609375, -0.7147140502929688, -0.6896820068359375, -0.6646499633789062, -0.639617919921875, -0.6145858764648438, -0.5895538330078125, -0.5645217895507812, -0.53948974609375, -0.5144577026367188, -0.4894256591796875, -0.46439361572265625, -0.439361572265625, -0.41432952880859375, -0.3892974853515625, -0.36426544189453125, -0.3392333984375, -0.31420135498046875, -0.2891693115234375, -0.26413726806640625, -0.239105224609375, -0.21407318115234375, -0.1890411376953125, -0.16400909423828125, -0.13897705078125, -0.11394500732421875, -0.0889129638671875, -0.06388092041015625, -0.038848876953125, -0.01381683349609375, 0.0112152099609375, 0.03624725341796875, 0.061279296875, 0.08631134033203125, 0.1113433837890625, 0.13637542724609375, 0.161407470703125, 0.18643951416015625, 0.2114715576171875, 0.23650360107421875, 0.26153564453125, 0.28656768798828125, 0.3115997314453125, 0.33663177490234375, 0.361663818359375, 0.38669586181640625, 0.4117279052734375, 0.43675994873046875, 0.4617919921875, 0.48682403564453125, 0.5118560791015625, 0.5368881225585938, 0.561920166015625, 0.5869522094726562, 0.6119842529296875, 0.6370162963867188, 0.66204833984375, 0.6870803833007812, 0.7121124267578125, 0.7371444702148438, 0.762176513671875, 0.7872085571289062, 0.8122406005859375, 0.8372726440429688, 0.8623046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 6.0, 7.0, 3.0, 14.0, 16.0, 19.0, 30.0, 53.0, 103.0, 212.0, 497.0, 1451.0, 5098.0, 33994.0, 946305.0, 51821.0, 6161.0, 1601.0, 624.0, 219.0, 107.0, 55.0, 42.0, 19.0, 14.0, 11.0, 11.0, 7.0, 8.0, 6.0, 3.0, 1.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.351806640625, -0.3390464782714844, -0.32628631591796875, -0.3135261535644531, -0.3007659912109375, -0.2880058288574219, -0.27524566650390625, -0.2624855041503906, -0.249725341796875, -0.23696517944335938, -0.22420501708984375, -0.21144485473632812, -0.1986846923828125, -0.18592453002929688, -0.17316436767578125, -0.16040420532226562, -0.14764404296875, -0.13488388061523438, -0.12212371826171875, -0.10936355590820312, -0.0966033935546875, -0.08384323120117188, -0.07108306884765625, -0.058322906494140625, -0.045562744140625, -0.032802581787109375, -0.02004241943359375, -0.007282257080078125, 0.0054779052734375, 0.018238067626953125, 0.03099822998046875, 0.043758392333984375, 0.0565185546875, 0.06927871704101562, 0.08203887939453125, 0.09479904174804688, 0.1075592041015625, 0.12031936645507812, 0.13307952880859375, 0.14583969116210938, 0.158599853515625, 0.17136001586914062, 0.18412017822265625, 0.19688034057617188, 0.2096405029296875, 0.22240066528320312, 0.23516082763671875, 0.24792098999023438, 0.26068115234375, 0.2734413146972656, 0.28620147705078125, 0.2989616394042969, 0.3117218017578125, 0.3244819641113281, 0.33724212646484375, 0.3500022888183594, 0.362762451171875, 0.3755226135253906, 0.38828277587890625, 0.4010429382324219, 0.4138031005859375, 0.4265632629394531, 0.43932342529296875, 0.4520835876464844, 0.46484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 0.0, 3.0, 2.0, 3.0, 8.0, 9.0, 10.0, 8.0, 15.0, 18.0, 14.0, 25.0, 23.0, 29.0, 23.0, 41.0, 69.0, 76.0, 97.0, 105.0, 90.0, 71.0, 44.0, 34.0, 35.0, 23.0, 20.0, 19.0, 14.0, 11.0, 11.0, 12.0, 8.0, 13.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.61611557006836e-05, -6.39650970697403e-05, -6.1769038438797e-05, -5.95729798078537e-05, -5.73769211769104e-05, -5.51808625459671e-05, -5.2984803915023804e-05, -5.0788745284080505e-05, -4.859268665313721e-05, -4.639662802219391e-05, -4.420056939125061e-05, -4.200451076030731e-05, -3.9808452129364014e-05, -3.7612393498420715e-05, -3.541633486747742e-05, -3.322027623653412e-05, -3.102421760559082e-05, -2.8828158974647522e-05, -2.6632100343704224e-05, -2.4436041712760925e-05, -2.2239983081817627e-05, -2.004392445087433e-05, -1.784786581993103e-05, -1.5651807188987732e-05, -1.3455748558044434e-05, -1.1259689927101135e-05, -9.063631296157837e-06, -6.8675726652145386e-06, -4.67151403427124e-06, -2.475455403327942e-06, -2.7939677238464355e-07, 1.9166618585586548e-06, 4.112720489501953e-06, 6.3087791204452515e-06, 8.50483775138855e-06, 1.0700896382331848e-05, 1.2896955013275146e-05, 1.5093013644218445e-05, 1.7289072275161743e-05, 1.948513090610504e-05, 2.168118953704834e-05, 2.3877248167991638e-05, 2.6073306798934937e-05, 2.8269365429878235e-05, 3.0465424060821533e-05, 3.266148269176483e-05, 3.485754132270813e-05, 3.705359995365143e-05, 3.9249658584594727e-05, 4.1445717215538025e-05, 4.364177584648132e-05, 4.583783447742462e-05, 4.803389310836792e-05, 5.022995173931122e-05, 5.2426010370254517e-05, 5.4622069001197815e-05, 5.681812763214111e-05, 5.901418626308441e-05, 6.121024489402771e-05, 6.340630352497101e-05, 6.56023621559143e-05, 6.77984207868576e-05, 6.99944794178009e-05, 7.21905380487442e-05, 7.43865966796875e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 2.0, 8.0, 9.0, 11.0, 20.0, 29.0, 33.0, 46.0, 61.0, 92.0, 137.0, 213.0, 390.0, 713.0, 1347.0, 2838.0, 8134.0, 51867.0, 906066.0, 61419.0, 8757.0, 3008.0, 1469.0, 716.0, 409.0, 229.0, 148.0, 104.0, 53.0, 66.0, 34.0, 21.0, 16.0, 13.0, 9.0, 11.0, 12.0, 6.0, 1.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.334228515625, -0.3242607116699219, -0.31429290771484375, -0.3043251037597656, -0.2943572998046875, -0.2843894958496094, -0.27442169189453125, -0.2644538879394531, -0.254486083984375, -0.24451828002929688, -0.23455047607421875, -0.22458267211914062, -0.2146148681640625, -0.20464706420898438, -0.19467926025390625, -0.18471145629882812, -0.17474365234375, -0.16477584838867188, -0.15480804443359375, -0.14484024047851562, -0.1348724365234375, -0.12490463256835938, -0.11493682861328125, -0.10496902465820312, -0.095001220703125, -0.08503341674804688, -0.07506561279296875, -0.06509780883789062, -0.0551300048828125, -0.045162200927734375, -0.03519439697265625, -0.025226593017578125, -0.0152587890625, -0.005290985107421875, 0.00467681884765625, 0.014644622802734375, 0.0246124267578125, 0.034580230712890625, 0.04454803466796875, 0.054515838623046875, 0.064483642578125, 0.07445144653320312, 0.08441925048828125, 0.09438705444335938, 0.1043548583984375, 0.11432266235351562, 0.12429046630859375, 0.13425827026367188, 0.14422607421875, 0.15419387817382812, 0.16416168212890625, 0.17412948608398438, 0.1840972900390625, 0.19406509399414062, 0.20403289794921875, 0.21400070190429688, 0.223968505859375, 0.23393630981445312, 0.24390411376953125, 0.2538719177246094, 0.2638397216796875, 0.2738075256347656, 0.28377532958984375, 0.2937431335449219, 0.3037109375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 8.0, 13.0, 17.0, 33.0, 50.0, 114.0, 218.0, 233.0, 127.0, 73.0, 36.0, 16.0, 15.0, 8.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39599609375, -0.3840599060058594, -0.37212371826171875, -0.3601875305175781, -0.3482513427734375, -0.3363151550292969, -0.32437896728515625, -0.3124427795410156, -0.300506591796875, -0.2885704040527344, -0.27663421630859375, -0.2646980285644531, -0.2527618408203125, -0.24082565307617188, -0.22888946533203125, -0.21695327758789062, -0.20501708984375, -0.19308090209960938, -0.18114471435546875, -0.16920852661132812, -0.1572723388671875, -0.14533615112304688, -0.13339996337890625, -0.12146377563476562, -0.109527587890625, -0.09759140014648438, -0.08565521240234375, -0.07371902465820312, -0.0617828369140625, -0.049846649169921875, -0.03791046142578125, -0.025974273681640625, -0.0140380859375, -0.002101898193359375, 0.00983428955078125, 0.021770477294921875, 0.0337066650390625, 0.045642852783203125, 0.05757904052734375, 0.06951522827148438, 0.081451416015625, 0.09338760375976562, 0.10532379150390625, 0.11725997924804688, 0.1291961669921875, 0.14113235473632812, 0.15306854248046875, 0.16500473022460938, 0.17694091796875, 0.18887710571289062, 0.20081329345703125, 0.21274948120117188, 0.2246856689453125, 0.23662185668945312, 0.24855804443359375, 0.2604942321777344, 0.272430419921875, 0.2843666076660156, 0.29630279541015625, 0.3082389831542969, 0.3201751708984375, 0.3321113586425781, 0.34404754638671875, 0.3559837341308594, 0.367919921875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 4.0, 17.0, 73.0, 295.0, 436.0, 120.0, 26.0, 10.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.787864685058594, -11.461349487304688, -11.134834289550781, -10.808319091796875, -10.481803894042969, -10.155288696289062, -9.828773498535156, -9.50225830078125, -9.175743103027344, -8.849227905273438, -8.522712707519531, -8.196197509765625, -7.869682312011719, -7.5431671142578125, -7.2166523933410645, -6.890137195587158, -6.56362247467041, -6.237107276916504, -5.910592079162598, -5.584076881408691, -5.257561683654785, -4.931046485900879, -4.604531764984131, -4.278016567230225, -3.9515013694763184, -3.624986171722412, -3.298470973968506, -2.9719560146331787, -2.6454408168792725, -2.318925619125366, -1.9924105405807495, -1.6658954620361328, -1.3393802642822266, -1.0128650665283203, -0.6863499879837036, -0.35983484983444214, -0.033319711685180664, 0.2931954860687256, 0.6197105646133423, 0.946225643157959, 1.2727408409118652, 1.5992560386657715, 1.9257711172103882, 2.252286195755005, 2.578801393508911, 2.9053165912628174, 3.2318315505981445, 3.558346748352051, 3.884861946105957, 4.211377143859863, 4.5378923416137695, 4.864407539367676, 5.190922737121582, 5.517437934875488, 5.843952655792236, 6.170467853546143, 6.496983051300049, 6.823498249053955, 7.150013446807861, 7.476528644561768, 7.803043365478516, 8.129558563232422, 8.456073760986328, 8.782588958740234, 9.10910415649414]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 10.0, 15.0, 9.0, 17.0, 27.0, 26.0, 29.0, 28.0, 46.0, 56.0, 57.0, 84.0, 130.0, 106.0, 81.0, 55.0, 42.0, 32.0, 29.0, 32.0, 24.0, 14.0, 10.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1053006649017334, -2.9970927238464355, -2.8888845443725586, -2.7806766033172607, -2.672468423843384, -2.564260482788086, -2.456052303314209, -2.347844362258911, -2.2396364212036133, -2.1314284801483154, -2.0232203006744385, -1.9150123596191406, -1.8068042993545532, -1.6985962390899658, -1.5903881788253784, -1.482180118560791, -1.3739720582962036, -1.2657639980316162, -1.1575559377670288, -1.0493478775024414, -0.9411399364471436, -0.8329318761825562, -0.7247238159179688, -0.6165158152580261, -0.5083077549934387, -0.4000997245311737, -0.2918916940689087, -0.1836836338043213, -0.07547560334205627, 0.03273242712020874, 0.14094048738479614, 0.24914848804473877, 0.35735654830932617, 0.4655645787715912, 0.5737726092338562, 0.6819806694984436, 0.7901886701583862, 0.8983967304229736, 1.006604790687561, 1.1148128509521484, 1.2230207920074463, 1.3312288522720337, 1.439436912536621, 1.547644853591919, 1.6558529138565063, 1.7640609741210938, 1.8722690343856812, 1.9804770946502686, 2.0886850357055664, 2.1968929767608643, 2.305101156234741, 2.413309097290039, 2.521517276763916, 2.629725217819214, 2.7379331588745117, 2.8461413383483887, 2.9543495178222656, 3.0625574588775635, 3.1707656383514404, 3.2789735794067383, 3.3871817588806152, 3.495389699935913, 3.603597640991211, 3.711805820465088, 3.8200137615203857]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 8.0, 2.0, 4.0, 6.0, 7.0, 21.0, 12.0, 32.0, 53.0, 81.0, 159.0, 286.0, 649.0, 1619.0, 5699.0, 30079.0, 479366.0, 3471106.0, 180894.0, 17869.0, 3916.0, 1294.0, 530.0, 258.0, 128.0, 68.0, 46.0, 33.0, 26.0, 11.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89111328125, -0.8651809692382812, -0.8392486572265625, -0.8133163452148438, -0.787384033203125, -0.7614517211914062, -0.7355194091796875, -0.7095870971679688, -0.68365478515625, -0.6577224731445312, -0.6317901611328125, -0.6058578491210938, -0.579925537109375, -0.5539932250976562, -0.5280609130859375, -0.5021286010742188, -0.4761962890625, -0.45026397705078125, -0.4243316650390625, -0.39839935302734375, -0.372467041015625, -0.34653472900390625, -0.3206024169921875, -0.29467010498046875, -0.26873779296875, -0.24280548095703125, -0.2168731689453125, -0.19094085693359375, -0.165008544921875, -0.13907623291015625, -0.1131439208984375, -0.08721160888671875, -0.061279296875, -0.03534698486328125, -0.0094146728515625, 0.01651763916015625, 0.042449951171875, 0.06838226318359375, 0.0943145751953125, 0.12024688720703125, 0.14617919921875, 0.17211151123046875, 0.1980438232421875, 0.22397613525390625, 0.249908447265625, 0.27584075927734375, 0.3017730712890625, 0.32770538330078125, 0.3536376953125, 0.37957000732421875, 0.4055023193359375, 0.43143463134765625, 0.457366943359375, 0.48329925537109375, 0.5092315673828125, 0.5351638793945312, 0.56109619140625, 0.5870285034179688, 0.6129608154296875, 0.6388931274414062, 0.664825439453125, 0.6907577514648438, 0.7166900634765625, 0.7426223754882812, 0.7685546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 10.0, 11.0, 18.0, 29.0, 21.0, 19.0, 32.0, 41.0, 50.0, 57.0, 62.0, 78.0, 62.0, 74.0, 74.0, 56.0, 47.0, 58.0, 34.0, 37.0, 35.0, 22.0, 22.0, 14.0, 13.0, 12.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15185546875, -0.1450042724609375, -0.138153076171875, -0.1313018798828125, -0.12445068359375, -0.1175994873046875, -0.110748291015625, -0.1038970947265625, -0.0970458984375, -0.0901947021484375, -0.083343505859375, -0.0764923095703125, -0.06964111328125, -0.0627899169921875, -0.055938720703125, -0.0490875244140625, -0.042236328125, -0.0353851318359375, -0.028533935546875, -0.0216827392578125, -0.01483154296875, -0.0079803466796875, -0.001129150390625, 0.0057220458984375, 0.0125732421875, 0.0194244384765625, 0.026275634765625, 0.0331268310546875, 0.03997802734375, 0.0468292236328125, 0.053680419921875, 0.0605316162109375, 0.0673828125, 0.0742340087890625, 0.081085205078125, 0.0879364013671875, 0.09478759765625, 0.1016387939453125, 0.108489990234375, 0.1153411865234375, 0.1221923828125, 0.1290435791015625, 0.135894775390625, 0.1427459716796875, 0.14959716796875, 0.1564483642578125, 0.163299560546875, 0.1701507568359375, 0.177001953125, 0.1838531494140625, 0.190704345703125, 0.1975555419921875, 0.20440673828125, 0.2112579345703125, 0.218109130859375, 0.2249603271484375, 0.2318115234375, 0.2386627197265625, 0.245513916015625, 0.2523651123046875, 0.25921630859375, 0.2660675048828125, 0.272918701171875, 0.2797698974609375, 0.28662109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 9.0, 11.0, 8.0, 16.0, 11.0, 33.0, 37.0, 68.0, 126.0, 190.0, 354.0, 730.0, 1801.0, 4852.0, 27935.0, 2342841.0, 1780808.0, 26325.0, 4745.0, 1677.0, 797.0, 357.0, 199.0, 103.0, 76.0, 42.0, 22.0, 17.0, 15.0, 12.0, 10.0, 10.0, 4.0, 7.0, 4.0, 1.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3681640625, -1.3290557861328125, -1.289947509765625, -1.2508392333984375, -1.21173095703125, -1.1726226806640625, -1.133514404296875, -1.0944061279296875, -1.0552978515625, -1.0161895751953125, -0.977081298828125, -0.9379730224609375, -0.89886474609375, -0.8597564697265625, -0.820648193359375, -0.7815399169921875, -0.742431640625, -0.7033233642578125, -0.664215087890625, -0.6251068115234375, -0.58599853515625, -0.5468902587890625, -0.507781982421875, -0.4686737060546875, -0.4295654296875, -0.3904571533203125, -0.351348876953125, -0.3122406005859375, -0.27313232421875, -0.2340240478515625, -0.194915771484375, -0.1558074951171875, -0.11669921875, -0.0775909423828125, -0.038482666015625, 0.0006256103515625, 0.03973388671875, 0.0788421630859375, 0.117950439453125, 0.1570587158203125, 0.1961669921875, 0.2352752685546875, 0.274383544921875, 0.3134918212890625, 0.35260009765625, 0.3917083740234375, 0.430816650390625, 0.4699249267578125, 0.509033203125, 0.5481414794921875, 0.587249755859375, 0.6263580322265625, 0.66546630859375, 0.7045745849609375, 0.743682861328125, 0.7827911376953125, 0.8218994140625, 0.8610076904296875, 0.900115966796875, 0.9392242431640625, 0.97833251953125, 1.0174407958984375, 1.056549072265625, 1.0956573486328125, 1.134765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 4.0, 7.0, 22.0, 22.0, 44.0, 74.0, 118.0, 207.0, 425.0, 787.0, 998.0, 607.0, 322.0, 176.0, 113.0, 48.0, 36.0, 15.0, 10.0, 10.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89697265625, -0.8599014282226562, -0.8228302001953125, -0.7857589721679688, -0.748687744140625, -0.7116165161132812, -0.6745452880859375, -0.6374740600585938, -0.60040283203125, -0.5633316040039062, -0.5262603759765625, -0.48918914794921875, -0.452117919921875, -0.41504669189453125, -0.3779754638671875, -0.34090423583984375, -0.3038330078125, -0.26676177978515625, -0.2296905517578125, -0.19261932373046875, -0.155548095703125, -0.11847686767578125, -0.0814056396484375, -0.04433441162109375, -0.00726318359375, 0.02980804443359375, 0.0668792724609375, 0.10395050048828125, 0.141021728515625, 0.17809295654296875, 0.2151641845703125, 0.25223541259765625, 0.289306640625, 0.32637786865234375, 0.3634490966796875, 0.40052032470703125, 0.437591552734375, 0.47466278076171875, 0.5117340087890625, 0.5488052368164062, 0.58587646484375, 0.6229476928710938, 0.6600189208984375, 0.6970901489257812, 0.734161376953125, 0.7712326049804688, 0.8083038330078125, 0.8453750610351562, 0.8824462890625, 0.9195175170898438, 0.9565887451171875, 0.9936599731445312, 1.030731201171875, 1.0678024291992188, 1.1048736572265625, 1.1419448852539062, 1.17901611328125, 1.2160873413085938, 1.2531585693359375, 1.2902297973632812, 1.327301025390625, 1.3643722534179688, 1.4014434814453125, 1.4385147094726562, 1.4755859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 10.0, 13.0, 35.0, 48.0, 151.0, 269.0, 233.0, 117.0, 54.0, 27.0, 8.0, 9.0, 2.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.487607955932617, -14.043328285217285, -13.599048614501953, -13.154767990112305, -12.710488319396973, -12.26620864868164, -11.821928977966309, -11.377649307250977, -10.933368682861328, -10.489089012145996, -10.044809341430664, -9.600528717041016, -9.156249046325684, -8.711969375610352, -8.26768970489502, -7.8234100341796875, -7.3791303634643555, -6.934850692749023, -6.490570545196533, -6.046290874481201, -5.602010726928711, -5.157731056213379, -4.713451385498047, -4.269171714782715, -3.8248915672302246, -3.3806116580963135, -2.9363317489624023, -2.4920520782470703, -2.047772169113159, -1.603492259979248, -1.159212589263916, -0.7149326801300049, -0.27065181732177734, 0.173628032207489, 0.6179078817367554, 1.062187671661377, 1.506467580795288, 1.9507474899291992, 2.3950271606445312, 2.8393070697784424, 3.2835869789123535, 3.7278668880462646, 4.172146797180176, 4.616426467895508, 5.06070613861084, 5.50498628616333, 5.949265956878662, 6.393546104431152, 6.837825775146484, 7.282105445861816, 7.726385593414307, 8.170665740966797, 8.614945411682129, 9.059225082397461, 9.503504753112793, 9.947784423828125, 10.392065048217773, 10.836344718933105, 11.280624389648438, 11.724905014038086, 12.169184684753418, 12.61346435546875, 13.057744026184082, 13.502023696899414, 13.946303367614746]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 3.0, 12.0, 17.0, 19.0, 22.0, 24.0, 43.0, 45.0, 54.0, 70.0, 72.0, 87.0, 87.0, 91.0, 77.0, 70.0, 53.0, 38.0, 31.0, 25.0, 14.0, 20.0, 6.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.083523750305176, -7.839505672454834, -7.595487117767334, -7.351469039916992, -7.10745096206665, -6.863432884216309, -6.619414329528809, -6.375396251678467, -6.131378173828125, -5.887360095977783, -5.643341541290283, -5.399323463439941, -5.1553053855896, -4.911287307739258, -4.667268753051758, -4.423250675201416, -4.179232120513916, -3.935213804244995, -3.6911957263946533, -3.4471774101257324, -3.2031593322753906, -2.9591410160064697, -2.715122699737549, -2.471104621887207, -2.227086305618286, -1.9830681085586548, -1.7390499114990234, -1.4950315952301025, -1.2510133981704712, -1.0069952011108398, -0.762976884841919, -0.5189586877822876, -0.27494049072265625, -0.030922263860702515, 0.21309596300125122, 0.45711421966552734, 0.7011324167251587, 0.94515061378479, 1.189168930053711, 1.4331871271133423, 1.6772053241729736, 1.921223521232605, 2.1652417182922363, 2.4092600345611572, 2.653278350830078, 2.89729642868042, 3.141314744949341, 3.3853330612182617, 3.6293511390686035, 3.8733694553375244, 4.117387771606445, 4.361405849456787, 4.605423927307129, 4.849442481994629, 5.093460559844971, 5.3374786376953125, 5.5814971923828125, 5.825515270233154, 6.069533824920654, 6.313551902770996, 6.557569980621338, 6.80158805847168, 7.04560661315918, 7.2896246910095215, 7.533642768859863]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 17.0, 17.0, 30.0, 26.0, 44.0, 77.0, 160.0, 210.0, 353.0, 740.0, 1579.0, 3722.0, 11115.0, 41219.0, 243979.0, 604639.0, 106388.0, 22605.0, 6593.0, 2595.0, 1139.0, 550.0, 303.0, 158.0, 107.0, 56.0, 32.0, 24.0, 23.0, 18.0, 9.0, 10.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.414306640625, -0.40256500244140625, -0.3908233642578125, -0.37908172607421875, -0.367340087890625, -0.35559844970703125, -0.3438568115234375, -0.33211517333984375, -0.32037353515625, -0.30863189697265625, -0.2968902587890625, -0.28514862060546875, -0.273406982421875, -0.26166534423828125, -0.2499237060546875, -0.23818206787109375, -0.2264404296875, -0.21469879150390625, -0.2029571533203125, -0.19121551513671875, -0.179473876953125, -0.16773223876953125, -0.1559906005859375, -0.14424896240234375, -0.13250732421875, -0.12076568603515625, -0.1090240478515625, -0.09728240966796875, -0.085540771484375, -0.07379913330078125, -0.0620574951171875, -0.05031585693359375, -0.03857421875, -0.02683258056640625, -0.0150909423828125, -0.00334930419921875, 0.008392333984375, 0.02013397216796875, 0.0318756103515625, 0.04361724853515625, 0.05535888671875, 0.06710052490234375, 0.0788421630859375, 0.09058380126953125, 0.102325439453125, 0.11406707763671875, 0.1258087158203125, 0.13755035400390625, 0.1492919921875, 0.16103363037109375, 0.1727752685546875, 0.18451690673828125, 0.196258544921875, 0.20800018310546875, 0.2197418212890625, 0.23148345947265625, 0.24322509765625, 0.25496673583984375, 0.2667083740234375, 0.27845001220703125, 0.290191650390625, 0.30193328857421875, 0.3136749267578125, 0.32541656494140625, 0.337158203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 9.0, 9.0, 20.0, 24.0, 34.0, 52.0, 50.0, 69.0, 81.0, 73.0, 73.0, 110.0, 96.0, 67.0, 64.0, 52.0, 34.0, 31.0, 20.0, 16.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361083984375, -0.34853363037109375, -0.3359832763671875, -0.32343292236328125, -0.310882568359375, -0.29833221435546875, -0.2857818603515625, -0.27323150634765625, -0.26068115234375, -0.24813079833984375, -0.2355804443359375, -0.22303009033203125, -0.210479736328125, -0.19792938232421875, -0.1853790283203125, -0.17282867431640625, -0.1602783203125, -0.14772796630859375, -0.1351776123046875, -0.12262725830078125, -0.110076904296875, -0.09752655029296875, -0.0849761962890625, -0.07242584228515625, -0.05987548828125, -0.04732513427734375, -0.0347747802734375, -0.02222442626953125, -0.009674072265625, 0.00287628173828125, 0.0154266357421875, 0.02797698974609375, 0.04052734375, 0.05307769775390625, 0.0656280517578125, 0.07817840576171875, 0.090728759765625, 0.10327911376953125, 0.1158294677734375, 0.12837982177734375, 0.14093017578125, 0.15348052978515625, 0.1660308837890625, 0.17858123779296875, 0.191131591796875, 0.20368194580078125, 0.2162322998046875, 0.22878265380859375, 0.2413330078125, 0.25388336181640625, 0.2664337158203125, 0.27898406982421875, 0.291534423828125, 0.30408477783203125, 0.3166351318359375, 0.32918548583984375, 0.34173583984375, 0.35428619384765625, 0.3668365478515625, 0.37938690185546875, 0.391937255859375, 0.40448760986328125, 0.4170379638671875, 0.42958831787109375, 0.442138671875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 9.0, 5.0, 11.0, 18.0, 21.0, 57.0, 65.0, 111.0, 217.0, 494.0, 1269.0, 4957.0, 41759.0, 927159.0, 63294.0, 6406.0, 1576.0, 532.0, 257.0, 125.0, 68.0, 54.0, 27.0, 20.0, 15.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6595535278320312, -0.6399078369140625, -0.6202621459960938, -0.600616455078125, -0.5809707641601562, -0.5613250732421875, -0.5416793823242188, -0.52203369140625, -0.5023880004882812, -0.4827423095703125, -0.46309661865234375, -0.443450927734375, -0.42380523681640625, -0.4041595458984375, -0.38451385498046875, -0.3648681640625, -0.34522247314453125, -0.3255767822265625, -0.30593109130859375, -0.286285400390625, -0.26663970947265625, -0.2469940185546875, -0.22734832763671875, -0.20770263671875, -0.18805694580078125, -0.1684112548828125, -0.14876556396484375, -0.129119873046875, -0.10947418212890625, -0.0898284912109375, -0.07018280029296875, -0.050537109375, -0.03089141845703125, -0.0112457275390625, 0.00839996337890625, 0.028045654296875, 0.04769134521484375, 0.0673370361328125, 0.08698272705078125, 0.10662841796875, 0.12627410888671875, 0.1459197998046875, 0.16556549072265625, 0.185211181640625, 0.20485687255859375, 0.2245025634765625, 0.24414825439453125, 0.2637939453125, 0.28343963623046875, 0.3030853271484375, 0.32273101806640625, 0.342376708984375, 0.36202239990234375, 0.3816680908203125, 0.40131378173828125, 0.42095947265625, 0.44060516357421875, 0.4602508544921875, 0.47989654541015625, 0.499542236328125, 0.5191879272460938, 0.5388336181640625, 0.5584793090820312, 0.578125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 11.0, 5.0, 4.0, 10.0, 14.0, 26.0, 29.0, 33.0, 28.0, 43.0, 80.0, 86.0, 109.0, 120.0, 83.0, 90.0, 54.0, 46.0, 32.0, 27.0, 21.0, 11.0, 10.0, 14.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.44403076171875, -1.3978271484375, -1.35162353515625, -1.305419921875, -1.25921630859375, -1.2130126953125, -1.16680908203125, -1.12060546875, -1.07440185546875, -1.0281982421875, -0.98199462890625, -0.935791015625, -0.88958740234375, -0.8433837890625, -0.79718017578125, -0.7509765625, -0.70477294921875, -0.6585693359375, -0.61236572265625, -0.566162109375, -0.51995849609375, -0.4737548828125, -0.42755126953125, -0.38134765625, -0.33514404296875, -0.2889404296875, -0.24273681640625, -0.196533203125, -0.15032958984375, -0.1041259765625, -0.05792236328125, -0.01171875, 0.03448486328125, 0.0806884765625, 0.12689208984375, 0.173095703125, 0.21929931640625, 0.2655029296875, 0.31170654296875, 0.35791015625, 0.40411376953125, 0.4503173828125, 0.49652099609375, 0.542724609375, 0.58892822265625, 0.6351318359375, 0.68133544921875, 0.7275390625, 0.77374267578125, 0.8199462890625, 0.86614990234375, 0.912353515625, 0.95855712890625, 1.0047607421875, 1.05096435546875, 1.09716796875, 1.14337158203125, 1.1895751953125, 1.23577880859375, 1.281982421875, 1.32818603515625, 1.3743896484375, 1.42059326171875, 1.466796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 7.0, 11.0, 14.0, 15.0, 24.0, 43.0, 31.0, 63.0, 89.0, 149.0, 223.0, 389.0, 735.0, 1512.0, 3619.0, 9903.0, 39305.0, 779845.0, 175079.0, 24639.0, 7394.0, 2721.0, 1173.0, 594.0, 361.0, 202.0, 138.0, 69.0, 51.0, 42.0, 33.0, 20.0, 6.0, 13.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06195068359375, -0.05987548828125, -0.05780029296875, -0.05572509765625, -0.05364990234375, -0.05157470703125, -0.04949951171875, -0.04742431640625, -0.04534912109375, -0.04327392578125, -0.04119873046875, -0.03912353515625, -0.03704833984375, -0.03497314453125, -0.03289794921875, -0.03082275390625, -0.02874755859375, -0.02667236328125, -0.02459716796875, -0.02252197265625, -0.02044677734375, -0.01837158203125, -0.01629638671875, -0.01422119140625, -0.01214599609375, -0.01007080078125, -0.00799560546875, -0.00592041015625, -0.00384521484375, -0.00177001953125, 0.00030517578125, 0.00238037109375, 0.00445556640625, 0.00653076171875, 0.00860595703125, 0.01068115234375, 0.01275634765625, 0.01483154296875, 0.01690673828125, 0.01898193359375, 0.02105712890625, 0.02313232421875, 0.02520751953125, 0.02728271484375, 0.02935791015625, 0.03143310546875, 0.03350830078125, 0.03558349609375, 0.03765869140625, 0.03973388671875, 0.04180908203125, 0.04388427734375, 0.04595947265625, 0.04803466796875, 0.05010986328125, 0.05218505859375, 0.05426025390625, 0.05633544921875, 0.05841064453125, 0.06048583984375, 0.06256103515625, 0.06463623046875, 0.06671142578125, 0.06878662109375, 0.07086181640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 5.0, 4.0, 8.0, 5.0, 14.0, 14.0, 20.0, 27.0, 33.0, 59.0, 73.0, 87.0, 92.0, 87.0, 95.0, 89.0, 58.0, 51.0, 29.0, 30.0, 16.0, 14.0, 18.0, 9.0, 9.0, 9.0, 8.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3543834686279297e-05, -2.2739171981811523e-05, -2.193450927734375e-05, -2.1129846572875977e-05, -2.0325183868408203e-05, -1.952052116394043e-05, -1.8715858459472656e-05, -1.7911195755004883e-05, -1.710653305053711e-05, -1.6301870346069336e-05, -1.5497207641601562e-05, -1.4692544937133789e-05, -1.3887882232666016e-05, -1.3083219528198242e-05, -1.2278556823730469e-05, -1.1473894119262695e-05, -1.0669231414794922e-05, -9.864568710327148e-06, -9.059906005859375e-06, -8.255243301391602e-06, -7.450580596923828e-06, -6.645917892456055e-06, -5.841255187988281e-06, -5.036592483520508e-06, -4.231929779052734e-06, -3.427267074584961e-06, -2.6226043701171875e-06, -1.817941665649414e-06, -1.0132789611816406e-06, -2.086162567138672e-07, 5.960464477539062e-07, 1.4007091522216797e-06, 2.205371856689453e-06, 3.0100345611572266e-06, 3.814697265625e-06, 4.6193599700927734e-06, 5.424022674560547e-06, 6.22868537902832e-06, 7.033348083496094e-06, 7.838010787963867e-06, 8.64267349243164e-06, 9.447336196899414e-06, 1.0251998901367188e-05, 1.1056661605834961e-05, 1.1861324310302734e-05, 1.2665987014770508e-05, 1.3470649719238281e-05, 1.4275312423706055e-05, 1.5079975128173828e-05, 1.58846378326416e-05, 1.6689300537109375e-05, 1.749396324157715e-05, 1.8298625946044922e-05, 1.9103288650512695e-05, 1.990795135498047e-05, 2.0712614059448242e-05, 2.1517276763916016e-05, 2.232193946838379e-05, 2.3126602172851562e-05, 2.3931264877319336e-05, 2.473592758178711e-05, 2.5540590286254883e-05, 2.6345252990722656e-05, 2.714991569519043e-05, 2.7954578399658203e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 4.0, 10.0, 15.0, 12.0, 22.0, 32.0, 47.0, 76.0, 122.0, 217.0, 323.0, 697.0, 1242.0, 2780.0, 6594.0, 20306.0, 93633.0, 819907.0, 73873.0, 17553.0, 6072.0, 2501.0, 1131.0, 586.0, 305.0, 177.0, 106.0, 69.0, 41.0, 20.0, 20.0, 14.0, 11.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07025146484375, -0.06815052032470703, -0.06604957580566406, -0.0639486312866211, -0.061847686767578125, -0.059746742248535156, -0.05764579772949219, -0.05554485321044922, -0.05344390869140625, -0.05134296417236328, -0.04924201965332031, -0.047141075134277344, -0.045040130615234375, -0.042939186096191406, -0.04083824157714844, -0.03873729705810547, -0.0366363525390625, -0.03453540802001953, -0.03243446350097656, -0.030333518981933594, -0.028232574462890625, -0.026131629943847656, -0.024030685424804688, -0.02192974090576172, -0.01982879638671875, -0.01772785186767578, -0.015626907348632812, -0.013525962829589844, -0.011425018310546875, -0.009324073791503906, -0.0072231292724609375, -0.005122184753417969, -0.003021240234375, -0.0009202957153320312, 0.0011806488037109375, 0.0032815933227539062, 0.005382537841796875, 0.007483482360839844, 0.009584426879882812, 0.011685371398925781, 0.01378631591796875, 0.01588726043701172, 0.017988204956054688, 0.020089149475097656, 0.022190093994140625, 0.024291038513183594, 0.026391983032226562, 0.02849292755126953, 0.0305938720703125, 0.03269481658935547, 0.03479576110839844, 0.036896705627441406, 0.038997650146484375, 0.041098594665527344, 0.04319953918457031, 0.04530048370361328, 0.04740142822265625, 0.04950237274169922, 0.05160331726074219, 0.053704261779785156, 0.055805206298828125, 0.057906150817871094, 0.06000709533691406, 0.06210803985595703, 0.064208984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 2.0, 5.0, 4.0, 11.0, 11.0, 9.0, 16.0, 22.0, 33.0, 38.0, 60.0, 123.0, 168.0, 156.0, 114.0, 68.0, 45.0, 26.0, 23.0, 13.0, 18.0, 4.0, 8.0, 4.0, 3.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13427734375, -0.1302051544189453, -0.12613296508789062, -0.12206077575683594, -0.11798858642578125, -0.11391639709472656, -0.10984420776367188, -0.10577201843261719, -0.1016998291015625, -0.09762763977050781, -0.09355545043945312, -0.08948326110839844, -0.08541107177734375, -0.08133888244628906, -0.07726669311523438, -0.07319450378417969, -0.069122314453125, -0.06505012512207031, -0.060977935791015625, -0.05690574645996094, -0.05283355712890625, -0.04876136779785156, -0.044689178466796875, -0.04061698913574219, -0.0365447998046875, -0.03247261047363281, -0.028400421142578125, -0.024328231811523438, -0.02025604248046875, -0.016183853149414062, -0.012111663818359375, -0.008039474487304688, -0.00396728515625, 0.0001049041748046875, 0.004177093505859375, 0.008249282836914062, 0.01232147216796875, 0.016393661499023438, 0.020465850830078125, 0.024538040161132812, 0.0286102294921875, 0.03268241882324219, 0.036754608154296875, 0.04082679748535156, 0.04489898681640625, 0.04897117614746094, 0.053043365478515625, 0.05711555480957031, 0.061187744140625, 0.06525993347167969, 0.06933212280273438, 0.07340431213378906, 0.07747650146484375, 0.08154869079589844, 0.08562088012695312, 0.08969306945800781, 0.0937652587890625, 0.09783744812011719, 0.10190963745117188, 0.10598182678222656, 0.11005401611328125, 0.11412620544433594, 0.11819839477539062, 0.12227058410644531, 0.1263427734375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 15.0, 32.0, 70.0, 232.0, 488.0, 104.0, 32.0, 10.0, 9.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5393590927124023, -3.2913997173309326, -3.043440341949463, -2.7954812049865723, -2.5475218296051025, -2.299562454223633, -2.051603317260742, -1.8036439418792725, -1.5556845664978027, -1.307725191116333, -1.0597659349441528, -0.8118066191673279, -0.5638473033905029, -0.3158879280090332, -0.06792867183685303, 0.18003058433532715, 0.4279899597167969, 0.6759492754936218, 0.9239085912704468, 1.171867847442627, 1.4198272228240967, 1.6677865982055664, 1.9157458543777466, 2.1637051105499268, 2.4116644859313965, 2.659623861312866, 2.907583236694336, 3.1555423736572266, 3.4035017490386963, 3.651461124420166, 3.8994202613830566, 4.1473798751831055, 4.395339012145996, 4.643298149108887, 4.8912577629089355, 5.139216899871826, 5.387176513671875, 5.635135650634766, 5.883094787597656, 6.131053924560547, 6.379013538360596, 6.626972675323486, 6.874932289123535, 7.122891426086426, 7.370850563049316, 7.618810176849365, 7.866769313812256, 8.114728927612305, 8.362688064575195, 8.610647201538086, 8.858606338500977, 9.106566429138184, 9.354525566101074, 9.602484703063965, 9.850443840026855, 10.098402976989746, 10.346363067626953, 10.594322204589844, 10.842281341552734, 11.090241432189941, 11.338200569152832, 11.586159706115723, 11.834118843078613, 12.082077980041504, 12.330037117004395]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 9.0, 27.0, 22.0, 37.0, 33.0, 47.0, 88.0, 137.0, 181.0, 170.0, 65.0, 51.0, 24.0, 18.0, 15.0, 16.0, 10.0, 14.0, 12.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.862760543823242, -3.698683738708496, -3.53460693359375, -3.370530128479004, -3.206453323364258, -3.0423765182495117, -2.8782994747161865, -2.7142226696014404, -2.5501458644866943, -2.3860690593719482, -2.221992254257202, -2.057915449142456, -1.8938385248184204, -1.7297617197036743, -1.5656847953796387, -1.4016079902648926, -1.2375311851501465, -1.0734543800354004, -0.9093775153160095, -0.7453006505966187, -0.5812238454818726, -0.41714704036712646, -0.2530701756477356, -0.08899331092834473, 0.07508349418640137, 0.23916032910346985, 0.40323716402053833, 0.5673140287399292, 0.7313908338546753, 0.8954676389694214, 1.059544563293457, 1.2236213684082031, 1.3876981735229492, 1.5517749786376953, 1.7158517837524414, 1.879928708076477, 2.0440053939819336, 2.2080821990966797, 2.372159242630005, 2.536236047744751, 2.700312852859497, 2.864389657974243, 3.0284664630889893, 3.1925432682037354, 3.3566203117370605, 3.5206971168518066, 3.6847739219665527, 3.848850727081299, 4.012927532196045, 4.177004337310791, 4.341081142425537, 4.505157947540283, 4.669234752655029, 4.833311557769775, 4.9973883628845215, 5.161465644836426, 5.325542449951172, 5.489619255065918, 5.653696060180664, 5.81777286529541, 5.981849670410156, 6.145926475524902, 6.310003280639648, 6.4740800857543945, 6.638156890869141]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 12.0, 12.0, 9.0, 20.0, 26.0, 27.0, 42.0, 49.0, 55.0, 193.0, 260.0, 63.0, 48.0, 49.0, 43.0, 19.0, 18.0, 12.0, 18.0, 11.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.422119140625, -0.4104042053222656, -0.39868927001953125, -0.3869743347167969, -0.3752593994140625, -0.3635444641113281, -0.35182952880859375, -0.3401145935058594, -0.328399658203125, -0.3166847229003906, -0.30496978759765625, -0.2932548522949219, -0.2815399169921875, -0.2698249816894531, -0.25811004638671875, -0.24639511108398438, -0.23468017578125, -0.22296524047851562, -0.21125030517578125, -0.19953536987304688, -0.1878204345703125, -0.17610549926757812, -0.16439056396484375, -0.15267562866210938, -0.140960693359375, -0.12924575805664062, -0.11753082275390625, -0.10581588745117188, -0.0941009521484375, -0.08238601684570312, -0.07067108154296875, -0.058956146240234375, -0.0472412109375, -0.035526275634765625, -0.02381134033203125, -0.012096405029296875, -0.0003814697265625, 0.011333465576171875, 0.02304840087890625, 0.034763336181640625, 0.046478271484375, 0.058193206787109375, 0.06990814208984375, 0.08162307739257812, 0.0933380126953125, 0.10505294799804688, 0.11676788330078125, 0.12848281860351562, 0.14019775390625, 0.15191268920898438, 0.16362762451171875, 0.17534255981445312, 0.1870574951171875, 0.19877243041992188, 0.21048736572265625, 0.22220230102539062, 0.233917236328125, 0.24563217163085938, 0.25734710693359375, 0.2690620422363281, 0.2807769775390625, 0.2924919128417969, 0.30420684814453125, 0.3159217834472656, 0.32763671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 6.0, 20.0, 22.0, 47.0, 50.0, 94.0, 205.0, 469.0, 1528.0, 7696.0, 8334815.0, 38486.0, 3495.0, 904.0, 330.0, 151.0, 89.0, 56.0, 32.0, 23.0, 18.0, 8.0, 1.0, 5.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.9818265438079834, -3.879146099090576, -3.77646541595459, -3.6737849712371826, -3.5711042881011963, -3.468423843383789, -3.3657431602478027, -3.2630627155303955, -3.1603822708129883, -3.057701826095581, -2.9550211429595947, -2.8523406982421875, -2.749660015106201, -2.646979570388794, -2.5442991256713867, -2.4416184425354004, -2.338937759399414, -2.236257314682007, -2.1335766315460205, -2.0308961868286133, -1.9282156229019165, -1.8255350589752197, -1.722854495048523, -1.6201739311218262, -1.517493486404419, -1.4148129224777222, -1.3121323585510254, -1.2094519138336182, -1.1067713499069214, -1.0040907859802246, -0.9014102220535278, -0.7987297177314758, -0.6960492134094238, -0.593368649482727, -0.49068814516067505, -0.38800758123397827, -0.2853270471096039, -0.1826465129852295, -0.07996594905853271, 0.022714555263519287, 0.12539511919021606, 0.22807565331459045, 0.33075618743896484, 0.4334367513656616, 0.5361173152923584, 0.6387978196144104, 0.7414783835411072, 0.8441588878631592, 0.946839451789856, 1.0495200157165527, 1.1522005796432495, 1.2548811435699463, 1.3575615882873535, 1.4602421522140503, 1.562922716140747, 1.6656031608581543, 1.7682838439941406, 1.8709644079208374, 1.9736449718475342, 2.0763254165649414, 2.1790060997009277, 2.281686544418335, 2.384366989135742, 2.4870476722717285, 2.5897281169891357]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 6.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 1.0, 1.0, 3.0, 8.0, 1.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.363250732421875, -4.21594762802124, -4.068645000457764, -3.921341896057129, -3.7740390300750732, -3.6267361640930176, -3.479433059692383, -3.332130193710327, -3.1848273277282715, -3.037524461746216, -2.89022159576416, -2.7429184913635254, -2.5956156253814697, -2.448312759399414, -2.3010096549987793, -2.1537067890167236, -2.006403923034668, -1.8591010570526123, -1.711798071861267, -1.5644950866699219, -1.4171922206878662, -1.2698893547058105, -1.1225863695144653, -0.9752833843231201, -0.8279805183410645, -0.680677592754364, -0.5333746671676636, -0.38607174158096313, -0.2387688159942627, -0.09146589040756226, 0.055837035179138184, 0.2031400203704834, 0.35044240951538086, 0.4977453351020813, 0.6450482606887817, 0.7923511862754822, 0.9396541118621826, 1.0869569778442383, 1.2342599630355835, 1.3815629482269287, 1.5288658142089844, 1.67616868019104, 1.8234716653823853, 1.9707746505737305, 2.118077516555786, 2.265380382537842, 2.4126834869384766, 2.5599863529205322, 2.707289218902588, 2.8545920848846436, 3.001894950866699, 3.149198055267334, 3.2965009212493896, 3.4438037872314453, 3.59110689163208, 3.7384097576141357, 3.8857126235961914, 4.033015727996826, 4.180318355560303, 4.3276214599609375, 4.474924087524414, 4.622227191925049, 4.769530296325684, 4.91683292388916, 5.064136028289795]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 7.0, 9.0, 6.0, 17.0, 18.0, 18.0, 33.0, 38.0, 74.0, 104.0, 136.0, 238.0, 417.0, 679.0, 1239.0, 2526.0, 5244.0, 11636.0, 25904.0, 58287.0, 122839.0, 148148.0, 80688.0, 35853.0, 15720.0, 7145.0, 3309.0, 1691.0, 896.0, 474.0, 289.0, 180.0, 108.0, 85.0, 46.0, 37.0, 38.0, 22.0, 23.0, 15.0, 14.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.353515625, -1.3087158203125, -1.263916015625, -1.2191162109375, -1.17431640625, -1.1295166015625, -1.084716796875, -1.0399169921875, -0.9951171875, -0.9503173828125, -0.905517578125, -0.8607177734375, -0.81591796875, -0.7711181640625, -0.726318359375, -0.6815185546875, -0.63671875, -0.5919189453125, -0.547119140625, -0.5023193359375, -0.45751953125, -0.4127197265625, -0.367919921875, -0.3231201171875, -0.2783203125, -0.2335205078125, -0.188720703125, -0.1439208984375, -0.09912109375, -0.0543212890625, -0.009521484375, 0.0352783203125, 0.080078125, 0.1248779296875, 0.169677734375, 0.2144775390625, 0.25927734375, 0.3040771484375, 0.348876953125, 0.3936767578125, 0.4384765625, 0.4832763671875, 0.528076171875, 0.5728759765625, 0.61767578125, 0.6624755859375, 0.707275390625, 0.7520751953125, 0.796875, 0.8416748046875, 0.886474609375, 0.9312744140625, 0.97607421875, 1.0208740234375, 1.065673828125, 1.1104736328125, 1.1552734375, 1.2000732421875, 1.244873046875, 1.2896728515625, 1.33447265625, 1.3792724609375, 1.424072265625, 1.4688720703125, 1.513671875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 9.0, 25.0, 27.0, 43.0, 65.0, 116.0, 99.0, 120.0, 144.0, 89.0, 78.0, 55.0, 34.0, 28.0, 26.0, 12.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67041015625, -0.652801513671875, -0.63519287109375, -0.617584228515625, -0.5999755859375, -0.582366943359375, -0.56475830078125, -0.547149658203125, -0.529541015625, -0.511932373046875, -0.49432373046875, -0.476715087890625, -0.4591064453125, -0.441497802734375, -0.42388916015625, -0.406280517578125, -0.388671875, -0.371063232421875, -0.35345458984375, -0.335845947265625, -0.3182373046875, -0.300628662109375, -0.28302001953125, -0.265411376953125, -0.247802734375, -0.230194091796875, -0.21258544921875, -0.194976806640625, -0.1773681640625, -0.159759521484375, -0.14215087890625, -0.124542236328125, -0.10693359375, -0.089324951171875, -0.07171630859375, -0.054107666015625, -0.0364990234375, -0.018890380859375, -0.00128173828125, 0.016326904296875, 0.033935546875, 0.051544189453125, 0.06915283203125, 0.086761474609375, 0.1043701171875, 0.121978759765625, 0.13958740234375, 0.157196044921875, 0.1748046875, 0.192413330078125, 0.21002197265625, 0.227630615234375, 0.2452392578125, 0.262847900390625, 0.28045654296875, 0.298065185546875, 0.315673828125, 0.333282470703125, 0.35089111328125, 0.368499755859375, 0.3861083984375, 0.403717041015625, 0.42132568359375, 0.438934326171875, 0.45654296875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 8.0, 19.0, 25.0, 63.0, 84.0, 109.0, 62.0, 32.0, 29.0, 16.0, 16.0, 8.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.640334129333496, -4.501906394958496, -4.363478183746338, -4.225050449371338, -4.086622714996338, -3.948194742202759, -3.8097667694091797, -3.6713390350341797, -3.5329113006591797, -3.3944833278656006, -3.2560555934906006, -3.1176276206970215, -2.9791998863220215, -2.8407719135284424, -2.7023439407348633, -2.5639162063598633, -2.425488233566284, -2.287060260772705, -2.148632526397705, -2.010204553604126, -1.871776819229126, -1.7333488464355469, -1.5949209928512573, -1.4564931392669678, -1.3180652856826782, -1.1796374320983887, -1.0412095785140991, -0.9027816653251648, -0.7643538117408752, -0.6259259581565857, -0.48749804496765137, -0.3490701913833618, -0.21064233779907227, -0.07221446931362152, 0.06621339917182922, 0.20464128255844116, 0.3430691361427307, 0.48149698972702026, 0.6199249029159546, 0.7583527565002441, 0.8967806100845337, 1.0352084636688232, 1.1736363172531128, 1.3120641708374023, 1.4504921436309814, 1.5889198780059814, 1.7273478507995605, 1.86577570438385, 2.0042035579681396, 2.1426315307617188, 2.2810592651367188, 2.419487237930298, 2.557914972305298, 2.696342945098877, 2.834770679473877, 2.973198652267456, 3.111626625061035, 3.2500545978546143, 3.3884823322296143, 3.5269103050231934, 3.6653380393981934, 3.8037660121917725, 3.9421939849853516, 4.080621719360352, 4.219049453735352]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 1.0, 7.0, 8.0, 19.0, 15.0, 28.0, 32.0, 32.0, 52.0, 45.0, 42.0, 51.0, 33.0, 23.0, 17.0, 17.0, 13.0, 11.0, 10.0, 5.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.310678005218506, -3.2163918018341064, -3.122105598449707, -3.0278191566467285, -2.933532953262329, -2.8392467498779297, -2.7449605464935303, -2.650674343109131, -2.5563879013061523, -2.462101697921753, -2.3678154945373535, -2.273529052734375, -2.1792428493499756, -2.084956645965576, -1.9906704425811768, -1.8963841199874878, -1.8020979166030884, -1.707811713218689, -1.613525390625, -1.5192391872406006, -1.4249528646469116, -1.3306666612625122, -1.2363803386688232, -1.1420941352844238, -1.0478079319000244, -0.9535216689109802, -0.859235405921936, -0.7649492025375366, -0.6706628799438477, -0.5763766765594482, -0.48209041357040405, -0.38780415058135986, -0.2935178279876709, -0.1992315649986267, -0.10494531691074371, -0.010659068822860718, 0.08362719416618347, 0.17791345715522766, 0.27219969034194946, 0.36648595333099365, 0.46077221632003784, 0.555058479309082, 0.6493447422981262, 0.7436310052871704, 0.8379172086715698, 0.9322035312652588, 1.0264897346496582, 1.1207759380340576, 1.2150622606277466, 1.309348464012146, 1.403634786605835, 1.4979209899902344, 1.5922073125839233, 1.6864935159683228, 1.7807798385620117, 1.8750660419464111, 1.9693522453308105, 2.06363844871521, 2.1579246520996094, 2.252211093902588, 2.3464972972869873, 2.4407835006713867, 2.535069704055786, 2.6293559074401855, 2.723642349243164]}, "eval/loss": 5.553798675537109, "eval/wer": 2.01330821102737, "eval/runtime": 947.3214, "eval/samples_per_second": 2.789, "eval/steps_per_second": 0.349, "train/train_runtime": 6324.9374, "train/train_samples_per_second": 4.512, "train/train_steps_per_second": 0.141, "train/total_flos": 0.0, "train/train_loss": 4.944881099221952} \ No newline at end of file