diff --git "a/wandb/run-20220303_033953-1eigbhyo/files/wandb-summary.json" "b/wandb/run-20220303_033953-1eigbhyo/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220303_033953-1eigbhyo/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.7246, "train/learning_rate": 0.000996, "train/epoch": 0.56, "train/global_step": 500, "_runtime": 3880, "_timestamp": 1646282673, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [4.0, 237.0, 759.0, 14.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-65.58610534667969, -35.810096740722656, -6.034088134765625, 23.741920471191406, 53.51792907714844, 83.29393005371094, 113.0699462890625, 142.84596252441406, 172.62196350097656, 202.39797973632812, 232.17398071289062, 261.9499816894531, 291.72601318359375, 321.50201416015625, 351.27801513671875, 381.05401611328125, 410.83001708984375, 440.60601806640625, 470.38201904296875, 500.1580505371094, 529.93408203125, 559.7100830078125, 589.486083984375, 619.2620849609375, 649.0380859375, 678.8140869140625, 708.590087890625, 738.3660888671875, 768.14208984375, 797.9180908203125, 827.6941528320312, 857.4701538085938, 887.2462158203125, 917.022216796875, 946.7982177734375, 976.57421875, 1006.3502197265625, 1036.126220703125, 1065.9022216796875, 1095.67822265625, 1125.454345703125, 1155.2303466796875, 1185.00634765625, 1214.7823486328125, 1244.558349609375, 1274.3343505859375, 1304.1103515625, 1333.886474609375, 1363.662353515625, 1393.4383544921875, 1423.21435546875, 1452.9903564453125, 1482.766357421875, 1512.5423583984375, 1542.318359375, 1572.094482421875, 1601.870361328125, 1631.6463623046875, 1661.42236328125, 1691.1983642578125, 1720.974365234375, 1750.7503662109375, 1780.5263671875, 1810.302490234375, 1840.0784912109375]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 5.0, 12.0, 16.0, 23.0, 21.0, 24.0, 28.0, 39.0, 36.0, 71.0, 71.0, 70.0, 70.0, 58.0, 74.0, 56.0, 53.0, 53.0, 29.0, 44.0, 30.0, 25.0, 24.0, 6.0, 11.0, 12.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.4993133544922, -243.7826385498047, -235.06597900390625, -226.34930419921875, -217.63262939453125, -208.91595458984375, -200.1992950439453, -191.4826202392578, -182.76596069335938, -174.04928588867188, -165.33262634277344, -156.61595153808594, -147.89927673339844, -139.1826171875, -130.4659423828125, -121.749267578125, -113.0325927734375, -104.31592559814453, -95.59925079345703, -86.88258361816406, -78.16590881347656, -69.4492416381836, -60.732574462890625, -52.01590347290039, -43.299232482910156, -34.58256149291992, -25.86589241027832, -17.14922332763672, -8.432552337646484, 0.28411865234375, 9.000785827636719, 17.717456817626953, 26.43414306640625, 35.150814056396484, 43.86748504638672, 52.58415222167969, 61.30082321166992, 70.01749420166016, 78.73416137695312, 87.45083618164062, 96.1675033569336, 104.88417053222656, 113.60084533691406, 122.31751251220703, 131.0341796875, 139.7508544921875, 148.467529296875, 157.18418884277344, 165.90086364746094, 174.61753845214844, 183.33419799804688, 192.05087280273438, 200.76754760742188, 209.48422241210938, 218.2008819580078, 226.9175567626953, 235.63421630859375, 244.35089111328125, 253.0675506591797, 261.78424072265625, 270.5008850097656, 279.2175598144531, 287.9342346191406, 296.6509094238281, 305.3675842285156]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 4.0, 13.0, 25.0, 20.0, 26.0, 30.0, 35.0, 44.0, 64.0, 76.0, 69.0, 61.0, 65.0, 65.0, 70.0, 38.0, 52.0, 34.0, 53.0, 42.0, 20.0, 15.0, 14.0, 10.0, 12.0, 8.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.68359375, -3.55340576171875, -3.4232177734375, -3.29302978515625, -3.162841796875, -3.03265380859375, -2.9024658203125, -2.77227783203125, -2.64208984375, -2.51190185546875, -2.3817138671875, -2.25152587890625, -2.121337890625, -1.99114990234375, -1.8609619140625, -1.73077392578125, -1.6005859375, -1.47039794921875, -1.3402099609375, -1.21002197265625, -1.079833984375, -0.94964599609375, -0.8194580078125, -0.68927001953125, -0.55908203125, -0.42889404296875, -0.2987060546875, -0.16851806640625, -0.038330078125, 0.09185791015625, 0.2220458984375, 0.35223388671875, 0.482421875, 0.61260986328125, 0.7427978515625, 0.87298583984375, 1.003173828125, 1.13336181640625, 1.2635498046875, 1.39373779296875, 1.52392578125, 1.65411376953125, 1.7843017578125, 1.91448974609375, 2.044677734375, 2.17486572265625, 2.3050537109375, 2.43524169921875, 2.5654296875, 2.69561767578125, 2.8258056640625, 2.95599365234375, 3.086181640625, 3.21636962890625, 3.3465576171875, 3.47674560546875, 3.60693359375, 3.73712158203125, 3.8673095703125, 3.99749755859375, 4.127685546875, 4.25787353515625, 4.3880615234375, 4.51824951171875, 4.6484375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 7.0, 14.0, 16.0, 17.0, 36.0, 35.0, 43.0, 90.0, 106.0, 153.0, 232.0, 348.0, 522.0, 967.0, 1656.0, 3255.0, 8921.0, 53525.0, 4012053.0, 93158.0, 10593.0, 3822.0, 1825.0, 1045.0, 641.0, 379.0, 265.0, 150.0, 112.0, 80.0, 55.0, 38.0, 29.0, 22.0, 17.0, 12.0, 9.0, 9.0, 2.0, 8.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.03125, -26.9765625, -25.921875, -24.8671875, -23.8125, -22.7578125, -21.703125, -20.6484375, -19.59375, -18.5390625, -17.484375, -16.4296875, -15.375, -14.3203125, -13.265625, -12.2109375, -11.15625, -10.1015625, -9.046875, -7.9921875, -6.9375, -5.8828125, -4.828125, -3.7734375, -2.71875, -1.6640625, -0.609375, 0.4453125, 1.5, 2.5546875, 3.609375, 4.6640625, 5.71875, 6.7734375, 7.828125, 8.8828125, 9.9375, 10.9921875, 12.046875, 13.1015625, 14.15625, 15.2109375, 16.265625, 17.3203125, 18.375, 19.4296875, 20.484375, 21.5390625, 22.59375, 23.6484375, 24.703125, 25.7578125, 26.8125, 27.8671875, 28.921875, 29.9765625, 31.03125, 32.0859375, 33.140625, 34.1953125, 35.25, 36.3046875, 37.359375, 38.4140625, 39.46875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 8.0, 13.0, 16.0, 17.0, 30.0, 57.0, 65.0, 126.0, 246.0, 411.0, 905.0, 974.0, 520.0, 258.0, 158.0, 93.0, 62.0, 44.0, 22.0, 19.0, 6.0, 9.0, 4.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.4375, -18.88330078125, -18.3291015625, -17.77490234375, -17.220703125, -16.66650390625, -16.1123046875, -15.55810546875, -15.00390625, -14.44970703125, -13.8955078125, -13.34130859375, -12.787109375, -12.23291015625, -11.6787109375, -11.12451171875, -10.5703125, -10.01611328125, -9.4619140625, -8.90771484375, -8.353515625, -7.79931640625, -7.2451171875, -6.69091796875, -6.13671875, -5.58251953125, -5.0283203125, -4.47412109375, -3.919921875, -3.36572265625, -2.8115234375, -2.25732421875, -1.703125, -1.14892578125, -0.5947265625, -0.04052734375, 0.513671875, 1.06787109375, 1.6220703125, 2.17626953125, 2.73046875, 3.28466796875, 3.8388671875, 4.39306640625, 4.947265625, 5.50146484375, 6.0556640625, 6.60986328125, 7.1640625, 7.71826171875, 8.2724609375, 8.82666015625, 9.380859375, 9.93505859375, 10.4892578125, 11.04345703125, 11.59765625, 12.15185546875, 12.7060546875, 13.26025390625, 13.814453125, 14.36865234375, 14.9228515625, 15.47705078125, 16.03125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 8.0, 16.0, 18.0, 32.0, 70.0, 103.0, 139.0, 277.0, 607.0, 2123.0, 69665.0, 4099668.0, 19058.0, 1436.0, 466.0, 251.0, 128.0, 78.0, 49.0, 23.0, 18.0, 12.0, 9.0, 7.0, 9.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.875, -49.08203125, -47.2890625, -45.49609375, -43.703125, -41.91015625, -40.1171875, -38.32421875, -36.53125, -34.73828125, -32.9453125, -31.15234375, -29.359375, -27.56640625, -25.7734375, -23.98046875, -22.1875, -20.39453125, -18.6015625, -16.80859375, -15.015625, -13.22265625, -11.4296875, -9.63671875, -7.84375, -6.05078125, -4.2578125, -2.46484375, -0.671875, 1.12109375, 2.9140625, 4.70703125, 6.5, 8.29296875, 10.0859375, 11.87890625, 13.671875, 15.46484375, 17.2578125, 19.05078125, 20.84375, 22.63671875, 24.4296875, 26.22265625, 28.015625, 29.80859375, 31.6015625, 33.39453125, 35.1875, 36.98046875, 38.7734375, 40.56640625, 42.359375, 44.15234375, 45.9453125, 47.73828125, 49.53125, 51.32421875, 53.1171875, 54.91015625, 56.703125, 58.49609375, 60.2890625, 62.08203125, 63.875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 78.0, 747.0, 182.0, 8.0, 0.0, 0.0, 1.0], "bins": [-363.37139892578125, -357.1737365722656, -350.97607421875, -344.7784423828125, -338.5807800292969, -332.38311767578125, -326.18548583984375, -319.9878234863281, -313.7901611328125, -307.5924987792969, -301.39483642578125, -295.19720458984375, -288.9995422363281, -282.8018798828125, -276.604248046875, -270.4065856933594, -264.20892333984375, -258.0112609863281, -251.81361389160156, -245.615966796875, -239.41830444335938, -233.22064208984375, -227.0229949951172, -220.82534790039062, -214.627685546875, -208.43002319335938, -202.2323760986328, -196.03472900390625, -189.83706665039062, -183.639404296875, -177.44175720214844, -171.24411010742188, -165.04644775390625, -158.84878540039062, -152.65113830566406, -146.4534912109375, -140.25582885742188, -134.05816650390625, -127.86051940917969, -121.6628646850586, -115.4652099609375, -109.2675552368164, -103.06990051269531, -96.87224578857422, -90.67459106445312, -84.47693634033203, -78.27928161621094, -72.08162689208984, -65.88397216796875, -59.686317443847656, -53.48866271972656, -47.29100799560547, -41.093353271484375, -34.89569854736328, -28.698043823242188, -22.500389099121094, -16.302730560302734, -10.10507583618164, -3.907421112060547, 2.290233612060547, 8.48788833618164, 14.685543060302734, 20.883197784423828, 27.080852508544922, 33.278507232666016]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 1.0, 9.0, 9.0, 12.0, 19.0, 11.0, 19.0, 19.0, 19.0, 17.0, 44.0, 30.0, 37.0, 29.0, 29.0, 39.0, 32.0, 30.0, 41.0, 41.0, 40.0, 37.0, 38.0, 47.0, 45.0, 25.0, 39.0, 33.0, 28.0, 31.0, 23.0, 15.0, 11.0, 20.0, 19.0, 5.0, 17.0, 8.0, 7.0, 3.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.180938720703125, -34.971675872802734, -33.762413024902344, -32.55315017700195, -31.343887329101562, -30.134624481201172, -28.92536163330078, -27.71609878540039, -26.5068359375, -25.29757308959961, -24.08831024169922, -22.879047393798828, -21.669784545898438, -20.460521697998047, -19.251258850097656, -18.041996002197266, -16.832733154296875, -15.623470306396484, -14.414207458496094, -13.204944610595703, -11.995681762695312, -10.786418914794922, -9.577156066894531, -8.36789321899414, -7.15863037109375, -5.949367523193359, -4.740104675292969, -3.530841827392578, -2.3215789794921875, -1.1123161315917969, 0.09694671630859375, 1.3062095642089844, 2.515472412109375, 3.7247352600097656, 4.933998107910156, 6.143260955810547, 7.3525238037109375, 8.561786651611328, 9.771049499511719, 10.98031234741211, 12.1895751953125, 13.39883804321289, 14.608100891113281, 15.817363739013672, 17.026626586914062, 18.235889434814453, 19.445152282714844, 20.654415130615234, 21.863677978515625, 23.072940826416016, 24.282203674316406, 25.491466522216797, 26.700729370117188, 27.909992218017578, 29.11925506591797, 30.32851791381836, 31.53778076171875, 32.74704360961914, 33.95630645751953, 35.16556930541992, 36.37483215332031, 37.5840950012207, 38.793357849121094, 40.002620697021484, 41.211883544921875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 8.0, 12.0, 22.0, 22.0, 24.0, 27.0, 33.0, 47.0, 55.0, 62.0, 71.0, 62.0, 60.0, 59.0, 63.0, 50.0, 52.0, 41.0, 40.0, 43.0, 42.0, 17.0, 11.0, 13.0, 14.0, 7.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7421875, -3.615966796875, -3.48974609375, -3.363525390625, -3.2373046875, -3.111083984375, -2.98486328125, -2.858642578125, -2.732421875, -2.606201171875, -2.47998046875, -2.353759765625, -2.2275390625, -2.101318359375, -1.97509765625, -1.848876953125, -1.72265625, -1.596435546875, -1.47021484375, -1.343994140625, -1.2177734375, -1.091552734375, -0.96533203125, -0.839111328125, -0.712890625, -0.586669921875, -0.46044921875, -0.334228515625, -0.2080078125, -0.081787109375, 0.04443359375, 0.170654296875, 0.296875, 0.423095703125, 0.54931640625, 0.675537109375, 0.8017578125, 0.927978515625, 1.05419921875, 1.180419921875, 1.306640625, 1.432861328125, 1.55908203125, 1.685302734375, 1.8115234375, 1.937744140625, 2.06396484375, 2.190185546875, 2.31640625, 2.442626953125, 2.56884765625, 2.695068359375, 2.8212890625, 2.947509765625, 3.07373046875, 3.199951171875, 3.326171875, 3.452392578125, 3.57861328125, 3.704833984375, 3.8310546875, 3.957275390625, 4.08349609375, 4.209716796875, 4.3359375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 10.0, 13.0, 20.0, 28.0, 39.0, 44.0, 64.0, 72.0, 108.0, 186.0, 255.0, 332.0, 499.0, 831.0, 1275.0, 1952.0, 3235.0, 5302.0, 9157.0, 16816.0, 30462.0, 60081.0, 134801.0, 374003.0, 227760.0, 86716.0, 42041.0, 22027.0, 12174.0, 7066.0, 4086.0, 2419.0, 1539.0, 1039.0, 639.0, 450.0, 334.0, 203.0, 129.0, 110.0, 73.0, 47.0, 31.0, 22.0, 23.0, 14.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18324851989746094, -0.17728805541992188, -0.1713275909423828, -0.16536712646484375, -0.1594066619873047, -0.15344619750976562, -0.14748573303222656, -0.1415252685546875, -0.13556480407714844, -0.12960433959960938, -0.12364387512207031, -0.11768341064453125, -0.11172294616699219, -0.10576248168945312, -0.09980201721191406, -0.093841552734375, -0.08788108825683594, -0.08192062377929688, -0.07596015930175781, -0.06999969482421875, -0.06403923034667969, -0.058078765869140625, -0.05211830139160156, -0.0461578369140625, -0.04019737243652344, -0.034236907958984375, -0.028276443481445312, -0.02231597900390625, -0.016355514526367188, -0.010395050048828125, -0.0044345855712890625, 0.00152587890625, 0.0074863433837890625, 0.013446807861328125, 0.019407272338867188, 0.02536773681640625, 0.03132820129394531, 0.037288665771484375, 0.04324913024902344, 0.0492095947265625, 0.05517005920410156, 0.061130523681640625, 0.06709098815917969, 0.07305145263671875, 0.07901191711425781, 0.08497238159179688, 0.09093284606933594, 0.096893310546875, 0.10285377502441406, 0.10881423950195312, 0.11477470397949219, 0.12073516845703125, 0.1266956329345703, 0.13265609741210938, 0.13861656188964844, 0.1445770263671875, 0.15053749084472656, 0.15649795532226562, 0.1624584197998047, 0.16841888427734375, 0.1743793487548828, 0.18033981323242188, 0.18630027770996094, 0.1922607421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 2.0, 12.0, 5.0, 13.0, 6.0, 12.0, 23.0, 19.0, 22.0, 23.0, 24.0, 36.0, 38.0, 26.0, 38.0, 32.0, 48.0, 49.0, 47.0, 1077.0, 32.0, 50.0, 31.0, 45.0, 33.0, 41.0, 36.0, 27.0, 31.0, 27.0, 24.0, 19.0, 11.0, 16.0, 11.0, 5.0, 15.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.463836669921875, -2.38470458984375, -2.305572509765625, -2.2264404296875, -2.147308349609375, -2.06817626953125, -1.989044189453125, -1.909912109375, -1.830780029296875, -1.75164794921875, -1.672515869140625, -1.5933837890625, -1.514251708984375, -1.43511962890625, -1.355987548828125, -1.27685546875, -1.197723388671875, -1.11859130859375, -1.039459228515625, -0.9603271484375, -0.881195068359375, -0.80206298828125, -0.722930908203125, -0.643798828125, -0.564666748046875, -0.48553466796875, -0.406402587890625, -0.3272705078125, -0.248138427734375, -0.16900634765625, -0.089874267578125, -0.0107421875, 0.068389892578125, 0.14752197265625, 0.226654052734375, 0.3057861328125, 0.384918212890625, 0.46405029296875, 0.543182373046875, 0.622314453125, 0.701446533203125, 0.78057861328125, 0.859710693359375, 0.9388427734375, 1.017974853515625, 1.09710693359375, 1.176239013671875, 1.25537109375, 1.334503173828125, 1.41363525390625, 1.492767333984375, 1.5718994140625, 1.651031494140625, 1.73016357421875, 1.809295654296875, 1.888427734375, 1.967559814453125, 2.04669189453125, 2.125823974609375, 2.2049560546875, 2.284088134765625, 2.36322021484375, 2.442352294921875, 2.521484375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 13.0, 17.0, 21.0, 33.0, 53.0, 76.0, 139.0, 222.0, 367.0, 577.0, 957.0, 1549.0, 2567.0, 4386.0, 7353.0, 12684.0, 21799.0, 38586.0, 70465.0, 145112.0, 1387471.0, 201591.0, 89195.0, 47447.0, 26909.0, 15378.0, 8929.0, 5263.0, 3119.0, 1882.0, 1136.0, 691.0, 435.0, 284.0, 140.0, 113.0, 59.0, 43.0, 25.0, 15.0, 6.0, 11.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.094482421875, -0.09159088134765625, -0.0886993408203125, -0.08580780029296875, -0.082916259765625, -0.08002471923828125, -0.0771331787109375, -0.07424163818359375, -0.07135009765625, -0.06845855712890625, -0.0655670166015625, -0.06267547607421875, -0.059783935546875, -0.05689239501953125, -0.0540008544921875, -0.05110931396484375, -0.0482177734375, -0.04532623291015625, -0.0424346923828125, -0.03954315185546875, -0.036651611328125, -0.03376007080078125, -0.0308685302734375, -0.02797698974609375, -0.02508544921875, -0.02219390869140625, -0.0193023681640625, -0.01641082763671875, -0.013519287109375, -0.01062774658203125, -0.0077362060546875, -0.00484466552734375, -0.001953125, 0.00093841552734375, 0.0038299560546875, 0.00672149658203125, 0.009613037109375, 0.01250457763671875, 0.0153961181640625, 0.01828765869140625, 0.02117919921875, 0.02407073974609375, 0.0269622802734375, 0.02985382080078125, 0.032745361328125, 0.03563690185546875, 0.0385284423828125, 0.04141998291015625, 0.0443115234375, 0.04720306396484375, 0.0500946044921875, 0.05298614501953125, 0.055877685546875, 0.05876922607421875, 0.0616607666015625, 0.06455230712890625, 0.06744384765625, 0.07033538818359375, 0.0732269287109375, 0.07611846923828125, 0.079010009765625, 0.08190155029296875, 0.0847930908203125, 0.08768463134765625, 0.090576171875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 9.0, 6.0, 9.0, 7.0, 9.0, 16.0, 25.0, 13.0, 13.0, 21.0, 15.0, 25.0, 54.0, 39.0, 39.0, 28.0, 43.0, 48.0, 50.0, 42.0, 46.0, 41.0, 52.0, 47.0, 33.0, 33.0, 36.0, 28.0, 18.0, 14.0, 22.0, 14.0, 15.0, 18.0, 12.0, 11.0, 10.0, 16.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.355741500854492e-05, -3.243889659643173e-05, -3.132037818431854e-05, -3.0201859772205353e-05, -2.9083341360092163e-05, -2.7964822947978973e-05, -2.6846304535865784e-05, -2.5727786123752594e-05, -2.4609267711639404e-05, -2.3490749299526215e-05, -2.2372230887413025e-05, -2.1253712475299835e-05, -2.0135194063186646e-05, -1.9016675651073456e-05, -1.7898157238960266e-05, -1.6779638826847076e-05, -1.5661120414733887e-05, -1.4542602002620697e-05, -1.3424083590507507e-05, -1.2305565178394318e-05, -1.1187046766281128e-05, -1.0068528354167938e-05, -8.950009942054749e-06, -7.831491529941559e-06, -6.712973117828369e-06, -5.5944547057151794e-06, -4.47593629360199e-06, -3.3574178814888e-06, -2.2388994693756104e-06, -1.1203810572624207e-06, -1.862645149230957e-09, 1.1166557669639587e-06, 2.2351741790771484e-06, 3.353692591190338e-06, 4.472211003303528e-06, 5.5907294154167175e-06, 6.709247827529907e-06, 7.827766239643097e-06, 8.946284651756287e-06, 1.0064803063869476e-05, 1.1183321475982666e-05, 1.2301839888095856e-05, 1.3420358300209045e-05, 1.4538876712322235e-05, 1.5657395124435425e-05, 1.6775913536548615e-05, 1.7894431948661804e-05, 1.9012950360774994e-05, 2.0131468772888184e-05, 2.1249987185001373e-05, 2.2368505597114563e-05, 2.3487024009227753e-05, 2.4605542421340942e-05, 2.5724060833454132e-05, 2.6842579245567322e-05, 2.796109765768051e-05, 2.90796160697937e-05, 3.019813448190689e-05, 3.131665289402008e-05, 3.243517130613327e-05, 3.355368971824646e-05, 3.467220813035965e-05, 3.579072654247284e-05, 3.690924495458603e-05, 3.802776336669922e-05]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 8.0, 15.0, 11.0, 15.0, 15.0, 25.0, 30.0, 38.0, 30.0, 41.0, 58.0, 54.0, 89.0, 98.0, 148.0, 175.0, 168.0, 263.0, 319.0, 1035.0, 1036230.0, 7877.0, 415.0, 259.0, 217.0, 155.0, 145.0, 106.0, 92.0, 70.0, 66.0, 66.0, 45.0, 26.0, 19.0, 40.0, 26.0, 13.0, 10.0, 16.0, 10.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.0007548332214355469, -0.0007317513227462769, -0.0007086694240570068, -0.0006855875253677368, -0.0006625056266784668, -0.0006394237279891968, -0.0006163418292999268, -0.0005932599306106567, -0.0005701780319213867, -0.0005470961332321167, -0.0005240142345428467, -0.0005009323358535767, -0.00047785043716430664, -0.0004547685384750366, -0.0004316866397857666, -0.0004086047410964966, -0.00038552284240722656, -0.00036244094371795654, -0.0003393590450286865, -0.0003162771463394165, -0.0002931952476501465, -0.00027011334896087646, -0.00024703145027160645, -0.00022394955158233643, -0.0002008676528930664, -0.0001777857542037964, -0.00015470385551452637, -0.00013162195682525635, -0.00010854005813598633, -8.545815944671631e-05, -6.237626075744629e-05, -3.929436206817627e-05, -1.621246337890625e-05, 6.8694353103637695e-06, 2.995133399963379e-05, 5.303323268890381e-05, 7.611513137817383e-05, 9.919703006744385e-05, 0.00012227892875671387, 0.0001453608274459839, 0.0001684427261352539, 0.00019152462482452393, 0.00021460652351379395, 0.00023768842220306396, 0.000260770320892334, 0.000283852219581604, 0.000306934118270874, 0.00033001601696014404, 0.00035309791564941406, 0.0003761798143386841, 0.0003992617130279541, 0.0004223436117172241, 0.00044542551040649414, 0.00046850740909576416, 0.0004915893077850342, 0.0005146712064743042, 0.0005377531051635742, 0.0005608350038528442, 0.0005839169025421143, 0.0006069988012313843, 0.0006300806999206543, 0.0006531625986099243, 0.0006762444972991943, 0.0006993263959884644, 0.0007224082946777344]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 964.0, 54.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003014194662682712, -0.00029057663050480187, -0.000279733823845163, -0.00026889098808169365, -0.00025804818142205477, -0.00024720534565858543, -0.00023636252444703132, -0.0002255197032354772, -0.0002146768820239231, -0.000203834060812369, -0.00019299123960081488, -0.00018214841838926077, -0.00017130558262579143, -0.00016046277596615255, -0.0001496199402026832, -0.0001387771189911291, -0.000127934297779575, -0.00011709147656802088, -0.00010624865535646677, -9.540582686895505e-05, -8.456300565740094e-05, -7.372018444584683e-05, -6.28773559583351e-05, -5.203453474678099e-05, -4.119171353522688e-05, -3.0348890504683368e-05, -1.9506067474139854e-05, -8.663242624606937e-06, 2.179578586947173e-06, 1.3022399798501283e-05, 2.3865228286013007e-05, 3.470804949756712e-05, 4.555084160529077e-05, 5.639366281684488e-05, 6.723648402839899e-05, 7.807931251591071e-05, 8.892213372746482e-05, 9.976495493901893e-05, 0.00011060778342653066, 0.00012145060463808477, 0.00013229342584963888, 0.000143136247061193, 0.0001539790682727471, 0.0001648218894843012, 0.00017566472524777055, 0.00018650753190740943, 0.00019735036767087877, 0.00020819318888243288, 0.000219036010093987, 0.0002298788313055411, 0.0002407216525170952, 0.00025156448828056455, 0.00026240729494020343, 0.00027325013070367277, 0.0002840929664671421, 0.000294935773126781, 0.00030577857978641987, 0.0003166214155498892, 0.0003274642222095281, 0.0003383070579729974, 0.0003491498646326363, 0.00035999270039610565, 0.000370835536159575, 0.00038167834281921387, 0.0003925211785826832]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 12.0, 10.0, 9.0, 9.0, 15.0, 17.0, 29.0, 14.0, 29.0, 25.0, 26.0, 21.0, 28.0, 47.0, 32.0, 41.0, 40.0, 42.0, 52.0, 44.0, 33.0, 46.0, 30.0, 35.0, 42.0, 32.0, 31.0, 47.0, 20.0, 17.0, 16.0, 14.0, 16.0, 15.0, 10.0, 8.0, 6.0, 14.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4139881134033203e-05, -2.342555671930313e-05, -2.271123230457306e-05, -2.1996907889842987e-05, -2.1282583475112915e-05, -2.0568259060382843e-05, -1.985393464565277e-05, -1.91396102309227e-05, -1.8425285816192627e-05, -1.7710961401462555e-05, -1.6996636986732483e-05, -1.628231257200241e-05, -1.556798815727234e-05, -1.4853663742542267e-05, -1.4139339327812195e-05, -1.3425014913082123e-05, -1.271069049835205e-05, -1.1996366083621979e-05, -1.1282041668891907e-05, -1.0567717254161835e-05, -9.853392839431763e-06, -9.13906842470169e-06, -8.424744009971619e-06, -7.710419595241547e-06, -6.996095180511475e-06, -6.281770765781403e-06, -5.5674463510513306e-06, -4.8531219363212585e-06, -4.1387975215911865e-06, -3.4244731068611145e-06, -2.7101486921310425e-06, -1.9958242774009705e-06, -1.2814998626708984e-06, -5.671754479408264e-07, 1.471489667892456e-07, 8.614733815193176e-07, 1.5757977962493896e-06, 2.2901222109794617e-06, 3.0044466257095337e-06, 3.7187710404396057e-06, 4.433095455169678e-06, 5.14741986989975e-06, 5.861744284629822e-06, 6.576068699359894e-06, 7.290393114089966e-06, 8.004717528820038e-06, 8.71904194355011e-06, 9.433366358280182e-06, 1.0147690773010254e-05, 1.0862015187740326e-05, 1.1576339602470398e-05, 1.229066401720047e-05, 1.3004988431930542e-05, 1.3719312846660614e-05, 1.4433637261390686e-05, 1.5147961676120758e-05, 1.586228609085083e-05, 1.6576610505580902e-05, 1.7290934920310974e-05, 1.8005259335041046e-05, 1.8719583749771118e-05, 1.943390816450119e-05, 2.0148232579231262e-05, 2.0862556993961334e-05, 2.1576881408691406e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 8.0, 12.0, 22.0, 22.0, 24.0, 27.0, 33.0, 47.0, 55.0, 62.0, 71.0, 62.0, 60.0, 59.0, 63.0, 50.0, 52.0, 41.0, 40.0, 43.0, 42.0, 17.0, 11.0, 13.0, 14.0, 7.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7421875, -3.615966796875, -3.48974609375, -3.363525390625, -3.2373046875, -3.111083984375, -2.98486328125, -2.858642578125, -2.732421875, -2.606201171875, -2.47998046875, -2.353759765625, -2.2275390625, -2.101318359375, -1.97509765625, -1.848876953125, -1.72265625, -1.596435546875, -1.47021484375, -1.343994140625, -1.2177734375, -1.091552734375, -0.96533203125, -0.839111328125, -0.712890625, -0.586669921875, -0.46044921875, -0.334228515625, -0.2080078125, -0.081787109375, 0.04443359375, 0.170654296875, 0.296875, 0.423095703125, 0.54931640625, 0.675537109375, 0.8017578125, 0.927978515625, 1.05419921875, 1.180419921875, 1.306640625, 1.432861328125, 1.55908203125, 1.685302734375, 1.8115234375, 1.937744140625, 2.06396484375, 2.190185546875, 2.31640625, 2.442626953125, 2.56884765625, 2.695068359375, 2.8212890625, 2.947509765625, 3.07373046875, 3.199951171875, 3.326171875, 3.452392578125, 3.57861328125, 3.704833984375, 3.8310546875, 3.957275390625, 4.08349609375, 4.209716796875, 4.3359375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 9.0, 16.0, 21.0, 31.0, 34.0, 53.0, 67.0, 89.0, 101.0, 159.0, 234.0, 310.0, 488.0, 752.0, 1322.0, 2216.0, 3753.0, 8146.0, 25050.0, 240498.0, 705189.0, 38173.0, 10542.0, 4543.0, 2540.0, 1499.0, 880.0, 552.0, 322.0, 252.0, 196.0, 119.0, 95.0, 75.0, 47.0, 42.0, 32.0, 17.0, 12.0, 15.0, 11.0, 8.0, 3.0, 7.0, 3.0, 6.0, 2.0, 1.0, 1.0, 4.0], "bins": [-30.46875, -29.576171875, -28.68359375, -27.791015625, -26.8984375, -26.005859375, -25.11328125, -24.220703125, -23.328125, -22.435546875, -21.54296875, -20.650390625, -19.7578125, -18.865234375, -17.97265625, -17.080078125, -16.1875, -15.294921875, -14.40234375, -13.509765625, -12.6171875, -11.724609375, -10.83203125, -9.939453125, -9.046875, -8.154296875, -7.26171875, -6.369140625, -5.4765625, -4.583984375, -3.69140625, -2.798828125, -1.90625, -1.013671875, -0.12109375, 0.771484375, 1.6640625, 2.556640625, 3.44921875, 4.341796875, 5.234375, 6.126953125, 7.01953125, 7.912109375, 8.8046875, 9.697265625, 10.58984375, 11.482421875, 12.375, 13.267578125, 14.16015625, 15.052734375, 15.9453125, 16.837890625, 17.73046875, 18.623046875, 19.515625, 20.408203125, 21.30078125, 22.193359375, 23.0859375, 23.978515625, 24.87109375, 25.763671875, 26.65625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 10.0, 8.0, 10.0, 8.0, 16.0, 10.0, 12.0, 33.0, 18.0, 21.0, 27.0, 42.0, 34.0, 43.0, 51.0, 46.0, 74.0, 131.0, 1632.0, 233.0, 85.0, 56.0, 53.0, 63.0, 37.0, 49.0, 38.0, 31.0, 28.0, 34.0, 18.0, 19.0, 15.0, 15.0, 9.0, 10.0, 9.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.65625, -9.331298828125, -9.00634765625, -8.681396484375, -8.3564453125, -8.031494140625, -7.70654296875, -7.381591796875, -7.056640625, -6.731689453125, -6.40673828125, -6.081787109375, -5.7568359375, -5.431884765625, -5.10693359375, -4.781982421875, -4.45703125, -4.132080078125, -3.80712890625, -3.482177734375, -3.1572265625, -2.832275390625, -2.50732421875, -2.182373046875, -1.857421875, -1.532470703125, -1.20751953125, -0.882568359375, -0.5576171875, -0.232666015625, 0.09228515625, 0.417236328125, 0.7421875, 1.067138671875, 1.39208984375, 1.717041015625, 2.0419921875, 2.366943359375, 2.69189453125, 3.016845703125, 3.341796875, 3.666748046875, 3.99169921875, 4.316650390625, 4.6416015625, 4.966552734375, 5.29150390625, 5.616455078125, 5.94140625, 6.266357421875, 6.59130859375, 6.916259765625, 7.2412109375, 7.566162109375, 7.89111328125, 8.216064453125, 8.541015625, 8.865966796875, 9.19091796875, 9.515869140625, 9.8408203125, 10.165771484375, 10.49072265625, 10.815673828125, 11.140625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 8.0, 6.0, 12.0, 18.0, 12.0, 21.0, 16.0, 20.0, 31.0, 35.0, 40.0, 77.0, 78.0, 111.0, 271.0, 743.0, 7270.0, 3013481.0, 120248.0, 2208.0, 397.0, 185.0, 98.0, 68.0, 48.0, 36.0, 33.0, 12.0, 20.0, 22.0, 9.0, 8.0, 15.0, 12.0, 8.0, 6.0, 6.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.78125, -48.30810546875, -46.8349609375, -45.36181640625, -43.888671875, -42.41552734375, -40.9423828125, -39.46923828125, -37.99609375, -36.52294921875, -35.0498046875, -33.57666015625, -32.103515625, -30.63037109375, -29.1572265625, -27.68408203125, -26.2109375, -24.73779296875, -23.2646484375, -21.79150390625, -20.318359375, -18.84521484375, -17.3720703125, -15.89892578125, -14.42578125, -12.95263671875, -11.4794921875, -10.00634765625, -8.533203125, -7.06005859375, -5.5869140625, -4.11376953125, -2.640625, -1.16748046875, 0.3056640625, 1.77880859375, 3.251953125, 4.72509765625, 6.1982421875, 7.67138671875, 9.14453125, 10.61767578125, 12.0908203125, 13.56396484375, 15.037109375, 16.51025390625, 17.9833984375, 19.45654296875, 20.9296875, 22.40283203125, 23.8759765625, 25.34912109375, 26.822265625, 28.29541015625, 29.7685546875, 31.24169921875, 32.71484375, 34.18798828125, 35.6611328125, 37.13427734375, 38.607421875, 40.08056640625, 41.5537109375, 43.02685546875, 44.5]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 81.0, 607.0, 287.0, 32.0, 6.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.40023803710938, -179.775146484375, -176.1500701904297, -172.5249786376953, -168.89988708496094, -165.27479553222656, -161.64971923828125, -158.02462768554688, -154.3995361328125, -150.77444458007812, -147.1493682861328, -143.52427673339844, -139.89918518066406, -136.2740936279297, -132.64901733398438, -129.02392578125, -125.39884185791016, -121.77375793457031, -118.14866638183594, -114.5235824584961, -110.89849090576172, -107.27340698242188, -103.6483154296875, -100.02323150634766, -96.39814758300781, -92.77306365966797, -89.1479721069336, -85.52288818359375, -81.89779663085938, -78.27271270751953, -74.64762878417969, -71.02253723144531, -67.3974380493164, -63.7723503112793, -60.14726257324219, -56.522178649902344, -52.89708709716797, -49.272003173828125, -45.646915435791016, -42.021827697753906, -38.3967399597168, -34.77165222167969, -31.146564483642578, -27.5214786529541, -23.896390914916992, -20.271303176879883, -16.646217346191406, -13.021129608154297, -9.396041870117188, -5.770954608917236, -2.145867347717285, 1.4792194366455078, 5.104307174682617, 8.729394912719727, 12.354480743408203, 15.979568481445312, 19.604656219482422, 23.22974395751953, 26.85483169555664, 30.479917526245117, 34.105003356933594, 37.73009490966797, 41.35517883300781, 44.98026657104492, 48.60535430908203]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 2.0, 10.0, 13.0, 13.0, 12.0, 21.0, 21.0, 21.0, 20.0, 27.0, 24.0, 33.0, 41.0, 45.0, 41.0, 44.0, 41.0, 33.0, 31.0, 38.0, 39.0, 40.0, 39.0, 44.0, 32.0, 37.0, 21.0, 28.0, 29.0, 26.0, 25.0, 19.0, 17.0, 17.0, 9.0, 7.0, 5.0, 14.0, 2.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0], "bins": [-46.847984313964844, -45.650413513183594, -44.452842712402344, -43.25527572631836, -42.05770492553711, -40.86013412475586, -39.66256332397461, -38.464996337890625, -37.267425537109375, -36.069854736328125, -34.872283935546875, -33.67471694946289, -32.47714614868164, -31.27957534790039, -30.08200454711914, -28.884435653686523, -27.686864852905273, -26.489294052124023, -25.291725158691406, -24.094154357910156, -22.89658546447754, -21.69901466369629, -20.501445770263672, -19.303874969482422, -18.106304168701172, -16.908733367919922, -15.711164474487305, -14.513593673706055, -13.316024780273438, -12.118453979492188, -10.920884132385254, -9.72331428527832, -8.525745391845703, -7.3281755447387695, -6.130605697631836, -4.933035373687744, -3.7354655265808105, -2.537895679473877, -1.3403253555297852, -0.14275550842285156, 1.054814338684082, 2.2523841857910156, 3.4499542713165283, 4.647524356842041, 5.845094203948975, 7.042664051055908, 8.240234375, 9.437804222106934, 10.635374069213867, 11.8329439163208, 13.030513763427734, 14.228084564208984, 15.425653457641602, 16.62322425842285, 17.82079315185547, 19.01836395263672, 20.21593475341797, 21.41350555419922, 22.611074447631836, 23.808645248413086, 25.006214141845703, 26.203784942626953, 27.401355743408203, 28.59892463684082, 29.796493530273438]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 1.0, 4.0, 10.0, 12.0, 18.0, 16.0, 32.0, 20.0, 42.0, 26.0, 60.0, 55.0, 69.0, 67.0, 61.0, 54.0, 59.0, 56.0, 61.0, 42.0, 38.0, 41.0, 44.0, 28.0, 15.0, 14.0, 9.0, 7.0, 9.0, 6.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.765625, -3.63592529296875, -3.5062255859375, -3.37652587890625, -3.246826171875, -3.11712646484375, -2.9874267578125, -2.85772705078125, -2.72802734375, -2.59832763671875, -2.4686279296875, -2.33892822265625, -2.209228515625, -2.07952880859375, -1.9498291015625, -1.82012939453125, -1.6904296875, -1.56072998046875, -1.4310302734375, -1.30133056640625, -1.171630859375, -1.04193115234375, -0.9122314453125, -0.78253173828125, -0.65283203125, -0.52313232421875, -0.3934326171875, -0.26373291015625, -0.134033203125, -0.00433349609375, 0.1253662109375, 0.25506591796875, 0.384765625, 0.51446533203125, 0.6441650390625, 0.77386474609375, 0.903564453125, 1.03326416015625, 1.1629638671875, 1.29266357421875, 1.42236328125, 1.55206298828125, 1.6817626953125, 1.81146240234375, 1.941162109375, 2.07086181640625, 2.2005615234375, 2.33026123046875, 2.4599609375, 2.58966064453125, 2.7193603515625, 2.84906005859375, 2.978759765625, 3.10845947265625, 3.2381591796875, 3.36785888671875, 3.49755859375, 3.62725830078125, 3.7569580078125, 3.88665771484375, 4.016357421875, 4.14605712890625, 4.2757568359375, 4.40545654296875, 4.53515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 4.0, 1.0, 5.0, 3.0, 4.0, 8.0, 5.0, 21.0, 26.0, 43.0, 51.0, 85.0, 108.0, 178.0, 353.0, 657.0, 1463.0, 4000.0, 29359.0, 3998291.0, 148669.0, 7003.0, 2000.0, 876.0, 420.0, 244.0, 134.0, 87.0, 57.0, 28.0, 18.0, 22.0, 18.0, 9.0, 6.0, 3.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.21875, -37.8515625, -36.484375, -35.1171875, -33.75, -32.3828125, -31.015625, -29.6484375, -28.28125, -26.9140625, -25.546875, -24.1796875, -22.8125, -21.4453125, -20.078125, -18.7109375, -17.34375, -15.9765625, -14.609375, -13.2421875, -11.875, -10.5078125, -9.140625, -7.7734375, -6.40625, -5.0390625, -3.671875, -2.3046875, -0.9375, 0.4296875, 1.796875, 3.1640625, 4.53125, 5.8984375, 7.265625, 8.6328125, 10.0, 11.3671875, 12.734375, 14.1015625, 15.46875, 16.8359375, 18.203125, 19.5703125, 20.9375, 22.3046875, 23.671875, 25.0390625, 26.40625, 27.7734375, 29.140625, 30.5078125, 31.875, 33.2421875, 34.609375, 35.9765625, 37.34375, 38.7109375, 40.078125, 41.4453125, 42.8125, 44.1796875, 45.546875, 46.9140625, 48.28125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 9.0, 13.0, 14.0, 23.0, 27.0, 54.0, 67.0, 133.0, 150.0, 251.0, 440.0, 702.0, 834.0, 495.0, 285.0, 201.0, 114.0, 87.0, 60.0, 33.0, 33.0, 16.0, 10.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.96875, -10.51318359375, -10.0576171875, -9.60205078125, -9.146484375, -8.69091796875, -8.2353515625, -7.77978515625, -7.32421875, -6.86865234375, -6.4130859375, -5.95751953125, -5.501953125, -5.04638671875, -4.5908203125, -4.13525390625, -3.6796875, -3.22412109375, -2.7685546875, -2.31298828125, -1.857421875, -1.40185546875, -0.9462890625, -0.49072265625, -0.03515625, 0.42041015625, 0.8759765625, 1.33154296875, 1.787109375, 2.24267578125, 2.6982421875, 3.15380859375, 3.609375, 4.06494140625, 4.5205078125, 4.97607421875, 5.431640625, 5.88720703125, 6.3427734375, 6.79833984375, 7.25390625, 7.70947265625, 8.1650390625, 8.62060546875, 9.076171875, 9.53173828125, 9.9873046875, 10.44287109375, 10.8984375, 11.35400390625, 11.8095703125, 12.26513671875, 12.720703125, 13.17626953125, 13.6318359375, 14.08740234375, 14.54296875, 14.99853515625, 15.4541015625, 15.90966796875, 16.365234375, 16.82080078125, 17.2763671875, 17.73193359375, 18.1875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 2.0, 11.0, 17.0, 49.0, 43.0, 91.0, 153.0, 270.0, 478.0, 1108.0, 2627.0, 8487.0, 34944.0, 285525.0, 3389806.0, 410570.0, 44501.0, 9911.0, 3166.0, 1303.0, 511.0, 305.0, 144.0, 103.0, 66.0, 31.0, 15.0, 18.0, 8.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.953125, -21.094482421875, -20.23583984375, -19.377197265625, -18.5185546875, -17.659912109375, -16.80126953125, -15.942626953125, -15.083984375, -14.225341796875, -13.36669921875, -12.508056640625, -11.6494140625, -10.790771484375, -9.93212890625, -9.073486328125, -8.21484375, -7.356201171875, -6.49755859375, -5.638916015625, -4.7802734375, -3.921630859375, -3.06298828125, -2.204345703125, -1.345703125, -0.487060546875, 0.37158203125, 1.230224609375, 2.0888671875, 2.947509765625, 3.80615234375, 4.664794921875, 5.5234375, 6.382080078125, 7.24072265625, 8.099365234375, 8.9580078125, 9.816650390625, 10.67529296875, 11.533935546875, 12.392578125, 13.251220703125, 14.10986328125, 14.968505859375, 15.8271484375, 16.685791015625, 17.54443359375, 18.403076171875, 19.26171875, 20.120361328125, 20.97900390625, 21.837646484375, 22.6962890625, 23.554931640625, 24.41357421875, 25.272216796875, 26.130859375, 26.989501953125, 27.84814453125, 28.706787109375, 29.5654296875, 30.424072265625, 31.28271484375, 32.141357421875, 33.0]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 11.0, 42.0, 166.0, 319.0, 329.0, 115.0, 20.0, 11.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.693973541259766, -32.02808380126953, -27.362192153930664, -22.696300506591797, -18.030410766601562, -13.364521026611328, -8.698629379272461, -4.032737731933594, 0.6331520080566406, 5.299042701721191, 9.964933395385742, 14.630824089050293, 19.296714782714844, 23.962604522705078, 28.628496170043945, 33.29438781738281, 37.96027755737305, 42.62616729736328, 47.29206085205078, 51.957950592041016, 56.62384033203125, 61.289730072021484, 65.95561981201172, 70.62151336669922, 75.28739929199219, 79.95329284667969, 84.61917877197266, 89.28507232666016, 93.95095825195312, 98.61685180664062, 103.28274536132812, 107.94863891601562, 112.61453247070312, 117.28042602539062, 121.9463119506836, 126.6122055053711, 131.27809143066406, 135.94398498535156, 140.60987854003906, 145.27577209472656, 149.941650390625, 154.6075439453125, 159.2734375, 163.93931579589844, 168.60520935058594, 173.27110290527344, 177.93699645996094, 182.60289001464844, 187.26878356933594, 191.93467712402344, 196.60057067871094, 201.26644897460938, 205.93234252929688, 210.59823608398438, 215.26412963867188, 219.93002319335938, 224.59591674804688, 229.26181030273438, 233.92770385742188, 238.5935821533203, 243.2594757080078, 247.9253692626953, 252.5912628173828, 257.25714111328125, 261.92303466796875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 5.0, 7.0, 24.0, 25.0, 20.0, 16.0, 36.0, 33.0, 30.0, 32.0, 32.0, 38.0, 48.0, 47.0, 39.0, 48.0, 37.0, 39.0, 39.0, 39.0, 45.0, 47.0, 36.0, 35.0, 35.0, 32.0, 26.0, 14.0, 20.0, 14.0, 10.0, 8.0, 9.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.860904693603516, -38.67665481567383, -37.492401123046875, -36.30815124511719, -35.1239013671875, -33.93965148925781, -32.75539779663086, -31.571147918701172, -30.38689613342285, -29.20264434814453, -28.018394470214844, -26.834142684936523, -25.649890899658203, -24.465641021728516, -23.281389236450195, -22.097137451171875, -20.912887573242188, -19.728635787963867, -18.54438591003418, -17.36013412475586, -16.175884246826172, -14.991632461547852, -13.807380676269531, -12.623129844665527, -11.438879013061523, -10.25462818145752, -9.070377349853516, -7.886125564575195, -6.701874732971191, -5.5176239013671875, -4.333372592926025, -3.1491212844848633, -1.9648666381835938, -0.7806155681610107, 0.40363550186157227, 1.5878865718841553, 2.7721376419067383, 3.956388473510742, 5.140639781951904, 6.324891090393066, 7.50914192199707, 8.693392753601074, 9.877643585205078, 11.061895370483398, 12.246146202087402, 13.430397033691406, 14.614648818969727, 15.79889965057373, 16.983150482177734, 18.167402267456055, 19.351652145385742, 20.535903930664062, 21.72015380859375, 22.90440559387207, 24.08865737915039, 25.272907257080078, 26.4571590423584, 27.64141082763672, 28.825660705566406, 30.009912490844727, 31.194164276123047, 32.378414154052734, 33.56266403198242, 34.746917724609375, 35.93116760253906]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 4.0, 15.0, 19.0, 22.0, 22.0, 31.0, 37.0, 40.0, 40.0, 42.0, 54.0, 54.0, 51.0, 63.0, 59.0, 57.0, 48.0, 52.0, 59.0, 37.0, 35.0, 26.0, 29.0, 12.0, 19.0, 15.0, 10.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.814453125, -3.690277099609375, -3.56610107421875, -3.441925048828125, -3.3177490234375, -3.193572998046875, -3.06939697265625, -2.945220947265625, -2.821044921875, -2.696868896484375, -2.57269287109375, -2.448516845703125, -2.3243408203125, -2.200164794921875, -2.07598876953125, -1.951812744140625, -1.82763671875, -1.703460693359375, -1.57928466796875, -1.455108642578125, -1.3309326171875, -1.206756591796875, -1.08258056640625, -0.958404541015625, -0.834228515625, -0.710052490234375, -0.58587646484375, -0.461700439453125, -0.3375244140625, -0.213348388671875, -0.08917236328125, 0.035003662109375, 0.1591796875, 0.283355712890625, 0.40753173828125, 0.531707763671875, 0.6558837890625, 0.780059814453125, 0.90423583984375, 1.028411865234375, 1.152587890625, 1.276763916015625, 1.40093994140625, 1.525115966796875, 1.6492919921875, 1.773468017578125, 1.89764404296875, 2.021820068359375, 2.14599609375, 2.270172119140625, 2.39434814453125, 2.518524169921875, 2.6427001953125, 2.766876220703125, 2.89105224609375, 3.015228271484375, 3.139404296875, 3.263580322265625, 3.38775634765625, 3.511932373046875, 3.6361083984375, 3.760284423828125, 3.88446044921875, 4.008636474609375, 4.1328125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 12.0, 21.0, 18.0, 37.0, 44.0, 76.0, 102.0, 145.0, 178.0, 259.0, 362.0, 516.0, 770.0, 1213.0, 1784.0, 2747.0, 4432.0, 7326.0, 12256.0, 21300.0, 38351.0, 73943.0, 167287.0, 381444.0, 167703.0, 74377.0, 38180.0, 21286.0, 12278.0, 7355.0, 4444.0, 2714.0, 1815.0, 1161.0, 759.0, 561.0, 377.0, 248.0, 194.0, 150.0, 78.0, 67.0, 45.0, 40.0, 24.0, 16.0, 12.0, 9.0, 7.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.17041015625, -0.16516685485839844, -0.15992355346679688, -0.1546802520751953, -0.14943695068359375, -0.1441936492919922, -0.13895034790039062, -0.13370704650878906, -0.1284637451171875, -0.12322044372558594, -0.11797714233398438, -0.11273384094238281, -0.10749053955078125, -0.10224723815917969, -0.09700393676757812, -0.09176063537597656, -0.086517333984375, -0.08127403259277344, -0.07603073120117188, -0.07078742980957031, -0.06554412841796875, -0.06030082702636719, -0.055057525634765625, -0.04981422424316406, -0.0445709228515625, -0.03932762145996094, -0.034084320068359375, -0.028841018676757812, -0.02359771728515625, -0.018354415893554688, -0.013111114501953125, -0.007867813110351562, -0.00262451171875, 0.0026187896728515625, 0.007862091064453125, 0.013105392456054688, 0.01834869384765625, 0.023591995239257812, 0.028835296630859375, 0.03407859802246094, 0.0393218994140625, 0.04456520080566406, 0.049808502197265625, 0.05505180358886719, 0.06029510498046875, 0.06553840637207031, 0.07078170776367188, 0.07602500915527344, 0.081268310546875, 0.08651161193847656, 0.09175491333007812, 0.09699821472167969, 0.10224151611328125, 0.10748481750488281, 0.11272811889648438, 0.11797142028808594, 0.1232147216796875, 0.12845802307128906, 0.13370132446289062, 0.1389446258544922, 0.14418792724609375, 0.1494312286376953, 0.15467453002929688, 0.15991783142089844, 0.1651611328125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 11.0, 8.0, 9.0, 12.0, 19.0, 25.0, 25.0, 23.0, 21.0, 30.0, 28.0, 33.0, 31.0, 35.0, 35.0, 35.0, 24.0, 31.0, 47.0, 1059.0, 42.0, 35.0, 28.0, 45.0, 29.0, 32.0, 27.0, 34.0, 22.0, 15.0, 27.0, 19.0, 21.0, 12.0, 9.0, 13.0, 14.0, 4.0, 8.0, 8.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-2.435546875, -2.3642578125, -2.29296875, -2.2216796875, -2.150390625, -2.0791015625, -2.0078125, -1.9365234375, -1.865234375, -1.7939453125, -1.72265625, -1.6513671875, -1.580078125, -1.5087890625, -1.4375, -1.3662109375, -1.294921875, -1.2236328125, -1.15234375, -1.0810546875, -1.009765625, -0.9384765625, -0.8671875, -0.7958984375, -0.724609375, -0.6533203125, -0.58203125, -0.5107421875, -0.439453125, -0.3681640625, -0.296875, -0.2255859375, -0.154296875, -0.0830078125, -0.01171875, 0.0595703125, 0.130859375, 0.2021484375, 0.2734375, 0.3447265625, 0.416015625, 0.4873046875, 0.55859375, 0.6298828125, 0.701171875, 0.7724609375, 0.84375, 0.9150390625, 0.986328125, 1.0576171875, 1.12890625, 1.2001953125, 1.271484375, 1.3427734375, 1.4140625, 1.4853515625, 1.556640625, 1.6279296875, 1.69921875, 1.7705078125, 1.841796875, 1.9130859375, 1.984375, 2.0556640625, 2.126953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 1.0, 5.0, 13.0, 21.0, 27.0, 46.0, 56.0, 113.0, 170.0, 272.0, 440.0, 682.0, 1061.0, 1625.0, 2707.0, 4259.0, 6952.0, 11342.0, 18354.0, 30352.0, 50682.0, 89929.0, 185379.0, 1356142.0, 148150.0, 76623.0, 43434.0, 26301.0, 15918.0, 9888.0, 6123.0, 3728.0, 2366.0, 1442.0, 954.0, 577.0, 374.0, 204.0, 157.0, 98.0, 61.0, 29.0, 26.0, 19.0, 16.0, 9.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0931396484375, -0.09042930603027344, -0.08771896362304688, -0.08500862121582031, -0.08229827880859375, -0.07958793640136719, -0.07687759399414062, -0.07416725158691406, -0.0714569091796875, -0.06874656677246094, -0.06603622436523438, -0.06332588195800781, -0.06061553955078125, -0.05790519714355469, -0.055194854736328125, -0.05248451232910156, -0.049774169921875, -0.04706382751464844, -0.044353485107421875, -0.04164314270019531, -0.03893280029296875, -0.03622245788574219, -0.033512115478515625, -0.030801773071289062, -0.0280914306640625, -0.025381088256835938, -0.022670745849609375, -0.019960403442382812, -0.01725006103515625, -0.014539718627929688, -0.011829376220703125, -0.009119033813476562, -0.00640869140625, -0.0036983489990234375, -0.000988006591796875, 0.0017223358154296875, 0.00443267822265625, 0.0071430206298828125, 0.009853363037109375, 0.012563705444335938, 0.0152740478515625, 0.017984390258789062, 0.020694732666015625, 0.023405075073242188, 0.02611541748046875, 0.028825759887695312, 0.031536102294921875, 0.03424644470214844, 0.036956787109375, 0.03966712951660156, 0.042377471923828125, 0.04508781433105469, 0.04779815673828125, 0.05050849914550781, 0.053218841552734375, 0.05592918395996094, 0.0586395263671875, 0.06134986877441406, 0.06406021118164062, 0.06677055358886719, 0.06948089599609375, 0.07219123840332031, 0.07490158081054688, 0.07761192321777344, 0.080322265625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 13.0, 6.0, 8.0, 16.0, 20.0, 14.0, 29.0, 21.0, 38.0, 48.0, 38.0, 48.0, 51.0, 40.0, 43.0, 48.0, 54.0, 44.0, 53.0, 46.0, 46.0, 25.0, 30.0, 39.0, 30.0, 20.0, 23.0, 14.0, 12.0, 19.0, 15.0, 7.0, 9.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.629922866821289e-05, -3.520585596561432e-05, -3.411248326301575e-05, -3.3019110560417175e-05, -3.1925737857818604e-05, -3.083236515522003e-05, -2.973899245262146e-05, -2.8645619750022888e-05, -2.7552247047424316e-05, -2.6458874344825745e-05, -2.5365501642227173e-05, -2.42721289396286e-05, -2.317875623703003e-05, -2.2085383534431458e-05, -2.0992010831832886e-05, -1.9898638129234314e-05, -1.8805265426635742e-05, -1.771189272403717e-05, -1.66185200214386e-05, -1.5525147318840027e-05, -1.4431774616241455e-05, -1.3338401913642883e-05, -1.2245029211044312e-05, -1.115165650844574e-05, -1.0058283805847168e-05, -8.964911103248596e-06, -7.871538400650024e-06, -6.778165698051453e-06, -5.684792995452881e-06, -4.591420292854309e-06, -3.4980475902557373e-06, -2.4046748876571655e-06, -1.3113021850585938e-06, -2.1792948246002197e-07, 8.754432201385498e-07, 1.9688159227371216e-06, 3.0621886253356934e-06, 4.155561327934265e-06, 5.248934030532837e-06, 6.342306733131409e-06, 7.4356794357299805e-06, 8.529052138328552e-06, 9.622424840927124e-06, 1.0715797543525696e-05, 1.1809170246124268e-05, 1.290254294872284e-05, 1.3995915651321411e-05, 1.5089288353919983e-05, 1.6182661056518555e-05, 1.7276033759117126e-05, 1.8369406461715698e-05, 1.946277916431427e-05, 2.0556151866912842e-05, 2.1649524569511414e-05, 2.2742897272109985e-05, 2.3836269974708557e-05, 2.492964267730713e-05, 2.60230153799057e-05, 2.7116388082504272e-05, 2.8209760785102844e-05, 2.9303133487701416e-05, 3.0396506190299988e-05, 3.148987889289856e-05, 3.258325159549713e-05, 3.36766242980957e-05]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 10.0, 4.0, 8.0, 7.0, 10.0, 12.0, 16.0, 25.0, 34.0, 33.0, 50.0, 49.0, 59.0, 80.0, 110.0, 104.0, 136.0, 140.0, 175.0, 331.0, 2120.0, 193166.0, 838969.0, 11151.0, 578.0, 207.0, 172.0, 123.0, 98.0, 92.0, 89.0, 58.0, 62.0, 46.0, 49.0, 50.0, 21.0, 26.0, 23.0, 11.0, 15.0, 9.0, 2.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005736351013183594, -0.0005552619695663452, -0.0005368888378143311, -0.0005185157060623169, -0.0005001425743103027, -0.0004817694425582886, -0.0004633963108062744, -0.00044502317905426025, -0.0004266500473022461, -0.00040827691555023193, -0.0003899037837982178, -0.0003715306520462036, -0.00035315752029418945, -0.0003347843885421753, -0.00031641125679016113, -0.00029803812503814697, -0.0002796649932861328, -0.00026129186153411865, -0.0002429187297821045, -0.00022454559803009033, -0.00020617246627807617, -0.000187799334526062, -0.00016942620277404785, -0.0001510530710220337, -0.00013267993927001953, -0.00011430680751800537, -9.593367576599121e-05, -7.756054401397705e-05, -5.918741226196289e-05, -4.081428050994873e-05, -2.244114875793457e-05, -4.06801700592041e-06, 1.430511474609375e-05, 3.267824649810791e-05, 5.105137825012207e-05, 6.942451000213623e-05, 8.779764175415039e-05, 0.00010617077350616455, 0.0001245439052581787, 0.00014291703701019287, 0.00016129016876220703, 0.0001796633005142212, 0.00019803643226623535, 0.0002164095640182495, 0.00023478269577026367, 0.00025315582752227783, 0.000271528959274292, 0.00028990209102630615, 0.0003082752227783203, 0.00032664835453033447, 0.00034502148628234863, 0.0003633946180343628, 0.00038176774978637695, 0.0004001408815383911, 0.0004185140132904053, 0.00043688714504241943, 0.0004552602767944336, 0.00047363340854644775, 0.0004920065402984619, 0.0005103796720504761, 0.0005287528038024902, 0.0005471259355545044, 0.0005654990673065186, 0.0005838721990585327, 0.0006022453308105469]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 23.0, 37.0, 130.0, 315.0, 326.0, 127.0, 42.0, 8.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.350548210320994e-05, -5.9986017731716856e-05, -5.646655336022377e-05, -5.2947088988730684e-05, -4.94276246172376e-05, -4.590816024574451e-05, -4.2388695874251425e-05, -3.886923150275834e-05, -3.534976713126525e-05, -3.1830302759772167e-05, -2.831083838827908e-05, -2.4791374016785994e-05, -2.1271909645292908e-05, -1.7752445273799822e-05, -1.4232980902306736e-05, -1.071351653081365e-05, -7.194052159320563e-06, -3.674587787827477e-06, -1.5512341633439064e-07, 3.3643409551586956e-06, 6.883805326651782e-06, 1.0403269698144868e-05, 1.3922734069637954e-05, 1.744219844113104e-05, 2.0961662812624127e-05, 2.4481127184117213e-05, 2.80005915556103e-05, 3.1520055927103385e-05, 3.503952029859647e-05, 3.855898467008956e-05, 4.2078449041582644e-05, 4.559791341307573e-05, 4.911738506052643e-05, 5.263684943201952e-05, 5.61563138035126e-05, 5.967577817500569e-05, 6.319524254649878e-05, 6.671471055597067e-05, 7.023417128948495e-05, 7.375363202299923e-05, 7.727310003247112e-05, 8.079256804194301e-05, 8.431202877545729e-05, 8.783148950897157e-05, 9.135095751844347e-05, 9.487042552791536e-05, 9.838988626142964e-05, 0.00010190934699494392, 0.00010542881500441581, 0.0001089482830138877, 0.00011246774374740198, 0.00011598720448091626, 0.00011950667249038815, 0.00012302614049986005, 0.00012654560850933194, 0.0001300650619668886, 0.0001335845299763605, 0.0001371039979858324, 0.00014062345144338906, 0.00014414291945286095, 0.00014766238746233284, 0.00015118185547180474, 0.00015470132348127663, 0.0001582207769388333, 0.0001617402449483052]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 9.0, 17.0, 24.0, 27.0, 31.0, 35.0, 41.0, 33.0, 43.0, 47.0, 44.0, 49.0, 71.0, 54.0, 55.0, 53.0, 45.0, 40.0, 41.0, 50.0, 36.0, 29.0, 29.0, 23.0, 15.0, 12.0, 7.0, 9.0, 3.0, 4.0, 2.0, 3.0, 5.0, 0.0, 4.0], "bins": [-4.178285598754883e-05, -4.078727215528488e-05, -3.9791688323020935e-05, -3.879610449075699e-05, -3.780052065849304e-05, -3.6804936826229095e-05, -3.580935299396515e-05, -3.48137691617012e-05, -3.3818185329437256e-05, -3.282260149717331e-05, -3.182701766490936e-05, -3.0831433832645416e-05, -2.983585000038147e-05, -2.8840266168117523e-05, -2.7844682335853577e-05, -2.684909850358963e-05, -2.5853514671325684e-05, -2.4857930839061737e-05, -2.386234700679779e-05, -2.2866763174533844e-05, -2.1871179342269897e-05, -2.087559551000595e-05, -1.9880011677742004e-05, -1.8884427845478058e-05, -1.788884401321411e-05, -1.6893260180950165e-05, -1.5897676348686218e-05, -1.4902092516422272e-05, -1.3906508684158325e-05, -1.2910924851894379e-05, -1.1915341019630432e-05, -1.0919757187366486e-05, -9.924173355102539e-06, -8.928589522838593e-06, -7.933005690574646e-06, -6.9374218583106995e-06, -5.941838026046753e-06, -4.946254193782806e-06, -3.95067036151886e-06, -2.9550865292549133e-06, -1.959502696990967e-06, -9.639188647270203e-07, 3.166496753692627e-08, 1.0272487998008728e-06, 2.0228326320648193e-06, 3.018416464328766e-06, 4.014000296592712e-06, 5.009584128856659e-06, 6.0051679611206055e-06, 7.000751793384552e-06, 7.996335625648499e-06, 8.991919457912445e-06, 9.987503290176392e-06, 1.0983087122440338e-05, 1.1978670954704285e-05, 1.2974254786968231e-05, 1.3969838619232178e-05, 1.4965422451496124e-05, 1.596100628376007e-05, 1.6956590116024017e-05, 1.7952173948287964e-05, 1.894775778055191e-05, 1.9943341612815857e-05, 2.0938925445079803e-05, 2.193450927734375e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 4.0, 15.0, 19.0, 22.0, 22.0, 31.0, 37.0, 40.0, 40.0, 42.0, 54.0, 54.0, 51.0, 63.0, 59.0, 57.0, 48.0, 52.0, 59.0, 37.0, 35.0, 26.0, 29.0, 12.0, 19.0, 15.0, 10.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.814453125, -3.690277099609375, -3.56610107421875, -3.441925048828125, -3.3177490234375, -3.193572998046875, -3.06939697265625, -2.945220947265625, -2.821044921875, -2.696868896484375, -2.57269287109375, -2.448516845703125, -2.3243408203125, -2.200164794921875, -2.07598876953125, -1.951812744140625, -1.82763671875, -1.703460693359375, -1.57928466796875, -1.455108642578125, -1.3309326171875, -1.206756591796875, -1.08258056640625, -0.958404541015625, -0.834228515625, -0.710052490234375, -0.58587646484375, -0.461700439453125, -0.3375244140625, -0.213348388671875, -0.08917236328125, 0.035003662109375, 0.1591796875, 0.283355712890625, 0.40753173828125, 0.531707763671875, 0.6558837890625, 0.780059814453125, 0.90423583984375, 1.028411865234375, 1.152587890625, 1.276763916015625, 1.40093994140625, 1.525115966796875, 1.6492919921875, 1.773468017578125, 1.89764404296875, 2.021820068359375, 2.14599609375, 2.270172119140625, 2.39434814453125, 2.518524169921875, 2.6427001953125, 2.766876220703125, 2.89105224609375, 3.015228271484375, 3.139404296875, 3.263580322265625, 3.38775634765625, 3.511932373046875, 3.6361083984375, 3.760284423828125, 3.88446044921875, 4.008636474609375, 4.1328125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 14.0, 19.0, 10.0, 14.0, 32.0, 36.0, 66.0, 107.0, 128.0, 261.0, 394.0, 692.0, 1155.0, 1950.0, 3639.0, 7437.0, 16537.0, 44904.0, 163382.0, 547517.0, 177570.0, 48302.0, 17704.0, 7744.0, 3960.0, 2047.0, 1081.0, 674.0, 399.0, 270.0, 150.0, 123.0, 76.0, 50.0, 33.0, 20.0, 7.0, 15.0, 6.0, 6.0, 0.0, 1.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.734375, -3.612060546875, -3.48974609375, -3.367431640625, -3.2451171875, -3.122802734375, -3.00048828125, -2.878173828125, -2.755859375, -2.633544921875, -2.51123046875, -2.388916015625, -2.2666015625, -2.144287109375, -2.02197265625, -1.899658203125, -1.77734375, -1.655029296875, -1.53271484375, -1.410400390625, -1.2880859375, -1.165771484375, -1.04345703125, -0.921142578125, -0.798828125, -0.676513671875, -0.55419921875, -0.431884765625, -0.3095703125, -0.187255859375, -0.06494140625, 0.057373046875, 0.1796875, 0.302001953125, 0.42431640625, 0.546630859375, 0.6689453125, 0.791259765625, 0.91357421875, 1.035888671875, 1.158203125, 1.280517578125, 1.40283203125, 1.525146484375, 1.6474609375, 1.769775390625, 1.89208984375, 2.014404296875, 2.13671875, 2.259033203125, 2.38134765625, 2.503662109375, 2.6259765625, 2.748291015625, 2.87060546875, 2.992919921875, 3.115234375, 3.237548828125, 3.35986328125, 3.482177734375, 3.6044921875, 3.726806640625, 3.84912109375, 3.971435546875, 4.09375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 6.0, 7.0, 9.0, 10.0, 13.0, 13.0, 18.0, 19.0, 19.0, 29.0, 37.0, 31.0, 33.0, 39.0, 49.0, 46.0, 60.0, 126.0, 1810.0, 172.0, 76.0, 50.0, 54.0, 43.0, 36.0, 42.0, 28.0, 22.0, 22.0, 22.0, 28.0, 16.0, 15.0, 8.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.5234375, -13.14306640625, -12.7626953125, -12.38232421875, -12.001953125, -11.62158203125, -11.2412109375, -10.86083984375, -10.48046875, -10.10009765625, -9.7197265625, -9.33935546875, -8.958984375, -8.57861328125, -8.1982421875, -7.81787109375, -7.4375, -7.05712890625, -6.6767578125, -6.29638671875, -5.916015625, -5.53564453125, -5.1552734375, -4.77490234375, -4.39453125, -4.01416015625, -3.6337890625, -3.25341796875, -2.873046875, -2.49267578125, -2.1123046875, -1.73193359375, -1.3515625, -0.97119140625, -0.5908203125, -0.21044921875, 0.169921875, 0.55029296875, 0.9306640625, 1.31103515625, 1.69140625, 2.07177734375, 2.4521484375, 2.83251953125, 3.212890625, 3.59326171875, 3.9736328125, 4.35400390625, 4.734375, 5.11474609375, 5.4951171875, 5.87548828125, 6.255859375, 6.63623046875, 7.0166015625, 7.39697265625, 7.77734375, 8.15771484375, 8.5380859375, 8.91845703125, 9.298828125, 9.67919921875, 10.0595703125, 10.43994140625, 10.8203125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 11.0, 13.0, 13.0, 28.0, 23.0, 22.0, 24.0, 39.0, 48.0, 61.0, 90.0, 170.0, 315.0, 968.0, 8565.0, 3025223.0, 106440.0, 2382.0, 527.0, 225.0, 120.0, 72.0, 55.0, 50.0, 37.0, 30.0, 18.0, 18.0, 20.0, 11.0, 15.0, 7.0, 7.0, 7.0, 8.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.921875, -21.102783203125, -20.28369140625, -19.464599609375, -18.6455078125, -17.826416015625, -17.00732421875, -16.188232421875, -15.369140625, -14.550048828125, -13.73095703125, -12.911865234375, -12.0927734375, -11.273681640625, -10.45458984375, -9.635498046875, -8.81640625, -7.997314453125, -7.17822265625, -6.359130859375, -5.5400390625, -4.720947265625, -3.90185546875, -3.082763671875, -2.263671875, -1.444580078125, -0.62548828125, 0.193603515625, 1.0126953125, 1.831787109375, 2.65087890625, 3.469970703125, 4.2890625, 5.108154296875, 5.92724609375, 6.746337890625, 7.5654296875, 8.384521484375, 9.20361328125, 10.022705078125, 10.841796875, 11.660888671875, 12.47998046875, 13.299072265625, 14.1181640625, 14.937255859375, 15.75634765625, 16.575439453125, 17.39453125, 18.213623046875, 19.03271484375, 19.851806640625, 20.6708984375, 21.489990234375, 22.30908203125, 23.128173828125, 23.947265625, 24.766357421875, 25.58544921875, 26.404541015625, 27.2236328125, 28.042724609375, 28.86181640625, 29.680908203125, 30.5]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [3.0, 96.0, 917.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.43546199798584, -6.46983528137207, -1.5042085647583008, 3.4614181518554688, 8.427044868469238, 13.392670631408691, 18.358299255371094, 23.323925018310547, 28.28955078125, 33.25517654418945, 38.220802307128906, 43.186431884765625, 48.15205764770508, 53.11768341064453, 58.08331298828125, 63.0489387512207, 68.01456451416016, 72.98019409179688, 77.94581604003906, 82.91144561767578, 87.8770751953125, 92.84269714355469, 97.8083267211914, 102.77395629882812, 107.73957824707031, 112.70520782470703, 117.67082977294922, 122.63645935058594, 127.60208129882812, 132.56771850585938, 137.53334045410156, 142.49896240234375, 147.464599609375, 152.4302215576172, 157.39585876464844, 162.36148071289062, 167.3271026611328, 172.292724609375, 177.25836181640625, 182.22398376464844, 187.18960571289062, 192.1552276611328, 197.12086486816406, 202.08648681640625, 207.05210876464844, 212.01773071289062, 216.98336791992188, 221.94898986816406, 226.9146270751953, 231.8802490234375, 236.84588623046875, 241.81150817871094, 246.77713012695312, 251.74276733398438, 256.7083740234375, 261.67401123046875, 266.6396484375, 271.60528564453125, 276.5708923339844, 281.5365295410156, 286.5021667480469, 291.4677734375, 296.43341064453125, 301.3990478515625, 306.3646545410156]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 3.0, 7.0, 16.0, 14.0, 10.0, 15.0, 21.0, 28.0, 24.0, 31.0, 32.0, 31.0, 43.0, 49.0, 32.0, 49.0, 33.0, 51.0, 43.0, 37.0, 45.0, 46.0, 51.0, 34.0, 38.0, 34.0, 29.0, 32.0, 15.0, 19.0, 15.0, 23.0, 13.0, 6.0, 6.0, 3.0, 4.0, 0.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.51384735107422, -37.267852783203125, -36.0218620300293, -34.77587127685547, -33.529876708984375, -32.28388214111328, -31.037891387939453, -29.791898727416992, -28.54590606689453, -27.29991340637207, -26.05392074584961, -24.80792808532715, -23.561935424804688, -22.315942764282227, -21.069950103759766, -19.823957443237305, -18.577964782714844, -17.331972122192383, -16.085979461669922, -14.839986801147461, -13.593994140625, -12.348001480102539, -11.102008819580078, -9.856016159057617, -8.610023498535156, -7.364030838012695, -6.118038177490234, -4.872045516967773, -3.6260528564453125, -2.3800601959228516, -1.1340675354003906, 0.11192512512207031, 1.3579216003417969, 2.603914260864258, 3.8499069213867188, 5.09589958190918, 6.341892242431641, 7.587884902954102, 8.833877563476562, 10.079870223999023, 11.325862884521484, 12.571855545043945, 13.817848205566406, 15.063840866088867, 16.309833526611328, 17.55582618713379, 18.80181884765625, 20.04781150817871, 21.293804168701172, 22.539796829223633, 23.785789489746094, 25.031782150268555, 26.277774810791016, 27.523767471313477, 28.769760131835938, 30.0157527923584, 31.26174545288086, 32.50773620605469, 33.75373077392578, 34.999725341796875, 36.2457160949707, 37.49170684814453, 38.737701416015625, 39.98369598388672, 41.22968673706055]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 2.0, 5.0, 2.0, 2.0, 5.0, 4.0, 14.0, 19.0, 22.0, 24.0, 30.0, 33.0, 34.0, 51.0, 38.0, 49.0, 57.0, 52.0, 55.0, 65.0, 55.0, 46.0, 60.0, 50.0, 45.0, 31.0, 31.0, 24.0, 17.0, 21.0, 11.0, 12.0, 10.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.853515625, -3.728424072265625, -3.60333251953125, -3.478240966796875, -3.3531494140625, -3.228057861328125, -3.10296630859375, -2.977874755859375, -2.852783203125, -2.727691650390625, -2.60260009765625, -2.477508544921875, -2.3524169921875, -2.227325439453125, -2.10223388671875, -1.977142333984375, -1.85205078125, -1.726959228515625, -1.60186767578125, -1.476776123046875, -1.3516845703125, -1.226593017578125, -1.10150146484375, -0.976409912109375, -0.851318359375, -0.726226806640625, -0.60113525390625, -0.476043701171875, -0.3509521484375, -0.225860595703125, -0.10076904296875, 0.024322509765625, 0.1494140625, 0.274505615234375, 0.39959716796875, 0.524688720703125, 0.6497802734375, 0.774871826171875, 0.89996337890625, 1.025054931640625, 1.150146484375, 1.275238037109375, 1.40032958984375, 1.525421142578125, 1.6505126953125, 1.775604248046875, 1.90069580078125, 2.025787353515625, 2.15087890625, 2.275970458984375, 2.40106201171875, 2.526153564453125, 2.6512451171875, 2.776336669921875, 2.90142822265625, 3.026519775390625, 3.151611328125, 3.276702880859375, 3.40179443359375, 3.526885986328125, 3.6519775390625, 3.777069091796875, 3.90216064453125, 4.027252197265625, 4.15234375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 8.0, 12.0, 12.0, 21.0, 20.0, 24.0, 60.0, 70.0, 132.0, 220.0, 346.0, 673.0, 1483.0, 4891.0, 46422.0, 3867666.0, 257849.0, 10115.0, 2146.0, 954.0, 475.0, 251.0, 160.0, 101.0, 46.0, 45.0, 23.0, 20.0, 9.0, 7.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.46875, -33.446044921875, -32.42333984375, -31.400634765625, -30.3779296875, -29.355224609375, -28.33251953125, -27.309814453125, -26.287109375, -25.264404296875, -24.24169921875, -23.218994140625, -22.1962890625, -21.173583984375, -20.15087890625, -19.128173828125, -18.10546875, -17.082763671875, -16.06005859375, -15.037353515625, -14.0146484375, -12.991943359375, -11.96923828125, -10.946533203125, -9.923828125, -8.901123046875, -7.87841796875, -6.855712890625, -5.8330078125, -4.810302734375, -3.78759765625, -2.764892578125, -1.7421875, -0.719482421875, 0.30322265625, 1.325927734375, 2.3486328125, 3.371337890625, 4.39404296875, 5.416748046875, 6.439453125, 7.462158203125, 8.48486328125, 9.507568359375, 10.5302734375, 11.552978515625, 12.57568359375, 13.598388671875, 14.62109375, 15.643798828125, 16.66650390625, 17.689208984375, 18.7119140625, 19.734619140625, 20.75732421875, 21.780029296875, 22.802734375, 23.825439453125, 24.84814453125, 25.870849609375, 26.8935546875, 27.916259765625, 28.93896484375, 29.961669921875, 30.984375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 5.0, 11.0, 15.0, 18.0, 20.0, 37.0, 45.0, 53.0, 58.0, 101.0, 131.0, 196.0, 259.0, 342.0, 477.0, 597.0, 405.0, 347.0, 242.0, 161.0, 127.0, 98.0, 87.0, 60.0, 38.0, 26.0, 24.0, 22.0, 11.0, 12.0, 5.0, 10.0, 10.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.890625, -9.5948486328125, -9.299072265625, -9.0032958984375, -8.70751953125, -8.4117431640625, -8.115966796875, -7.8201904296875, -7.5244140625, -7.2286376953125, -6.932861328125, -6.6370849609375, -6.34130859375, -6.0455322265625, -5.749755859375, -5.4539794921875, -5.158203125, -4.8624267578125, -4.566650390625, -4.2708740234375, -3.97509765625, -3.6793212890625, -3.383544921875, -3.0877685546875, -2.7919921875, -2.4962158203125, -2.200439453125, -1.9046630859375, -1.60888671875, -1.3131103515625, -1.017333984375, -0.7215576171875, -0.42578125, -0.1300048828125, 0.165771484375, 0.4615478515625, 0.75732421875, 1.0531005859375, 1.348876953125, 1.6446533203125, 1.9404296875, 2.2362060546875, 2.531982421875, 2.8277587890625, 3.12353515625, 3.4193115234375, 3.715087890625, 4.0108642578125, 4.306640625, 4.6024169921875, 4.898193359375, 5.1939697265625, 5.48974609375, 5.7855224609375, 6.081298828125, 6.3770751953125, 6.6728515625, 6.9686279296875, 7.264404296875, 7.5601806640625, 7.85595703125, 8.1517333984375, 8.447509765625, 8.7432861328125, 9.0390625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 7.0, 7.0, 10.0, 11.0, 20.0, 35.0, 53.0, 63.0, 110.0, 153.0, 277.0, 463.0, 782.0, 1347.0, 2513.0, 5393.0, 12594.0, 34346.0, 119232.0, 649131.0, 2726503.0, 492161.0, 98073.0, 29513.0, 11190.0, 4877.0, 2387.0, 1224.0, 723.0, 406.0, 259.0, 145.0, 88.0, 67.0, 38.0, 30.0, 13.0, 15.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.5682373046875, -17.042724609375, -16.5172119140625, -15.99169921875, -15.4661865234375, -14.940673828125, -14.4151611328125, -13.8896484375, -13.3641357421875, -12.838623046875, -12.3131103515625, -11.78759765625, -11.2620849609375, -10.736572265625, -10.2110595703125, -9.685546875, -9.1600341796875, -8.634521484375, -8.1090087890625, -7.58349609375, -7.0579833984375, -6.532470703125, -6.0069580078125, -5.4814453125, -4.9559326171875, -4.430419921875, -3.9049072265625, -3.37939453125, -2.8538818359375, -2.328369140625, -1.8028564453125, -1.27734375, -0.7518310546875, -0.226318359375, 0.2991943359375, 0.82470703125, 1.3502197265625, 1.875732421875, 2.4012451171875, 2.9267578125, 3.4522705078125, 3.977783203125, 4.5032958984375, 5.02880859375, 5.5543212890625, 6.079833984375, 6.6053466796875, 7.130859375, 7.6563720703125, 8.181884765625, 8.7073974609375, 9.23291015625, 9.7584228515625, 10.283935546875, 10.8094482421875, 11.3349609375, 11.8604736328125, 12.385986328125, 12.9114990234375, 13.43701171875, 13.9625244140625, 14.488037109375, 15.0135498046875, 15.5390625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 9.0, 17.0, 23.0, 24.0, 24.0, 50.0, 57.0, 63.0, 72.0, 89.0, 84.0, 84.0, 61.0, 57.0, 73.0, 45.0, 38.0, 24.0, 29.0, 15.0, 8.0, 10.0, 16.0, 7.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.29800796508789, -47.07801818847656, -45.858028411865234, -44.638038635253906, -43.41804885864258, -42.19805908203125, -40.97806930541992, -39.758079528808594, -38.538089752197266, -37.31809997558594, -36.09811019897461, -34.87812042236328, -33.65813064575195, -32.438140869140625, -31.218151092529297, -29.99816131591797, -28.778169631958008, -27.55817985534668, -26.33819007873535, -25.118200302124023, -23.898210525512695, -22.678220748901367, -21.458229064941406, -20.238239288330078, -19.01824951171875, -17.798259735107422, -16.578269958496094, -15.358280181884766, -14.138290405273438, -12.91830062866211, -11.698309898376465, -10.478320121765137, -9.258329391479492, -8.038339614868164, -6.818349838256836, -5.59835958480835, -4.3783698081970215, -3.1583800315856934, -1.938389778137207, -0.7184000015258789, 0.5015897750854492, 1.721579670906067, 2.9415695667266846, 4.161559581756592, 5.38154935836792, 6.601539134979248, 7.821529388427734, 9.041519165039062, 10.26150894165039, 11.481498718261719, 12.701488494873047, 13.921478271484375, 15.141468048095703, 16.36145782470703, 17.58144760131836, 18.801437377929688, 20.021427154541016, 21.241416931152344, 22.461406707763672, 23.681396484375, 24.901386260986328, 26.121376037597656, 27.341365814208984, 28.561355590820312, 29.781347274780273]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 3.0, 10.0, 10.0, 14.0, 12.0, 13.0, 18.0, 18.0, 18.0, 27.0, 27.0, 25.0, 32.0, 40.0, 53.0, 39.0, 34.0, 52.0, 36.0, 44.0, 44.0, 41.0, 34.0, 34.0, 43.0, 43.0, 32.0, 35.0, 34.0, 19.0, 19.0, 19.0, 18.0, 9.0, 5.0, 7.0, 8.0, 14.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.27893829345703, -34.19860076904297, -33.118263244628906, -32.03792953491211, -30.957592010498047, -29.877254486083984, -28.796918869018555, -27.716583251953125, -26.636245727539062, -25.555908203125, -24.47557258605957, -23.39523696899414, -22.314899444580078, -21.234561920166016, -20.154226303100586, -19.073890686035156, -17.993553161621094, -16.91321563720703, -15.832880020141602, -14.752543449401855, -13.67220687866211, -12.591870307922363, -11.511533737182617, -10.431197166442871, -9.350860595703125, -8.270524024963379, -7.190187454223633, -6.109850883483887, -5.029514312744141, -3.9491777420043945, -2.8688411712646484, -1.7885046005249023, -0.7081718444824219, 0.3721647262573242, 1.4525012969970703, 2.5328378677368164, 3.6131744384765625, 4.693511009216309, 5.773847579956055, 6.854184150695801, 7.934520721435547, 9.014857292175293, 10.095193862915039, 11.175530433654785, 12.255867004394531, 13.336203575134277, 14.416540145874023, 15.49687671661377, 16.577213287353516, 17.657550811767578, 18.737886428833008, 19.818222045898438, 20.8985595703125, 21.978897094726562, 23.059232711791992, 24.139568328857422, 25.219905853271484, 26.300243377685547, 27.380578994750977, 28.460914611816406, 29.54125213623047, 30.62158966064453, 31.70192527770996, 32.78226089477539, 33.86259841918945]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 2.0, 13.0, 14.0, 13.0, 13.0, 23.0, 26.0, 35.0, 30.0, 45.0, 63.0, 48.0, 47.0, 54.0, 47.0, 43.0, 54.0, 49.0, 61.0, 51.0, 50.0, 43.0, 36.0, 32.0, 22.0, 15.0, 15.0, 10.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0078125, -3.87908935546875, -3.7503662109375, -3.62164306640625, -3.492919921875, -3.36419677734375, -3.2354736328125, -3.10675048828125, -2.97802734375, -2.84930419921875, -2.7205810546875, -2.59185791015625, -2.463134765625, -2.33441162109375, -2.2056884765625, -2.07696533203125, -1.9482421875, -1.81951904296875, -1.6907958984375, -1.56207275390625, -1.433349609375, -1.30462646484375, -1.1759033203125, -1.04718017578125, -0.91845703125, -0.78973388671875, -0.6610107421875, -0.53228759765625, -0.403564453125, -0.27484130859375, -0.1461181640625, -0.01739501953125, 0.111328125, 0.24005126953125, 0.3687744140625, 0.49749755859375, 0.626220703125, 0.75494384765625, 0.8836669921875, 1.01239013671875, 1.14111328125, 1.26983642578125, 1.3985595703125, 1.52728271484375, 1.656005859375, 1.78472900390625, 1.9134521484375, 2.04217529296875, 2.1708984375, 2.29962158203125, 2.4283447265625, 2.55706787109375, 2.685791015625, 2.81451416015625, 2.9432373046875, 3.07196044921875, 3.20068359375, 3.32940673828125, 3.4581298828125, 3.58685302734375, 3.715576171875, 3.84429931640625, 3.9730224609375, 4.10174560546875, 4.23046875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 10.0, 10.0, 12.0, 14.0, 29.0, 23.0, 39.0, 58.0, 91.0, 123.0, 179.0, 226.0, 356.0, 485.0, 666.0, 997.0, 1523.0, 2328.0, 3473.0, 5645.0, 9071.0, 14842.0, 26161.0, 46669.0, 89180.0, 193891.0, 326692.0, 153572.0, 74716.0, 39622.0, 22377.0, 13117.0, 7870.0, 4935.0, 3119.0, 2084.0, 1357.0, 929.0, 636.0, 420.0, 272.0, 220.0, 144.0, 93.0, 78.0, 59.0, 43.0, 30.0, 19.0, 23.0, 13.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.14599609375, -0.14148521423339844, -0.13697433471679688, -0.1324634552001953, -0.12795257568359375, -0.12344169616699219, -0.11893081665039062, -0.11441993713378906, -0.1099090576171875, -0.10539817810058594, -0.10088729858398438, -0.09637641906738281, -0.09186553955078125, -0.08735466003417969, -0.08284378051757812, -0.07833290100097656, -0.073822021484375, -0.06931114196777344, -0.06480026245117188, -0.06028938293457031, -0.05577850341796875, -0.05126762390136719, -0.046756744384765625, -0.04224586486816406, -0.0377349853515625, -0.03322410583496094, -0.028713226318359375, -0.024202346801757812, -0.01969146728515625, -0.015180587768554688, -0.010669708251953125, -0.0061588287353515625, -0.00164794921875, 0.0028629302978515625, 0.007373809814453125, 0.011884689331054688, 0.01639556884765625, 0.020906448364257812, 0.025417327880859375, 0.029928207397460938, 0.0344390869140625, 0.03894996643066406, 0.043460845947265625, 0.04797172546386719, 0.05248260498046875, 0.05699348449707031, 0.061504364013671875, 0.06601524353027344, 0.070526123046875, 0.07503700256347656, 0.07954788208007812, 0.08405876159667969, 0.08856964111328125, 0.09308052062988281, 0.09759140014648438, 0.10210227966308594, 0.1066131591796875, 0.11112403869628906, 0.11563491821289062, 0.12014579772949219, 0.12465667724609375, 0.1291675567626953, 0.13367843627929688, 0.13818931579589844, 0.1427001953125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 10.0, 7.0, 4.0, 5.0, 3.0, 10.0, 17.0, 10.0, 17.0, 16.0, 19.0, 28.0, 28.0, 24.0, 28.0, 25.0, 30.0, 29.0, 34.0, 34.0, 40.0, 36.0, 40.0, 1062.0, 34.0, 35.0, 35.0, 38.0, 32.0, 37.0, 18.0, 34.0, 27.0, 30.0, 28.0, 20.0, 20.0, 14.0, 8.0, 12.0, 11.0, 9.0, 7.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0], "bins": [-2.537109375, -2.462982177734375, -2.38885498046875, -2.314727783203125, -2.2406005859375, -2.166473388671875, -2.09234619140625, -2.018218994140625, -1.944091796875, -1.869964599609375, -1.79583740234375, -1.721710205078125, -1.6475830078125, -1.573455810546875, -1.49932861328125, -1.425201416015625, -1.35107421875, -1.276947021484375, -1.20281982421875, -1.128692626953125, -1.0545654296875, -0.980438232421875, -0.90631103515625, -0.832183837890625, -0.758056640625, -0.683929443359375, -0.60980224609375, -0.535675048828125, -0.4615478515625, -0.387420654296875, -0.31329345703125, -0.239166259765625, -0.1650390625, -0.090911865234375, -0.01678466796875, 0.057342529296875, 0.1314697265625, 0.205596923828125, 0.27972412109375, 0.353851318359375, 0.427978515625, 0.502105712890625, 0.57623291015625, 0.650360107421875, 0.7244873046875, 0.798614501953125, 0.87274169921875, 0.946868896484375, 1.02099609375, 1.095123291015625, 1.16925048828125, 1.243377685546875, 1.3175048828125, 1.391632080078125, 1.46575927734375, 1.539886474609375, 1.614013671875, 1.688140869140625, 1.76226806640625, 1.836395263671875, 1.9105224609375, 1.984649658203125, 2.05877685546875, 2.132904052734375, 2.20703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 9.0, 10.0, 27.0, 31.0, 41.0, 61.0, 92.0, 168.0, 223.0, 355.0, 583.0, 873.0, 1236.0, 1945.0, 3136.0, 4818.0, 7752.0, 12431.0, 20251.0, 32867.0, 54987.0, 97655.0, 208681.0, 1337840.0, 133417.0, 69802.0, 41526.0, 25050.0, 15091.0, 9646.0, 5929.0, 3785.0, 2357.0, 1549.0, 957.0, 699.0, 427.0, 268.0, 208.0, 127.0, 76.0, 50.0, 31.0, 22.0, 24.0, 8.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 4.0], "bins": [-0.09344482421875, -0.0907144546508789, -0.08798408508300781, -0.08525371551513672, -0.08252334594726562, -0.07979297637939453, -0.07706260681152344, -0.07433223724365234, -0.07160186767578125, -0.06887149810791016, -0.06614112854003906, -0.06341075897216797, -0.060680389404296875, -0.05795001983642578, -0.05521965026855469, -0.052489280700683594, -0.0497589111328125, -0.047028541564941406, -0.04429817199707031, -0.04156780242919922, -0.038837432861328125, -0.03610706329345703, -0.03337669372558594, -0.030646324157714844, -0.02791595458984375, -0.025185585021972656, -0.022455215454101562, -0.01972484588623047, -0.016994476318359375, -0.014264106750488281, -0.011533737182617188, -0.008803367614746094, -0.006072998046875, -0.0033426284790039062, -0.0006122589111328125, 0.0021181106567382812, 0.004848480224609375, 0.007578849792480469, 0.010309219360351562, 0.013039588928222656, 0.01576995849609375, 0.018500328063964844, 0.021230697631835938, 0.02396106719970703, 0.026691436767578125, 0.02942180633544922, 0.03215217590332031, 0.034882545471191406, 0.0376129150390625, 0.040343284606933594, 0.04307365417480469, 0.04580402374267578, 0.048534393310546875, 0.05126476287841797, 0.05399513244628906, 0.056725502014160156, 0.05945587158203125, 0.062186241149902344, 0.06491661071777344, 0.06764698028564453, 0.07037734985351562, 0.07310771942138672, 0.07583808898925781, 0.0785684585571289, 0.081298828125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 4.0, 4.0, 3.0, 15.0, 13.0, 17.0, 17.0, 26.0, 27.0, 31.0, 36.0, 38.0, 35.0, 37.0, 42.0, 38.0, 63.0, 58.0, 52.0, 48.0, 46.0, 36.0, 48.0, 43.0, 32.0, 28.0, 28.0, 25.0, 22.0, 18.0, 16.0, 12.0, 7.0, 9.0, 2.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.24249267578125e-05, -3.144051879644394e-05, -3.045611083507538e-05, -2.9471702873706818e-05, -2.8487294912338257e-05, -2.7502886950969696e-05, -2.6518478989601135e-05, -2.5534071028232574e-05, -2.4549663066864014e-05, -2.3565255105495453e-05, -2.2580847144126892e-05, -2.159643918275833e-05, -2.061203122138977e-05, -1.962762326002121e-05, -1.864321529865265e-05, -1.7658807337284088e-05, -1.6674399375915527e-05, -1.5689991414546967e-05, -1.4705583453178406e-05, -1.3721175491809845e-05, -1.2736767530441284e-05, -1.1752359569072723e-05, -1.0767951607704163e-05, -9.783543646335602e-06, -8.799135684967041e-06, -7.81472772359848e-06, -6.8303197622299194e-06, -5.845911800861359e-06, -4.861503839492798e-06, -3.877095878124237e-06, -2.8926879167556763e-06, -1.9082799553871155e-06, -9.238719940185547e-07, 6.05359673500061e-08, 1.044943928718567e-06, 2.0293518900871277e-06, 3.0137598514556885e-06, 3.998167812824249e-06, 4.98257577419281e-06, 5.966983735561371e-06, 6.951391696929932e-06, 7.935799658298492e-06, 8.920207619667053e-06, 9.904615581035614e-06, 1.0889023542404175e-05, 1.1873431503772736e-05, 1.2857839465141296e-05, 1.3842247426509857e-05, 1.4826655387878418e-05, 1.581106334924698e-05, 1.679547131061554e-05, 1.77798792719841e-05, 1.876428723335266e-05, 1.9748695194721222e-05, 2.0733103156089783e-05, 2.1717511117458344e-05, 2.2701919078826904e-05, 2.3686327040195465e-05, 2.4670735001564026e-05, 2.5655142962932587e-05, 2.6639550924301147e-05, 2.7623958885669708e-05, 2.860836684703827e-05, 2.959277480840683e-05, 3.057718276977539e-05]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 7.0, 0.0, 8.0, 13.0, 8.0, 18.0, 17.0, 20.0, 30.0, 23.0, 35.0, 43.0, 52.0, 72.0, 93.0, 115.0, 132.0, 129.0, 205.0, 416.0, 1738.0, 28865.0, 682789.0, 321816.0, 9637.0, 979.0, 326.0, 181.0, 141.0, 112.0, 92.0, 81.0, 69.0, 70.0, 60.0, 37.0, 27.0, 13.0, 17.0, 12.0, 11.0, 14.0, 7.0, 4.0, 5.0, 1.0, 5.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0], "bins": [-0.0004813671112060547, -0.00046714022755622864, -0.0004529133439064026, -0.00043868646025657654, -0.0004244595766067505, -0.00041023269295692444, -0.0003960058093070984, -0.00038177892565727234, -0.0003675520420074463, -0.00035332515835762024, -0.0003390982747077942, -0.00032487139105796814, -0.0003106445074081421, -0.00029641762375831604, -0.00028219074010849, -0.00026796385645866394, -0.0002537369728088379, -0.00023951008915901184, -0.0002252832055091858, -0.00021105632185935974, -0.0001968294382095337, -0.00018260255455970764, -0.0001683756709098816, -0.00015414878726005554, -0.0001399219036102295, -0.00012569501996040344, -0.00011146813631057739, -9.724125266075134e-05, -8.301436901092529e-05, -6.878748536109924e-05, -5.456060171127319e-05, -4.0333718061447144e-05, -2.6106834411621094e-05, -1.1879950761795044e-05, 2.346932888031006e-06, 1.6573816537857056e-05, 3.0800700187683105e-05, 4.5027583837509155e-05, 5.9254467487335205e-05, 7.348135113716125e-05, 8.77082347869873e-05, 0.00010193511843681335, 0.0001161620020866394, 0.00013038888573646545, 0.0001446157693862915, 0.00015884265303611755, 0.0001730695366859436, 0.00018729642033576965, 0.0002015233039855957, 0.00021575018763542175, 0.0002299770712852478, 0.00024420395493507385, 0.0002584308385848999, 0.00027265772223472595, 0.000286884605884552, 0.00030111148953437805, 0.0003153383731842041, 0.00032956525683403015, 0.0003437921404838562, 0.00035801902413368225, 0.0003722459077835083, 0.00038647279143333435, 0.0004006996750831604, 0.00041492655873298645, 0.0004291534423828125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 50.0, 188.0, 383.0, 289.0, 76.0, 12.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.816213863203302e-05, -6.351246702251956e-05, -5.886279177502729e-05, -5.421312016551383e-05, -4.956344491802156e-05, -4.49137733085081e-05, -4.0264101698994637e-05, -3.561442645150237e-05, -3.0964754841988906e-05, -2.631508141348604e-05, -2.1665407984983176e-05, -1.7015736375469714e-05, -1.236606294696685e-05, -7.716389518463984e-06, -3.0667179089505225e-06, 1.5829573385417461e-06, 6.232628948055208e-06, 1.0882302376558073e-05, 1.5531975805060938e-05, 2.01816474145744e-05, 2.4831320843077265e-05, 2.948099427158013e-05, 3.413066588109359e-05, 3.878034112858586e-05, 4.343001273809932e-05, 4.807968434761278e-05, 5.272935959510505e-05, 5.7379031204618514e-05, 6.202870281413198e-05, 6.667837442364544e-05, 7.13280460331589e-05, 7.597772491862997e-05, 8.062738925218582e-05, 8.527706086169928e-05, 8.992673247121274e-05, 9.45764040807262e-05, 9.922608296619728e-05, 0.00010387575457571074, 0.0001085254261852242, 0.00011317510507069528, 0.00011782477668020874, 0.0001224744482897222, 0.00012712411989923567, 0.00013177379150874913, 0.0001364234631182626, 0.00014107313472777605, 0.00014572282088920474, 0.0001503724924987182, 0.00015502216410823166, 0.00015967183571774513, 0.0001643215073272586, 0.00016897117893677205, 0.0001736208505462855, 0.0001782705367077142, 0.00018292019376531243, 0.00018756987992674112, 0.00019221953698433936, 0.00019686920859385282, 0.00020151888020336628, 0.00020616855181287974, 0.0002108182234223932, 0.0002154679095838219, 0.00022011756664142013, 0.00022476725280284882, 0.00022941692441236228]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 4.0, 6.0, 5.0, 5.0, 7.0, 9.0, 11.0, 17.0, 10.0, 15.0, 21.0, 24.0, 43.0, 35.0, 35.0, 30.0, 31.0, 25.0, 33.0, 45.0, 44.0, 34.0, 50.0, 31.0, 42.0, 45.0, 37.0, 38.0, 35.0, 43.0, 23.0, 26.0, 23.0, 21.0, 12.0, 20.0, 15.0, 12.0, 9.0, 5.0, 6.0, 4.0, 6.0, 0.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.0265579223632812e-05, -1.968536525964737e-05, -1.9105151295661926e-05, -1.8524937331676483e-05, -1.794472336769104e-05, -1.7364509403705597e-05, -1.6784295439720154e-05, -1.620408147573471e-05, -1.5623867511749268e-05, -1.5043653547763824e-05, -1.4463439583778381e-05, -1.3883225619792938e-05, -1.3303011655807495e-05, -1.2722797691822052e-05, -1.2142583727836609e-05, -1.1562369763851166e-05, -1.0982155799865723e-05, -1.040194183588028e-05, -9.821727871894836e-06, -9.241513907909393e-06, -8.66129994392395e-06, -8.081085979938507e-06, -7.500872015953064e-06, -6.920658051967621e-06, -6.340444087982178e-06, -5.760230123996735e-06, -5.1800161600112915e-06, -4.599802196025848e-06, -4.019588232040405e-06, -3.439374268054962e-06, -2.859160304069519e-06, -2.278946340084076e-06, -1.6987323760986328e-06, -1.1185184121131897e-06, -5.383044481277466e-07, 4.190951585769653e-08, 6.221234798431396e-07, 1.2023374438285828e-06, 1.7825514078140259e-06, 2.362765371799469e-06, 2.942979335784912e-06, 3.5231932997703552e-06, 4.103407263755798e-06, 4.6836212277412415e-06, 5.2638351917266846e-06, 5.844049155712128e-06, 6.424263119697571e-06, 7.004477083683014e-06, 7.584691047668457e-06, 8.1649050116539e-06, 8.745118975639343e-06, 9.325332939624786e-06, 9.90554690361023e-06, 1.0485760867595673e-05, 1.1065974831581116e-05, 1.1646188795566559e-05, 1.2226402759552002e-05, 1.2806616723537445e-05, 1.3386830687522888e-05, 1.3967044651508331e-05, 1.4547258615493774e-05, 1.5127472579479218e-05, 1.570768654346466e-05, 1.6287900507450104e-05, 1.6868114471435547e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 2.0, 13.0, 14.0, 13.0, 13.0, 23.0, 26.0, 35.0, 30.0, 45.0, 63.0, 48.0, 47.0, 54.0, 47.0, 43.0, 54.0, 49.0, 61.0, 51.0, 50.0, 43.0, 36.0, 32.0, 22.0, 15.0, 15.0, 10.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0078125, -3.87908935546875, -3.7503662109375, -3.62164306640625, -3.492919921875, -3.36419677734375, -3.2354736328125, -3.10675048828125, -2.97802734375, -2.84930419921875, -2.7205810546875, -2.59185791015625, -2.463134765625, -2.33441162109375, -2.2056884765625, -2.07696533203125, -1.9482421875, -1.81951904296875, -1.6907958984375, -1.56207275390625, -1.433349609375, -1.30462646484375, -1.1759033203125, -1.04718017578125, -0.91845703125, -0.78973388671875, -0.6610107421875, -0.53228759765625, -0.403564453125, -0.27484130859375, -0.1461181640625, -0.01739501953125, 0.111328125, 0.24005126953125, 0.3687744140625, 0.49749755859375, 0.626220703125, 0.75494384765625, 0.8836669921875, 1.01239013671875, 1.14111328125, 1.26983642578125, 1.3985595703125, 1.52728271484375, 1.656005859375, 1.78472900390625, 1.9134521484375, 2.04217529296875, 2.1708984375, 2.29962158203125, 2.4283447265625, 2.55706787109375, 2.685791015625, 2.81451416015625, 2.9432373046875, 3.07196044921875, 3.20068359375, 3.32940673828125, 3.4581298828125, 3.58685302734375, 3.715576171875, 3.84429931640625, 3.9730224609375, 4.10174560546875, 4.23046875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 5.0, 11.0, 16.0, 15.0, 21.0, 31.0, 48.0, 71.0, 111.0, 173.0, 273.0, 434.0, 812.0, 1555.0, 3019.0, 6489.0, 14187.0, 35086.0, 107381.0, 509123.0, 258646.0, 66680.0, 23959.0, 10385.0, 4753.0, 2382.0, 1208.0, 674.0, 356.0, 217.0, 136.0, 63.0, 50.0, 46.0, 37.0, 18.0, 21.0, 15.0, 11.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.9921875, -2.900970458984375, -2.80975341796875, -2.718536376953125, -2.6273193359375, -2.536102294921875, -2.44488525390625, -2.353668212890625, -2.262451171875, -2.171234130859375, -2.08001708984375, -1.988800048828125, -1.8975830078125, -1.806365966796875, -1.71514892578125, -1.623931884765625, -1.53271484375, -1.441497802734375, -1.35028076171875, -1.259063720703125, -1.1678466796875, -1.076629638671875, -0.98541259765625, -0.894195556640625, -0.802978515625, -0.711761474609375, -0.62054443359375, -0.529327392578125, -0.4381103515625, -0.346893310546875, -0.25567626953125, -0.164459228515625, -0.0732421875, 0.017974853515625, 0.10919189453125, 0.200408935546875, 0.2916259765625, 0.382843017578125, 0.47406005859375, 0.565277099609375, 0.656494140625, 0.747711181640625, 0.83892822265625, 0.930145263671875, 1.0213623046875, 1.112579345703125, 1.20379638671875, 1.295013427734375, 1.38623046875, 1.477447509765625, 1.56866455078125, 1.659881591796875, 1.7510986328125, 1.842315673828125, 1.93353271484375, 2.024749755859375, 2.115966796875, 2.207183837890625, 2.29840087890625, 2.389617919921875, 2.4808349609375, 2.572052001953125, 2.66326904296875, 2.754486083984375, 2.845703125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 3.0, 10.0, 10.0, 11.0, 17.0, 17.0, 12.0, 21.0, 23.0, 23.0, 37.0, 48.0, 33.0, 50.0, 45.0, 44.0, 62.0, 85.0, 1976.0, 72.0, 53.0, 37.0, 42.0, 36.0, 41.0, 41.0, 29.0, 26.0, 20.0, 21.0, 16.0, 10.0, 11.0, 13.0, 11.0, 7.0, 5.0, 10.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.171875, -11.7840576171875, -11.396240234375, -11.0084228515625, -10.62060546875, -10.2327880859375, -9.844970703125, -9.4571533203125, -9.0693359375, -8.6815185546875, -8.293701171875, -7.9058837890625, -7.51806640625, -7.1302490234375, -6.742431640625, -6.3546142578125, -5.966796875, -5.5789794921875, -5.191162109375, -4.8033447265625, -4.41552734375, -4.0277099609375, -3.639892578125, -3.2520751953125, -2.8642578125, -2.4764404296875, -2.088623046875, -1.7008056640625, -1.31298828125, -0.9251708984375, -0.537353515625, -0.1495361328125, 0.23828125, 0.6260986328125, 1.013916015625, 1.4017333984375, 1.78955078125, 2.1773681640625, 2.565185546875, 2.9530029296875, 3.3408203125, 3.7286376953125, 4.116455078125, 4.5042724609375, 4.89208984375, 5.2799072265625, 5.667724609375, 6.0555419921875, 6.443359375, 6.8311767578125, 7.218994140625, 7.6068115234375, 7.99462890625, 8.3824462890625, 8.770263671875, 9.1580810546875, 9.5458984375, 9.9337158203125, 10.321533203125, 10.7093505859375, 11.09716796875, 11.4849853515625, 11.872802734375, 12.2606201171875, 12.6484375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 3.0, 6.0, 11.0, 15.0, 7.0, 16.0, 16.0, 17.0, 25.0, 27.0, 31.0, 44.0, 67.0, 86.0, 157.0, 351.0, 983.0, 8534.0, 3084602.0, 47605.0, 1898.0, 519.0, 203.0, 136.0, 53.0, 67.0, 38.0, 29.0, 24.0, 19.0, 13.0, 18.0, 17.0, 13.0, 11.0, 8.0, 7.0, 1.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-27.296875, -26.462158203125, -25.62744140625, -24.792724609375, -23.9580078125, -23.123291015625, -22.28857421875, -21.453857421875, -20.619140625, -19.784423828125, -18.94970703125, -18.114990234375, -17.2802734375, -16.445556640625, -15.61083984375, -14.776123046875, -13.94140625, -13.106689453125, -12.27197265625, -11.437255859375, -10.6025390625, -9.767822265625, -8.93310546875, -8.098388671875, -7.263671875, -6.428955078125, -5.59423828125, -4.759521484375, -3.9248046875, -3.090087890625, -2.25537109375, -1.420654296875, -0.5859375, 0.248779296875, 1.08349609375, 1.918212890625, 2.7529296875, 3.587646484375, 4.42236328125, 5.257080078125, 6.091796875, 6.926513671875, 7.76123046875, 8.595947265625, 9.4306640625, 10.265380859375, 11.10009765625, 11.934814453125, 12.76953125, 13.604248046875, 14.43896484375, 15.273681640625, 16.1083984375, 16.943115234375, 17.77783203125, 18.612548828125, 19.447265625, 20.281982421875, 21.11669921875, 21.951416015625, 22.7861328125, 23.620849609375, 24.45556640625, 25.290283203125, 26.125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [32.0, 973.0, 15.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.357064247131348, -2.43745756149292, 3.482149124145508, 9.401755332946777, 15.321362495422363, 21.240970611572266, 27.16057586669922, 33.08018493652344, 38.99979019165039, 44.919395446777344, 50.83900451660156, 56.758609771728516, 62.67821502685547, 68.59782409667969, 74.51742553710938, 80.43704223632812, 86.35664367675781, 92.27625274658203, 98.19585418701172, 104.11546325683594, 110.03507232666016, 115.95468139648438, 121.87428283691406, 127.79389190673828, 133.7135009765625, 139.6331024169922, 145.55271911621094, 151.47232055664062, 157.3919219970703, 163.31153869628906, 169.23114013671875, 175.1507568359375, 181.0703582763672, 186.98995971679688, 192.90957641601562, 198.8291778564453, 204.748779296875, 210.66839599609375, 216.58799743652344, 222.50759887695312, 228.42721557617188, 234.34681701660156, 240.2664337158203, 246.18603515625, 252.1056365966797, 258.0252380371094, 263.9448547363281, 269.8644714355469, 275.7840576171875, 281.70367431640625, 287.6232604980469, 293.5428771972656, 299.4624938964844, 305.382080078125, 311.30169677734375, 317.2213134765625, 323.14093017578125, 329.060546875, 334.9801330566406, 340.8997497558594, 346.8193664550781, 352.73895263671875, 358.6585693359375, 364.57818603515625, 370.4977722167969]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 3.0, 6.0, 5.0, 9.0, 8.0, 14.0, 24.0, 19.0, 23.0, 22.0, 23.0, 35.0, 25.0, 28.0, 24.0, 46.0, 60.0, 36.0, 36.0, 40.0, 41.0, 38.0, 37.0, 49.0, 43.0, 38.0, 28.0, 33.0, 33.0, 26.0, 22.0, 19.0, 14.0, 15.0, 19.0, 16.0, 8.0, 11.0, 3.0, 9.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.23114776611328, -36.970375061035156, -35.7096061706543, -34.44883728027344, -33.18806457519531, -31.92729377746582, -30.666522979736328, -29.405752182006836, -28.144981384277344, -26.88421058654785, -25.62343978881836, -24.362668991088867, -23.101898193359375, -21.841127395629883, -20.58035659790039, -19.3195858001709, -18.058815002441406, -16.798044204711914, -15.537273406982422, -14.27650260925293, -13.015731811523438, -11.754961013793945, -10.494190216064453, -9.233419418334961, -7.972648620605469, -6.711877822875977, -5.451107025146484, -4.190336227416992, -2.9295654296875, -1.6687946319580078, -0.4080238342285156, 0.8527469635009766, 2.113513946533203, 3.3742847442626953, 4.6350555419921875, 5.89582633972168, 7.156597137451172, 8.417367935180664, 9.678138732910156, 10.938909530639648, 12.19968032836914, 13.460451126098633, 14.721221923828125, 15.981992721557617, 17.24276351928711, 18.5035343170166, 19.764305114746094, 21.025075912475586, 22.285846710205078, 23.54661750793457, 24.807388305664062, 26.068159103393555, 27.328929901123047, 28.58970069885254, 29.85047149658203, 31.111242294311523, 32.372013092041016, 33.632781982421875, 34.8935546875, 36.154327392578125, 37.415096282958984, 38.675865173339844, 39.93663787841797, 41.197410583496094, 42.45817947387695]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 2.0, 2.0, 4.0, 8.0, 13.0, 13.0, 14.0, 21.0, 23.0, 28.0, 35.0, 27.0, 50.0, 56.0, 54.0, 48.0, 45.0, 53.0, 48.0, 54.0, 53.0, 55.0, 49.0, 52.0, 34.0, 41.0, 28.0, 18.0, 15.0, 14.0, 7.0, 11.0, 8.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.998046875, -3.868194580078125, -3.73834228515625, -3.608489990234375, -3.4786376953125, -3.348785400390625, -3.21893310546875, -3.089080810546875, -2.959228515625, -2.829376220703125, -2.69952392578125, -2.569671630859375, -2.4398193359375, -2.309967041015625, -2.18011474609375, -2.050262451171875, -1.92041015625, -1.790557861328125, -1.66070556640625, -1.530853271484375, -1.4010009765625, -1.271148681640625, -1.14129638671875, -1.011444091796875, -0.881591796875, -0.751739501953125, -0.62188720703125, -0.492034912109375, -0.3621826171875, -0.232330322265625, -0.10247802734375, 0.027374267578125, 0.1572265625, 0.287078857421875, 0.41693115234375, 0.546783447265625, 0.6766357421875, 0.806488037109375, 0.93634033203125, 1.066192626953125, 1.196044921875, 1.325897216796875, 1.45574951171875, 1.585601806640625, 1.7154541015625, 1.845306396484375, 1.97515869140625, 2.105010986328125, 2.23486328125, 2.364715576171875, 2.49456787109375, 2.624420166015625, 2.7542724609375, 2.884124755859375, 3.01397705078125, 3.143829345703125, 3.273681640625, 3.403533935546875, 3.53338623046875, 3.663238525390625, 3.7930908203125, 3.922943115234375, 4.05279541015625, 4.182647705078125, 4.3125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 5.0, 15.0, 15.0, 22.0, 27.0, 38.0, 60.0, 70.0, 104.0, 143.0, 192.0, 299.0, 476.0, 773.0, 1520.0, 3456.0, 10084.0, 51824.0, 795749.0, 3169264.0, 131434.0, 18727.0, 5194.0, 2057.0, 1022.0, 581.0, 345.0, 237.0, 156.0, 119.0, 83.0, 51.0, 38.0, 30.0, 20.0, 8.0, 16.0, 6.0, 8.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.984375, -19.400146484375, -18.81591796875, -18.231689453125, -17.6474609375, -17.063232421875, -16.47900390625, -15.894775390625, -15.310546875, -14.726318359375, -14.14208984375, -13.557861328125, -12.9736328125, -12.389404296875, -11.80517578125, -11.220947265625, -10.63671875, -10.052490234375, -9.46826171875, -8.884033203125, -8.2998046875, -7.715576171875, -7.13134765625, -6.547119140625, -5.962890625, -5.378662109375, -4.79443359375, -4.210205078125, -3.6259765625, -3.041748046875, -2.45751953125, -1.873291015625, -1.2890625, -0.704833984375, -0.12060546875, 0.463623046875, 1.0478515625, 1.632080078125, 2.21630859375, 2.800537109375, 3.384765625, 3.968994140625, 4.55322265625, 5.137451171875, 5.7216796875, 6.305908203125, 6.89013671875, 7.474365234375, 8.05859375, 8.642822265625, 9.22705078125, 9.811279296875, 10.3955078125, 10.979736328125, 11.56396484375, 12.148193359375, 12.732421875, 13.316650390625, 13.90087890625, 14.485107421875, 15.0693359375, 15.653564453125, 16.23779296875, 16.822021484375, 17.40625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 7.0, 11.0, 13.0, 25.0, 28.0, 48.0, 84.0, 114.0, 201.0, 259.0, 421.0, 692.0, 733.0, 521.0, 311.0, 200.0, 141.0, 88.0, 59.0, 27.0, 22.0, 25.0, 11.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0, -17.5623779296875, -17.124755859375, -16.6871337890625, -16.24951171875, -15.8118896484375, -15.374267578125, -14.9366455078125, -14.4990234375, -14.0614013671875, -13.623779296875, -13.1861572265625, -12.74853515625, -12.3109130859375, -11.873291015625, -11.4356689453125, -10.998046875, -10.5604248046875, -10.122802734375, -9.6851806640625, -9.24755859375, -8.8099365234375, -8.372314453125, -7.9346923828125, -7.4970703125, -7.0594482421875, -6.621826171875, -6.1842041015625, -5.74658203125, -5.3089599609375, -4.871337890625, -4.4337158203125, -3.99609375, -3.5584716796875, -3.120849609375, -2.6832275390625, -2.24560546875, -1.8079833984375, -1.370361328125, -0.9327392578125, -0.4951171875, -0.0574951171875, 0.380126953125, 0.8177490234375, 1.25537109375, 1.6929931640625, 2.130615234375, 2.5682373046875, 3.005859375, 3.4434814453125, 3.881103515625, 4.3187255859375, 4.75634765625, 5.1939697265625, 5.631591796875, 6.0692138671875, 6.5068359375, 6.9444580078125, 7.382080078125, 7.8197021484375, 8.25732421875, 8.6949462890625, 9.132568359375, 9.5701904296875, 10.0078125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 25.0, 26.0, 52.0, 81.0, 129.0, 228.0, 484.0, 1026.0, 2355.0, 6422.0, 22540.0, 124853.0, 1828834.0, 2039116.0, 133362.0, 23529.0, 6668.0, 2445.0, 989.0, 492.0, 216.0, 157.0, 87.0, 68.0, 33.0, 12.0, 10.0, 9.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.328125, -19.481689453125, -18.63525390625, -17.788818359375, -16.9423828125, -16.095947265625, -15.24951171875, -14.403076171875, -13.556640625, -12.710205078125, -11.86376953125, -11.017333984375, -10.1708984375, -9.324462890625, -8.47802734375, -7.631591796875, -6.78515625, -5.938720703125, -5.09228515625, -4.245849609375, -3.3994140625, -2.552978515625, -1.70654296875, -0.860107421875, -0.013671875, 0.832763671875, 1.67919921875, 2.525634765625, 3.3720703125, 4.218505859375, 5.06494140625, 5.911376953125, 6.7578125, 7.604248046875, 8.45068359375, 9.297119140625, 10.1435546875, 10.989990234375, 11.83642578125, 12.682861328125, 13.529296875, 14.375732421875, 15.22216796875, 16.068603515625, 16.9150390625, 17.761474609375, 18.60791015625, 19.454345703125, 20.30078125, 21.147216796875, 21.99365234375, 22.840087890625, 23.6865234375, 24.532958984375, 25.37939453125, 26.225830078125, 27.072265625, 27.918701171875, 28.76513671875, 29.611572265625, 30.4580078125, 31.304443359375, 32.15087890625, 32.997314453125, 33.84375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 13.0, 22.0, 39.0, 67.0, 98.0, 151.0, 152.0, 163.0, 111.0, 76.0, 58.0, 28.0, 18.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.28873825073242, -34.372779846191406, -31.456823348999023, -28.540864944458008, -25.624908447265625, -22.70895004272461, -19.792991638183594, -16.87703514099121, -13.961076736450195, -11.045119285583496, -8.129161834716797, -5.213203430175781, -2.297245979309082, 0.6187114715576172, 3.534669876098633, 6.450626373291016, 9.366584777832031, 12.28254222869873, 15.19849967956543, 18.114458084106445, 21.030414581298828, 23.946372985839844, 26.86233139038086, 29.778287887573242, 32.694244384765625, 35.61020278930664, 38.526161193847656, 41.442115783691406, 44.35807418823242, 47.27403259277344, 50.18999099731445, 53.10594940185547, 56.02190399169922, 58.937862396240234, 61.85382080078125, 64.769775390625, 67.68573760986328, 70.60169219970703, 73.51765441894531, 76.43360900878906, 79.34956359863281, 82.26551818847656, 85.18148040771484, 88.0974349975586, 91.01339721679688, 93.92935180664062, 96.84530639648438, 99.76126861572266, 102.67723083496094, 105.59318542480469, 108.50914764404297, 111.42510223388672, 114.341064453125, 117.25701904296875, 120.1729736328125, 123.08893585205078, 126.00489044189453, 128.9208526611328, 131.83680725097656, 134.7527618408203, 137.66871643066406, 140.58468627929688, 143.50064086914062, 146.41659545898438, 149.33255004882812]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 0.0, 4.0, 10.0, 8.0, 4.0, 10.0, 10.0, 13.0, 17.0, 16.0, 23.0, 29.0, 25.0, 23.0, 26.0, 26.0, 29.0, 38.0, 36.0, 26.0, 34.0, 42.0, 36.0, 43.0, 32.0, 38.0, 32.0, 40.0, 29.0, 27.0, 40.0, 29.0, 27.0, 28.0, 26.0, 14.0, 15.0, 8.0, 9.0, 13.0, 12.0, 11.0, 12.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-32.762451171875, -31.75228500366211, -30.74212074279785, -29.73195457458496, -28.72178840637207, -27.711624145507812, -26.701457977294922, -25.69129180908203, -24.68112564086914, -23.67095947265625, -22.660795211791992, -21.6506290435791, -20.64046287536621, -19.630298614501953, -18.620132446289062, -17.609966278076172, -16.599802017211914, -15.58963680267334, -14.57947063446045, -13.569305419921875, -12.559139251708984, -11.54897403717041, -10.538808822631836, -9.528642654418945, -8.518477439880371, -7.508311748504639, -6.498146057128906, -5.487980842590332, -4.4778151512146, -3.467649459838867, -2.457484245300293, -1.4473185539245605, -0.4371528625488281, 0.5730127096176147, 1.5831782817840576, 2.593343734741211, 3.6035094261169434, 4.613675117492676, 5.62384033203125, 6.634006023406982, 7.644171714782715, 8.654336929321289, 9.66450309753418, 10.674668312072754, 11.684833526611328, 12.694999694824219, 13.705164909362793, 14.715330123901367, 15.725496292114258, 16.73566246032715, 17.745826721191406, 18.755992889404297, 19.766159057617188, 20.776325225830078, 21.786489486694336, 22.796655654907227, 23.806819915771484, 24.816986083984375, 25.827150344848633, 26.837316513061523, 27.847482681274414, 28.857646942138672, 29.867813110351562, 30.877979278564453, 31.888145446777344]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 9.0, 4.0, 8.0, 6.0, 14.0, 13.0, 24.0, 20.0, 32.0, 32.0, 37.0, 29.0, 54.0, 45.0, 44.0, 60.0, 47.0, 61.0, 47.0, 45.0, 49.0, 36.0, 46.0, 46.0, 30.0, 36.0, 29.0, 23.0, 18.0, 9.0, 10.0, 10.0, 5.0, 4.0, 1.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.943359375, -3.817108154296875, -3.69085693359375, -3.564605712890625, -3.4383544921875, -3.312103271484375, -3.18585205078125, -3.059600830078125, -2.933349609375, -2.807098388671875, -2.68084716796875, -2.554595947265625, -2.4283447265625, -2.302093505859375, -2.17584228515625, -2.049591064453125, -1.92333984375, -1.797088623046875, -1.67083740234375, -1.544586181640625, -1.4183349609375, -1.292083740234375, -1.16583251953125, -1.039581298828125, -0.913330078125, -0.787078857421875, -0.66082763671875, -0.534576416015625, -0.4083251953125, -0.282073974609375, -0.15582275390625, -0.029571533203125, 0.0966796875, 0.222930908203125, 0.34918212890625, 0.475433349609375, 0.6016845703125, 0.727935791015625, 0.85418701171875, 0.980438232421875, 1.106689453125, 1.232940673828125, 1.35919189453125, 1.485443115234375, 1.6116943359375, 1.737945556640625, 1.86419677734375, 1.990447998046875, 2.11669921875, 2.242950439453125, 2.36920166015625, 2.495452880859375, 2.6217041015625, 2.747955322265625, 2.87420654296875, 3.000457763671875, 3.126708984375, 3.252960205078125, 3.37921142578125, 3.505462646484375, 3.6317138671875, 3.757965087890625, 3.88421630859375, 4.010467529296875, 4.13671875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 4.0, 5.0, 7.0, 16.0, 17.0, 33.0, 56.0, 81.0, 92.0, 158.0, 230.0, 345.0, 491.0, 778.0, 1162.0, 1830.0, 2839.0, 4751.0, 7932.0, 13744.0, 24261.0, 44829.0, 86853.0, 202127.0, 360837.0, 141689.0, 68681.0, 36248.0, 19681.0, 11333.0, 6627.0, 3933.0, 2398.0, 1510.0, 957.0, 696.0, 457.0, 276.0, 186.0, 131.0, 96.0, 63.0, 37.0, 18.0, 27.0, 16.0, 12.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.16455078125, -0.15946006774902344, -0.15436935424804688, -0.1492786407470703, -0.14418792724609375, -0.1390972137451172, -0.13400650024414062, -0.12891578674316406, -0.1238250732421875, -0.11873435974121094, -0.11364364624023438, -0.10855293273925781, -0.10346221923828125, -0.09837150573730469, -0.09328079223632812, -0.08819007873535156, -0.083099365234375, -0.07800865173339844, -0.07291793823242188, -0.06782722473144531, -0.06273651123046875, -0.05764579772949219, -0.052555084228515625, -0.04746437072753906, -0.0423736572265625, -0.03728294372558594, -0.032192230224609375, -0.027101516723632812, -0.02201080322265625, -0.016920089721679688, -0.011829376220703125, -0.0067386627197265625, -0.00164794921875, 0.0034427642822265625, 0.008533477783203125, 0.013624191284179688, 0.01871490478515625, 0.023805618286132812, 0.028896331787109375, 0.03398704528808594, 0.0390777587890625, 0.04416847229003906, 0.049259185791015625, 0.05434989929199219, 0.05944061279296875, 0.06453132629394531, 0.06962203979492188, 0.07471275329589844, 0.079803466796875, 0.08489418029785156, 0.08998489379882812, 0.09507560729980469, 0.10016632080078125, 0.10525703430175781, 0.11034774780273438, 0.11543846130371094, 0.1205291748046875, 0.12561988830566406, 0.13071060180664062, 0.1358013153076172, 0.14089202880859375, 0.1459827423095703, 0.15107345581054688, 0.15616416931152344, 0.1612548828125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 5.0, 11.0, 18.0, 19.0, 15.0, 29.0, 14.0, 28.0, 23.0, 26.0, 28.0, 38.0, 39.0, 31.0, 35.0, 34.0, 49.0, 1066.0, 35.0, 38.0, 44.0, 40.0, 37.0, 30.0, 29.0, 34.0, 23.0, 25.0, 24.0, 21.0, 22.0, 23.0, 14.0, 11.0, 8.0, 7.0, 5.0, 7.0, 2.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-2.70703125, -2.62725830078125, -2.5474853515625, -2.46771240234375, -2.387939453125, -2.30816650390625, -2.2283935546875, -2.14862060546875, -2.06884765625, -1.98907470703125, -1.9093017578125, -1.82952880859375, -1.749755859375, -1.66998291015625, -1.5902099609375, -1.51043701171875, -1.4306640625, -1.35089111328125, -1.2711181640625, -1.19134521484375, -1.111572265625, -1.03179931640625, -0.9520263671875, -0.87225341796875, -0.79248046875, -0.71270751953125, -0.6329345703125, -0.55316162109375, -0.473388671875, -0.39361572265625, -0.3138427734375, -0.23406982421875, -0.154296875, -0.07452392578125, 0.0052490234375, 0.08502197265625, 0.164794921875, 0.24456787109375, 0.3243408203125, 0.40411376953125, 0.48388671875, 0.56365966796875, 0.6434326171875, 0.72320556640625, 0.802978515625, 0.88275146484375, 0.9625244140625, 1.04229736328125, 1.1220703125, 1.20184326171875, 1.2816162109375, 1.36138916015625, 1.441162109375, 1.52093505859375, 1.6007080078125, 1.68048095703125, 1.76025390625, 1.84002685546875, 1.9197998046875, 1.99957275390625, 2.079345703125, 2.15911865234375, 2.2388916015625, 2.31866455078125, 2.3984375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 5.0, 15.0, 18.0, 30.0, 42.0, 65.0, 106.0, 172.0, 251.0, 391.0, 566.0, 935.0, 1407.0, 2345.0, 3780.0, 5881.0, 9740.0, 16122.0, 26587.0, 44801.0, 79425.0, 165451.0, 1367679.0, 173045.0, 82262.0, 45954.0, 27384.0, 16249.0, 9897.0, 6220.0, 3755.0, 2341.0, 1514.0, 950.0, 610.0, 413.0, 253.0, 167.0, 101.0, 85.0, 40.0, 25.0, 12.0, 15.0, 11.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0986328125, -0.09569072723388672, -0.09274864196777344, -0.08980655670166016, -0.08686447143554688, -0.0839223861694336, -0.08098030090332031, -0.07803821563720703, -0.07509613037109375, -0.07215404510498047, -0.06921195983886719, -0.0662698745727539, -0.06332778930664062, -0.060385704040527344, -0.05744361877441406, -0.05450153350830078, -0.0515594482421875, -0.04861736297607422, -0.04567527770996094, -0.042733192443847656, -0.039791107177734375, -0.036849021911621094, -0.03390693664550781, -0.03096485137939453, -0.02802276611328125, -0.02508068084716797, -0.022138595581054688, -0.019196510314941406, -0.016254425048828125, -0.013312339782714844, -0.010370254516601562, -0.007428169250488281, -0.004486083984375, -0.0015439987182617188, 0.0013980865478515625, 0.004340171813964844, 0.007282257080078125, 0.010224342346191406, 0.013166427612304688, 0.01610851287841797, 0.01905059814453125, 0.02199268341064453, 0.024934768676757812, 0.027876853942871094, 0.030818939208984375, 0.033761024475097656, 0.03670310974121094, 0.03964519500732422, 0.0425872802734375, 0.04552936553955078, 0.04847145080566406, 0.051413536071777344, 0.054355621337890625, 0.057297706604003906, 0.06023979187011719, 0.06318187713623047, 0.06612396240234375, 0.06906604766845703, 0.07200813293457031, 0.0749502182006836, 0.07789230346679688, 0.08083438873291016, 0.08377647399902344, 0.08671855926513672, 0.08966064453125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 7.0, 13.0, 7.0, 14.0, 13.0, 12.0, 23.0, 10.0, 26.0, 20.0, 23.0, 31.0, 35.0, 39.0, 51.0, 48.0, 45.0, 55.0, 55.0, 39.0, 53.0, 27.0, 37.0, 34.0, 46.0, 24.0, 17.0, 28.0, 32.0, 19.0, 19.0, 12.0, 12.0, 17.0, 7.0, 9.0, 7.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.5881996154785156e-05, -3.4800730645656586e-05, -3.3719465136528015e-05, -3.2638199627399445e-05, -3.1556934118270874e-05, -3.0475668609142303e-05, -2.9394403100013733e-05, -2.8313137590885162e-05, -2.7231872081756592e-05, -2.615060657262802e-05, -2.506934106349945e-05, -2.398807555437088e-05, -2.290681004524231e-05, -2.182554453611374e-05, -2.074427902698517e-05, -1.9663013517856598e-05, -1.8581748008728027e-05, -1.7500482499599457e-05, -1.6419216990470886e-05, -1.5337951481342316e-05, -1.4256685972213745e-05, -1.3175420463085175e-05, -1.2094154953956604e-05, -1.1012889444828033e-05, -9.931623935699463e-06, -8.850358426570892e-06, -7.769092917442322e-06, -6.687827408313751e-06, -5.606561899185181e-06, -4.52529639005661e-06, -3.4440308809280396e-06, -2.362765371799469e-06, -1.2814998626708984e-06, -2.0023435354232788e-07, 8.810311555862427e-07, 1.9622966647148132e-06, 3.043562173843384e-06, 4.124827682971954e-06, 5.206093192100525e-06, 6.2873587012290955e-06, 7.368624210357666e-06, 8.449889719486237e-06, 9.531155228614807e-06, 1.0612420737743378e-05, 1.1693686246871948e-05, 1.2774951756000519e-05, 1.385621726512909e-05, 1.493748277425766e-05, 1.601874828338623e-05, 1.71000137925148e-05, 1.818127930164337e-05, 1.9262544810771942e-05, 2.0343810319900513e-05, 2.1425075829029083e-05, 2.2506341338157654e-05, 2.3587606847286224e-05, 2.4668872356414795e-05, 2.5750137865543365e-05, 2.6831403374671936e-05, 2.7912668883800507e-05, 2.8993934392929077e-05, 3.0075199902057648e-05, 3.115646541118622e-05, 3.223773092031479e-05, 3.331899642944336e-05]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 10.0, 9.0, 8.0, 14.0, 19.0, 16.0, 26.0, 35.0, 31.0, 47.0, 59.0, 63.0, 67.0, 75.0, 142.0, 151.0, 241.0, 447.0, 2517.0, 58363.0, 761932.0, 215289.0, 7065.0, 764.0, 299.0, 174.0, 131.0, 113.0, 93.0, 74.0, 63.0, 40.0, 28.0, 29.0, 24.0, 23.0, 14.0, 11.0, 10.0, 17.0, 5.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-0.0005521774291992188, -0.0005357861518859863, -0.0005193948745727539, -0.0005030035972595215, -0.00048661231994628906, -0.00047022104263305664, -0.0004538297653198242, -0.0004374384880065918, -0.0004210472106933594, -0.00040465593338012695, -0.00038826465606689453, -0.0003718733787536621, -0.0003554821014404297, -0.00033909082412719727, -0.00032269954681396484, -0.0003063082695007324, -0.0002899169921875, -0.0002735257148742676, -0.00025713443756103516, -0.00024074316024780273, -0.0002243518829345703, -0.0002079606056213379, -0.00019156932830810547, -0.00017517805099487305, -0.00015878677368164062, -0.0001423954963684082, -0.00012600421905517578, -0.00010961294174194336, -9.322166442871094e-05, -7.683038711547852e-05, -6.0439109802246094e-05, -4.404783248901367e-05, -2.765655517578125e-05, -1.1265277862548828e-05, 5.125999450683594e-06, 2.1517276763916016e-05, 3.790855407714844e-05, 5.429983139038086e-05, 7.069110870361328e-05, 8.70823860168457e-05, 0.00010347366333007812, 0.00011986494064331055, 0.00013625621795654297, 0.0001526474952697754, 0.0001690387725830078, 0.00018543004989624023, 0.00020182132720947266, 0.00021821260452270508, 0.0002346038818359375, 0.0002509951591491699, 0.00026738643646240234, 0.00028377771377563477, 0.0003001689910888672, 0.0003165602684020996, 0.00033295154571533203, 0.00034934282302856445, 0.0003657341003417969, 0.0003821253776550293, 0.0003985166549682617, 0.00041490793228149414, 0.00043129920959472656, 0.000447690486907959, 0.0004640817642211914, 0.00048047304153442383, 0.0004968643188476562]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 14.0, 38.0, 138.0, 291.0, 313.0, 149.0, 57.0, 12.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.985628664959222e-05, -8.512732165399939e-05, -8.039835665840656e-05, -7.566939166281372e-05, -7.094042666722089e-05, -6.621146167162806e-05, -6.148248940007761e-05, -5.675352440448478e-05, -5.2024559408891946e-05, -4.7295594413299114e-05, -4.256662941770628e-05, -3.783766078413464e-05, -3.310869578854181e-05, -2.8379730792948976e-05, -2.365076397836674e-05, -1.8921797163784504e-05, -1.4192832168191671e-05, -9.463866263104137e-06, -4.734900358016603e-06, -5.934452929068357e-09, 4.723031452158466e-06, 9.451996447751299e-06, 1.4180963262333535e-05, 1.890993007691577e-05, 2.3638895072508603e-05, 2.8367860068101436e-05, 3.309682506369427e-05, 3.782579369726591e-05, 4.255475869285874e-05, 4.728372368845157e-05, 5.201269232202321e-05, 5.6741657317616045e-05, 6.14706368651241e-05, 6.619960186071694e-05, 7.092856685630977e-05, 7.56575318519026e-05, 8.038649684749544e-05, 8.511546184308827e-05, 8.984443411463872e-05, 9.457339911023155e-05, 9.930236410582438e-05, 0.00010403132910141721, 0.00010876029409701005, 0.00011348925909260288, 0.00011821823136415333, 0.00012294719635974616, 0.000127676161355339, 0.00013240512635093182, 0.00013713409134652466, 0.0001418630563421175, 0.00014659202133771032, 0.00015132098633330315, 0.00015604995132889599, 0.00016077891632448882, 0.00016550788132008165, 0.0001702368608675897, 0.00017496582586318254, 0.00017969479085877538, 0.0001844237558543682, 0.00018915272084996104, 0.00019388168584555387, 0.0001986106508411467, 0.00020333961583673954, 0.00020806858083233237, 0.0002127975458279252]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 2.0, 17.0, 12.0, 10.0, 16.0, 24.0, 16.0, 19.0, 24.0, 28.0, 32.0, 25.0, 39.0, 35.0, 43.0, 38.0, 46.0, 39.0, 42.0, 32.0, 30.0, 42.0, 36.0, 34.0, 29.0, 32.0, 35.0, 25.0, 26.0, 28.0, 20.0, 22.0, 17.0, 8.0, 8.0, 10.0, 7.0, 16.0, 6.0, 7.0, 3.0, 0.0, 8.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.6524066925048828e-05, -2.5663524866104126e-05, -2.4802982807159424e-05, -2.394244074821472e-05, -2.308189868927002e-05, -2.2221356630325317e-05, -2.1360814571380615e-05, -2.0500272512435913e-05, -1.963973045349121e-05, -1.877918839454651e-05, -1.7918646335601807e-05, -1.7058104276657104e-05, -1.6197562217712402e-05, -1.53370201587677e-05, -1.4476478099822998e-05, -1.3615936040878296e-05, -1.2755393981933594e-05, -1.1894851922988892e-05, -1.103430986404419e-05, -1.0173767805099487e-05, -9.313225746154785e-06, -8.452683687210083e-06, -7.592141628265381e-06, -6.731599569320679e-06, -5.8710575103759766e-06, -5.010515451431274e-06, -4.149973392486572e-06, -3.28943133354187e-06, -2.428889274597168e-06, -1.5683472156524658e-06, -7.078051567077637e-07, 1.5273690223693848e-07, 1.0132789611816406e-06, 1.8738210201263428e-06, 2.734363079071045e-06, 3.594905138015747e-06, 4.455447196960449e-06, 5.315989255905151e-06, 6.1765313148498535e-06, 7.037073373794556e-06, 7.897615432739258e-06, 8.75815749168396e-06, 9.618699550628662e-06, 1.0479241609573364e-05, 1.1339783668518066e-05, 1.2200325727462769e-05, 1.306086778640747e-05, 1.3921409845352173e-05, 1.4781951904296875e-05, 1.5642493963241577e-05, 1.650303602218628e-05, 1.736357808113098e-05, 1.8224120140075684e-05, 1.9084662199020386e-05, 1.9945204257965088e-05, 2.080574631690979e-05, 2.1666288375854492e-05, 2.2526830434799194e-05, 2.3387372493743896e-05, 2.42479145526886e-05, 2.51084566116333e-05, 2.5968998670578003e-05, 2.6829540729522705e-05, 2.7690082788467407e-05, 2.855062484741211e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 9.0, 4.0, 8.0, 6.0, 14.0, 13.0, 24.0, 20.0, 32.0, 32.0, 37.0, 29.0, 54.0, 45.0, 44.0, 60.0, 47.0, 61.0, 47.0, 45.0, 49.0, 36.0, 46.0, 46.0, 30.0, 36.0, 29.0, 23.0, 18.0, 9.0, 10.0, 10.0, 5.0, 4.0, 1.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.943359375, -3.817108154296875, -3.69085693359375, -3.564605712890625, -3.4383544921875, -3.312103271484375, -3.18585205078125, -3.059600830078125, -2.933349609375, -2.807098388671875, -2.68084716796875, -2.554595947265625, -2.4283447265625, -2.302093505859375, -2.17584228515625, -2.049591064453125, -1.92333984375, -1.797088623046875, -1.67083740234375, -1.544586181640625, -1.4183349609375, -1.292083740234375, -1.16583251953125, -1.039581298828125, -0.913330078125, -0.787078857421875, -0.66082763671875, -0.534576416015625, -0.4083251953125, -0.282073974609375, -0.15582275390625, -0.029571533203125, 0.0966796875, 0.222930908203125, 0.34918212890625, 0.475433349609375, 0.6016845703125, 0.727935791015625, 0.85418701171875, 0.980438232421875, 1.106689453125, 1.232940673828125, 1.35919189453125, 1.485443115234375, 1.6116943359375, 1.737945556640625, 1.86419677734375, 1.990447998046875, 2.11669921875, 2.242950439453125, 2.36920166015625, 2.495452880859375, 2.6217041015625, 2.747955322265625, 2.87420654296875, 3.000457763671875, 3.126708984375, 3.252960205078125, 3.37921142578125, 3.505462646484375, 3.6317138671875, 3.757965087890625, 3.88421630859375, 4.010467529296875, 4.13671875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 1.0, 4.0, 5.0, 2.0, 6.0, 8.0, 6.0, 13.0, 15.0, 18.0, 19.0, 27.0, 71.0, 73.0, 160.0, 258.0, 516.0, 976.0, 1994.0, 4427.0, 11258.0, 37488.0, 286310.0, 628004.0, 52285.0, 14460.0, 5299.0, 2318.0, 1160.0, 592.0, 298.0, 197.0, 88.0, 58.0, 41.0, 22.0, 16.0, 20.0, 9.0, 11.0, 7.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.203125, -7.939453125, -7.67578125, -7.412109375, -7.1484375, -6.884765625, -6.62109375, -6.357421875, -6.09375, -5.830078125, -5.56640625, -5.302734375, -5.0390625, -4.775390625, -4.51171875, -4.248046875, -3.984375, -3.720703125, -3.45703125, -3.193359375, -2.9296875, -2.666015625, -2.40234375, -2.138671875, -1.875, -1.611328125, -1.34765625, -1.083984375, -0.8203125, -0.556640625, -0.29296875, -0.029296875, 0.234375, 0.498046875, 0.76171875, 1.025390625, 1.2890625, 1.552734375, 1.81640625, 2.080078125, 2.34375, 2.607421875, 2.87109375, 3.134765625, 3.3984375, 3.662109375, 3.92578125, 4.189453125, 4.453125, 4.716796875, 4.98046875, 5.244140625, 5.5078125, 5.771484375, 6.03515625, 6.298828125, 6.5625, 6.826171875, 7.08984375, 7.353515625, 7.6171875, 7.880859375, 8.14453125, 8.408203125, 8.671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 8.0, 3.0, 10.0, 7.0, 11.0, 8.0, 22.0, 14.0, 19.0, 21.0, 18.0, 24.0, 36.0, 37.0, 45.0, 44.0, 36.0, 47.0, 66.0, 89.0, 1688.0, 243.0, 98.0, 64.0, 48.0, 42.0, 46.0, 41.0, 24.0, 20.0, 33.0, 29.0, 18.0, 21.0, 11.0, 13.0, 18.0, 10.0, 5.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0], "bins": [-14.859375, -14.487060546875, -14.11474609375, -13.742431640625, -13.3701171875, -12.997802734375, -12.62548828125, -12.253173828125, -11.880859375, -11.508544921875, -11.13623046875, -10.763916015625, -10.3916015625, -10.019287109375, -9.64697265625, -9.274658203125, -8.90234375, -8.530029296875, -8.15771484375, -7.785400390625, -7.4130859375, -7.040771484375, -6.66845703125, -6.296142578125, -5.923828125, -5.551513671875, -5.17919921875, -4.806884765625, -4.4345703125, -4.062255859375, -3.68994140625, -3.317626953125, -2.9453125, -2.572998046875, -2.20068359375, -1.828369140625, -1.4560546875, -1.083740234375, -0.71142578125, -0.339111328125, 0.033203125, 0.405517578125, 0.77783203125, 1.150146484375, 1.5224609375, 1.894775390625, 2.26708984375, 2.639404296875, 3.01171875, 3.384033203125, 3.75634765625, 4.128662109375, 4.5009765625, 4.873291015625, 5.24560546875, 5.617919921875, 5.990234375, 6.362548828125, 6.73486328125, 7.107177734375, 7.4794921875, 7.851806640625, 8.22412109375, 8.596435546875, 8.96875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 12.0, 12.0, 10.0, 11.0, 16.0, 18.0, 20.0, 27.0, 48.0, 46.0, 65.0, 149.0, 244.0, 506.0, 1011.0, 2394.0, 6506.0, 24956.0, 191066.0, 2782992.0, 108203.0, 17973.0, 5430.0, 2012.0, 876.0, 437.0, 227.0, 117.0, 74.0, 47.0, 30.0, 23.0, 24.0, 23.0, 18.0, 18.0, 10.0, 10.0, 7.0, 6.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.046875, -11.59033203125, -11.1337890625, -10.67724609375, -10.220703125, -9.76416015625, -9.3076171875, -8.85107421875, -8.39453125, -7.93798828125, -7.4814453125, -7.02490234375, -6.568359375, -6.11181640625, -5.6552734375, -5.19873046875, -4.7421875, -4.28564453125, -3.8291015625, -3.37255859375, -2.916015625, -2.45947265625, -2.0029296875, -1.54638671875, -1.08984375, -0.63330078125, -0.1767578125, 0.27978515625, 0.736328125, 1.19287109375, 1.6494140625, 2.10595703125, 2.5625, 3.01904296875, 3.4755859375, 3.93212890625, 4.388671875, 4.84521484375, 5.3017578125, 5.75830078125, 6.21484375, 6.67138671875, 7.1279296875, 7.58447265625, 8.041015625, 8.49755859375, 8.9541015625, 9.41064453125, 9.8671875, 10.32373046875, 10.7802734375, 11.23681640625, 11.693359375, 12.14990234375, 12.6064453125, 13.06298828125, 13.51953125, 13.97607421875, 14.4326171875, 14.88916015625, 15.345703125, 15.80224609375, 16.2587890625, 16.71533203125, 17.171875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [476.0, 542.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4761323928833, -0.3498659133911133, 11.776400566101074, 23.902667999267578, 36.028934478759766, 48.15520095825195, 60.28146743774414, 72.40773010253906, 84.53399658203125, 96.66026306152344, 108.78652954101562, 120.91279602050781, 133.0390625, 145.1653289794922, 157.29159545898438, 169.41786193847656, 181.54412841796875, 193.67039489746094, 205.79666137695312, 217.9229278564453, 230.0491943359375, 242.1754608154297, 254.30172729492188, 266.427978515625, 278.55426025390625, 290.6805419921875, 302.8067932128906, 314.93304443359375, 327.059326171875, 339.18560791015625, 351.3118591308594, 363.4381103515625, 375.56439208984375, 387.690673828125, 399.8169250488281, 411.94317626953125, 424.0694580078125, 436.19573974609375, 448.3219909667969, 460.4482421875, 472.57452392578125, 484.7008056640625, 496.8270568847656, 508.95330810546875, 521.07958984375, 533.2058715820312, 545.3321533203125, 557.4583740234375, 569.5846557617188, 581.7109375, 593.837158203125, 605.9634399414062, 618.0897216796875, 630.2160034179688, 642.34228515625, 654.468505859375, 666.5947875976562, 678.7210693359375, 690.8472900390625, 702.9735717773438, 715.099853515625, 727.2261352539062, 739.3524169921875, 751.4786376953125, 763.6049194335938]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 4.0, 10.0, 12.0, 13.0, 9.0, 15.0, 22.0, 19.0, 21.0, 24.0, 27.0, 38.0, 33.0, 36.0, 37.0, 43.0, 46.0, 45.0, 41.0, 31.0, 35.0, 37.0, 47.0, 36.0, 29.0, 35.0, 39.0, 22.0, 34.0, 14.0, 27.0, 15.0, 19.0, 9.0, 8.0, 6.0, 12.0, 11.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.21539306640625, -32.09511184692383, -30.974830627441406, -29.854549407958984, -28.734268188476562, -27.61398696899414, -26.49370574951172, -25.373424530029297, -24.253143310546875, -23.132862091064453, -22.01258087158203, -20.89229965209961, -19.772018432617188, -18.651737213134766, -17.531455993652344, -16.411174774169922, -15.2908935546875, -14.170612335205078, -13.050331115722656, -11.930049896240234, -10.809768676757812, -9.68948745727539, -8.569206237792969, -7.448925018310547, -6.328643798828125, -5.208362579345703, -4.088081359863281, -2.9678001403808594, -1.8475189208984375, -0.7272377014160156, 0.39304351806640625, 1.5133247375488281, 2.6336021423339844, 3.7538833618164062, 4.874164581298828, 5.99444580078125, 7.114727020263672, 8.235008239746094, 9.355289459228516, 10.475570678710938, 11.59585189819336, 12.716133117675781, 13.836414337158203, 14.956695556640625, 16.076976776123047, 17.19725799560547, 18.31753921508789, 19.437820434570312, 20.558101654052734, 21.678382873535156, 22.798664093017578, 23.9189453125, 25.039226531982422, 26.159507751464844, 27.279788970947266, 28.400070190429688, 29.52035140991211, 30.64063262939453, 31.760913848876953, 32.881195068359375, 34.0014762878418, 35.12175750732422, 36.24203872680664, 37.36231994628906, 38.482601165771484]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 7.0, 6.0, 4.0, 16.0, 13.0, 14.0, 25.0, 24.0, 36.0, 37.0, 36.0, 40.0, 48.0, 52.0, 55.0, 46.0, 54.0, 51.0, 53.0, 58.0, 42.0, 41.0, 37.0, 43.0, 36.0, 25.0, 28.0, 12.0, 12.0, 12.0, 8.0, 7.0, 2.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140625, -4.00933837890625, -3.8780517578125, -3.74676513671875, -3.615478515625, -3.48419189453125, -3.3529052734375, -3.22161865234375, -3.09033203125, -2.95904541015625, -2.8277587890625, -2.69647216796875, -2.565185546875, -2.43389892578125, -2.3026123046875, -2.17132568359375, -2.0400390625, -1.90875244140625, -1.7774658203125, -1.64617919921875, -1.514892578125, -1.38360595703125, -1.2523193359375, -1.12103271484375, -0.98974609375, -0.85845947265625, -0.7271728515625, -0.59588623046875, -0.464599609375, -0.33331298828125, -0.2020263671875, -0.07073974609375, 0.060546875, 0.19183349609375, 0.3231201171875, 0.45440673828125, 0.585693359375, 0.71697998046875, 0.8482666015625, 0.97955322265625, 1.11083984375, 1.24212646484375, 1.3734130859375, 1.50469970703125, 1.635986328125, 1.76727294921875, 1.8985595703125, 2.02984619140625, 2.1611328125, 2.29241943359375, 2.4237060546875, 2.55499267578125, 2.686279296875, 2.81756591796875, 2.9488525390625, 3.08013916015625, 3.21142578125, 3.34271240234375, 3.4739990234375, 3.60528564453125, 3.736572265625, 3.86785888671875, 3.9991455078125, 4.13043212890625, 4.26171875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 10.0, 8.0, 10.0, 12.0, 20.0, 20.0, 37.0, 63.0, 80.0, 115.0, 213.0, 310.0, 519.0, 1024.0, 2377.0, 7127.0, 33864.0, 385613.0, 3541840.0, 189311.0, 22389.0, 5332.0, 1949.0, 853.0, 432.0, 263.0, 163.0, 109.0, 69.0, 49.0, 30.0, 19.0, 21.0, 15.0, 4.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.75, -20.146484375, -19.54296875, -18.939453125, -18.3359375, -17.732421875, -17.12890625, -16.525390625, -15.921875, -15.318359375, -14.71484375, -14.111328125, -13.5078125, -12.904296875, -12.30078125, -11.697265625, -11.09375, -10.490234375, -9.88671875, -9.283203125, -8.6796875, -8.076171875, -7.47265625, -6.869140625, -6.265625, -5.662109375, -5.05859375, -4.455078125, -3.8515625, -3.248046875, -2.64453125, -2.041015625, -1.4375, -0.833984375, -0.23046875, 0.373046875, 0.9765625, 1.580078125, 2.18359375, 2.787109375, 3.390625, 3.994140625, 4.59765625, 5.201171875, 5.8046875, 6.408203125, 7.01171875, 7.615234375, 8.21875, 8.822265625, 9.42578125, 10.029296875, 10.6328125, 11.236328125, 11.83984375, 12.443359375, 13.046875, 13.650390625, 14.25390625, 14.857421875, 15.4609375, 16.064453125, 16.66796875, 17.271484375, 17.875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 6.0, 5.0, 4.0, 6.0, 9.0, 11.0, 11.0, 20.0, 36.0, 46.0, 60.0, 103.0, 126.0, 240.0, 319.0, 556.0, 714.0, 631.0, 391.0, 251.0, 156.0, 113.0, 64.0, 52.0, 36.0, 40.0, 18.0, 9.0, 14.0, 7.0, 5.0, 2.0, 6.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0, -12.613525390625, -12.22705078125, -11.840576171875, -11.4541015625, -11.067626953125, -10.68115234375, -10.294677734375, -9.908203125, -9.521728515625, -9.13525390625, -8.748779296875, -8.3623046875, -7.975830078125, -7.58935546875, -7.202880859375, -6.81640625, -6.429931640625, -6.04345703125, -5.656982421875, -5.2705078125, -4.884033203125, -4.49755859375, -4.111083984375, -3.724609375, -3.338134765625, -2.95166015625, -2.565185546875, -2.1787109375, -1.792236328125, -1.40576171875, -1.019287109375, -0.6328125, -0.246337890625, 0.14013671875, 0.526611328125, 0.9130859375, 1.299560546875, 1.68603515625, 2.072509765625, 2.458984375, 2.845458984375, 3.23193359375, 3.618408203125, 4.0048828125, 4.391357421875, 4.77783203125, 5.164306640625, 5.55078125, 5.937255859375, 6.32373046875, 6.710205078125, 7.0966796875, 7.483154296875, 7.86962890625, 8.256103515625, 8.642578125, 9.029052734375, 9.41552734375, 9.802001953125, 10.1884765625, 10.574951171875, 10.96142578125, 11.347900390625, 11.734375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 13.0, 7.0, 9.0, 22.0, 19.0, 30.0, 46.0, 72.0, 106.0, 137.0, 233.0, 387.0, 561.0, 876.0, 1571.0, 2805.0, 5018.0, 10631.0, 25361.0, 75727.0, 323234.0, 2324375.0, 1154188.0, 183175.0, 49902.0, 18122.0, 7968.0, 4109.0, 2209.0, 1274.0, 761.0, 469.0, 303.0, 182.0, 115.0, 89.0, 59.0, 38.0, 25.0, 14.0, 14.0, 8.0, 6.0, 8.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.6328125, -15.1256103515625, -14.618408203125, -14.1112060546875, -13.60400390625, -13.0968017578125, -12.589599609375, -12.0823974609375, -11.5751953125, -11.0679931640625, -10.560791015625, -10.0535888671875, -9.54638671875, -9.0391845703125, -8.531982421875, -8.0247802734375, -7.517578125, -7.0103759765625, -6.503173828125, -5.9959716796875, -5.48876953125, -4.9815673828125, -4.474365234375, -3.9671630859375, -3.4599609375, -2.9527587890625, -2.445556640625, -1.9383544921875, -1.43115234375, -0.9239501953125, -0.416748046875, 0.0904541015625, 0.59765625, 1.1048583984375, 1.612060546875, 2.1192626953125, 2.62646484375, 3.1336669921875, 3.640869140625, 4.1480712890625, 4.6552734375, 5.1624755859375, 5.669677734375, 6.1768798828125, 6.68408203125, 7.1912841796875, 7.698486328125, 8.2056884765625, 8.712890625, 9.2200927734375, 9.727294921875, 10.2344970703125, 10.74169921875, 11.2489013671875, 11.756103515625, 12.2633056640625, 12.7705078125, 13.2777099609375, 13.784912109375, 14.2921142578125, 14.79931640625, 15.3065185546875, 15.813720703125, 16.3209228515625, 16.828125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 11.0, 11.0, 11.0, 24.0, 26.0, 36.0, 59.0, 72.0, 86.0, 93.0, 111.0, 68.0, 98.0, 81.0, 65.0, 42.0, 32.0, 26.0, 19.0, 14.0, 11.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.32262420654297, -39.52180480957031, -37.720985412597656, -35.920166015625, -34.119346618652344, -32.31852722167969, -30.51770782470703, -28.716888427734375, -26.91606903076172, -25.115249633789062, -23.314430236816406, -21.51361083984375, -19.712791442871094, -17.911972045898438, -16.11115264892578, -14.310334205627441, -12.509515762329102, -10.708696365356445, -8.907876968383789, -7.107058048248291, -5.306238651275635, -3.5054197311401367, -1.7046003341674805, 0.09621906280517578, 1.897038459777832, 3.6978578567504883, 5.4986772537231445, 7.299496173858643, 9.10031509399414, 10.901134490966797, 12.701953887939453, 14.50277328491211, 16.303592681884766, 18.104412078857422, 19.905231475830078, 21.706050872802734, 23.50687026977539, 25.307689666748047, 27.108509063720703, 28.90932846069336, 30.710147857666016, 32.51096725463867, 34.31178665161133, 36.112606048583984, 37.91342544555664, 39.7142448425293, 41.51506423950195, 43.31588363647461, 45.11669921875, 46.917518615722656, 48.71833801269531, 50.51915740966797, 52.319976806640625, 54.12079620361328, 55.92161560058594, 57.722434997558594, 59.52325439453125, 61.324073791503906, 63.12489318847656, 64.92571258544922, 66.72653198242188, 68.52735137939453, 70.32817077636719, 72.12899017333984, 73.9298095703125]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 3.0, 8.0, 9.0, 9.0, 10.0, 10.0, 9.0, 12.0, 20.0, 17.0, 20.0, 18.0, 21.0, 22.0, 27.0, 36.0, 26.0, 25.0, 23.0, 31.0, 35.0, 45.0, 31.0, 53.0, 39.0, 35.0, 36.0, 28.0, 29.0, 35.0, 27.0, 23.0, 25.0, 28.0, 20.0, 19.0, 13.0, 25.0, 14.0, 14.0, 12.0, 8.0, 9.0, 9.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0], "bins": [-32.93708038330078, -31.973960876464844, -31.010839462280273, -30.047718048095703, -29.084598541259766, -28.121479034423828, -27.158357620239258, -26.195236206054688, -25.23211669921875, -24.268997192382812, -23.305875778198242, -22.342754364013672, -21.379634857177734, -20.416515350341797, -19.453393936157227, -18.490272521972656, -17.52715301513672, -16.56403350830078, -15.600912094116211, -14.637791633605957, -13.674671173095703, -12.71155071258545, -11.748430252075195, -10.785309791564941, -9.822189331054688, -8.859068870544434, -7.89594841003418, -6.932827949523926, -5.969707489013672, -5.006587028503418, -4.043466567993164, -3.08034610748291, -2.1172256469726562, -1.1541051864624023, -0.19098472595214844, 0.7721357345581055, 1.7352561950683594, 2.6983766555786133, 3.661497116088867, 4.624617576599121, 5.587738037109375, 6.550858497619629, 7.513978958129883, 8.477099418640137, 9.44021987915039, 10.403340339660645, 11.366460800170898, 12.329581260681152, 13.292701721191406, 14.25582218170166, 15.218942642211914, 16.182064056396484, 17.145183563232422, 18.10830307006836, 19.07142448425293, 20.0345458984375, 20.997665405273438, 21.960784912109375, 22.923906326293945, 23.887027740478516, 24.850147247314453, 25.81326675415039, 26.77638816833496, 27.73950958251953, 28.70262908935547]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 12.0, 17.0, 17.0, 23.0, 20.0, 32.0, 29.0, 35.0, 38.0, 60.0, 46.0, 52.0, 49.0, 57.0, 54.0, 47.0, 60.0, 57.0, 33.0, 41.0, 33.0, 31.0, 29.0, 29.0, 12.0, 15.0, 12.0, 11.0, 8.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.888671875, -3.753387451171875, -3.61810302734375, -3.482818603515625, -3.3475341796875, -3.212249755859375, -3.07696533203125, -2.941680908203125, -2.806396484375, -2.671112060546875, -2.53582763671875, -2.400543212890625, -2.2652587890625, -2.129974365234375, -1.99468994140625, -1.859405517578125, -1.72412109375, -1.588836669921875, -1.45355224609375, -1.318267822265625, -1.1829833984375, -1.047698974609375, -0.91241455078125, -0.777130126953125, -0.641845703125, -0.506561279296875, -0.37127685546875, -0.235992431640625, -0.1007080078125, 0.034576416015625, 0.16986083984375, 0.305145263671875, 0.4404296875, 0.575714111328125, 0.71099853515625, 0.846282958984375, 0.9815673828125, 1.116851806640625, 1.25213623046875, 1.387420654296875, 1.522705078125, 1.657989501953125, 1.79327392578125, 1.928558349609375, 2.0638427734375, 2.199127197265625, 2.33441162109375, 2.469696044921875, 2.60498046875, 2.740264892578125, 2.87554931640625, 3.010833740234375, 3.1461181640625, 3.281402587890625, 3.41668701171875, 3.551971435546875, 3.687255859375, 3.822540283203125, 3.95782470703125, 4.093109130859375, 4.2283935546875, 4.363677978515625, 4.49896240234375, 4.634246826171875, 4.76953125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 6.0, 9.0, 3.0, 19.0, 18.0, 29.0, 40.0, 67.0, 86.0, 121.0, 180.0, 262.0, 419.0, 610.0, 880.0, 1434.0, 2221.0, 3443.0, 5736.0, 9151.0, 15231.0, 25663.0, 44516.0, 82539.0, 179696.0, 335406.0, 161136.0, 76462.0, 41338.0, 24251.0, 14168.0, 8681.0, 5327.0, 3287.0, 2164.0, 1330.0, 898.0, 581.0, 382.0, 261.0, 169.0, 113.0, 80.0, 56.0, 29.0, 20.0, 12.0, 12.0, 6.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1368408203125, -0.13219261169433594, -0.12754440307617188, -0.12289619445800781, -0.11824798583984375, -0.11359977722167969, -0.10895156860351562, -0.10430335998535156, -0.0996551513671875, -0.09500694274902344, -0.09035873413085938, -0.08571052551269531, -0.08106231689453125, -0.07641410827636719, -0.07176589965820312, -0.06711769104003906, -0.062469482421875, -0.05782127380371094, -0.053173065185546875, -0.04852485656738281, -0.04387664794921875, -0.03922843933105469, -0.034580230712890625, -0.029932022094726562, -0.0252838134765625, -0.020635604858398438, -0.015987396240234375, -0.011339187622070312, -0.00669097900390625, -0.0020427703857421875, 0.002605438232421875, 0.0072536468505859375, 0.01190185546875, 0.016550064086914062, 0.021198272705078125, 0.025846481323242188, 0.03049468994140625, 0.03514289855957031, 0.039791107177734375, 0.04443931579589844, 0.0490875244140625, 0.05373573303222656, 0.058383941650390625, 0.06303215026855469, 0.06768035888671875, 0.07232856750488281, 0.07697677612304688, 0.08162498474121094, 0.086273193359375, 0.09092140197753906, 0.09556961059570312, 0.10021781921386719, 0.10486602783203125, 0.10951423645019531, 0.11416244506835938, 0.11881065368652344, 0.1234588623046875, 0.12810707092285156, 0.13275527954101562, 0.1374034881591797, 0.14205169677734375, 0.1466999053955078, 0.15134811401367188, 0.15599632263183594, 0.16064453125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 7.0, 6.0, 5.0, 4.0, 2.0, 12.0, 15.0, 14.0, 12.0, 16.0, 17.0, 18.0, 21.0, 30.0, 20.0, 32.0, 41.0, 26.0, 35.0, 37.0, 31.0, 41.0, 42.0, 1064.0, 32.0, 36.0, 35.0, 39.0, 36.0, 39.0, 26.0, 27.0, 25.0, 31.0, 14.0, 17.0, 24.0, 15.0, 12.0, 6.0, 8.0, 13.0, 11.0, 5.0, 4.0, 5.0, 3.0, 5.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.46484375, -2.38568115234375, -2.3065185546875, -2.22735595703125, -2.148193359375, -2.06903076171875, -1.9898681640625, -1.91070556640625, -1.83154296875, -1.75238037109375, -1.6732177734375, -1.59405517578125, -1.514892578125, -1.43572998046875, -1.3565673828125, -1.27740478515625, -1.1982421875, -1.11907958984375, -1.0399169921875, -0.96075439453125, -0.881591796875, -0.80242919921875, -0.7232666015625, -0.64410400390625, -0.56494140625, -0.48577880859375, -0.4066162109375, -0.32745361328125, -0.248291015625, -0.16912841796875, -0.0899658203125, -0.01080322265625, 0.068359375, 0.14752197265625, 0.2266845703125, 0.30584716796875, 0.385009765625, 0.46417236328125, 0.5433349609375, 0.62249755859375, 0.70166015625, 0.78082275390625, 0.8599853515625, 0.93914794921875, 1.018310546875, 1.09747314453125, 1.1766357421875, 1.25579833984375, 1.3349609375, 1.41412353515625, 1.4932861328125, 1.57244873046875, 1.651611328125, 1.73077392578125, 1.8099365234375, 1.88909912109375, 1.96826171875, 2.04742431640625, 2.1265869140625, 2.20574951171875, 2.284912109375, 2.36407470703125, 2.4432373046875, 2.52239990234375, 2.6015625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 14.0, 16.0, 26.0, 40.0, 49.0, 104.0, 137.0, 197.0, 305.0, 436.0, 687.0, 1036.0, 1437.0, 2214.0, 3465.0, 5139.0, 7939.0, 12158.0, 19333.0, 30943.0, 51656.0, 91474.0, 190019.0, 1341728.0, 144494.0, 74943.0, 43106.0, 26353.0, 16652.0, 10681.0, 6866.0, 4546.0, 2918.0, 1977.0, 1347.0, 843.0, 639.0, 421.0, 236.0, 186.0, 125.0, 93.0, 51.0, 31.0, 24.0, 12.0, 9.0, 10.0, 5.0, 1.0, 4.0, 0.0, 3.0, 2.0, 3.0], "bins": [-0.0919189453125, -0.08907604217529297, -0.08623313903808594, -0.0833902359008789, -0.08054733276367188, -0.07770442962646484, -0.07486152648925781, -0.07201862335205078, -0.06917572021484375, -0.06633281707763672, -0.06348991394042969, -0.060647010803222656, -0.057804107666015625, -0.054961204528808594, -0.05211830139160156, -0.04927539825439453, -0.0464324951171875, -0.04358959197998047, -0.04074668884277344, -0.037903785705566406, -0.035060882568359375, -0.032217979431152344, -0.029375076293945312, -0.02653217315673828, -0.02368927001953125, -0.02084636688232422, -0.018003463745117188, -0.015160560607910156, -0.012317657470703125, -0.009474754333496094, -0.0066318511962890625, -0.0037889480590820312, -0.000946044921875, 0.0018968582153320312, 0.0047397613525390625, 0.007582664489746094, 0.010425567626953125, 0.013268470764160156, 0.016111373901367188, 0.01895427703857422, 0.02179718017578125, 0.02464008331298828, 0.027482986450195312, 0.030325889587402344, 0.033168792724609375, 0.036011695861816406, 0.03885459899902344, 0.04169750213623047, 0.0445404052734375, 0.04738330841064453, 0.05022621154785156, 0.053069114685058594, 0.055912017822265625, 0.058754920959472656, 0.06159782409667969, 0.06444072723388672, 0.06728363037109375, 0.07012653350830078, 0.07296943664550781, 0.07581233978271484, 0.07865524291992188, 0.0814981460571289, 0.08434104919433594, 0.08718395233154297, 0.09002685546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 3.0, 3.0, 7.0, 12.0, 16.0, 9.0, 17.0, 19.0, 19.0, 29.0, 35.0, 33.0, 49.0, 36.0, 55.0, 51.0, 61.0, 69.0, 54.0, 50.0, 50.0, 48.0, 45.0, 44.0, 30.0, 24.0, 30.0, 24.0, 26.0, 12.0, 11.0, 6.0, 8.0, 11.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83393669128418e-05, -4.682410508394241e-05, -4.530884325504303e-05, -4.3793581426143646e-05, -4.227831959724426e-05, -4.076305776834488e-05, -3.9247795939445496e-05, -3.773253411054611e-05, -3.621727228164673e-05, -3.4702010452747345e-05, -3.318674862384796e-05, -3.167148679494858e-05, -3.0156224966049194e-05, -2.864096313714981e-05, -2.7125701308250427e-05, -2.5610439479351044e-05, -2.409517765045166e-05, -2.2579915821552277e-05, -2.1064653992652893e-05, -1.954939216375351e-05, -1.8034130334854126e-05, -1.6518868505954742e-05, -1.5003606677055359e-05, -1.3488344848155975e-05, -1.1973083019256592e-05, -1.0457821190357208e-05, -8.942559361457825e-06, -7.427297532558441e-06, -5.912035703659058e-06, -4.396773874759674e-06, -2.8815120458602905e-06, -1.366250216960907e-06, 1.4901161193847656e-07, 1.6642734408378601e-06, 3.1795352697372437e-06, 4.694797098636627e-06, 6.210058927536011e-06, 7.725320756435394e-06, 9.240582585334778e-06, 1.0755844414234161e-05, 1.2271106243133545e-05, 1.3786368072032928e-05, 1.5301629900932312e-05, 1.6816891729831696e-05, 1.833215355873108e-05, 1.9847415387630463e-05, 2.1362677216529846e-05, 2.287793904542923e-05, 2.4393200874328613e-05, 2.5908462703227997e-05, 2.742372453212738e-05, 2.8938986361026764e-05, 3.0454248189926147e-05, 3.196951001882553e-05, 3.3484771847724915e-05, 3.50000336766243e-05, 3.651529550552368e-05, 3.8030557334423065e-05, 3.954581916332245e-05, 4.106108099222183e-05, 4.2576342821121216e-05, 4.40916046500206e-05, 4.560686647891998e-05, 4.7122128307819366e-05, 4.863739013671875e-05]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 7.0, 13.0, 12.0, 11.0, 35.0, 26.0, 28.0, 45.0, 67.0, 76.0, 90.0, 129.0, 167.0, 301.0, 838.0, 5846.0, 115159.0, 797818.0, 119979.0, 5964.0, 880.0, 310.0, 176.0, 140.0, 96.0, 76.0, 53.0, 46.0, 41.0, 22.0, 24.0, 18.0, 14.0, 7.0, 13.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0006532669067382812, -0.0006343349814414978, -0.0006154030561447144, -0.0005964711308479309, -0.0005775392055511475, -0.000558607280254364, -0.0005396753549575806, -0.0005207434296607971, -0.0005018115043640137, -0.0004828795790672302, -0.0004639476537704468, -0.00044501572847366333, -0.0004260838031768799, -0.00040715187788009644, -0.000388219952583313, -0.00036928802728652954, -0.0003503561019897461, -0.00033142417669296265, -0.0003124922513961792, -0.00029356032609939575, -0.0002746284008026123, -0.00025569647550582886, -0.0002367645502090454, -0.00021783262491226196, -0.00019890069961547852, -0.00017996877431869507, -0.00016103684902191162, -0.00014210492372512817, -0.00012317299842834473, -0.00010424107313156128, -8.530914783477783e-05, -6.637722253799438e-05, -4.744529724121094e-05, -2.851337194442749e-05, -9.581446647644043e-06, 9.350478649139404e-06, 2.828240394592285e-05, 4.72143292427063e-05, 6.614625453948975e-05, 8.50781798362732e-05, 0.00010401010513305664, 0.0001229420304298401, 0.00014187395572662354, 0.00016080588102340698, 0.00017973780632019043, 0.00019866973161697388, 0.00021760165691375732, 0.00023653358221054077, 0.0002554655075073242, 0.00027439743280410767, 0.0002933293581008911, 0.00031226128339767456, 0.000331193208694458, 0.00035012513399124146, 0.0003690570592880249, 0.00038798898458480835, 0.0004069209098815918, 0.00042585283517837524, 0.0004447847604751587, 0.00046371668577194214, 0.0004826486110687256, 0.000501580536365509, 0.0005205124616622925, 0.0005394443869590759, 0.0005583763122558594]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 8.0, 9.0, 19.0, 23.0, 19.0, 42.0, 42.0, 54.0, 59.0, 82.0, 82.0, 79.0, 94.0, 58.0, 57.0, 54.0, 42.0, 38.0, 27.0, 30.0, 13.0, 10.0, 12.0, 10.0, 8.0, 3.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.65196137863677e-05, -3.532379196258262e-05, -3.4127973776776344e-05, -3.293215195299126e-05, -3.173633012920618e-05, -3.0540511943399906e-05, -2.9344690119614825e-05, -2.8148870114819147e-05, -2.695305011002347e-05, -2.575723010522779e-05, -2.4561410100432113e-05, -2.336558827664703e-05, -2.2169768271851353e-05, -2.0973948267055675e-05, -1.9778126443270594e-05, -1.8582306438474916e-05, -1.7386486433679238e-05, -1.619066642888356e-05, -1.499484551459318e-05, -1.37990246003028e-05, -1.2603204595507123e-05, -1.1407384590711445e-05, -1.0211563676421065e-05, -9.015742762130685e-06, -7.819922757335007e-06, -6.624102297791978e-06, -5.4282818382489495e-06, -4.232461378705921e-06, -3.036640919162892e-06, -1.840820459619863e-06, -6.450000000768341e-07, 5.508209142135456e-07, 1.7466445569880307e-06, 2.9424650165310595e-06, 4.138285476074088e-06, 5.334105935617117e-06, 6.529926395160146e-06, 7.725746399955824e-06, 8.921567314246204e-06, 1.0117388228536583e-05, 1.1313208233332261e-05, 1.250902823812794e-05, 1.3704849152418319e-05, 1.4900670066708699e-05, 1.6096490071504377e-05, 1.7292310076300055e-05, 1.8488131900085136e-05, 1.9683951904880814e-05, 2.0879771909676492e-05, 2.207559191447217e-05, 2.3271411919267848e-05, 2.446723374305293e-05, 2.5663053747848608e-05, 2.6858873752644286e-05, 2.8054695576429367e-05, 2.9250515581225045e-05, 3.0446335586020723e-05, 3.1642157409805804e-05, 3.283797559561208e-05, 3.403379741939716e-05, 3.522961924318224e-05, 3.6425437428988516e-05, 3.76212592527736e-05, 3.881708107655868e-05, 4.0012899262364954e-05]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 8.0, 4.0, 10.0, 6.0, 12.0, 13.0, 12.0, 16.0, 13.0, 30.0, 30.0, 29.0, 32.0, 26.0, 40.0, 45.0, 50.0, 46.0, 64.0, 42.0, 48.0, 51.0, 32.0, 36.0, 49.0, 33.0, 32.0, 34.0, 29.0, 17.0, 24.0, 21.0, 9.0, 14.0, 12.0, 8.0, 10.0, 8.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9921531677246094e-05, -2.8954818844795227e-05, -2.798810601234436e-05, -2.7021393179893494e-05, -2.6054680347442627e-05, -2.508796751499176e-05, -2.4121254682540894e-05, -2.3154541850090027e-05, -2.218782901763916e-05, -2.1221116185188293e-05, -2.0254403352737427e-05, -1.928769052028656e-05, -1.8320977687835693e-05, -1.7354264855384827e-05, -1.638755202293396e-05, -1.5420839190483093e-05, -1.4454126358032227e-05, -1.348741352558136e-05, -1.2520700693130493e-05, -1.1553987860679626e-05, -1.058727502822876e-05, -9.620562195777893e-06, -8.653849363327026e-06, -7.68713653087616e-06, -6.720423698425293e-06, -5.753710865974426e-06, -4.7869980335235596e-06, -3.820285201072693e-06, -2.853572368621826e-06, -1.8868595361709595e-06, -9.201467037200928e-07, 4.6566128730773926e-08, 1.0132789611816406e-06, 1.9799917936325073e-06, 2.946704626083374e-06, 3.913417458534241e-06, 4.880130290985107e-06, 5.846843123435974e-06, 6.813555955886841e-06, 7.780268788337708e-06, 8.746981620788574e-06, 9.713694453239441e-06, 1.0680407285690308e-05, 1.1647120118141174e-05, 1.2613832950592041e-05, 1.3580545783042908e-05, 1.4547258615493774e-05, 1.551397144794464e-05, 1.6480684280395508e-05, 1.7447397112846375e-05, 1.841410994529724e-05, 1.9380822777748108e-05, 2.0347535610198975e-05, 2.131424844264984e-05, 2.2280961275100708e-05, 2.3247674107551575e-05, 2.421438694000244e-05, 2.5181099772453308e-05, 2.6147812604904175e-05, 2.711452543735504e-05, 2.8081238269805908e-05, 2.9047951102256775e-05, 3.001466393470764e-05, 3.098137676715851e-05, 3.1948089599609375e-05]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 12.0, 17.0, 17.0, 23.0, 20.0, 32.0, 29.0, 35.0, 38.0, 60.0, 46.0, 52.0, 49.0, 57.0, 54.0, 47.0, 60.0, 57.0, 33.0, 41.0, 33.0, 31.0, 29.0, 29.0, 12.0, 15.0, 12.0, 11.0, 8.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.888671875, -3.753387451171875, -3.61810302734375, -3.482818603515625, -3.3475341796875, -3.212249755859375, -3.07696533203125, -2.941680908203125, -2.806396484375, -2.671112060546875, -2.53582763671875, -2.400543212890625, -2.2652587890625, -2.129974365234375, -1.99468994140625, -1.859405517578125, -1.72412109375, -1.588836669921875, -1.45355224609375, -1.318267822265625, -1.1829833984375, -1.047698974609375, -0.91241455078125, -0.777130126953125, -0.641845703125, -0.506561279296875, -0.37127685546875, -0.235992431640625, -0.1007080078125, 0.034576416015625, 0.16986083984375, 0.305145263671875, 0.4404296875, 0.575714111328125, 0.71099853515625, 0.846282958984375, 0.9815673828125, 1.116851806640625, 1.25213623046875, 1.387420654296875, 1.522705078125, 1.657989501953125, 1.79327392578125, 1.928558349609375, 2.0638427734375, 2.199127197265625, 2.33441162109375, 2.469696044921875, 2.60498046875, 2.740264892578125, 2.87554931640625, 3.010833740234375, 3.1461181640625, 3.281402587890625, 3.41668701171875, 3.551971435546875, 3.687255859375, 3.822540283203125, 3.95782470703125, 4.093109130859375, 4.2283935546875, 4.363677978515625, 4.49896240234375, 4.634246826171875, 4.76953125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 6.0, 5.0, 10.0, 16.0, 17.0, 29.0, 26.0, 45.0, 71.0, 108.0, 202.0, 373.0, 649.0, 1314.0, 2906.0, 6914.0, 17908.0, 61423.0, 654826.0, 243003.0, 36821.0, 12499.0, 4984.0, 2082.0, 1024.0, 516.0, 306.0, 161.0, 91.0, 63.0, 38.0, 32.0, 13.0, 19.0, 8.0, 5.0, 11.0, 2.0, 4.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5625, -6.3424072265625, -6.122314453125, -5.9022216796875, -5.68212890625, -5.4620361328125, -5.241943359375, -5.0218505859375, -4.8017578125, -4.5816650390625, -4.361572265625, -4.1414794921875, -3.92138671875, -3.7012939453125, -3.481201171875, -3.2611083984375, -3.041015625, -2.8209228515625, -2.600830078125, -2.3807373046875, -2.16064453125, -1.9405517578125, -1.720458984375, -1.5003662109375, -1.2802734375, -1.0601806640625, -0.840087890625, -0.6199951171875, -0.39990234375, -0.1798095703125, 0.040283203125, 0.2603759765625, 0.48046875, 0.7005615234375, 0.920654296875, 1.1407470703125, 1.36083984375, 1.5809326171875, 1.801025390625, 2.0211181640625, 2.2412109375, 2.4613037109375, 2.681396484375, 2.9014892578125, 3.12158203125, 3.3416748046875, 3.561767578125, 3.7818603515625, 4.001953125, 4.2220458984375, 4.442138671875, 4.6622314453125, 4.88232421875, 5.1024169921875, 5.322509765625, 5.5426025390625, 5.7626953125, 5.9827880859375, 6.202880859375, 6.4229736328125, 6.64306640625, 6.8631591796875, 7.083251953125, 7.3033447265625, 7.5234375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 12.0, 12.0, 15.0, 10.0, 21.0, 23.0, 24.0, 33.0, 30.0, 35.0, 40.0, 29.0, 55.0, 47.0, 75.0, 164.0, 1811.0, 146.0, 54.0, 45.0, 54.0, 40.0, 39.0, 35.0, 26.0, 29.0, 18.0, 15.0, 19.0, 18.0, 12.0, 14.0, 5.0, 6.0, 8.0, 7.0, 3.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4140625, -12.972900390625, -12.53173828125, -12.090576171875, -11.6494140625, -11.208251953125, -10.76708984375, -10.325927734375, -9.884765625, -9.443603515625, -9.00244140625, -8.561279296875, -8.1201171875, -7.678955078125, -7.23779296875, -6.796630859375, -6.35546875, -5.914306640625, -5.47314453125, -5.031982421875, -4.5908203125, -4.149658203125, -3.70849609375, -3.267333984375, -2.826171875, -2.385009765625, -1.94384765625, -1.502685546875, -1.0615234375, -0.620361328125, -0.17919921875, 0.261962890625, 0.703125, 1.144287109375, 1.58544921875, 2.026611328125, 2.4677734375, 2.908935546875, 3.35009765625, 3.791259765625, 4.232421875, 4.673583984375, 5.11474609375, 5.555908203125, 5.9970703125, 6.438232421875, 6.87939453125, 7.320556640625, 7.76171875, 8.202880859375, 8.64404296875, 9.085205078125, 9.5263671875, 9.967529296875, 10.40869140625, 10.849853515625, 11.291015625, 11.732177734375, 12.17333984375, 12.614501953125, 13.0556640625, 13.496826171875, 13.93798828125, 14.379150390625, 14.8203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 5.0, 11.0, 16.0, 22.0, 11.0, 12.0, 20.0, 32.0, 39.0, 65.0, 87.0, 143.0, 225.0, 511.0, 1799.0, 13369.0, 1161683.0, 1950115.0, 14508.0, 1769.0, 525.0, 242.0, 135.0, 83.0, 56.0, 45.0, 27.0, 32.0, 21.0, 17.0, 19.0, 10.0, 10.0, 8.0, 8.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.046875, -24.310546875, -23.57421875, -22.837890625, -22.1015625, -21.365234375, -20.62890625, -19.892578125, -19.15625, -18.419921875, -17.68359375, -16.947265625, -16.2109375, -15.474609375, -14.73828125, -14.001953125, -13.265625, -12.529296875, -11.79296875, -11.056640625, -10.3203125, -9.583984375, -8.84765625, -8.111328125, -7.375, -6.638671875, -5.90234375, -5.166015625, -4.4296875, -3.693359375, -2.95703125, -2.220703125, -1.484375, -0.748046875, -0.01171875, 0.724609375, 1.4609375, 2.197265625, 2.93359375, 3.669921875, 4.40625, 5.142578125, 5.87890625, 6.615234375, 7.3515625, 8.087890625, 8.82421875, 9.560546875, 10.296875, 11.033203125, 11.76953125, 12.505859375, 13.2421875, 13.978515625, 14.71484375, 15.451171875, 16.1875, 16.923828125, 17.66015625, 18.396484375, 19.1328125, 19.869140625, 20.60546875, 21.341796875, 22.078125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 11.0, 93.0, 464.0, 379.0, 66.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.226112365722656, -37.10015869140625, -33.974205017089844, -30.84825325012207, -27.722299575805664, -24.596345901489258, -21.470394134521484, -18.344440460205078, -15.218486785888672, -12.092533111572266, -8.966580390930176, -5.840627670288086, -2.7146739959716797, 0.41127967834472656, 3.5372314453125, 6.663185119628906, 9.789138793945312, 12.915092468261719, 16.041046142578125, 19.1669979095459, 22.292951583862305, 25.41890525817871, 28.544857025146484, 31.67081069946289, 34.7967643737793, 37.9227180480957, 41.04867172241211, 44.17462158203125, 47.300575256347656, 50.42652893066406, 53.55248260498047, 56.678436279296875, 59.80438232421875, 62.930335998535156, 66.05628967285156, 69.18224334716797, 72.30819702148438, 75.43415069580078, 78.56010437011719, 81.68605041503906, 84.81201171875, 87.9379653930664, 91.06391906738281, 94.18987274169922, 97.31582641601562, 100.44178009033203, 103.56773376464844, 106.69367980957031, 109.81963348388672, 112.94558715820312, 116.07154083251953, 119.19749450683594, 122.32344818115234, 125.44940185546875, 128.57534790039062, 131.70130920410156, 134.82725524902344, 137.9532012939453, 141.07916259765625, 144.20510864257812, 147.33106994628906, 150.45701599121094, 153.58297729492188, 156.70892333984375, 159.8348846435547]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 16.0, 5.0, 6.0, 7.0, 11.0, 8.0, 21.0, 22.0, 22.0, 23.0, 36.0, 26.0, 23.0, 38.0, 32.0, 30.0, 30.0, 41.0, 34.0, 54.0, 46.0, 45.0, 48.0, 52.0, 45.0, 44.0, 27.0, 25.0, 41.0, 21.0, 25.0, 23.0, 14.0, 10.0, 8.0, 15.0, 10.0, 11.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.94865417480469, -44.49686813354492, -43.045082092285156, -41.593299865722656, -40.14151382446289, -38.689727783203125, -37.23794174194336, -35.786155700683594, -34.334373474121094, -32.88258743286133, -31.430803298950195, -29.97901725769043, -28.527233123779297, -27.07544708251953, -25.623661041259766, -24.171875, -22.720088958740234, -21.26830291748047, -19.816518783569336, -18.36473274230957, -16.912948608398438, -15.461162567138672, -14.009376525878906, -12.557591438293457, -11.105806350708008, -9.654021263122559, -8.20223617553711, -6.750450134277344, -5.2986650466918945, -3.8468799591064453, -2.3950939178466797, -0.9433088302612305, 0.5084800720214844, 1.9602653980255127, 3.412050724029541, 4.863836288452148, 6.315621376037598, 7.767406463623047, 9.219192504882812, 10.670977592468262, 12.122762680053711, 13.57454776763916, 15.02633285522461, 16.478118896484375, 17.92990493774414, 19.381689071655273, 20.83347511291504, 22.285259246826172, 23.737045288085938, 25.188831329345703, 26.640615463256836, 28.0924015045166, 29.544185638427734, 30.9959716796875, 32.447757720947266, 33.89954376220703, 35.35132598876953, 36.8031120300293, 38.25489807128906, 39.70668029785156, 41.15846633911133, 42.610252380371094, 44.06203842163086, 45.513824462890625, 46.96561050415039]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 4.0, 14.0, 13.0, 17.0, 15.0, 20.0, 21.0, 36.0, 36.0, 29.0, 53.0, 54.0, 46.0, 59.0, 47.0, 53.0, 58.0, 50.0, 58.0, 38.0, 40.0, 38.0, 37.0, 32.0, 21.0, 31.0, 8.0, 11.0, 12.0, 12.0, 5.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.912109375, -3.773773193359375, -3.63543701171875, -3.497100830078125, -3.3587646484375, -3.220428466796875, -3.08209228515625, -2.943756103515625, -2.805419921875, -2.667083740234375, -2.52874755859375, -2.390411376953125, -2.2520751953125, -2.113739013671875, -1.97540283203125, -1.837066650390625, -1.69873046875, -1.560394287109375, -1.42205810546875, -1.283721923828125, -1.1453857421875, -1.007049560546875, -0.86871337890625, -0.730377197265625, -0.592041015625, -0.453704833984375, -0.31536865234375, -0.177032470703125, -0.0386962890625, 0.099639892578125, 0.23797607421875, 0.376312255859375, 0.5146484375, 0.652984619140625, 0.79132080078125, 0.929656982421875, 1.0679931640625, 1.206329345703125, 1.34466552734375, 1.483001708984375, 1.621337890625, 1.759674072265625, 1.89801025390625, 2.036346435546875, 2.1746826171875, 2.313018798828125, 2.45135498046875, 2.589691162109375, 2.72802734375, 2.866363525390625, 3.00469970703125, 3.143035888671875, 3.2813720703125, 3.419708251953125, 3.55804443359375, 3.696380615234375, 3.834716796875, 3.973052978515625, 4.11138916015625, 4.249725341796875, 4.3880615234375, 4.526397705078125, 4.66473388671875, 4.803070068359375, 4.94140625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 9.0, 10.0, 16.0, 13.0, 24.0, 24.0, 36.0, 42.0, 54.0, 90.0, 108.0, 162.0, 236.0, 352.0, 570.0, 953.0, 1874.0, 4088.0, 10835.0, 37135.0, 194947.0, 2483680.0, 1296123.0, 120783.0, 26298.0, 8408.0, 3365.0, 1655.0, 854.0, 489.0, 317.0, 204.0, 141.0, 97.0, 81.0, 46.0, 45.0, 36.0, 17.0, 15.0, 9.0, 12.0, 6.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.9375, -13.5260009765625, -13.114501953125, -12.7030029296875, -12.29150390625, -11.8800048828125, -11.468505859375, -11.0570068359375, -10.6455078125, -10.2340087890625, -9.822509765625, -9.4110107421875, -8.99951171875, -8.5880126953125, -8.176513671875, -7.7650146484375, -7.353515625, -6.9420166015625, -6.530517578125, -6.1190185546875, -5.70751953125, -5.2960205078125, -4.884521484375, -4.4730224609375, -4.0615234375, -3.6500244140625, -3.238525390625, -2.8270263671875, -2.41552734375, -2.0040283203125, -1.592529296875, -1.1810302734375, -0.76953125, -0.3580322265625, 0.053466796875, 0.4649658203125, 0.87646484375, 1.2879638671875, 1.699462890625, 2.1109619140625, 2.5224609375, 2.9339599609375, 3.345458984375, 3.7569580078125, 4.16845703125, 4.5799560546875, 4.991455078125, 5.4029541015625, 5.814453125, 6.2259521484375, 6.637451171875, 7.0489501953125, 7.46044921875, 7.8719482421875, 8.283447265625, 8.6949462890625, 9.1064453125, 9.5179443359375, 9.929443359375, 10.3409423828125, 10.75244140625, 11.1639404296875, 11.575439453125, 11.9869384765625, 12.3984375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 1.0, 6.0, 6.0, 7.0, 10.0, 14.0, 16.0, 24.0, 29.0, 30.0, 43.0, 64.0, 88.0, 126.0, 164.0, 270.0, 345.0, 495.0, 608.0, 494.0, 341.0, 256.0, 167.0, 108.0, 98.0, 75.0, 50.0, 35.0, 30.0, 20.0, 13.0, 7.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-12.15625, -11.83935546875, -11.5224609375, -11.20556640625, -10.888671875, -10.57177734375, -10.2548828125, -9.93798828125, -9.62109375, -9.30419921875, -8.9873046875, -8.67041015625, -8.353515625, -8.03662109375, -7.7197265625, -7.40283203125, -7.0859375, -6.76904296875, -6.4521484375, -6.13525390625, -5.818359375, -5.50146484375, -5.1845703125, -4.86767578125, -4.55078125, -4.23388671875, -3.9169921875, -3.60009765625, -3.283203125, -2.96630859375, -2.6494140625, -2.33251953125, -2.015625, -1.69873046875, -1.3818359375, -1.06494140625, -0.748046875, -0.43115234375, -0.1142578125, 0.20263671875, 0.51953125, 0.83642578125, 1.1533203125, 1.47021484375, 1.787109375, 2.10400390625, 2.4208984375, 2.73779296875, 3.0546875, 3.37158203125, 3.6884765625, 4.00537109375, 4.322265625, 4.63916015625, 4.9560546875, 5.27294921875, 5.58984375, 5.90673828125, 6.2236328125, 6.54052734375, 6.857421875, 7.17431640625, 7.4912109375, 7.80810546875, 8.125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 9.0, 28.0, 44.0, 53.0, 102.0, 163.0, 308.0, 548.0, 936.0, 1830.0, 3944.0, 9193.0, 26594.0, 99671.0, 543485.0, 2767601.0, 588887.0, 105367.0, 28030.0, 9535.0, 3939.0, 1722.0, 982.0, 540.0, 326.0, 176.0, 99.0, 65.0, 49.0, 19.0, 11.0, 10.0, 6.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -15.895751953125, -15.33837890625, -14.781005859375, -14.2236328125, -13.666259765625, -13.10888671875, -12.551513671875, -11.994140625, -11.436767578125, -10.87939453125, -10.322021484375, -9.7646484375, -9.207275390625, -8.64990234375, -8.092529296875, -7.53515625, -6.977783203125, -6.42041015625, -5.863037109375, -5.3056640625, -4.748291015625, -4.19091796875, -3.633544921875, -3.076171875, -2.518798828125, -1.96142578125, -1.404052734375, -0.8466796875, -0.289306640625, 0.26806640625, 0.825439453125, 1.3828125, 1.940185546875, 2.49755859375, 3.054931640625, 3.6123046875, 4.169677734375, 4.72705078125, 5.284423828125, 5.841796875, 6.399169921875, 6.95654296875, 7.513916015625, 8.0712890625, 8.628662109375, 9.18603515625, 9.743408203125, 10.30078125, 10.858154296875, 11.41552734375, 11.972900390625, 12.5302734375, 13.087646484375, 13.64501953125, 14.202392578125, 14.759765625, 15.317138671875, 15.87451171875, 16.431884765625, 16.9892578125, 17.546630859375, 18.10400390625, 18.661376953125, 19.21875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 8.0, 13.0, 21.0, 25.0, 59.0, 78.0, 75.0, 132.0, 129.0, 120.0, 111.0, 80.0, 73.0, 30.0, 23.0, 11.0, 11.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.62012481689453, -88.22784423828125, -85.83556365966797, -83.44329071044922, -81.05101013183594, -78.65872955322266, -76.26644897460938, -73.8741683959961, -71.48188781738281, -69.08960723876953, -66.69732666015625, -64.3050537109375, -61.91277313232422, -59.52049255371094, -57.128211975097656, -54.735931396484375, -52.343658447265625, -49.951377868652344, -47.55910110473633, -45.16682052612305, -42.77454376220703, -40.38226318359375, -37.98998260498047, -35.59770202636719, -33.20542526245117, -30.813146591186523, -28.420867919921875, -26.028587341308594, -23.636308670043945, -21.244029998779297, -18.851749420166016, -16.459470748901367, -14.06719970703125, -11.674921035766602, -9.282641410827637, -6.89036226272583, -4.498083114624023, -2.105804443359375, 0.28647518157958984, 2.6787548065185547, 5.071033477783203, 7.46331262588501, 9.855591773986816, 12.247871398925781, 14.64015007019043, 17.032428741455078, 19.42470932006836, 21.816987991333008, 24.209266662597656, 26.601545333862305, 28.993824005126953, 31.386104583740234, 33.77838134765625, 36.17066192626953, 38.56294250488281, 40.955223083496094, 43.34749984741211, 45.73978042602539, 48.132057189941406, 50.52433776855469, 52.91661834716797, 55.308895111083984, 57.701175689697266, 60.09345245361328, 62.48573303222656]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 7.0, 4.0, 9.0, 11.0, 19.0, 16.0, 13.0, 14.0, 21.0, 25.0, 31.0, 28.0, 34.0, 34.0, 47.0, 35.0, 50.0, 44.0, 48.0, 52.0, 46.0, 45.0, 33.0, 44.0, 41.0, 31.0, 33.0, 32.0, 29.0, 25.0, 22.0, 10.0, 17.0, 13.0, 10.0, 6.0, 5.0, 10.0, 2.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.43781280517578, -27.305179595947266, -26.17254638671875, -25.039913177490234, -23.90727996826172, -22.774646759033203, -21.64201545715332, -20.509382247924805, -19.37674903869629, -18.244115829467773, -17.111482620239258, -15.978850364685059, -14.846217155456543, -13.713583946228027, -12.580951690673828, -11.448318481445312, -10.315685272216797, -9.183052062988281, -8.050418853759766, -6.917786598205566, -5.785153388977051, -4.652520179748535, -3.5198874473571777, -2.3872547149658203, -1.2546215057373047, -0.12198853492736816, 1.0106444358825684, 2.143277406692505, 3.2759103775024414, 4.408543586730957, 5.5411763191223145, 6.673809051513672, 7.8064422607421875, 8.939075469970703, 10.071708679199219, 11.204340934753418, 12.336974143981934, 13.46960735321045, 14.602239608764648, 15.734872817993164, 16.86750602722168, 18.000139236450195, 19.13277244567871, 20.265405654907227, 21.39803695678711, 22.530670166015625, 23.66330337524414, 24.795936584472656, 25.928569793701172, 27.061203002929688, 28.193836212158203, 29.32646942138672, 30.459102630615234, 31.59173583984375, 32.724369049072266, 33.85700225830078, 34.98963165283203, 36.12226486206055, 37.25489807128906, 38.38753128051758, 39.520164489746094, 40.65279769897461, 41.785430908203125, 42.918060302734375, 44.050697326660156]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 8.0, 18.0, 12.0, 19.0, 23.0, 22.0, 28.0, 26.0, 39.0, 47.0, 57.0, 55.0, 49.0, 60.0, 57.0, 66.0, 59.0, 45.0, 47.0, 46.0, 39.0, 26.0, 25.0, 24.0, 16.0, 13.0, 5.0, 12.0, 9.0, 7.0, 6.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.928955078125, -3.78369140625, -3.638427734375, -3.4931640625, -3.347900390625, -3.20263671875, -3.057373046875, -2.912109375, -2.766845703125, -2.62158203125, -2.476318359375, -2.3310546875, -2.185791015625, -2.04052734375, -1.895263671875, -1.75, -1.604736328125, -1.45947265625, -1.314208984375, -1.1689453125, -1.023681640625, -0.87841796875, -0.733154296875, -0.587890625, -0.442626953125, -0.29736328125, -0.152099609375, -0.0068359375, 0.138427734375, 0.28369140625, 0.428955078125, 0.57421875, 0.719482421875, 0.86474609375, 1.010009765625, 1.1552734375, 1.300537109375, 1.44580078125, 1.591064453125, 1.736328125, 1.881591796875, 2.02685546875, 2.172119140625, 2.3173828125, 2.462646484375, 2.60791015625, 2.753173828125, 2.8984375, 3.043701171875, 3.18896484375, 3.334228515625, 3.4794921875, 3.624755859375, 3.77001953125, 3.915283203125, 4.060546875, 4.205810546875, 4.35107421875, 4.496337890625, 4.6416015625, 4.786865234375, 4.93212890625, 5.077392578125, 5.22265625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 17.0, 12.0, 24.0, 47.0, 72.0, 79.0, 144.0, 217.0, 314.0, 566.0, 848.0, 1409.0, 2380.0, 3919.0, 6377.0, 10913.0, 19197.0, 35894.0, 71492.0, 173669.0, 401817.0, 167831.0, 70319.0, 34976.0, 18902.0, 10935.0, 6340.0, 3791.0, 2297.0, 1395.0, 880.0, 512.0, 329.0, 234.0, 137.0, 86.0, 55.0, 36.0, 21.0, 25.0, 12.0, 12.0, 4.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1732177734375, -0.1673431396484375, -0.161468505859375, -0.1555938720703125, -0.14971923828125, -0.1438446044921875, -0.137969970703125, -0.1320953369140625, -0.126220703125, -0.1203460693359375, -0.114471435546875, -0.1085968017578125, -0.10272216796875, -0.0968475341796875, -0.090972900390625, -0.0850982666015625, -0.0792236328125, -0.0733489990234375, -0.067474365234375, -0.0615997314453125, -0.05572509765625, -0.0498504638671875, -0.043975830078125, -0.0381011962890625, -0.0322265625, -0.0263519287109375, -0.020477294921875, -0.0146026611328125, -0.00872802734375, -0.0028533935546875, 0.003021240234375, 0.0088958740234375, 0.0147705078125, 0.0206451416015625, 0.026519775390625, 0.0323944091796875, 0.03826904296875, 0.0441436767578125, 0.050018310546875, 0.0558929443359375, 0.061767578125, 0.0676422119140625, 0.073516845703125, 0.0793914794921875, 0.08526611328125, 0.0911407470703125, 0.097015380859375, 0.1028900146484375, 0.1087646484375, 0.1146392822265625, 0.120513916015625, 0.1263885498046875, 0.13226318359375, 0.1381378173828125, 0.144012451171875, 0.1498870849609375, 0.15576171875, 0.1616363525390625, 0.167510986328125, 0.1733856201171875, 0.17926025390625, 0.1851348876953125, 0.191009521484375, 0.1968841552734375, 0.2027587890625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 5.0, 1.0, 6.0, 4.0, 7.0, 5.0, 4.0, 15.0, 18.0, 22.0, 15.0, 19.0, 19.0, 26.0, 32.0, 26.0, 32.0, 15.0, 36.0, 38.0, 33.0, 32.0, 45.0, 40.0, 1062.0, 45.0, 37.0, 38.0, 39.0, 29.0, 34.0, 30.0, 25.0, 23.0, 17.0, 26.0, 13.0, 16.0, 14.0, 13.0, 9.0, 16.0, 5.0, 13.0, 5.0, 3.0, 2.0, 4.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.4140625, -2.337371826171875, -2.26068115234375, -2.183990478515625, -2.1072998046875, -2.030609130859375, -1.95391845703125, -1.877227783203125, -1.800537109375, -1.723846435546875, -1.64715576171875, -1.570465087890625, -1.4937744140625, -1.417083740234375, -1.34039306640625, -1.263702392578125, -1.18701171875, -1.110321044921875, -1.03363037109375, -0.956939697265625, -0.8802490234375, -0.803558349609375, -0.72686767578125, -0.650177001953125, -0.573486328125, -0.496795654296875, -0.42010498046875, -0.343414306640625, -0.2667236328125, -0.190032958984375, -0.11334228515625, -0.036651611328125, 0.0400390625, 0.116729736328125, 0.19342041015625, 0.270111083984375, 0.3468017578125, 0.423492431640625, 0.50018310546875, 0.576873779296875, 0.653564453125, 0.730255126953125, 0.80694580078125, 0.883636474609375, 0.9603271484375, 1.037017822265625, 1.11370849609375, 1.190399169921875, 1.26708984375, 1.343780517578125, 1.42047119140625, 1.497161865234375, 1.5738525390625, 1.650543212890625, 1.72723388671875, 1.803924560546875, 1.880615234375, 1.957305908203125, 2.03399658203125, 2.110687255859375, 2.1873779296875, 2.264068603515625, 2.34075927734375, 2.417449951171875, 2.494140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 3.0, 12.0, 13.0, 18.0, 31.0, 56.0, 96.0, 122.0, 195.0, 282.0, 393.0, 624.0, 920.0, 1398.0, 2062.0, 3192.0, 4920.0, 7545.0, 11559.0, 18265.0, 28626.0, 47529.0, 82902.0, 170920.0, 1348750.0, 163330.0, 79823.0, 45600.0, 28087.0, 17304.0, 11259.0, 7372.0, 4710.0, 3104.0, 2043.0, 1362.0, 872.0, 607.0, 423.0, 267.0, 167.0, 131.0, 81.0, 65.0, 32.0, 16.0, 12.0, 9.0, 11.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.087158203125, -0.08438873291015625, -0.0816192626953125, -0.07884979248046875, -0.076080322265625, -0.07331085205078125, -0.0705413818359375, -0.06777191162109375, -0.06500244140625, -0.06223297119140625, -0.0594635009765625, -0.05669403076171875, -0.053924560546875, -0.05115509033203125, -0.0483856201171875, -0.04561614990234375, -0.0428466796875, -0.04007720947265625, -0.0373077392578125, -0.03453826904296875, -0.031768798828125, -0.02899932861328125, -0.0262298583984375, -0.02346038818359375, -0.02069091796875, -0.01792144775390625, -0.0151519775390625, -0.01238250732421875, -0.009613037109375, -0.00684356689453125, -0.0040740966796875, -0.00130462646484375, 0.00146484375, 0.00423431396484375, 0.0070037841796875, 0.00977325439453125, 0.012542724609375, 0.01531219482421875, 0.0180816650390625, 0.02085113525390625, 0.02362060546875, 0.02639007568359375, 0.0291595458984375, 0.03192901611328125, 0.034698486328125, 0.03746795654296875, 0.0402374267578125, 0.04300689697265625, 0.0457763671875, 0.04854583740234375, 0.0513153076171875, 0.05408477783203125, 0.056854248046875, 0.05962371826171875, 0.0623931884765625, 0.06516265869140625, 0.06793212890625, 0.07070159912109375, 0.0734710693359375, 0.07624053955078125, 0.079010009765625, 0.08177947998046875, 0.0845489501953125, 0.08731842041015625, 0.090087890625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 2.0, 5.0, 5.0, 7.0, 8.0, 14.0, 14.0, 15.0, 19.0, 18.0, 26.0, 16.0, 27.0, 37.0, 35.0, 51.0, 38.0, 38.0, 38.0, 39.0, 39.0, 37.0, 39.0, 40.0, 39.0, 39.0, 39.0, 31.0, 18.0, 29.0, 35.0, 27.0, 22.0, 20.0, 20.0, 14.0, 8.0, 12.0, 11.0, 1.0, 5.0, 5.0, 5.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.1365623474121094e-05, -4.0121376514434814e-05, -3.8877129554748535e-05, -3.7632882595062256e-05, -3.6388635635375977e-05, -3.51443886756897e-05, -3.390014171600342e-05, -3.265589475631714e-05, -3.141164779663086e-05, -3.016740083694458e-05, -2.89231538772583e-05, -2.767890691757202e-05, -2.6434659957885742e-05, -2.5190412998199463e-05, -2.3946166038513184e-05, -2.2701919078826904e-05, -2.1457672119140625e-05, -2.0213425159454346e-05, -1.8969178199768066e-05, -1.7724931240081787e-05, -1.6480684280395508e-05, -1.5236437320709229e-05, -1.399219036102295e-05, -1.274794340133667e-05, -1.150369644165039e-05, -1.0259449481964111e-05, -9.015202522277832e-06, -7.770955562591553e-06, -6.5267086029052734e-06, -5.282461643218994e-06, -4.038214683532715e-06, -2.7939677238464355e-06, -1.5497207641601562e-06, -3.0547380447387695e-07, 9.387731552124023e-07, 2.1830201148986816e-06, 3.427267074584961e-06, 4.67151403427124e-06, 5.9157609939575195e-06, 7.160007953643799e-06, 8.404254913330078e-06, 9.648501873016357e-06, 1.0892748832702637e-05, 1.2136995792388916e-05, 1.3381242752075195e-05, 1.4625489711761475e-05, 1.5869736671447754e-05, 1.7113983631134033e-05, 1.8358230590820312e-05, 1.9602477550506592e-05, 2.084672451019287e-05, 2.209097146987915e-05, 2.333521842956543e-05, 2.457946538925171e-05, 2.5823712348937988e-05, 2.7067959308624268e-05, 2.8312206268310547e-05, 2.9556453227996826e-05, 3.0800700187683105e-05, 3.2044947147369385e-05, 3.3289194107055664e-05, 3.453344106674194e-05, 3.577768802642822e-05, 3.70219349861145e-05, 3.826618194580078e-05]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 6.0, 5.0, 3.0, 5.0, 14.0, 4.0, 18.0, 38.0, 24.0, 43.0, 42.0, 55.0, 69.0, 80.0, 117.0, 154.0, 254.0, 473.0, 2195.0, 30540.0, 521802.0, 463598.0, 25702.0, 1839.0, 509.0, 274.0, 171.0, 111.0, 92.0, 58.0, 49.0, 46.0, 26.0, 30.0, 22.0, 18.0, 14.0, 8.0, 9.0, 8.0, 5.0, 4.0, 2.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005526542663574219, -0.0005342140793800354, -0.0005157738924026489, -0.0004973337054252625, -0.000478893518447876, -0.0004604533314704895, -0.00044201314449310303, -0.00042357295751571655, -0.0004051327705383301, -0.0003866925835609436, -0.00036825239658355713, -0.00034981220960617065, -0.0003313720226287842, -0.0003129318356513977, -0.00029449164867401123, -0.00027605146169662476, -0.0002576112747192383, -0.0002391710877418518, -0.00022073090076446533, -0.00020229071378707886, -0.00018385052680969238, -0.0001654103398323059, -0.00014697015285491943, -0.00012852996587753296, -0.00011008977890014648, -9.164959192276001e-05, -7.320940494537354e-05, -5.476921796798706e-05, -3.6329030990600586e-05, -1.788884401321411e-05, 5.513429641723633e-07, 1.8991529941558838e-05, 3.743171691894531e-05, 5.587190389633179e-05, 7.431209087371826e-05, 9.275227785110474e-05, 0.00011119246482849121, 0.00012963265180587769, 0.00014807283878326416, 0.00016651302576065063, 0.0001849532127380371, 0.00020339339971542358, 0.00022183358669281006, 0.00024027377367019653, 0.000258713960647583, 0.0002771541476249695, 0.00029559433460235596, 0.00031403452157974243, 0.0003324747085571289, 0.0003509148955345154, 0.00036935508251190186, 0.00038779526948928833, 0.0004062354564666748, 0.0004246756434440613, 0.00044311583042144775, 0.00046155601739883423, 0.0004799962043762207, 0.0004984363913536072, 0.0005168765783309937, 0.0005353167653083801, 0.0005537569522857666, 0.0005721971392631531, 0.0005906373262405396, 0.000609077513217926, 0.0006275177001953125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 33.0, 224.0, 521.0, 197.0, 33.0, 3.0, 1.0, 1.0], "bins": [-0.0005321917124092579, -0.0005230947863310575, -0.0005139978602528572, -0.0005049009341746569, -0.0004958040080964565, -0.0004867070820182562, -0.00047761015594005585, -0.0004685132298618555, -0.00045941630378365517, -0.0004503193777054548, -0.0004412224516272545, -0.00043212552554905415, -0.0004230285994708538, -0.00041393167339265347, -0.0004048347473144531, -0.0003957378212362528, -0.000386640866054222, -0.00037754393997602165, -0.0003684470138978213, -0.00035935008781962097, -0.0003502531617414206, -0.0003411562356632203, -0.00033205930958501995, -0.00032296235440298915, -0.0003138654283247888, -0.00030476850224658847, -0.00029567157616838813, -0.0002865746500901878, -0.00027747772401198745, -0.0002683807979337871, -0.00025928387185558677, -0.0002501869457773864, -0.0002410900196991861, -0.00023199309362098575, -0.0002228961675427854, -0.00021379924146458507, -0.00020470231538638473, -0.00019560538930818439, -0.00018650844867806882, -0.00017741152259986848, -0.00016831459652166814, -0.0001592176704434678, -0.00015012074436526746, -0.00014102381828706712, -0.00013192687765695155, -0.0001228299515787512, -0.00011373302550055087, -0.00010463609942235053, -9.553917334415019e-05, -8.644224726594985e-05, -7.73453211877495e-05, -6.824838783359155e-05, -5.915146175539121e-05, -5.005453567719087e-05, -4.095760596101172e-05, -3.1860676244832575e-05, -2.2763750166632235e-05, -1.3666822269442491e-05, -4.569894372252747e-06, 4.527033524936996e-06, 1.362396142212674e-05, 2.272088750032708e-05, 3.181781721650623e-05, 4.0914746932685375e-05, 5.0011673010885715e-05]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 4.0, 12.0, 12.0, 12.0, 12.0, 14.0, 19.0, 23.0, 27.0, 39.0, 38.0, 23.0, 48.0, 36.0, 45.0, 38.0, 40.0, 37.0, 37.0, 38.0, 37.0, 44.0, 39.0, 41.0, 40.0, 27.0, 31.0, 29.0, 34.0, 12.0, 18.0, 15.0, 10.0, 13.0, 15.0, 13.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.950429916381836e-05, -2.8464943170547485e-05, -2.742558717727661e-05, -2.6386231184005737e-05, -2.5346875190734863e-05, -2.430751919746399e-05, -2.3268163204193115e-05, -2.222880721092224e-05, -2.1189451217651367e-05, -2.0150095224380493e-05, -1.911073923110962e-05, -1.8071383237838745e-05, -1.703202724456787e-05, -1.5992671251296997e-05, -1.4953315258026123e-05, -1.3913959264755249e-05, -1.2874603271484375e-05, -1.1835247278213501e-05, -1.0795891284942627e-05, -9.756535291671753e-06, -8.717179298400879e-06, -7.677823305130005e-06, -6.638467311859131e-06, -5.599111318588257e-06, -4.559755325317383e-06, -3.520399332046509e-06, -2.4810433387756348e-06, -1.4416873455047607e-06, -4.023313522338867e-07, 6.370246410369873e-07, 1.6763806343078613e-06, 2.7157366275787354e-06, 3.7550926208496094e-06, 4.794448614120483e-06, 5.833804607391357e-06, 6.8731606006622314e-06, 7.912516593933105e-06, 8.95187258720398e-06, 9.991228580474854e-06, 1.1030584573745728e-05, 1.2069940567016602e-05, 1.3109296560287476e-05, 1.414865255355835e-05, 1.5188008546829224e-05, 1.6227364540100098e-05, 1.726672053337097e-05, 1.8306076526641846e-05, 1.934543251991272e-05, 2.0384788513183594e-05, 2.1424144506454468e-05, 2.2463500499725342e-05, 2.3502856492996216e-05, 2.454221248626709e-05, 2.5581568479537964e-05, 2.6620924472808838e-05, 2.7660280466079712e-05, 2.8699636459350586e-05, 2.973899245262146e-05, 3.0778348445892334e-05, 3.181770443916321e-05, 3.285706043243408e-05, 3.3896416425704956e-05, 3.493577241897583e-05, 3.5975128412246704e-05, 3.701448440551758e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 8.0, 18.0, 12.0, 19.0, 23.0, 22.0, 28.0, 26.0, 39.0, 47.0, 57.0, 55.0, 49.0, 60.0, 57.0, 66.0, 59.0, 45.0, 47.0, 46.0, 39.0, 26.0, 25.0, 24.0, 16.0, 13.0, 5.0, 12.0, 9.0, 7.0, 6.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.928955078125, -3.78369140625, -3.638427734375, -3.4931640625, -3.347900390625, -3.20263671875, -3.057373046875, -2.912109375, -2.766845703125, -2.62158203125, -2.476318359375, -2.3310546875, -2.185791015625, -2.04052734375, -1.895263671875, -1.75, -1.604736328125, -1.45947265625, -1.314208984375, -1.1689453125, -1.023681640625, -0.87841796875, -0.733154296875, -0.587890625, -0.442626953125, -0.29736328125, -0.152099609375, -0.0068359375, 0.138427734375, 0.28369140625, 0.428955078125, 0.57421875, 0.719482421875, 0.86474609375, 1.010009765625, 1.1552734375, 1.300537109375, 1.44580078125, 1.591064453125, 1.736328125, 1.881591796875, 2.02685546875, 2.172119140625, 2.3173828125, 2.462646484375, 2.60791015625, 2.753173828125, 2.8984375, 3.043701171875, 3.18896484375, 3.334228515625, 3.4794921875, 3.624755859375, 3.77001953125, 3.915283203125, 4.060546875, 4.205810546875, 4.35107421875, 4.496337890625, 4.6416015625, 4.786865234375, 4.93212890625, 5.077392578125, 5.22265625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 10.0, 16.0, 20.0, 27.0, 34.0, 53.0, 82.0, 127.0, 156.0, 231.0, 383.0, 556.0, 820.0, 1283.0, 1919.0, 3054.0, 4938.0, 8307.0, 15069.0, 29085.0, 61713.0, 156102.0, 399820.0, 208913.0, 77165.0, 35325.0, 17937.0, 9815.0, 5843.0, 3380.0, 2184.0, 1372.0, 921.0, 579.0, 410.0, 265.0, 180.0, 154.0, 75.0, 67.0, 60.0, 21.0, 17.0, 18.0, 14.0, 10.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.713134765625, -2.62158203125, -2.530029296875, -2.4384765625, -2.346923828125, -2.25537109375, -2.163818359375, -2.072265625, -1.980712890625, -1.88916015625, -1.797607421875, -1.7060546875, -1.614501953125, -1.52294921875, -1.431396484375, -1.33984375, -1.248291015625, -1.15673828125, -1.065185546875, -0.9736328125, -0.882080078125, -0.79052734375, -0.698974609375, -0.607421875, -0.515869140625, -0.42431640625, -0.332763671875, -0.2412109375, -0.149658203125, -0.05810546875, 0.033447265625, 0.125, 0.216552734375, 0.30810546875, 0.399658203125, 0.4912109375, 0.582763671875, 0.67431640625, 0.765869140625, 0.857421875, 0.948974609375, 1.04052734375, 1.132080078125, 1.2236328125, 1.315185546875, 1.40673828125, 1.498291015625, 1.58984375, 1.681396484375, 1.77294921875, 1.864501953125, 1.9560546875, 2.047607421875, 2.13916015625, 2.230712890625, 2.322265625, 2.413818359375, 2.50537109375, 2.596923828125, 2.6884765625, 2.780029296875, 2.87158203125, 2.963134765625, 3.0546875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 8.0, 5.0, 3.0, 4.0, 9.0, 5.0, 7.0, 14.0, 16.0, 22.0, 18.0, 24.0, 17.0, 24.0, 29.0, 24.0, 27.0, 32.0, 28.0, 42.0, 47.0, 57.0, 77.0, 150.0, 1530.0, 269.0, 119.0, 53.0, 40.0, 29.0, 42.0, 29.0, 36.0, 28.0, 32.0, 29.0, 11.0, 22.0, 11.0, 8.0, 11.0, 6.0, 6.0, 10.0, 7.0, 11.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0], "bins": [-11.4921875, -11.1513671875, -10.810546875, -10.4697265625, -10.12890625, -9.7880859375, -9.447265625, -9.1064453125, -8.765625, -8.4248046875, -8.083984375, -7.7431640625, -7.40234375, -7.0615234375, -6.720703125, -6.3798828125, -6.0390625, -5.6982421875, -5.357421875, -5.0166015625, -4.67578125, -4.3349609375, -3.994140625, -3.6533203125, -3.3125, -2.9716796875, -2.630859375, -2.2900390625, -1.94921875, -1.6083984375, -1.267578125, -0.9267578125, -0.5859375, -0.2451171875, 0.095703125, 0.4365234375, 0.77734375, 1.1181640625, 1.458984375, 1.7998046875, 2.140625, 2.4814453125, 2.822265625, 3.1630859375, 3.50390625, 3.8447265625, 4.185546875, 4.5263671875, 4.8671875, 5.2080078125, 5.548828125, 5.8896484375, 6.23046875, 6.5712890625, 6.912109375, 7.2529296875, 7.59375, 7.9345703125, 8.275390625, 8.6162109375, 8.95703125, 9.2978515625, 9.638671875, 9.9794921875, 10.3203125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 10.0, 7.0, 10.0, 6.0, 8.0, 9.0, 13.0, 14.0, 17.0, 33.0, 26.0, 44.0, 58.0, 77.0, 100.0, 175.0, 214.0, 449.0, 1119.0, 4205.0, 28873.0, 966115.0, 2099111.0, 37332.0, 5038.0, 1214.0, 481.0, 263.0, 180.0, 113.0, 65.0, 58.0, 45.0, 45.0, 32.0, 29.0, 24.0, 23.0, 14.0, 10.0, 4.0, 7.0, 7.0, 5.0, 3.0, 7.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.625, -16.07177734375, -15.5185546875, -14.96533203125, -14.412109375, -13.85888671875, -13.3056640625, -12.75244140625, -12.19921875, -11.64599609375, -11.0927734375, -10.53955078125, -9.986328125, -9.43310546875, -8.8798828125, -8.32666015625, -7.7734375, -7.22021484375, -6.6669921875, -6.11376953125, -5.560546875, -5.00732421875, -4.4541015625, -3.90087890625, -3.34765625, -2.79443359375, -2.2412109375, -1.68798828125, -1.134765625, -0.58154296875, -0.0283203125, 0.52490234375, 1.078125, 1.63134765625, 2.1845703125, 2.73779296875, 3.291015625, 3.84423828125, 4.3974609375, 4.95068359375, 5.50390625, 6.05712890625, 6.6103515625, 7.16357421875, 7.716796875, 8.27001953125, 8.8232421875, 9.37646484375, 9.9296875, 10.48291015625, 11.0361328125, 11.58935546875, 12.142578125, 12.69580078125, 13.2490234375, 13.80224609375, 14.35546875, 14.90869140625, 15.4619140625, 16.01513671875, 16.568359375, 17.12158203125, 17.6748046875, 18.22802734375, 18.78125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 53.0, 520.0, 425.0, 22.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.337419509887695, -9.378410339355469, -4.419402122497559, 0.5396060943603516, 5.498615264892578, 10.457624435424805, 15.416631698608398, 20.375642776489258, 25.33465003967285, 30.293659210205078, 35.25266647338867, 40.21167755126953, 45.170684814453125, 50.12969207763672, 55.08869934082031, 60.04771423339844, 65.00672149658203, 69.96572875976562, 74.92473602294922, 79.88374328613281, 84.84275817871094, 89.80176544189453, 94.76077270507812, 99.71978759765625, 104.67878723144531, 109.6377944946289, 114.5968017578125, 119.55581665039062, 124.51482391357422, 129.4738311767578, 134.43283081054688, 139.391845703125, 144.35084533691406, 149.3098602294922, 154.26885986328125, 159.22787475585938, 164.18687438964844, 169.14588928222656, 174.10488891601562, 179.06390380859375, 184.02291870117188, 188.98193359375, 193.94093322753906, 198.8999481201172, 203.85894775390625, 208.81796264648438, 213.7769775390625, 218.73597717285156, 223.69497680664062, 228.65399169921875, 233.6129913330078, 238.57200622558594, 243.531005859375, 248.49002075195312, 253.44903564453125, 258.4080505371094, 263.3670654296875, 268.3260803222656, 273.28509521484375, 278.24407958984375, 283.2030944824219, 288.162109375, 293.1211242675781, 298.08013916015625, 303.03912353515625]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 4.0, 11.0, 12.0, 4.0, 13.0, 13.0, 12.0, 20.0, 13.0, 22.0, 21.0, 31.0, 26.0, 25.0, 40.0, 45.0, 47.0, 44.0, 25.0, 36.0, 37.0, 36.0, 30.0, 48.0, 31.0, 41.0, 31.0, 36.0, 26.0, 28.0, 28.0, 21.0, 26.0, 20.0, 15.0, 12.0, 15.0, 13.0, 3.0, 5.0, 9.0, 8.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.43107604980469, -36.24427032470703, -35.05746078491211, -33.87065124511719, -32.68384552001953, -31.497037887573242, -30.310230255126953, -29.123422622680664, -27.936614990234375, -26.749807357788086, -25.562999725341797, -24.376192092895508, -23.18938446044922, -22.00257682800293, -20.81576919555664, -19.62896156311035, -18.442153930664062, -17.255346298217773, -16.068538665771484, -14.881731033325195, -13.694923400878906, -12.508115768432617, -11.321308135986328, -10.134500503540039, -8.94769287109375, -7.760885238647461, -6.574077606201172, -5.387269973754883, -4.200462341308594, -3.0136547088623047, -1.8268470764160156, -0.6400394439697266, 0.5467720031738281, 1.7335796356201172, 2.9203872680664062, 4.107194900512695, 5.294002532958984, 6.480810165405273, 7.6676177978515625, 8.854425430297852, 10.04123306274414, 11.22804069519043, 12.414848327636719, 13.601655960083008, 14.788463592529297, 15.975271224975586, 17.162078857421875, 18.348886489868164, 19.535694122314453, 20.722501754760742, 21.90930938720703, 23.09611701965332, 24.28292465209961, 25.4697322845459, 26.656539916992188, 27.843347549438477, 29.030155181884766, 30.216962814331055, 31.403770446777344, 32.590576171875, 33.77738571166992, 34.964195251464844, 36.1510009765625, 37.337806701660156, 38.52461624145508]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 10.0, 6.0, 8.0, 9.0, 11.0, 22.0, 18.0, 15.0, 21.0, 19.0, 26.0, 38.0, 29.0, 43.0, 66.0, 51.0, 44.0, 57.0, 54.0, 61.0, 55.0, 48.0, 39.0, 46.0, 33.0, 31.0, 20.0, 19.0, 22.0, 19.0, 10.0, 8.0, 7.0, 8.0, 4.0, 7.0, 6.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.93359375, -3.79736328125, -3.6611328125, -3.52490234375, -3.388671875, -3.25244140625, -3.1162109375, -2.97998046875, -2.84375, -2.70751953125, -2.5712890625, -2.43505859375, -2.298828125, -2.16259765625, -2.0263671875, -1.89013671875, -1.75390625, -1.61767578125, -1.4814453125, -1.34521484375, -1.208984375, -1.07275390625, -0.9365234375, -0.80029296875, -0.6640625, -0.52783203125, -0.3916015625, -0.25537109375, -0.119140625, 0.01708984375, 0.1533203125, 0.28955078125, 0.42578125, 0.56201171875, 0.6982421875, 0.83447265625, 0.970703125, 1.10693359375, 1.2431640625, 1.37939453125, 1.515625, 1.65185546875, 1.7880859375, 1.92431640625, 2.060546875, 2.19677734375, 2.3330078125, 2.46923828125, 2.60546875, 2.74169921875, 2.8779296875, 3.01416015625, 3.150390625, 3.28662109375, 3.4228515625, 3.55908203125, 3.6953125, 3.83154296875, 3.9677734375, 4.10400390625, 4.240234375, 4.37646484375, 4.5126953125, 4.64892578125, 4.78515625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 5.0, 4.0, 14.0, 10.0, 27.0, 31.0, 35.0, 55.0, 96.0, 140.0, 218.0, 489.0, 871.0, 2081.0, 6880.0, 30870.0, 272511.0, 3409860.0, 416115.0, 40825.0, 8569.0, 2562.0, 917.0, 441.0, 246.0, 137.0, 84.0, 60.0, 46.0, 35.0, 18.0, 18.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.46875, -19.876708984375, -19.28466796875, -18.692626953125, -18.1005859375, -17.508544921875, -16.91650390625, -16.324462890625, -15.732421875, -15.140380859375, -14.54833984375, -13.956298828125, -13.3642578125, -12.772216796875, -12.18017578125, -11.588134765625, -10.99609375, -10.404052734375, -9.81201171875, -9.219970703125, -8.6279296875, -8.035888671875, -7.44384765625, -6.851806640625, -6.259765625, -5.667724609375, -5.07568359375, -4.483642578125, -3.8916015625, -3.299560546875, -2.70751953125, -2.115478515625, -1.5234375, -0.931396484375, -0.33935546875, 0.252685546875, 0.8447265625, 1.436767578125, 2.02880859375, 2.620849609375, 3.212890625, 3.804931640625, 4.39697265625, 4.989013671875, 5.5810546875, 6.173095703125, 6.76513671875, 7.357177734375, 7.94921875, 8.541259765625, 9.13330078125, 9.725341796875, 10.3173828125, 10.909423828125, 11.50146484375, 12.093505859375, 12.685546875, 13.277587890625, 13.86962890625, 14.461669921875, 15.0537109375, 15.645751953125, 16.23779296875, 16.829833984375, 17.421875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 4.0, 9.0, 11.0, 15.0, 24.0, 24.0, 35.0, 38.0, 71.0, 96.0, 118.0, 143.0, 259.0, 326.0, 453.0, 573.0, 503.0, 390.0, 274.0, 198.0, 139.0, 92.0, 79.0, 55.0, 39.0, 33.0, 21.0, 15.0, 10.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8671875, -10.5338134765625, -10.200439453125, -9.8670654296875, -9.53369140625, -9.2003173828125, -8.866943359375, -8.5335693359375, -8.2001953125, -7.8668212890625, -7.533447265625, -7.2000732421875, -6.86669921875, -6.5333251953125, -6.199951171875, -5.8665771484375, -5.533203125, -5.1998291015625, -4.866455078125, -4.5330810546875, -4.19970703125, -3.8663330078125, -3.532958984375, -3.1995849609375, -2.8662109375, -2.5328369140625, -2.199462890625, -1.8660888671875, -1.53271484375, -1.1993408203125, -0.865966796875, -0.5325927734375, -0.19921875, 0.1341552734375, 0.467529296875, 0.8009033203125, 1.13427734375, 1.4676513671875, 1.801025390625, 2.1343994140625, 2.4677734375, 2.8011474609375, 3.134521484375, 3.4678955078125, 3.80126953125, 4.1346435546875, 4.468017578125, 4.8013916015625, 5.134765625, 5.4681396484375, 5.801513671875, 6.1348876953125, 6.46826171875, 6.8016357421875, 7.135009765625, 7.4683837890625, 7.8017578125, 8.1351318359375, 8.468505859375, 8.8018798828125, 9.13525390625, 9.4686279296875, 9.802001953125, 10.1353759765625, 10.46875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 12.0, 12.0, 19.0, 45.0, 70.0, 83.0, 149.0, 244.0, 369.0, 624.0, 1063.0, 2008.0, 4012.0, 8599.0, 20123.0, 54053.0, 173617.0, 710912.0, 2291608.0, 672942.0, 165671.0, 52058.0, 19403.0, 8184.0, 3747.0, 1950.0, 1108.0, 601.0, 369.0, 218.0, 149.0, 79.0, 54.0, 45.0, 27.0, 16.0, 17.0, 6.0, 0.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.390625, -11.9703369140625, -11.550048828125, -11.1297607421875, -10.70947265625, -10.2891845703125, -9.868896484375, -9.4486083984375, -9.0283203125, -8.6080322265625, -8.187744140625, -7.7674560546875, -7.34716796875, -6.9268798828125, -6.506591796875, -6.0863037109375, -5.666015625, -5.2457275390625, -4.825439453125, -4.4051513671875, -3.98486328125, -3.5645751953125, -3.144287109375, -2.7239990234375, -2.3037109375, -1.8834228515625, -1.463134765625, -1.0428466796875, -0.62255859375, -0.2022705078125, 0.218017578125, 0.6383056640625, 1.05859375, 1.4788818359375, 1.899169921875, 2.3194580078125, 2.73974609375, 3.1600341796875, 3.580322265625, 4.0006103515625, 4.4208984375, 4.8411865234375, 5.261474609375, 5.6817626953125, 6.10205078125, 6.5223388671875, 6.942626953125, 7.3629150390625, 7.783203125, 8.2034912109375, 8.623779296875, 9.0440673828125, 9.46435546875, 9.8846435546875, 10.304931640625, 10.7252197265625, 11.1455078125, 11.5657958984375, 11.986083984375, 12.4063720703125, 12.82666015625, 13.2469482421875, 13.667236328125, 14.0875244140625, 14.5078125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 11.0, 15.0, 40.0, 79.0, 114.0, 136.0, 161.0, 150.0, 111.0, 88.0, 50.0, 21.0, 16.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-107.01962280273438, -104.02365112304688, -101.0276870727539, -98.0317153930664, -95.0357437133789, -92.0397720336914, -89.04380798339844, -86.04783630371094, -83.05186462402344, -80.05589294433594, -77.05992889404297, -74.06395721435547, -71.06798553466797, -68.07201385498047, -65.0760498046875, -62.080078125, -59.084110260009766, -56.08814239501953, -53.09217071533203, -50.0962028503418, -47.1002311706543, -44.10426330566406, -41.10829162597656, -38.11232376098633, -35.116355895996094, -32.12038803100586, -29.12441635131836, -26.128448486328125, -23.132476806640625, -20.13650894165039, -17.140539169311523, -14.144569396972656, -11.148597717285156, -8.152627944946289, -5.15665864944458, -2.160689353942871, 0.8352804183959961, 3.8312501907348633, 6.827219009399414, 9.823188781738281, 12.819158554077148, 15.815128326416016, 18.811098098754883, 21.80706787109375, 24.803035736083984, 27.799007415771484, 30.79497528076172, 33.79094696044922, 36.78691482543945, 39.78288269042969, 42.77885437011719, 45.77482223510742, 48.77079391479492, 51.766761779785156, 54.762733459472656, 57.75870132446289, 60.754669189453125, 63.75063705444336, 66.7466049194336, 69.7425765991211, 72.7385482788086, 75.7345199584961, 78.73048400878906, 81.72645568847656, 84.72242736816406]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 5.0, 9.0, 8.0, 10.0, 12.0, 16.0, 20.0, 20.0, 18.0, 24.0, 25.0, 30.0, 40.0, 27.0, 29.0, 43.0, 34.0, 38.0, 37.0, 42.0, 30.0, 49.0, 41.0, 45.0, 36.0, 39.0, 31.0, 23.0, 30.0, 29.0, 17.0, 18.0, 27.0, 14.0, 12.0, 16.0, 15.0, 8.0, 7.0, 5.0, 5.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-34.2264404296875, -33.20804214477539, -32.18964767456055, -31.17125129699707, -30.152854919433594, -29.134456634521484, -28.116060256958008, -27.09766387939453, -26.079267501831055, -25.060871124267578, -24.0424747467041, -23.024078369140625, -22.005680084228516, -20.987285614013672, -19.968887329101562, -18.950490951538086, -17.93209457397461, -16.913698196411133, -15.895301818847656, -14.876904487609863, -13.858508110046387, -12.84011173248291, -11.821714401245117, -10.80331802368164, -9.784921646118164, -8.766525268554688, -7.748128414154053, -6.729731559753418, -5.711335182189941, -4.692938804626465, -3.67454195022583, -2.6561450958251953, -1.6377487182617188, -0.6193521022796631, 0.3990445137023926, 1.4174411296844482, 2.435837745666504, 3.4542341232299805, 4.472630977630615, 5.49102783203125, 6.509424209594727, 7.527820587158203, 8.54621696472168, 9.564614295959473, 10.58301067352295, 11.601407051086426, 12.619804382324219, 13.638200759887695, 14.656597137451172, 15.674993515014648, 16.693389892578125, 17.7117862701416, 18.730182647705078, 19.748580932617188, 20.766977310180664, 21.78537368774414, 22.803770065307617, 23.822166442871094, 24.84056282043457, 25.858959197998047, 26.877357482910156, 27.895751953125, 28.91415023803711, 29.932546615600586, 30.950942993164062]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 10.0, 7.0, 12.0, 12.0, 14.0, 19.0, 11.0, 24.0, 23.0, 38.0, 48.0, 49.0, 34.0, 43.0, 54.0, 43.0, 63.0, 63.0, 57.0, 37.0, 48.0, 42.0, 40.0, 29.0, 35.0, 23.0, 25.0, 23.0, 13.0, 12.0, 7.0, 5.0, 5.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.47265625, -4.33099365234375, -4.1893310546875, -4.04766845703125, -3.906005859375, -3.76434326171875, -3.6226806640625, -3.48101806640625, -3.33935546875, -3.19769287109375, -3.0560302734375, -2.91436767578125, -2.772705078125, -2.63104248046875, -2.4893798828125, -2.34771728515625, -2.2060546875, -2.06439208984375, -1.9227294921875, -1.78106689453125, -1.639404296875, -1.49774169921875, -1.3560791015625, -1.21441650390625, -1.07275390625, -0.93109130859375, -0.7894287109375, -0.64776611328125, -0.506103515625, -0.36444091796875, -0.2227783203125, -0.08111572265625, 0.060546875, 0.20220947265625, 0.3438720703125, 0.48553466796875, 0.627197265625, 0.76885986328125, 0.9105224609375, 1.05218505859375, 1.19384765625, 1.33551025390625, 1.4771728515625, 1.61883544921875, 1.760498046875, 1.90216064453125, 2.0438232421875, 2.18548583984375, 2.3271484375, 2.46881103515625, 2.6104736328125, 2.75213623046875, 2.893798828125, 3.03546142578125, 3.1771240234375, 3.31878662109375, 3.46044921875, 3.60211181640625, 3.7437744140625, 3.88543701171875, 4.027099609375, 4.16876220703125, 4.3104248046875, 4.45208740234375, 4.59375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 7.0, 15.0, 16.0, 28.0, 33.0, 44.0, 95.0, 121.0, 151.0, 230.0, 345.0, 572.0, 790.0, 1283.0, 1993.0, 3209.0, 5252.0, 8830.0, 15010.0, 26915.0, 51252.0, 106727.0, 291301.0, 304120.0, 110772.0, 52800.0, 27622.0, 15670.0, 8928.0, 5266.0, 3230.0, 2038.0, 1354.0, 821.0, 561.0, 361.0, 245.0, 174.0, 109.0, 85.0, 54.0, 42.0, 21.0, 15.0, 15.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1788330078125, -0.173248291015625, -0.16766357421875, -0.162078857421875, -0.156494140625, -0.150909423828125, -0.14532470703125, -0.139739990234375, -0.1341552734375, -0.128570556640625, -0.12298583984375, -0.117401123046875, -0.11181640625, -0.106231689453125, -0.10064697265625, -0.095062255859375, -0.0894775390625, -0.083892822265625, -0.07830810546875, -0.072723388671875, -0.067138671875, -0.061553955078125, -0.05596923828125, -0.050384521484375, -0.0447998046875, -0.039215087890625, -0.03363037109375, -0.028045654296875, -0.0224609375, -0.016876220703125, -0.01129150390625, -0.005706787109375, -0.0001220703125, 0.005462646484375, 0.01104736328125, 0.016632080078125, 0.022216796875, 0.027801513671875, 0.03338623046875, 0.038970947265625, 0.0445556640625, 0.050140380859375, 0.05572509765625, 0.061309814453125, 0.06689453125, 0.072479248046875, 0.07806396484375, 0.083648681640625, 0.0892333984375, 0.094818115234375, 0.10040283203125, 0.105987548828125, 0.111572265625, 0.117156982421875, 0.12274169921875, 0.128326416015625, 0.1339111328125, 0.139495849609375, 0.14508056640625, 0.150665283203125, 0.15625, 0.161834716796875, 0.16741943359375, 0.173004150390625, 0.1785888671875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 13.0, 5.0, 13.0, 13.0, 12.0, 16.0, 28.0, 27.0, 25.0, 39.0, 34.0, 43.0, 38.0, 38.0, 38.0, 34.0, 1063.0, 33.0, 44.0, 50.0, 31.0, 33.0, 37.0, 41.0, 30.0, 37.0, 31.0, 22.0, 18.0, 17.0, 13.0, 21.0, 10.0, 16.0, 9.0, 11.0, 7.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.716796875, -2.63177490234375, -2.5467529296875, -2.46173095703125, -2.376708984375, -2.29168701171875, -2.2066650390625, -2.12164306640625, -2.03662109375, -1.95159912109375, -1.8665771484375, -1.78155517578125, -1.696533203125, -1.61151123046875, -1.5264892578125, -1.44146728515625, -1.3564453125, -1.27142333984375, -1.1864013671875, -1.10137939453125, -1.016357421875, -0.93133544921875, -0.8463134765625, -0.76129150390625, -0.67626953125, -0.59124755859375, -0.5062255859375, -0.42120361328125, -0.336181640625, -0.25115966796875, -0.1661376953125, -0.08111572265625, 0.00390625, 0.08892822265625, 0.1739501953125, 0.25897216796875, 0.343994140625, 0.42901611328125, 0.5140380859375, 0.59906005859375, 0.68408203125, 0.76910400390625, 0.8541259765625, 0.93914794921875, 1.024169921875, 1.10919189453125, 1.1942138671875, 1.27923583984375, 1.3642578125, 1.44927978515625, 1.5343017578125, 1.61932373046875, 1.704345703125, 1.78936767578125, 1.8743896484375, 1.95941162109375, 2.04443359375, 2.12945556640625, 2.2144775390625, 2.29949951171875, 2.384521484375, 2.46954345703125, 2.5545654296875, 2.63958740234375, 2.724609375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 10.0, 5.0, 12.0, 23.0, 37.0, 51.0, 71.0, 111.0, 202.0, 317.0, 464.0, 761.0, 1179.0, 1870.0, 2889.0, 4740.0, 7753.0, 12763.0, 21273.0, 36231.0, 65661.0, 127659.0, 1324445.0, 240167.0, 108662.0, 57744.0, 32338.0, 19404.0, 11401.0, 7089.0, 4390.0, 2716.0, 1700.0, 1099.0, 684.0, 439.0, 260.0, 180.0, 106.0, 78.0, 52.0, 34.0, 27.0, 10.0, 11.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0982666015625, -0.0951852798461914, -0.09210395812988281, -0.08902263641357422, -0.08594131469726562, -0.08285999298095703, -0.07977867126464844, -0.07669734954833984, -0.07361602783203125, -0.07053470611572266, -0.06745338439941406, -0.06437206268310547, -0.061290740966796875, -0.05820941925048828, -0.05512809753417969, -0.052046775817871094, -0.0489654541015625, -0.045884132385253906, -0.04280281066894531, -0.03972148895263672, -0.036640167236328125, -0.03355884552001953, -0.030477523803710938, -0.027396202087402344, -0.02431488037109375, -0.021233558654785156, -0.018152236938476562, -0.015070915222167969, -0.011989593505859375, -0.008908271789550781, -0.0058269500732421875, -0.0027456283569335938, 0.000335693359375, 0.0034170150756835938, 0.0064983367919921875, 0.009579658508300781, 0.012660980224609375, 0.01574230194091797, 0.018823623657226562, 0.021904945373535156, 0.02498626708984375, 0.028067588806152344, 0.031148910522460938, 0.03423023223876953, 0.037311553955078125, 0.04039287567138672, 0.04347419738769531, 0.046555519104003906, 0.0496368408203125, 0.052718162536621094, 0.05579948425292969, 0.05888080596923828, 0.061962127685546875, 0.06504344940185547, 0.06812477111816406, 0.07120609283447266, 0.07428741455078125, 0.07736873626708984, 0.08045005798339844, 0.08353137969970703, 0.08661270141601562, 0.08969402313232422, 0.09277534484863281, 0.0958566665649414, 0.09893798828125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 9.0, 9.0, 13.0, 19.0, 29.0, 24.0, 32.0, 25.0, 37.0, 42.0, 40.0, 57.0, 68.0, 57.0, 53.0, 61.0, 53.0, 42.0, 41.0, 41.0, 36.0, 33.0, 34.0, 30.0, 27.0, 14.0, 13.0, 18.0, 8.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.875659942626953e-05, -4.7369860112667084e-05, -4.5983120799064636e-05, -4.459638148546219e-05, -4.320964217185974e-05, -4.1822902858257294e-05, -4.0436163544654846e-05, -3.90494242310524e-05, -3.766268491744995e-05, -3.6275945603847504e-05, -3.4889206290245056e-05, -3.350246697664261e-05, -3.211572766304016e-05, -3.0728988349437714e-05, -2.9342249035835266e-05, -2.795550972223282e-05, -2.656877040863037e-05, -2.5182031095027924e-05, -2.3795291781425476e-05, -2.240855246782303e-05, -2.102181315422058e-05, -1.9635073840618134e-05, -1.8248334527015686e-05, -1.686159521341324e-05, -1.547485589981079e-05, -1.4088116586208344e-05, -1.2701377272605896e-05, -1.1314637959003448e-05, -9.927898645401001e-06, -8.541159331798553e-06, -7.154420018196106e-06, -5.7676807045936584e-06, -4.380941390991211e-06, -2.9942020773887634e-06, -1.607462763786316e-06, -2.207234501838684e-07, 1.166015863418579e-06, 2.5527551770210266e-06, 3.939494490623474e-06, 5.326233804225922e-06, 6.712973117828369e-06, 8.099712431430817e-06, 9.486451745033264e-06, 1.0873191058635712e-05, 1.225993037223816e-05, 1.3646669685840607e-05, 1.5033408999443054e-05, 1.6420148313045502e-05, 1.780688762664795e-05, 1.9193626940250397e-05, 2.0580366253852844e-05, 2.1967105567455292e-05, 2.335384488105774e-05, 2.4740584194660187e-05, 2.6127323508262634e-05, 2.7514062821865082e-05, 2.890080213546753e-05, 3.0287541449069977e-05, 3.1674280762672424e-05, 3.306102007627487e-05, 3.444775938987732e-05, 3.583449870347977e-05, 3.7221238017082214e-05, 3.860797733068466e-05, 3.999471664428711e-05]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 14.0, 12.0, 14.0, 15.0, 19.0, 22.0, 16.0, 27.0, 32.0, 43.0, 61.0, 105.0, 162.0, 372.0, 1433.0, 19053.0, 409140.0, 580801.0, 34058.0, 2136.0, 451.0, 176.0, 107.0, 62.0, 52.0, 34.0, 30.0, 23.0, 25.0, 14.0, 16.0, 5.0, 0.0, 10.0, 4.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006575584411621094, -0.0006357058882713318, -0.0006138533353805542, -0.0005920007824897766, -0.000570148229598999, -0.0005482956767082214, -0.0005264431238174438, -0.0005045905709266663, -0.00048273801803588867, -0.0004608854651451111, -0.0004390329122543335, -0.0004171803593635559, -0.0003953278064727783, -0.00037347525358200073, -0.00035162270069122314, -0.00032977014780044556, -0.00030791759490966797, -0.0002860650420188904, -0.0002642124891281128, -0.0002423599362373352, -0.00022050738334655762, -0.00019865483045578003, -0.00017680227756500244, -0.00015494972467422485, -0.00013309717178344727, -0.00011124461889266968, -8.939206600189209e-05, -6.75395131111145e-05, -4.5686960220336914e-05, -2.3834407329559326e-05, -1.9818544387817383e-06, 1.987069845199585e-05, 4.172325134277344e-05, 6.357580423355103e-05, 8.542835712432861e-05, 0.0001072809100151062, 0.0001291334629058838, 0.00015098601579666138, 0.00017283856868743896, 0.00019469112157821655, 0.00021654367446899414, 0.00023839622735977173, 0.0002602487802505493, 0.0002821013331413269, 0.0003039538860321045, 0.0003258064389228821, 0.00034765899181365967, 0.00036951154470443726, 0.00039136409759521484, 0.00041321665048599243, 0.00043506920337677, 0.0004569217562675476, 0.0004787743091583252, 0.0005006268620491028, 0.0005224794149398804, 0.000544331967830658, 0.0005661845207214355, 0.0005880370736122131, 0.0006098896265029907, 0.0006317421793937683, 0.0006535947322845459, 0.0006754472851753235, 0.0006972998380661011, 0.0007191523909568787, 0.0007410049438476562]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 15.0, 30.0, 63.0, 150.0, 229.0, 244.0, 165.0, 69.0, 28.0, 13.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.304213482304476e-05, -4.825156429433264e-05, -4.346099740359932e-05, -3.86704268748872e-05, -3.3879856346175075e-05, -2.908928581746295e-05, -2.429871710774023e-05, -1.950814839801751e-05, -1.4717577869305387e-05, -9.927008250087965e-06, -5.136438630870543e-06, -3.4586901165312156e-07, 4.4447006075643e-06, 9.235271136276424e-06, 1.4025839845999144e-05, 1.8816408555721864e-05, 2.3606979084433988e-05, 2.839754961314611e-05, 3.318811650387943e-05, 3.797868703259155e-05, 4.2769257561303675e-05, 4.75598280900158e-05, 5.235039861872792e-05, 5.714096550946124e-05, 6.193153967615217e-05, 6.67221102048643e-05, 7.151268073357642e-05, 7.630325126228854e-05, 8.109382179100066e-05, 8.588438504375517e-05, 9.06749555724673e-05, 9.546552610117942e-05, 0.00010025608935393393, 0.00010504665988264605, 0.00010983723041135818, 0.0001146278009400703, 0.00011941837146878242, 0.00012420893472153693, 0.00012899951252620667, 0.00013379007577896118, 0.00013858065358363092, 0.00014337121683638543, 0.00014816179464105517, 0.00015295235789380968, 0.00015774293569847941, 0.00016253349895123392, 0.00016732407675590366, 0.00017211464000865817, 0.00017690520326141268, 0.0001816957665141672, 0.00018648634431883693, 0.00019127690757159144, 0.00019606748537626117, 0.00020085804862901568, 0.00020564862643368542, 0.00021043918968643993, 0.00021522975293919444, 0.00022002031619194895, 0.0002248108939966187, 0.0002296014572493732, 0.00023439203505404294, 0.00023918259830679744, 0.00024397317611146718, 0.0002487637393642217, 0.00025355431716889143]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 8.0, 9.0, 7.0, 11.0, 9.0, 21.0, 23.0, 21.0, 18.0, 27.0, 22.0, 36.0, 38.0, 31.0, 40.0, 41.0, 54.0, 48.0, 43.0, 54.0, 45.0, 26.0, 38.0, 50.0, 46.0, 26.0, 28.0, 29.0, 27.0, 18.0, 16.0, 18.0, 18.0, 12.0, 11.0, 6.0, 9.0, 6.0, 1.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0279159545898438e-05, -2.928357571363449e-05, -2.8287991881370544e-05, -2.7292408049106598e-05, -2.629682421684265e-05, -2.5301240384578705e-05, -2.4305656552314758e-05, -2.3310072720050812e-05, -2.2314488887786865e-05, -2.131890505552292e-05, -2.0323321223258972e-05, -1.9327737390995026e-05, -1.833215355873108e-05, -1.7336569726467133e-05, -1.6340985894203186e-05, -1.534540206193924e-05, -1.4349818229675293e-05, -1.3354234397411346e-05, -1.23586505651474e-05, -1.1363066732883453e-05, -1.0367482900619507e-05, -9.37189906835556e-06, -8.376315236091614e-06, -7.380731403827667e-06, -6.385147571563721e-06, -5.389563739299774e-06, -4.393979907035828e-06, -3.398396074771881e-06, -2.4028122425079346e-06, -1.407228410243988e-06, -4.116445779800415e-07, 5.83939254283905e-07, 1.5795230865478516e-06, 2.575106918811798e-06, 3.5706907510757446e-06, 4.566274583339691e-06, 5.561858415603638e-06, 6.557442247867584e-06, 7.553026080131531e-06, 8.548609912395477e-06, 9.544193744659424e-06, 1.053977757692337e-05, 1.1535361409187317e-05, 1.2530945241451263e-05, 1.352652907371521e-05, 1.4522112905979156e-05, 1.5517696738243103e-05, 1.651328057050705e-05, 1.7508864402770996e-05, 1.8504448235034943e-05, 1.950003206729889e-05, 2.0495615899562836e-05, 2.1491199731826782e-05, 2.248678356409073e-05, 2.3482367396354675e-05, 2.4477951228618622e-05, 2.547353506088257e-05, 2.6469118893146515e-05, 2.746470272541046e-05, 2.8460286557674408e-05, 2.9455870389938354e-05, 3.04514542222023e-05, 3.144703805446625e-05, 3.2442621886730194e-05, 3.343820571899414e-05]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 10.0, 7.0, 12.0, 12.0, 14.0, 19.0, 11.0, 24.0, 23.0, 38.0, 48.0, 49.0, 34.0, 43.0, 54.0, 43.0, 63.0, 63.0, 57.0, 37.0, 48.0, 42.0, 40.0, 29.0, 35.0, 23.0, 25.0, 23.0, 13.0, 12.0, 7.0, 5.0, 5.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.47265625, -4.33099365234375, -4.1893310546875, -4.04766845703125, -3.906005859375, -3.76434326171875, -3.6226806640625, -3.48101806640625, -3.33935546875, -3.19769287109375, -3.0560302734375, -2.91436767578125, -2.772705078125, -2.63104248046875, -2.4893798828125, -2.34771728515625, -2.2060546875, -2.06439208984375, -1.9227294921875, -1.78106689453125, -1.639404296875, -1.49774169921875, -1.3560791015625, -1.21441650390625, -1.07275390625, -0.93109130859375, -0.7894287109375, -0.64776611328125, -0.506103515625, -0.36444091796875, -0.2227783203125, -0.08111572265625, 0.060546875, 0.20220947265625, 0.3438720703125, 0.48553466796875, 0.627197265625, 0.76885986328125, 0.9105224609375, 1.05218505859375, 1.19384765625, 1.33551025390625, 1.4771728515625, 1.61883544921875, 1.760498046875, 1.90216064453125, 2.0438232421875, 2.18548583984375, 2.3271484375, 2.46881103515625, 2.6104736328125, 2.75213623046875, 2.893798828125, 3.03546142578125, 3.1771240234375, 3.31878662109375, 3.46044921875, 3.60211181640625, 3.7437744140625, 3.88543701171875, 4.027099609375, 4.16876220703125, 4.3104248046875, 4.45208740234375, 4.59375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 4.0, 15.0, 8.0, 16.0, 14.0, 27.0, 36.0, 41.0, 68.0, 91.0, 166.0, 234.0, 484.0, 1029.0, 2487.0, 8328.0, 41038.0, 798738.0, 166975.0, 20407.0, 4903.0, 1705.0, 723.0, 396.0, 194.0, 124.0, 72.0, 58.0, 50.0, 22.0, 19.0, 11.0, 16.0, 12.0, 10.0, 2.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5859375, -13.1141357421875, -12.642333984375, -12.1705322265625, -11.69873046875, -11.2269287109375, -10.755126953125, -10.2833251953125, -9.8115234375, -9.3397216796875, -8.867919921875, -8.3961181640625, -7.92431640625, -7.4525146484375, -6.980712890625, -6.5089111328125, -6.037109375, -5.5653076171875, -5.093505859375, -4.6217041015625, -4.14990234375, -3.6781005859375, -3.206298828125, -2.7344970703125, -2.2626953125, -1.7908935546875, -1.319091796875, -0.8472900390625, -0.37548828125, 0.0963134765625, 0.568115234375, 1.0399169921875, 1.51171875, 1.9835205078125, 2.455322265625, 2.9271240234375, 3.39892578125, 3.8707275390625, 4.342529296875, 4.8143310546875, 5.2861328125, 5.7579345703125, 6.229736328125, 6.7015380859375, 7.17333984375, 7.6451416015625, 8.116943359375, 8.5887451171875, 9.060546875, 9.5323486328125, 10.004150390625, 10.4759521484375, 10.94775390625, 11.4195556640625, 11.891357421875, 12.3631591796875, 12.8349609375, 13.3067626953125, 13.778564453125, 14.2503662109375, 14.72216796875, 15.1939697265625, 15.665771484375, 16.1375732421875, 16.609375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 0.0, 4.0, 3.0, 7.0, 6.0, 15.0, 8.0, 9.0, 22.0, 14.0, 28.0, 25.0, 34.0, 19.0, 23.0, 44.0, 35.0, 33.0, 52.0, 52.0, 95.0, 191.0, 1679.0, 132.0, 84.0, 57.0, 47.0, 42.0, 38.0, 33.0, 39.0, 21.0, 31.0, 13.0, 20.0, 17.0, 12.0, 14.0, 13.0, 12.0, 8.0, 5.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5, -13.08203125, -12.6640625, -12.24609375, -11.828125, -11.41015625, -10.9921875, -10.57421875, -10.15625, -9.73828125, -9.3203125, -8.90234375, -8.484375, -8.06640625, -7.6484375, -7.23046875, -6.8125, -6.39453125, -5.9765625, -5.55859375, -5.140625, -4.72265625, -4.3046875, -3.88671875, -3.46875, -3.05078125, -2.6328125, -2.21484375, -1.796875, -1.37890625, -0.9609375, -0.54296875, -0.125, 0.29296875, 0.7109375, 1.12890625, 1.546875, 1.96484375, 2.3828125, 2.80078125, 3.21875, 3.63671875, 4.0546875, 4.47265625, 4.890625, 5.30859375, 5.7265625, 6.14453125, 6.5625, 6.98046875, 7.3984375, 7.81640625, 8.234375, 8.65234375, 9.0703125, 9.48828125, 9.90625, 10.32421875, 10.7421875, 11.16015625, 11.578125, 11.99609375, 12.4140625, 12.83203125, 13.25]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 6.0, 8.0, 8.0, 10.0, 8.0, 14.0, 10.0, 18.0, 22.0, 19.0, 37.0, 50.0, 70.0, 94.0, 128.0, 205.0, 338.0, 943.0, 3496.0, 19726.0, 223352.0, 2811749.0, 72684.0, 9216.0, 2017.0, 616.0, 266.0, 166.0, 104.0, 75.0, 50.0, 40.0, 33.0, 30.0, 22.0, 21.0, 11.0, 12.0, 12.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-26.46875, -25.673828125, -24.87890625, -24.083984375, -23.2890625, -22.494140625, -21.69921875, -20.904296875, -20.109375, -19.314453125, -18.51953125, -17.724609375, -16.9296875, -16.134765625, -15.33984375, -14.544921875, -13.75, -12.955078125, -12.16015625, -11.365234375, -10.5703125, -9.775390625, -8.98046875, -8.185546875, -7.390625, -6.595703125, -5.80078125, -5.005859375, -4.2109375, -3.416015625, -2.62109375, -1.826171875, -1.03125, -0.236328125, 0.55859375, 1.353515625, 2.1484375, 2.943359375, 3.73828125, 4.533203125, 5.328125, 6.123046875, 6.91796875, 7.712890625, 8.5078125, 9.302734375, 10.09765625, 10.892578125, 11.6875, 12.482421875, 13.27734375, 14.072265625, 14.8671875, 15.662109375, 16.45703125, 17.251953125, 18.046875, 18.841796875, 19.63671875, 20.431640625, 21.2265625, 22.021484375, 22.81640625, 23.611328125, 24.40625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [2.0, 44.0, 320.0, 533.0, 116.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.23528480529785, -13.414440155029297, -7.593595504760742, -1.7727508544921875, 4.048093795776367, 9.868938446044922, 15.689783096313477, 21.5106258392334, 27.331472396850586, 33.15231704711914, 38.97315979003906, 44.79400634765625, 50.61485290527344, 56.43569564819336, 62.25653839111328, 68.07738494873047, 73.89823150634766, 79.71907806396484, 85.5399169921875, 91.36076354980469, 97.18161010742188, 103.00245666503906, 108.82330322265625, 114.6441421508789, 120.4649887084961, 126.28583526611328, 132.10667419433594, 137.92752075195312, 143.7483673095703, 149.5692138671875, 155.3900604248047, 161.21090698242188, 167.03173828125, 172.8525848388672, 178.67343139648438, 184.49427795410156, 190.31512451171875, 196.13595581054688, 201.95680236816406, 207.77764892578125, 213.59849548339844, 219.41934204101562, 225.2401885986328, 231.06103515625, 236.88186645507812, 242.7027130126953, 248.5235595703125, 254.3444061279297, 260.1652526855469, 265.986083984375, 271.80694580078125, 277.6277770996094, 283.4486389160156, 289.26947021484375, 295.09033203125, 300.9111633300781, 306.73199462890625, 312.5528259277344, 318.3736877441406, 324.19451904296875, 330.015380859375, 335.8362121582031, 341.6570739746094, 347.4779052734375, 353.29876708984375]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 8.0, 6.0, 10.0, 3.0, 15.0, 13.0, 15.0, 12.0, 15.0, 15.0, 25.0, 28.0, 20.0, 20.0, 26.0, 27.0, 28.0, 32.0, 32.0, 34.0, 35.0, 47.0, 39.0, 33.0, 46.0, 32.0, 38.0, 33.0, 40.0, 33.0, 25.0, 30.0, 26.0, 26.0, 22.0, 17.0, 15.0, 17.0, 12.0, 7.0, 10.0, 3.0, 6.0, 4.0, 6.0, 3.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-33.14991760253906, -32.12135696411133, -31.092798233032227, -30.064239501953125, -29.03567886352539, -28.007118225097656, -26.978559494018555, -25.950000762939453, -24.92144012451172, -23.892879486083984, -22.864320755004883, -21.83576202392578, -20.807201385498047, -19.778640747070312, -18.75008201599121, -17.72152328491211, -16.692962646484375, -15.664402961730957, -14.635843276977539, -13.607283592224121, -12.578723907470703, -11.550164222717285, -10.521604537963867, -9.49304485321045, -8.464485168457031, -7.435925483703613, -6.407365798950195, -5.378806114196777, -4.350246429443359, -3.3216867446899414, -2.2931270599365234, -1.2645673751831055, -0.2360076904296875, 0.7925519943237305, 1.8211116790771484, 2.8496713638305664, 3.8782310485839844, 4.906790733337402, 5.93535041809082, 6.963910102844238, 7.992469787597656, 9.021029472351074, 10.049589157104492, 11.07814884185791, 12.106708526611328, 13.135268211364746, 14.163827896118164, 15.192387580871582, 16.220947265625, 17.249507904052734, 18.278066635131836, 19.306625366210938, 20.335186004638672, 21.363746643066406, 22.392305374145508, 23.42086410522461, 24.449424743652344, 25.477985382080078, 26.50654411315918, 27.53510284423828, 28.563663482666016, 29.59222412109375, 30.62078285217285, 31.649341583251953, 32.67790222167969]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 3.0, 16.0, 6.0, 9.0, 15.0, 14.0, 17.0, 18.0, 22.0, 29.0, 31.0, 45.0, 50.0, 48.0, 43.0, 35.0, 54.0, 67.0, 73.0, 50.0, 40.0, 59.0, 34.0, 35.0, 32.0, 34.0, 20.0, 21.0, 18.0, 17.0, 9.0, 6.0, 10.0, 5.0, 8.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.9375, -4.784912109375, -4.63232421875, -4.479736328125, -4.3271484375, -4.174560546875, -4.02197265625, -3.869384765625, -3.716796875, -3.564208984375, -3.41162109375, -3.259033203125, -3.1064453125, -2.953857421875, -2.80126953125, -2.648681640625, -2.49609375, -2.343505859375, -2.19091796875, -2.038330078125, -1.8857421875, -1.733154296875, -1.58056640625, -1.427978515625, -1.275390625, -1.122802734375, -0.97021484375, -0.817626953125, -0.6650390625, -0.512451171875, -0.35986328125, -0.207275390625, -0.0546875, 0.097900390625, 0.25048828125, 0.403076171875, 0.5556640625, 0.708251953125, 0.86083984375, 1.013427734375, 1.166015625, 1.318603515625, 1.47119140625, 1.623779296875, 1.7763671875, 1.928955078125, 2.08154296875, 2.234130859375, 2.38671875, 2.539306640625, 2.69189453125, 2.844482421875, 2.9970703125, 3.149658203125, 3.30224609375, 3.454833984375, 3.607421875, 3.760009765625, 3.91259765625, 4.065185546875, 4.2177734375, 4.370361328125, 4.52294921875, 4.675537109375, 4.828125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 7.0, 13.0, 16.0, 19.0, 18.0, 29.0, 54.0, 67.0, 103.0, 149.0, 205.0, 365.0, 592.0, 1222.0, 2686.0, 6845.0, 22918.0, 114857.0, 1381724.0, 2435739.0, 178863.0, 32382.0, 8993.0, 3184.0, 1372.0, 749.0, 368.0, 235.0, 175.0, 99.0, 74.0, 46.0, 36.0, 20.0, 12.0, 9.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-15.578125, -15.1214599609375, -14.664794921875, -14.2081298828125, -13.75146484375, -13.2947998046875, -12.838134765625, -12.3814697265625, -11.9248046875, -11.4681396484375, -11.011474609375, -10.5548095703125, -10.09814453125, -9.6414794921875, -9.184814453125, -8.7281494140625, -8.271484375, -7.8148193359375, -7.358154296875, -6.9014892578125, -6.44482421875, -5.9881591796875, -5.531494140625, -5.0748291015625, -4.6181640625, -4.1614990234375, -3.704833984375, -3.2481689453125, -2.79150390625, -2.3348388671875, -1.878173828125, -1.4215087890625, -0.96484375, -0.5081787109375, -0.051513671875, 0.4051513671875, 0.86181640625, 1.3184814453125, 1.775146484375, 2.2318115234375, 2.6884765625, 3.1451416015625, 3.601806640625, 4.0584716796875, 4.51513671875, 4.9718017578125, 5.428466796875, 5.8851318359375, 6.341796875, 6.7984619140625, 7.255126953125, 7.7117919921875, 8.16845703125, 8.6251220703125, 9.081787109375, 9.5384521484375, 9.9951171875, 10.4517822265625, 10.908447265625, 11.3651123046875, 11.82177734375, 12.2784423828125, 12.735107421875, 13.1917724609375, 13.6484375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 6.0, 9.0, 5.0, 7.0, 13.0, 17.0, 29.0, 33.0, 54.0, 60.0, 91.0, 124.0, 199.0, 305.0, 492.0, 649.0, 619.0, 422.0, 279.0, 186.0, 157.0, 83.0, 53.0, 53.0, 34.0, 28.0, 15.0, 19.0, 13.0, 5.0, 4.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-15.375, -14.9990234375, -14.623046875, -14.2470703125, -13.87109375, -13.4951171875, -13.119140625, -12.7431640625, -12.3671875, -11.9912109375, -11.615234375, -11.2392578125, -10.86328125, -10.4873046875, -10.111328125, -9.7353515625, -9.359375, -8.9833984375, -8.607421875, -8.2314453125, -7.85546875, -7.4794921875, -7.103515625, -6.7275390625, -6.3515625, -5.9755859375, -5.599609375, -5.2236328125, -4.84765625, -4.4716796875, -4.095703125, -3.7197265625, -3.34375, -2.9677734375, -2.591796875, -2.2158203125, -1.83984375, -1.4638671875, -1.087890625, -0.7119140625, -0.3359375, 0.0400390625, 0.416015625, 0.7919921875, 1.16796875, 1.5439453125, 1.919921875, 2.2958984375, 2.671875, 3.0478515625, 3.423828125, 3.7998046875, 4.17578125, 4.5517578125, 4.927734375, 5.3037109375, 5.6796875, 6.0556640625, 6.431640625, 6.8076171875, 7.18359375, 7.5595703125, 7.935546875, 8.3115234375, 8.6875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 11.0, 14.0, 35.0, 45.0, 81.0, 127.0, 212.0, 442.0, 925.0, 2168.0, 6158.0, 22615.0, 121455.0, 1385244.0, 2421325.0, 189721.0, 30884.0, 7944.0, 2693.0, 1037.0, 527.0, 247.0, 131.0, 93.0, 40.0, 21.0, 30.0, 7.0, 6.0, 9.0, 7.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.328125, -17.59814453125, -16.8681640625, -16.13818359375, -15.408203125, -14.67822265625, -13.9482421875, -13.21826171875, -12.48828125, -11.75830078125, -11.0283203125, -10.29833984375, -9.568359375, -8.83837890625, -8.1083984375, -7.37841796875, -6.6484375, -5.91845703125, -5.1884765625, -4.45849609375, -3.728515625, -2.99853515625, -2.2685546875, -1.53857421875, -0.80859375, -0.07861328125, 0.6513671875, 1.38134765625, 2.111328125, 2.84130859375, 3.5712890625, 4.30126953125, 5.03125, 5.76123046875, 6.4912109375, 7.22119140625, 7.951171875, 8.68115234375, 9.4111328125, 10.14111328125, 10.87109375, 11.60107421875, 12.3310546875, 13.06103515625, 13.791015625, 14.52099609375, 15.2509765625, 15.98095703125, 16.7109375, 17.44091796875, 18.1708984375, 18.90087890625, 19.630859375, 20.36083984375, 21.0908203125, 21.82080078125, 22.55078125, 23.28076171875, 24.0107421875, 24.74072265625, 25.470703125, 26.20068359375, 26.9306640625, 27.66064453125, 28.390625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 13.0, 33.0, 72.0, 128.0, 198.0, 206.0, 165.0, 100.0, 48.0, 23.0, 13.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.10198974609375, -78.23880767822266, -74.37561798095703, -70.51243591308594, -66.64924621582031, -62.78606414794922, -58.92287826538086, -55.0596923828125, -51.196510314941406, -47.33332443237305, -43.47013854980469, -39.606956481933594, -35.743770599365234, -31.880584716796875, -28.017398834228516, -24.15421485900879, -20.291027069091797, -16.427841186523438, -12.564657211303711, -8.701471328735352, -4.838286399841309, -0.9751014709472656, 2.8880844116210938, 6.75126838684082, 10.61445426940918, 14.477639198303223, 18.340824127197266, 22.204010009765625, 26.067195892333984, 29.93037986755371, 33.79356384277344, 37.6567497253418, 41.519935607910156, 45.383121490478516, 49.246307373046875, 53.10948944091797, 56.97267532348633, 60.83586120605469, 64.69905090332031, 68.5622329711914, 72.4254150390625, 76.2885971069336, 80.15178680419922, 84.01496887207031, 87.87815856933594, 91.74134063720703, 95.60452270507812, 99.46771240234375, 103.33090209960938, 107.19408416748047, 111.0572738647461, 114.92045593261719, 118.78364562988281, 122.6468276977539, 126.510009765625, 130.37319946289062, 134.2363739013672, 138.0995635986328, 141.96273803710938, 145.825927734375, 149.68911743164062, 153.55230712890625, 157.4154815673828, 161.27867126464844, 165.14186096191406]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 4.0, 5.0, 11.0, 9.0, 12.0, 9.0, 16.0, 14.0, 21.0, 23.0, 37.0, 30.0, 33.0, 30.0, 51.0, 49.0, 43.0, 37.0, 42.0, 44.0, 49.0, 48.0, 35.0, 51.0, 22.0, 31.0, 41.0, 37.0, 32.0, 25.0, 20.0, 13.0, 17.0, 12.0, 10.0, 5.0, 8.0, 6.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.405067443847656, -39.14799118041992, -37.89091491699219, -36.63383865356445, -35.37676239013672, -34.119686126708984, -32.86260986328125, -31.605533599853516, -30.34845733642578, -29.091381072998047, -27.834304809570312, -26.577228546142578, -25.320152282714844, -24.06307601928711, -22.805999755859375, -21.54892349243164, -20.291847229003906, -19.034770965576172, -17.777694702148438, -16.520618438720703, -15.263542175292969, -14.006465911865234, -12.7493896484375, -11.492313385009766, -10.235237121582031, -8.978160858154297, -7.7210845947265625, -6.464008331298828, -5.206932067871094, -3.9498558044433594, -2.692779541015625, -1.4357032775878906, -0.17862701416015625, 1.0784492492675781, 2.3355255126953125, 3.592601776123047, 4.849678039550781, 6.106754302978516, 7.36383056640625, 8.620906829833984, 9.877983093261719, 11.135059356689453, 12.392135620117188, 13.649211883544922, 14.906288146972656, 16.16336441040039, 17.420440673828125, 18.67751693725586, 19.934593200683594, 21.191669464111328, 22.448745727539062, 23.705821990966797, 24.96289825439453, 26.219974517822266, 27.47705078125, 28.734127044677734, 29.99120330810547, 31.248279571533203, 32.50535583496094, 33.76243209838867, 35.019508361816406, 36.27658462524414, 37.533660888671875, 38.79073715209961, 40.047813415527344]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 13.0, 16.0, 14.0, 7.0, 14.0, 16.0, 19.0, 23.0, 28.0, 44.0, 39.0, 43.0, 38.0, 40.0, 42.0, 57.0, 50.0, 50.0, 40.0, 43.0, 45.0, 36.0, 40.0, 35.0, 22.0, 39.0, 24.0, 15.0, 22.0, 14.0, 16.0, 7.0, 8.0, 1.0, 6.0, 9.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.36328125, -4.2247314453125, -4.086181640625, -3.9476318359375, -3.80908203125, -3.6705322265625, -3.531982421875, -3.3934326171875, -3.2548828125, -3.1163330078125, -2.977783203125, -2.8392333984375, -2.70068359375, -2.5621337890625, -2.423583984375, -2.2850341796875, -2.146484375, -2.0079345703125, -1.869384765625, -1.7308349609375, -1.59228515625, -1.4537353515625, -1.315185546875, -1.1766357421875, -1.0380859375, -0.8995361328125, -0.760986328125, -0.6224365234375, -0.48388671875, -0.3453369140625, -0.206787109375, -0.0682373046875, 0.0703125, 0.2088623046875, 0.347412109375, 0.4859619140625, 0.62451171875, 0.7630615234375, 0.901611328125, 1.0401611328125, 1.1787109375, 1.3172607421875, 1.455810546875, 1.5943603515625, 1.73291015625, 1.8714599609375, 2.010009765625, 2.1485595703125, 2.287109375, 2.4256591796875, 2.564208984375, 2.7027587890625, 2.84130859375, 2.9798583984375, 3.118408203125, 3.2569580078125, 3.3955078125, 3.5340576171875, 3.672607421875, 3.8111572265625, 3.94970703125, 4.0882568359375, 4.226806640625, 4.3653564453125, 4.50390625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 3.0, 0.0, 6.0, 10.0, 24.0, 18.0, 24.0, 33.0, 69.0, 87.0, 127.0, 139.0, 202.0, 311.0, 496.0, 666.0, 981.0, 1444.0, 2193.0, 3133.0, 4710.0, 7344.0, 11070.0, 17039.0, 28089.0, 46939.0, 84986.0, 177729.0, 302649.0, 160578.0, 78640.0, 44715.0, 26631.0, 16234.0, 10546.0, 6704.0, 4332.0, 3056.0, 2011.0, 1440.0, 978.0, 676.0, 455.0, 315.0, 201.0, 163.0, 105.0, 82.0, 43.0, 42.0, 34.0, 29.0, 14.0, 4.0, 6.0, 1.0, 0.0, 3.0, 5.0, 3.0], "bins": [-0.1568603515625, -0.1520252227783203, -0.14719009399414062, -0.14235496520996094, -0.13751983642578125, -0.13268470764160156, -0.12784957885742188, -0.12301445007324219, -0.1181793212890625, -0.11334419250488281, -0.10850906372070312, -0.10367393493652344, -0.09883880615234375, -0.09400367736816406, -0.08916854858398438, -0.08433341979980469, -0.079498291015625, -0.07466316223144531, -0.06982803344726562, -0.06499290466308594, -0.06015777587890625, -0.05532264709472656, -0.050487518310546875, -0.04565238952636719, -0.0408172607421875, -0.03598213195800781, -0.031147003173828125, -0.026311874389648438, -0.02147674560546875, -0.016641616821289062, -0.011806488037109375, -0.0069713592529296875, -0.00213623046875, 0.0026988983154296875, 0.007534027099609375, 0.012369155883789062, 0.01720428466796875, 0.022039413452148438, 0.026874542236328125, 0.03170967102050781, 0.0365447998046875, 0.04137992858886719, 0.046215057373046875, 0.05105018615722656, 0.05588531494140625, 0.06072044372558594, 0.06555557250976562, 0.07039070129394531, 0.075225830078125, 0.08006095886230469, 0.08489608764648438, 0.08973121643066406, 0.09456634521484375, 0.09940147399902344, 0.10423660278320312, 0.10907173156738281, 0.1139068603515625, 0.11874198913574219, 0.12357711791992188, 0.12841224670410156, 0.13324737548828125, 0.13808250427246094, 0.14291763305664062, 0.1477527618408203, 0.152587890625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 8.0, 11.0, 7.0, 14.0, 17.0, 13.0, 18.0, 26.0, 22.0, 29.0, 22.0, 40.0, 39.0, 32.0, 51.0, 36.0, 44.0, 46.0, 1053.0, 45.0, 43.0, 37.0, 36.0, 39.0, 26.0, 33.0, 30.0, 34.0, 26.0, 15.0, 14.0, 19.0, 18.0, 17.0, 13.0, 11.0, 11.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.392578125, -3.29278564453125, -3.1929931640625, -3.09320068359375, -2.993408203125, -2.89361572265625, -2.7938232421875, -2.69403076171875, -2.59423828125, -2.49444580078125, -2.3946533203125, -2.29486083984375, -2.195068359375, -2.09527587890625, -1.9954833984375, -1.89569091796875, -1.7958984375, -1.69610595703125, -1.5963134765625, -1.49652099609375, -1.396728515625, -1.29693603515625, -1.1971435546875, -1.09735107421875, -0.99755859375, -0.89776611328125, -0.7979736328125, -0.69818115234375, -0.598388671875, -0.49859619140625, -0.3988037109375, -0.29901123046875, -0.19921875, -0.09942626953125, 0.0003662109375, 0.10015869140625, 0.199951171875, 0.29974365234375, 0.3995361328125, 0.49932861328125, 0.59912109375, 0.69891357421875, 0.7987060546875, 0.89849853515625, 0.998291015625, 1.09808349609375, 1.1978759765625, 1.29766845703125, 1.3974609375, 1.49725341796875, 1.5970458984375, 1.69683837890625, 1.796630859375, 1.89642333984375, 1.9962158203125, 2.09600830078125, 2.19580078125, 2.29559326171875, 2.3953857421875, 2.49517822265625, 2.594970703125, 2.69476318359375, 2.7945556640625, 2.89434814453125, 2.994140625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 16.0, 19.0, 30.0, 49.0, 58.0, 87.0, 144.0, 224.0, 392.0, 574.0, 943.0, 1538.0, 2391.0, 4000.0, 6460.0, 10819.0, 17999.0, 30070.0, 52158.0, 97659.0, 219327.0, 1353054.0, 135608.0, 67844.0, 38124.0, 22626.0, 13698.0, 8061.0, 4969.0, 3177.0, 1838.0, 1178.0, 718.0, 473.0, 292.0, 164.0, 117.0, 80.0, 48.0, 25.0, 29.0, 20.0, 13.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1243896484375, -0.12075519561767578, -0.11712074279785156, -0.11348628997802734, -0.10985183715820312, -0.1062173843383789, -0.10258293151855469, -0.09894847869873047, -0.09531402587890625, -0.09167957305908203, -0.08804512023925781, -0.0844106674194336, -0.08077621459960938, -0.07714176177978516, -0.07350730895996094, -0.06987285614013672, -0.0662384033203125, -0.06260395050048828, -0.05896949768066406, -0.055335044860839844, -0.051700592041015625, -0.048066139221191406, -0.04443168640136719, -0.04079723358154297, -0.03716278076171875, -0.03352832794189453, -0.029893875122070312, -0.026259422302246094, -0.022624969482421875, -0.018990516662597656, -0.015356063842773438, -0.011721611022949219, -0.008087158203125, -0.004452705383300781, -0.0008182525634765625, 0.0028162002563476562, 0.006450653076171875, 0.010085105895996094, 0.013719558715820312, 0.01735401153564453, 0.02098846435546875, 0.02462291717529297, 0.028257369995117188, 0.031891822814941406, 0.035526275634765625, 0.039160728454589844, 0.04279518127441406, 0.04642963409423828, 0.0500640869140625, 0.05369853973388672, 0.05733299255371094, 0.060967445373535156, 0.06460189819335938, 0.0682363510131836, 0.07187080383300781, 0.07550525665283203, 0.07913970947265625, 0.08277416229248047, 0.08640861511230469, 0.0900430679321289, 0.09367752075195312, 0.09731197357177734, 0.10094642639160156, 0.10458087921142578, 0.10821533203125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 6.0, 15.0, 17.0, 17.0, 16.0, 19.0, 15.0, 30.0, 33.0, 35.0, 39.0, 58.0, 60.0, 61.0, 68.0, 61.0, 56.0, 50.0, 47.0, 55.0, 50.0, 22.0, 22.0, 15.0, 20.0, 18.0, 12.0, 13.0, 11.0, 14.0, 5.0, 3.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.365776062011719e-05, -6.189383566379547e-05, -6.0129910707473755e-05, -5.836598575115204e-05, -5.660206079483032e-05, -5.4838135838508606e-05, -5.307421088218689e-05, -5.131028592586517e-05, -4.954636096954346e-05, -4.778243601322174e-05, -4.6018511056900024e-05, -4.425458610057831e-05, -4.249066114425659e-05, -4.0726736187934875e-05, -3.896281123161316e-05, -3.719888627529144e-05, -3.5434961318969727e-05, -3.367103636264801e-05, -3.1907111406326294e-05, -3.0143186450004578e-05, -2.837926149368286e-05, -2.6615336537361145e-05, -2.485141158103943e-05, -2.3087486624717712e-05, -2.1323561668395996e-05, -1.955963671207428e-05, -1.7795711755752563e-05, -1.6031786799430847e-05, -1.4267861843109131e-05, -1.2503936886787415e-05, -1.0740011930465698e-05, -8.976086974143982e-06, -7.212162017822266e-06, -5.448237061500549e-06, -3.684312105178833e-06, -1.9203871488571167e-06, -1.564621925354004e-07, 1.607462763786316e-06, 3.3713877201080322e-06, 5.1353126764297485e-06, 6.899237632751465e-06, 8.663162589073181e-06, 1.0427087545394897e-05, 1.2191012501716614e-05, 1.395493745803833e-05, 1.5718862414360046e-05, 1.7482787370681763e-05, 1.924671232700348e-05, 2.1010637283325195e-05, 2.277456223964691e-05, 2.4538487195968628e-05, 2.6302412152290344e-05, 2.806633710861206e-05, 2.9830262064933777e-05, 3.159418702125549e-05, 3.335811197757721e-05, 3.5122036933898926e-05, 3.688596189022064e-05, 3.864988684654236e-05, 4.0413811802864075e-05, 4.217773675918579e-05, 4.394166171550751e-05, 4.5705586671829224e-05, 4.746951162815094e-05, 4.9233436584472656e-05]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 12.0, 12.0, 15.0, 7.0, 25.0, 23.0, 29.0, 44.0, 64.0, 112.0, 221.0, 483.0, 3732.0, 189390.0, 822548.0, 29800.0, 1186.0, 328.0, 171.0, 93.0, 62.0, 22.0, 26.0, 26.0, 23.0, 16.0, 10.0, 16.0, 13.0, 7.0, 2.0, 0.0, 2.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007991790771484375, -0.000769883394241333, -0.0007405877113342285, -0.000711292028427124, -0.0006819963455200195, -0.000652700662612915, -0.0006234049797058105, -0.0005941092967987061, -0.0005648136138916016, -0.0005355179309844971, -0.0005062222480773926, -0.0004769265651702881, -0.0004476308822631836, -0.0004183351993560791, -0.0003890395164489746, -0.0003597438335418701, -0.0003304481506347656, -0.00030115246772766113, -0.00027185678482055664, -0.00024256110191345215, -0.00021326541900634766, -0.00018396973609924316, -0.00015467405319213867, -0.00012537837028503418, -9.608268737792969e-05, -6.67870044708252e-05, -3.74913215637207e-05, -8.195638656616211e-06, 2.110004425048828e-05, 5.0395727157592773e-05, 7.969141006469727e-05, 0.00010898709297180176, 0.00013828277587890625, 0.00016757845878601074, 0.00019687414169311523, 0.00022616982460021973, 0.0002554655075073242, 0.0002847611904144287, 0.0003140568733215332, 0.0003433525562286377, 0.0003726482391357422, 0.0004019439220428467, 0.00043123960494995117, 0.00046053528785705566, 0.0004898309707641602, 0.0005191266536712646, 0.0005484223365783691, 0.0005777180194854736, 0.0006070137023925781, 0.0006363093852996826, 0.0006656050682067871, 0.0006949007511138916, 0.0007241964340209961, 0.0007534921169281006, 0.0007827877998352051, 0.0008120834827423096, 0.0008413791656494141, 0.0008706748485565186, 0.000899970531463623, 0.0009292662143707275, 0.000958561897277832, 0.0009878575801849365, 0.001017153263092041, 0.0010464489459991455, 0.00107574462890625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 16.0, 44.0, 99.0, 231.0, 269.0, 197.0, 99.0, 36.0, 15.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3341970012988895e-05, -3.8189984479686245e-05, -3.3037998946383595e-05, -2.788600977510214e-05, -2.273402424179949e-05, -1.758203870849684e-05, -1.2430049537215382e-05, -7.278064003912732e-06, -2.126078470610082e-06, 3.0259079721872695e-06, 8.177894414984621e-06, 1.3329881767276675e-05, 1.8481867300579324e-05, 2.3633852833881974e-05, 2.878584200516343e-05, 3.393782753846608e-05, 3.908981307176873e-05, 4.424179860507138e-05, 4.939378413837403e-05, 5.454577330965549e-05, 5.969775884295814e-05, 6.484974437626079e-05, 7.000173354754224e-05, 7.515371544286609e-05, 8.030570461414754e-05, 8.5457693785429e-05, 9.060967568075284e-05, 9.57616648520343e-05, 0.00010091364674735814, 0.0001060656359186396, 0.00011121762508992106, 0.00011636961426120251, 0.00012152158888056874, 0.0001266735780518502, 0.00013182556722313166, 0.00013697755639441311, 0.00014212953101377934, 0.0001472815201850608, 0.00015243350935634226, 0.0001575854985276237, 0.00016273747314698994, 0.0001678894623182714, 0.00017304145148955286, 0.0001781934406608343, 0.00018334541528020054, 0.000188497404451482, 0.00019364939362276345, 0.0001988013827940449, 0.00020395337196532637, 0.00020910536113660783, 0.00021425735030788928, 0.0002194093249272555, 0.00022456131409853697, 0.00022971330326981843, 0.00023486529244109988, 0.00024001728161238134, 0.0002451692707836628, 0.00025032125995494425, 0.0002554732491262257, 0.00026062523829750717, 0.0002657772274687886, 0.0002709291875362396, 0.00027608120581135154, 0.00028123316587880254, 0.000286385155050084]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 9.0, 7.0, 6.0, 6.0, 12.0, 17.0, 13.0, 22.0, 15.0, 36.0, 30.0, 37.0, 33.0, 24.0, 43.0, 39.0, 40.0, 39.0, 40.0, 50.0, 46.0, 32.0, 52.0, 27.0, 33.0, 37.0, 47.0, 30.0, 26.0, 33.0, 22.0, 14.0, 19.0, 13.0, 7.0, 12.0, 7.0, 6.0, 4.0, 1.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.07099723815918e-05, -3.952439874410629e-05, -3.833882510662079e-05, -3.7153251469135284e-05, -3.596767783164978e-05, -3.4782104194164276e-05, -3.359653055667877e-05, -3.241095691919327e-05, -3.1225383281707764e-05, -3.003980964422226e-05, -2.8854236006736755e-05, -2.766866236925125e-05, -2.6483088731765747e-05, -2.5297515094280243e-05, -2.411194145679474e-05, -2.2926367819309235e-05, -2.174079418182373e-05, -2.0555220544338226e-05, -1.9369646906852722e-05, -1.8184073269367218e-05, -1.6998499631881714e-05, -1.581292599439621e-05, -1.4627352356910706e-05, -1.3441778719425201e-05, -1.2256205081939697e-05, -1.1070631444454193e-05, -9.885057806968689e-06, -8.699484169483185e-06, -7.513910531997681e-06, -6.3283368945121765e-06, -5.142763257026672e-06, -3.957189619541168e-06, -2.771615982055664e-06, -1.58604234457016e-06, -4.0046870708465576e-07, 7.851049304008484e-07, 1.9706785678863525e-06, 3.1562522053718567e-06, 4.341825842857361e-06, 5.527399480342865e-06, 6.712973117828369e-06, 7.898546755313873e-06, 9.084120392799377e-06, 1.0269694030284882e-05, 1.1455267667770386e-05, 1.264084130525589e-05, 1.3826414942741394e-05, 1.5011988580226898e-05, 1.6197562217712402e-05, 1.7383135855197906e-05, 1.856870949268341e-05, 1.9754283130168915e-05, 2.093985676765442e-05, 2.2125430405139923e-05, 2.3311004042625427e-05, 2.449657768011093e-05, 2.5682151317596436e-05, 2.686772495508194e-05, 2.8053298592567444e-05, 2.9238872230052948e-05, 3.0424445867538452e-05, 3.1610019505023956e-05, 3.279559314250946e-05, 3.3981166779994965e-05, 3.516674041748047e-05]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 13.0, 16.0, 14.0, 7.0, 14.0, 16.0, 19.0, 23.0, 28.0, 44.0, 39.0, 43.0, 38.0, 40.0, 42.0, 57.0, 50.0, 50.0, 40.0, 43.0, 45.0, 36.0, 40.0, 35.0, 22.0, 39.0, 24.0, 15.0, 22.0, 14.0, 16.0, 7.0, 8.0, 1.0, 6.0, 9.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.36328125, -4.2247314453125, -4.086181640625, -3.9476318359375, -3.80908203125, -3.6705322265625, -3.531982421875, -3.3934326171875, -3.2548828125, -3.1163330078125, -2.977783203125, -2.8392333984375, -2.70068359375, -2.5621337890625, -2.423583984375, -2.2850341796875, -2.146484375, -2.0079345703125, -1.869384765625, -1.7308349609375, -1.59228515625, -1.4537353515625, -1.315185546875, -1.1766357421875, -1.0380859375, -0.8995361328125, -0.760986328125, -0.6224365234375, -0.48388671875, -0.3453369140625, -0.206787109375, -0.0682373046875, 0.0703125, 0.2088623046875, 0.347412109375, 0.4859619140625, 0.62451171875, 0.7630615234375, 0.901611328125, 1.0401611328125, 1.1787109375, 1.3172607421875, 1.455810546875, 1.5943603515625, 1.73291015625, 1.8714599609375, 2.010009765625, 2.1485595703125, 2.287109375, 2.4256591796875, 2.564208984375, 2.7027587890625, 2.84130859375, 2.9798583984375, 3.118408203125, 3.2569580078125, 3.3955078125, 3.5340576171875, 3.672607421875, 3.8111572265625, 3.94970703125, 4.0882568359375, 4.226806640625, 4.3653564453125, 4.50390625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 5.0, 7.0, 8.0, 10.0, 9.0, 21.0, 16.0, 26.0, 22.0, 27.0, 37.0, 62.0, 92.0, 115.0, 200.0, 239.0, 348.0, 662.0, 1104.0, 1981.0, 4061.0, 10252.0, 35127.0, 214414.0, 691632.0, 61142.0, 15219.0, 5522.0, 2589.0, 1396.0, 788.0, 422.0, 275.0, 197.0, 128.0, 104.0, 61.0, 52.0, 28.0, 34.0, 32.0, 18.0, 14.0, 12.0, 10.0, 8.0, 8.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.4296875, -12.9847412109375, -12.539794921875, -12.0948486328125, -11.64990234375, -11.2049560546875, -10.760009765625, -10.3150634765625, -9.8701171875, -9.4251708984375, -8.980224609375, -8.5352783203125, -8.09033203125, -7.6453857421875, -7.200439453125, -6.7554931640625, -6.310546875, -5.8656005859375, -5.420654296875, -4.9757080078125, -4.53076171875, -4.0858154296875, -3.640869140625, -3.1959228515625, -2.7509765625, -2.3060302734375, -1.861083984375, -1.4161376953125, -0.97119140625, -0.5262451171875, -0.081298828125, 0.3636474609375, 0.80859375, 1.2535400390625, 1.698486328125, 2.1434326171875, 2.58837890625, 3.0333251953125, 3.478271484375, 3.9232177734375, 4.3681640625, 4.8131103515625, 5.258056640625, 5.7030029296875, 6.14794921875, 6.5928955078125, 7.037841796875, 7.4827880859375, 7.927734375, 8.3726806640625, 8.817626953125, 9.2625732421875, 9.70751953125, 10.1524658203125, 10.597412109375, 11.0423583984375, 11.4873046875, 11.9322509765625, 12.377197265625, 12.8221435546875, 13.26708984375, 13.7120361328125, 14.156982421875, 14.6019287109375, 15.046875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 0.0, 7.0, 8.0, 17.0, 14.0, 16.0, 24.0, 15.0, 28.0, 29.0, 33.0, 40.0, 49.0, 42.0, 44.0, 62.0, 86.0, 112.0, 271.0, 1546.0, 116.0, 78.0, 68.0, 57.0, 40.0, 36.0, 39.0, 26.0, 23.0, 20.0, 22.0, 17.0, 18.0, 10.0, 6.0, 6.0, 5.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.265625, -13.775390625, -13.28515625, -12.794921875, -12.3046875, -11.814453125, -11.32421875, -10.833984375, -10.34375, -9.853515625, -9.36328125, -8.873046875, -8.3828125, -7.892578125, -7.40234375, -6.912109375, -6.421875, -5.931640625, -5.44140625, -4.951171875, -4.4609375, -3.970703125, -3.48046875, -2.990234375, -2.5, -2.009765625, -1.51953125, -1.029296875, -0.5390625, -0.048828125, 0.44140625, 0.931640625, 1.421875, 1.912109375, 2.40234375, 2.892578125, 3.3828125, 3.873046875, 4.36328125, 4.853515625, 5.34375, 5.833984375, 6.32421875, 6.814453125, 7.3046875, 7.794921875, 8.28515625, 8.775390625, 9.265625, 9.755859375, 10.24609375, 10.736328125, 11.2265625, 11.716796875, 12.20703125, 12.697265625, 13.1875, 13.677734375, 14.16796875, 14.658203125, 15.1484375, 15.638671875, 16.12890625, 16.619140625, 17.109375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 7.0, 12.0, 10.0, 10.0, 19.0, 30.0, 27.0, 47.0, 75.0, 89.0, 144.0, 238.0, 439.0, 1047.0, 3584.0, 19184.0, 226188.0, 2790082.0, 89517.0, 10759.0, 2322.0, 774.0, 339.0, 228.0, 165.0, 100.0, 69.0, 49.0, 32.0, 32.0, 22.0, 19.0, 12.0, 7.0, 6.0, 2.0, 7.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.65625, -28.766845703125, -27.87744140625, -26.988037109375, -26.0986328125, -25.209228515625, -24.31982421875, -23.430419921875, -22.541015625, -21.651611328125, -20.76220703125, -19.872802734375, -18.9833984375, -18.093994140625, -17.20458984375, -16.315185546875, -15.42578125, -14.536376953125, -13.64697265625, -12.757568359375, -11.8681640625, -10.978759765625, -10.08935546875, -9.199951171875, -8.310546875, -7.421142578125, -6.53173828125, -5.642333984375, -4.7529296875, -3.863525390625, -2.97412109375, -2.084716796875, -1.1953125, -0.305908203125, 0.58349609375, 1.472900390625, 2.3623046875, 3.251708984375, 4.14111328125, 5.030517578125, 5.919921875, 6.809326171875, 7.69873046875, 8.588134765625, 9.4775390625, 10.366943359375, 11.25634765625, 12.145751953125, 13.03515625, 13.924560546875, 14.81396484375, 15.703369140625, 16.5927734375, 17.482177734375, 18.37158203125, 19.260986328125, 20.150390625, 21.039794921875, 21.92919921875, 22.818603515625, 23.7080078125, 24.597412109375, 25.48681640625, 26.376220703125, 27.265625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 243.0, 756.0, 19.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.11857223510742, -30.582426071166992, -17.046279907226562, -3.5101356506347656, 10.026012420654297, 23.56216049194336, 37.09830093383789, 50.63444900512695, 64.17059326171875, 77.70674133300781, 91.24288940429688, 104.7790298461914, 118.31517791748047, 131.851318359375, 145.38746643066406, 158.92361450195312, 172.4597625732422, 185.99591064453125, 199.5320587158203, 213.06820678710938, 226.60433959960938, 240.1405029296875, 253.6766357421875, 267.2127685546875, 280.7489318847656, 294.2850646972656, 307.82122802734375, 321.35736083984375, 334.8935241699219, 348.4296569824219, 361.9658203125, 375.501953125, 389.0380859375, 402.57421875, 416.1103820800781, 429.6465148925781, 443.18267822265625, 456.71881103515625, 470.25494384765625, 483.7911071777344, 497.3272705078125, 510.8634033203125, 524.3995361328125, 537.9357299804688, 551.4718627929688, 565.0079956054688, 578.5441284179688, 592.080322265625, 605.616455078125, 619.152587890625, 632.688720703125, 646.2249145507812, 659.7610473632812, 673.2971801757812, 686.8333129882812, 700.3695068359375, 713.9055786132812, 727.4417114257812, 740.9778442382812, 754.5140380859375, 768.0501708984375, 781.5863037109375, 795.1224365234375, 808.6585693359375, 822.1947631835938]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 9.0, 4.0, 4.0, 11.0, 7.0, 11.0, 15.0, 10.0, 16.0, 13.0, 30.0, 17.0, 35.0, 25.0, 34.0, 24.0, 36.0, 39.0, 40.0, 40.0, 40.0, 33.0, 43.0, 36.0, 49.0, 35.0, 44.0, 45.0, 35.0, 41.0, 25.0, 20.0, 20.0, 13.0, 25.0, 15.0, 13.0, 9.0, 17.0, 10.0, 5.0, 4.0, 4.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-50.25257873535156, -48.816070556640625, -47.37956237792969, -45.94305419921875, -44.50654220581055, -43.07003402709961, -41.63352584838867, -40.197017669677734, -38.76050567626953, -37.323997497558594, -35.887489318847656, -34.45098114013672, -33.014469146728516, -31.577960968017578, -30.14145278930664, -28.704944610595703, -27.268436431884766, -25.831928253173828, -24.395418167114258, -22.95890998840332, -21.52239990234375, -20.085891723632812, -18.649383544921875, -17.212875366210938, -15.776365280151367, -14.339856147766113, -12.90334701538086, -11.466838836669922, -10.030329704284668, -8.593820571899414, -7.157312393188477, -5.720803260803223, -4.284294128417969, -2.847785234451294, -1.4112763404846191, 0.025232315063476562, 1.4617414474487305, 2.8982505798339844, 4.334758758544922, 5.771267890930176, 7.20777702331543, 8.644286155700684, 10.080795288085938, 11.517303466796875, 12.953812599182129, 14.390321731567383, 15.82682991027832, 17.26333999633789, 18.699848175048828, 20.136356353759766, 21.572866439819336, 23.009374618530273, 24.445884704589844, 25.88239288330078, 27.31890106201172, 28.755409240722656, 30.191919326782227, 31.628427505493164, 33.064937591552734, 34.50144577026367, 35.93795394897461, 37.37446594238281, 38.81097412109375, 40.24748229980469, 41.683990478515625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 7.0, 10.0, 15.0, 10.0, 10.0, 16.0, 13.0, 21.0, 18.0, 31.0, 31.0, 42.0, 34.0, 46.0, 38.0, 52.0, 48.0, 45.0, 31.0, 50.0, 42.0, 42.0, 49.0, 34.0, 30.0, 33.0, 32.0, 33.0, 26.0, 17.0, 20.0, 19.0, 7.0, 8.0, 7.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.3291015625, -4.185546875, -4.0419921875, -3.8984375, -3.7548828125, -3.611328125, -3.4677734375, -3.32421875, -3.1806640625, -3.037109375, -2.8935546875, -2.75, -2.6064453125, -2.462890625, -2.3193359375, -2.17578125, -2.0322265625, -1.888671875, -1.7451171875, -1.6015625, -1.4580078125, -1.314453125, -1.1708984375, -1.02734375, -0.8837890625, -0.740234375, -0.5966796875, -0.453125, -0.3095703125, -0.166015625, -0.0224609375, 0.12109375, 0.2646484375, 0.408203125, 0.5517578125, 0.6953125, 0.8388671875, 0.982421875, 1.1259765625, 1.26953125, 1.4130859375, 1.556640625, 1.7001953125, 1.84375, 1.9873046875, 2.130859375, 2.2744140625, 2.41796875, 2.5615234375, 2.705078125, 2.8486328125, 2.9921875, 3.1357421875, 3.279296875, 3.4228515625, 3.56640625, 3.7099609375, 3.853515625, 3.9970703125, 4.140625, 4.2841796875, 4.427734375, 4.5712890625, 4.71484375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 9.0, 10.0, 21.0, 18.0, 33.0, 42.0, 76.0, 113.0, 187.0, 371.0, 711.0, 1617.0, 5043.0, 20948.0, 131318.0, 2349354.0, 1563243.0, 97295.0, 16763.0, 4210.0, 1433.0, 654.0, 351.0, 164.0, 94.0, 59.0, 49.0, 28.0, 26.0, 9.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.66552734375, -16.1435546875, -15.62158203125, -15.099609375, -14.57763671875, -14.0556640625, -13.53369140625, -13.01171875, -12.48974609375, -11.9677734375, -11.44580078125, -10.923828125, -10.40185546875, -9.8798828125, -9.35791015625, -8.8359375, -8.31396484375, -7.7919921875, -7.27001953125, -6.748046875, -6.22607421875, -5.7041015625, -5.18212890625, -4.66015625, -4.13818359375, -3.6162109375, -3.09423828125, -2.572265625, -2.05029296875, -1.5283203125, -1.00634765625, -0.484375, 0.03759765625, 0.5595703125, 1.08154296875, 1.603515625, 2.12548828125, 2.6474609375, 3.16943359375, 3.69140625, 4.21337890625, 4.7353515625, 5.25732421875, 5.779296875, 6.30126953125, 6.8232421875, 7.34521484375, 7.8671875, 8.38916015625, 8.9111328125, 9.43310546875, 9.955078125, 10.47705078125, 10.9990234375, 11.52099609375, 12.04296875, 12.56494140625, 13.0869140625, 13.60888671875, 14.130859375, 14.65283203125, 15.1748046875, 15.69677734375, 16.21875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 6.0, 4.0, 12.0, 7.0, 18.0, 15.0, 23.0, 44.0, 46.0, 62.0, 121.0, 148.0, 240.0, 340.0, 509.0, 642.0, 528.0, 390.0, 269.0, 175.0, 134.0, 95.0, 79.0, 56.0, 28.0, 16.0, 18.0, 9.0, 13.0, 7.0, 8.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.046875, -10.6856689453125, -10.324462890625, -9.9632568359375, -9.60205078125, -9.2408447265625, -8.879638671875, -8.5184326171875, -8.1572265625, -7.7960205078125, -7.434814453125, -7.0736083984375, -6.71240234375, -6.3511962890625, -5.989990234375, -5.6287841796875, -5.267578125, -4.9063720703125, -4.545166015625, -4.1839599609375, -3.82275390625, -3.4615478515625, -3.100341796875, -2.7391357421875, -2.3779296875, -2.0167236328125, -1.655517578125, -1.2943115234375, -0.93310546875, -0.5718994140625, -0.210693359375, 0.1505126953125, 0.51171875, 0.8729248046875, 1.234130859375, 1.5953369140625, 1.95654296875, 2.3177490234375, 2.678955078125, 3.0401611328125, 3.4013671875, 3.7625732421875, 4.123779296875, 4.4849853515625, 4.84619140625, 5.2073974609375, 5.568603515625, 5.9298095703125, 6.291015625, 6.6522216796875, 7.013427734375, 7.3746337890625, 7.73583984375, 8.0970458984375, 8.458251953125, 8.8194580078125, 9.1806640625, 9.5418701171875, 9.903076171875, 10.2642822265625, 10.62548828125, 10.9866943359375, 11.347900390625, 11.7091064453125, 12.0703125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 7.0, 14.0, 22.0, 27.0, 44.0, 51.0, 117.0, 160.0, 320.0, 520.0, 1123.0, 2581.0, 7087.0, 24092.0, 100715.0, 666013.0, 2838782.0, 448648.0, 75176.0, 18740.0, 5919.0, 2118.0, 919.0, 427.0, 224.0, 136.0, 98.0, 50.0, 36.0, 27.0, 20.0, 15.0, 7.0, 7.0, 5.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.62353515625, -17.0439453125, -16.46435546875, -15.884765625, -15.30517578125, -14.7255859375, -14.14599609375, -13.56640625, -12.98681640625, -12.4072265625, -11.82763671875, -11.248046875, -10.66845703125, -10.0888671875, -9.50927734375, -8.9296875, -8.35009765625, -7.7705078125, -7.19091796875, -6.611328125, -6.03173828125, -5.4521484375, -4.87255859375, -4.29296875, -3.71337890625, -3.1337890625, -2.55419921875, -1.974609375, -1.39501953125, -0.8154296875, -0.23583984375, 0.34375, 0.92333984375, 1.5029296875, 2.08251953125, 2.662109375, 3.24169921875, 3.8212890625, 4.40087890625, 4.98046875, 5.56005859375, 6.1396484375, 6.71923828125, 7.298828125, 7.87841796875, 8.4580078125, 9.03759765625, 9.6171875, 10.19677734375, 10.7763671875, 11.35595703125, 11.935546875, 12.51513671875, 13.0947265625, 13.67431640625, 14.25390625, 14.83349609375, 15.4130859375, 15.99267578125, 16.572265625, 17.15185546875, 17.7314453125, 18.31103515625, 18.890625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 13.0, 33.0, 55.0, 76.0, 105.0, 117.0, 138.0, 141.0, 109.0, 82.0, 54.0, 28.0, 31.0, 10.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.2820816040039, -90.87358856201172, -88.46509552001953, -86.05660247802734, -83.64810943603516, -81.23961639404297, -78.83112335205078, -76.42263793945312, -74.01414489746094, -71.60565185546875, -69.19715881347656, -66.78866577148438, -64.38017272949219, -61.9716796875, -59.56319046020508, -57.15469741821289, -54.74620056152344, -52.33770751953125, -49.92921447753906, -47.520721435546875, -45.11222839355469, -42.7037353515625, -40.29524612426758, -37.88675308227539, -35.4782600402832, -33.069766998291016, -30.661273956298828, -28.252782821655273, -25.844289779663086, -23.4357967376709, -21.027305603027344, -18.618812561035156, -16.21031951904297, -13.801826477050781, -11.39333438873291, -8.984842300415039, -6.576349258422852, -4.167856216430664, -1.759364128112793, 0.6491279602050781, 3.0576210021972656, 5.466113567352295, 7.874606132507324, 10.283098220825195, 12.691591262817383, 15.10008430480957, 17.508575439453125, 19.917068481445312, 22.3255615234375, 24.734054565429688, 27.142547607421875, 29.55103874206543, 31.959531784057617, 34.36802673339844, 36.77651596069336, 39.18500900268555, 41.593502044677734, 44.00199508666992, 46.41048812866211, 48.8189811706543, 51.22747039794922, 53.635963439941406, 56.044456481933594, 58.45294952392578, 60.86144256591797]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 7.0, 3.0, 13.0, 18.0, 20.0, 22.0, 16.0, 26.0, 26.0, 28.0, 28.0, 42.0, 35.0, 43.0, 48.0, 43.0, 48.0, 35.0, 33.0, 41.0, 50.0, 37.0, 42.0, 48.0, 30.0, 30.0, 30.0, 24.0, 28.0, 17.0, 18.0, 13.0, 13.0, 8.0, 8.0, 2.0, 4.0, 0.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.360870361328125, -34.18288803100586, -33.004905700683594, -31.826923370361328, -30.648941040039062, -29.470958709716797, -28.29297637939453, -27.114994049072266, -25.93701171875, -24.759029388427734, -23.58104705810547, -22.403064727783203, -21.225082397460938, -20.047100067138672, -18.869117736816406, -17.69113540649414, -16.513151168823242, -15.335168838500977, -14.157186508178711, -12.979204177856445, -11.80122184753418, -10.623239517211914, -9.445256233215332, -8.267273902893066, -7.089291572570801, -5.911309242248535, -4.7333269119262695, -3.5553441047668457, -2.37736177444458, -1.1993794441223145, -0.021396636962890625, 1.156585693359375, 2.3345680236816406, 3.5125503540039062, 4.690532684326172, 5.868515491485596, 7.046497821807861, 8.224479675292969, 9.40246295928955, 10.580445289611816, 11.758427619934082, 12.936409950256348, 14.114392280578613, 15.292375564575195, 16.47035789489746, 17.648340225219727, 18.826322555541992, 20.004304885864258, 21.182287216186523, 22.36026954650879, 23.538251876831055, 24.71623420715332, 25.894216537475586, 27.07219886779785, 28.25018310546875, 29.428165435791016, 30.60614776611328, 31.784130096435547, 32.96211242675781, 34.14009475708008, 35.318077087402344, 36.49605941772461, 37.674041748046875, 38.85202407836914, 40.030006408691406]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 8.0, 8.0, 12.0, 14.0, 16.0, 20.0, 17.0, 8.0, 25.0, 31.0, 24.0, 45.0, 34.0, 35.0, 39.0, 50.0, 41.0, 44.0, 40.0, 36.0, 38.0, 30.0, 38.0, 31.0, 43.0, 39.0, 34.0, 29.0, 22.0, 27.0, 21.0, 13.0, 15.0, 8.0, 12.0, 12.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.1328125, -3.99810791015625, -3.8634033203125, -3.72869873046875, -3.593994140625, -3.45928955078125, -3.3245849609375, -3.18988037109375, -3.05517578125, -2.92047119140625, -2.7857666015625, -2.65106201171875, -2.516357421875, -2.38165283203125, -2.2469482421875, -2.11224365234375, -1.9775390625, -1.84283447265625, -1.7081298828125, -1.57342529296875, -1.438720703125, -1.30401611328125, -1.1693115234375, -1.03460693359375, -0.89990234375, -0.76519775390625, -0.6304931640625, -0.49578857421875, -0.361083984375, -0.22637939453125, -0.0916748046875, 0.04302978515625, 0.177734375, 0.31243896484375, 0.4471435546875, 0.58184814453125, 0.716552734375, 0.85125732421875, 0.9859619140625, 1.12066650390625, 1.25537109375, 1.39007568359375, 1.5247802734375, 1.65948486328125, 1.794189453125, 1.92889404296875, 2.0635986328125, 2.19830322265625, 2.3330078125, 2.46771240234375, 2.6024169921875, 2.73712158203125, 2.871826171875, 3.00653076171875, 3.1412353515625, 3.27593994140625, 3.41064453125, 3.54534912109375, 3.6800537109375, 3.81475830078125, 3.949462890625, 4.08416748046875, 4.2188720703125, 4.35357666015625, 4.48828125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 8.0, 3.0, 5.0, 9.0, 12.0, 27.0, 41.0, 52.0, 65.0, 115.0, 178.0, 236.0, 375.0, 532.0, 792.0, 1148.0, 1822.0, 2615.0, 4046.0, 6065.0, 9212.0, 14058.0, 22074.0, 35308.0, 58223.0, 102685.0, 215080.0, 265091.0, 126167.0, 68766.0, 41086.0, 25384.0, 16153.0, 10570.0, 6864.0, 4494.0, 3049.0, 2003.0, 1438.0, 845.0, 624.0, 414.0, 285.0, 194.0, 128.0, 73.0, 54.0, 43.0, 18.0, 10.0, 11.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1529541015625, -0.14804458618164062, -0.14313507080078125, -0.13822555541992188, -0.1333160400390625, -0.12840652465820312, -0.12349700927734375, -0.11858749389648438, -0.113677978515625, -0.10876846313476562, -0.10385894775390625, -0.09894943237304688, -0.0940399169921875, -0.08913040161132812, -0.08422088623046875, -0.07931137084960938, -0.07440185546875, -0.06949234008789062, -0.06458282470703125, -0.059673309326171875, -0.0547637939453125, -0.049854278564453125, -0.04494476318359375, -0.040035247802734375, -0.035125732421875, -0.030216217041015625, -0.02530670166015625, -0.020397186279296875, -0.0154876708984375, -0.010578155517578125, -0.00566864013671875, -0.000759124755859375, 0.004150390625, 0.009059906005859375, 0.01396942138671875, 0.018878936767578125, 0.0237884521484375, 0.028697967529296875, 0.03360748291015625, 0.038516998291015625, 0.043426513671875, 0.048336029052734375, 0.05324554443359375, 0.058155059814453125, 0.0630645751953125, 0.06797409057617188, 0.07288360595703125, 0.07779312133789062, 0.08270263671875, 0.08761215209960938, 0.09252166748046875, 0.09743118286132812, 0.1023406982421875, 0.10725021362304688, 0.11215972900390625, 0.11706924438476562, 0.121978759765625, 0.12688827514648438, 0.13179779052734375, 0.13670730590820312, 0.1416168212890625, 0.14652633666992188, 0.15143585205078125, 0.15634536743164062, 0.1612548828125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 4.0, 4.0, 8.0, 13.0, 11.0, 7.0, 11.0, 18.0, 21.0, 31.0, 21.0, 31.0, 27.0, 28.0, 43.0, 32.0, 32.0, 39.0, 46.0, 41.0, 1074.0, 47.0, 46.0, 41.0, 29.0, 28.0, 33.0, 32.0, 23.0, 18.0, 19.0, 22.0, 25.0, 19.0, 14.0, 17.0, 11.0, 16.0, 8.0, 6.0, 7.0, 6.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.26953125, -3.1728515625, -3.076171875, -2.9794921875, -2.8828125, -2.7861328125, -2.689453125, -2.5927734375, -2.49609375, -2.3994140625, -2.302734375, -2.2060546875, -2.109375, -2.0126953125, -1.916015625, -1.8193359375, -1.72265625, -1.6259765625, -1.529296875, -1.4326171875, -1.3359375, -1.2392578125, -1.142578125, -1.0458984375, -0.94921875, -0.8525390625, -0.755859375, -0.6591796875, -0.5625, -0.4658203125, -0.369140625, -0.2724609375, -0.17578125, -0.0791015625, 0.017578125, 0.1142578125, 0.2109375, 0.3076171875, 0.404296875, 0.5009765625, 0.59765625, 0.6943359375, 0.791015625, 0.8876953125, 0.984375, 1.0810546875, 1.177734375, 1.2744140625, 1.37109375, 1.4677734375, 1.564453125, 1.6611328125, 1.7578125, 1.8544921875, 1.951171875, 2.0478515625, 2.14453125, 2.2412109375, 2.337890625, 2.4345703125, 2.53125, 2.6279296875, 2.724609375, 2.8212890625, 2.91796875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 13.0, 19.0, 14.0, 35.0, 44.0, 81.0, 109.0, 174.0, 263.0, 397.0, 627.0, 926.0, 1522.0, 2323.0, 3760.0, 5891.0, 9434.0, 15717.0, 25457.0, 42636.0, 74903.0, 156719.0, 1376636.0, 180505.0, 81371.0, 45960.0, 27277.0, 16879.0, 10220.0, 6358.0, 3902.0, 2515.0, 1568.0, 1018.0, 635.0, 430.0, 259.0, 189.0, 113.0, 80.0, 50.0, 36.0, 28.0, 11.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11602783203125, -0.11246585845947266, -0.10890388488769531, -0.10534191131591797, -0.10177993774414062, -0.09821796417236328, -0.09465599060058594, -0.0910940170288086, -0.08753204345703125, -0.0839700698852539, -0.08040809631347656, -0.07684612274169922, -0.07328414916992188, -0.06972217559814453, -0.06616020202636719, -0.06259822845458984, -0.0590362548828125, -0.055474281311035156, -0.05191230773925781, -0.04835033416748047, -0.044788360595703125, -0.04122638702392578, -0.03766441345214844, -0.034102439880371094, -0.03054046630859375, -0.026978492736816406, -0.023416519165039062, -0.01985454559326172, -0.016292572021484375, -0.012730598449707031, -0.009168624877929688, -0.005606651306152344, -0.002044677734375, 0.0015172958374023438, 0.0050792694091796875, 0.008641242980957031, 0.012203216552734375, 0.01576519012451172, 0.019327163696289062, 0.022889137268066406, 0.02645111083984375, 0.030013084411621094, 0.03357505798339844, 0.03713703155517578, 0.040699005126953125, 0.04426097869873047, 0.04782295227050781, 0.051384925842285156, 0.0549468994140625, 0.058508872985839844, 0.06207084655761719, 0.06563282012939453, 0.06919479370117188, 0.07275676727294922, 0.07631874084472656, 0.0798807144165039, 0.08344268798828125, 0.0870046615600586, 0.09056663513183594, 0.09412860870361328, 0.09769058227539062, 0.10125255584716797, 0.10481452941894531, 0.10837650299072266, 0.1119384765625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 6.0, 5.0, 2.0, 6.0, 3.0, 9.0, 12.0, 11.0, 21.0, 20.0, 24.0, 26.0, 31.0, 33.0, 42.0, 39.0, 45.0, 36.0, 33.0, 44.0, 51.0, 50.0, 38.0, 43.0, 42.0, 36.0, 42.0, 43.0, 30.0, 22.0, 26.0, 17.0, 15.0, 13.0, 15.0, 14.0, 9.0, 5.0, 5.0, 8.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0], "bins": [-4.792213439941406e-05, -4.655681550502777e-05, -4.519149661064148e-05, -4.382617771625519e-05, -4.2460858821868896e-05, -4.1095539927482605e-05, -3.9730221033096313e-05, -3.836490213871002e-05, -3.699958324432373e-05, -3.563426434993744e-05, -3.426894545555115e-05, -3.2903626561164856e-05, -3.1538307666778564e-05, -3.0172988772392273e-05, -2.880766987800598e-05, -2.744235098361969e-05, -2.60770320892334e-05, -2.4711713194847107e-05, -2.3346394300460815e-05, -2.1981075406074524e-05, -2.0615756511688232e-05, -1.925043761730194e-05, -1.788511872291565e-05, -1.6519799828529358e-05, -1.5154480934143066e-05, -1.3789162039756775e-05, -1.2423843145370483e-05, -1.1058524250984192e-05, -9.6932053565979e-06, -8.327886462211609e-06, -6.962567567825317e-06, -5.597248673439026e-06, -4.231929779052734e-06, -2.866610884666443e-06, -1.5012919902801514e-06, -1.3597309589385986e-07, 1.2293457984924316e-06, 2.594664692878723e-06, 3.959983587265015e-06, 5.325302481651306e-06, 6.690621376037598e-06, 8.05594027042389e-06, 9.42125916481018e-06, 1.0786578059196472e-05, 1.2151896953582764e-05, 1.3517215847969055e-05, 1.4882534742355347e-05, 1.6247853636741638e-05, 1.761317253112793e-05, 1.897849142551422e-05, 2.0343810319900513e-05, 2.1709129214286804e-05, 2.3074448108673096e-05, 2.4439767003059387e-05, 2.580508589744568e-05, 2.717040479183197e-05, 2.8535723686218262e-05, 2.9901042580604553e-05, 3.1266361474990845e-05, 3.2631680369377136e-05, 3.399699926376343e-05, 3.536231815814972e-05, 3.672763705253601e-05, 3.80929559469223e-05, 3.9458274841308594e-05]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 7.0, 6.0, 9.0, 9.0, 9.0, 16.0, 15.0, 16.0, 30.0, 29.0, 38.0, 74.0, 99.0, 144.0, 318.0, 855.0, 7534.0, 224995.0, 764020.0, 46811.0, 2355.0, 494.0, 188.0, 109.0, 88.0, 61.0, 42.0, 39.0, 20.0, 29.0, 12.0, 14.0, 11.0, 10.0, 4.0, 2.0, 9.0, 3.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006771087646484375, -0.0006539821624755859, -0.0006308555603027344, -0.0006077289581298828, -0.0005846023559570312, -0.0005614757537841797, -0.0005383491516113281, -0.0005152225494384766, -0.000492095947265625, -0.00046896934509277344, -0.0004458427429199219, -0.0004227161407470703, -0.00039958953857421875, -0.0003764629364013672, -0.0003533363342285156, -0.00033020973205566406, -0.0003070831298828125, -0.00028395652770996094, -0.0002608299255371094, -0.0002377033233642578, -0.00021457672119140625, -0.0001914501190185547, -0.00016832351684570312, -0.00014519691467285156, -0.0001220703125, -9.894371032714844e-05, -7.581710815429688e-05, -5.269050598144531e-05, -2.956390380859375e-05, -6.4373016357421875e-06, 1.6689300537109375e-05, 3.981590270996094e-05, 6.29425048828125e-05, 8.606910705566406e-05, 0.00010919570922851562, 0.0001323223114013672, 0.00015544891357421875, 0.0001785755157470703, 0.00020170211791992188, 0.00022482872009277344, 0.000247955322265625, 0.00027108192443847656, 0.0002942085266113281, 0.0003173351287841797, 0.00034046173095703125, 0.0003635883331298828, 0.0003867149353027344, 0.00040984153747558594, 0.0004329681396484375, 0.00045609474182128906, 0.0004792213439941406, 0.0005023479461669922, 0.0005254745483398438, 0.0005486011505126953, 0.0005717277526855469, 0.0005948543548583984, 0.00061798095703125, 0.0006411075592041016, 0.0006642341613769531, 0.0006873607635498047, 0.0007104873657226562, 0.0007336139678955078, 0.0007567405700683594, 0.0007798671722412109, 0.0008029937744140625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [5.0, 78.0, 478.0, 399.0, 54.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.225445470889099e-05, -2.1058283891761675e-05, -9.862113074632362e-06, 1.3340577424969524e-06, 1.2530228559626266e-05, 2.372639937675558e-05, 3.4922570193884894e-05, 4.611874101101421e-05, 5.731491182814352e-05, 6.851108628325164e-05, 7.970725710038096e-05, 9.090342791751027e-05, 0.00010209959873463959, 0.0001132957695517689, 0.0001244919403688982, 0.00013568811118602753, 0.00014688428200315684, 0.00015808045282028615, 0.00016927662363741547, 0.00018047279445454478, 0.0001916689652716741, 0.0002028651360888034, 0.00021406130690593272, 0.00022525747772306204, 0.00023645364854019135, 0.00024764981935732067, 0.00025884597562253475, 0.0002700421609915793, 0.00028123834636062384, 0.0002924345026258379, 0.000303630658891052, 0.00031482684426009655, 0.0003260230296291411, 0.00033721921499818563, 0.0003484153712633997, 0.0003596115275286138, 0.00037080771289765835, 0.0003820038982667029, 0.000393200054531917, 0.00040439621079713106, 0.0004155923961661756, 0.00042678858153522015, 0.00043798473780043423, 0.0004491808940656483, 0.00046037707943469286, 0.0004715732648037374, 0.0004827694210689515, 0.0004939655773341656, 0.0005051617627032101, 0.0005163579480722547, 0.0005275540752336383, 0.0005387502606026828, 0.0005499464459717274, 0.0005611426313407719, 0.0005723388167098165, 0.0005835349438712001, 0.0005947311292402446, 0.0006059273146092892, 0.0006171234417706728, 0.0006283196271397173, 0.0006395158125087619, 0.0006507119978778064, 0.000661908183246851, 0.0006731043104082346, 0.0006843004957772791]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 10.0, 21.0, 13.0, 18.0, 19.0, 18.0, 36.0, 22.0, 29.0, 31.0, 37.0, 32.0, 46.0, 49.0, 32.0, 46.0, 45.0, 55.0, 37.0, 44.0, 32.0, 44.0, 37.0, 32.0, 39.0, 25.0, 23.0, 19.0, 21.0, 13.0, 8.0, 7.0, 6.0, 8.0, 7.0, 5.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.921985626220703e-05, -3.806035965681076e-05, -3.690086305141449e-05, -3.574136644601822e-05, -3.458186984062195e-05, -3.342237323522568e-05, -3.226287662982941e-05, -3.1103380024433136e-05, -2.9943883419036865e-05, -2.8784386813640594e-05, -2.7624890208244324e-05, -2.6465393602848053e-05, -2.5305896997451782e-05, -2.414640039205551e-05, -2.298690378665924e-05, -2.182740718126297e-05, -2.06679105758667e-05, -1.950841397047043e-05, -1.8348917365074158e-05, -1.7189420759677887e-05, -1.6029924154281616e-05, -1.4870427548885345e-05, -1.3710930943489075e-05, -1.2551434338092804e-05, -1.1391937732696533e-05, -1.0232441127300262e-05, -9.072944521903992e-06, -7.913447916507721e-06, -6.75395131111145e-06, -5.5944547057151794e-06, -4.434958100318909e-06, -3.275461494922638e-06, -2.115964889526367e-06, -9.564682841300964e-07, 2.0302832126617432e-07, 1.362524926662445e-06, 2.522021532058716e-06, 3.6815181374549866e-06, 4.841014742851257e-06, 6.000511348247528e-06, 7.160007953643799e-06, 8.31950455904007e-06, 9.47900116443634e-06, 1.0638497769832611e-05, 1.1797994375228882e-05, 1.2957490980625153e-05, 1.4116987586021423e-05, 1.5276484191417694e-05, 1.6435980796813965e-05, 1.7595477402210236e-05, 1.8754974007606506e-05, 1.9914470613002777e-05, 2.1073967218399048e-05, 2.223346382379532e-05, 2.339296042919159e-05, 2.455245703458786e-05, 2.571195363998413e-05, 2.68714502453804e-05, 2.8030946850776672e-05, 2.9190443456172943e-05, 3.0349940061569214e-05, 3.1509436666965485e-05, 3.2668933272361755e-05, 3.3828429877758026e-05, 3.49879264831543e-05]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 8.0, 8.0, 12.0, 14.0, 16.0, 20.0, 17.0, 8.0, 25.0, 31.0, 24.0, 45.0, 34.0, 35.0, 39.0, 50.0, 41.0, 44.0, 40.0, 36.0, 38.0, 30.0, 38.0, 31.0, 43.0, 39.0, 34.0, 29.0, 22.0, 27.0, 21.0, 13.0, 15.0, 8.0, 12.0, 12.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.1328125, -3.99810791015625, -3.8634033203125, -3.72869873046875, -3.593994140625, -3.45928955078125, -3.3245849609375, -3.18988037109375, -3.05517578125, -2.92047119140625, -2.7857666015625, -2.65106201171875, -2.516357421875, -2.38165283203125, -2.2469482421875, -2.11224365234375, -1.9775390625, -1.84283447265625, -1.7081298828125, -1.57342529296875, -1.438720703125, -1.30401611328125, -1.1693115234375, -1.03460693359375, -0.89990234375, -0.76519775390625, -0.6304931640625, -0.49578857421875, -0.361083984375, -0.22637939453125, -0.0916748046875, 0.04302978515625, 0.177734375, 0.31243896484375, 0.4471435546875, 0.58184814453125, 0.716552734375, 0.85125732421875, 0.9859619140625, 1.12066650390625, 1.25537109375, 1.39007568359375, 1.5247802734375, 1.65948486328125, 1.794189453125, 1.92889404296875, 2.0635986328125, 2.19830322265625, 2.3330078125, 2.46771240234375, 2.6024169921875, 2.73712158203125, 2.871826171875, 3.00653076171875, 3.1412353515625, 3.27593994140625, 3.41064453125, 3.54534912109375, 3.6800537109375, 3.81475830078125, 3.949462890625, 4.08416748046875, 4.2188720703125, 4.35357666015625, 4.48828125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 8.0, 9.0, 7.0, 9.0, 21.0, 16.0, 28.0, 39.0, 45.0, 74.0, 113.0, 138.0, 256.0, 371.0, 593.0, 997.0, 1845.0, 4023.0, 11298.0, 43249.0, 293803.0, 585789.0, 77136.0, 17357.0, 5588.0, 2439.0, 1230.0, 712.0, 452.0, 269.0, 181.0, 114.0, 86.0, 75.0, 42.0, 31.0, 21.0, 17.0, 9.0, 11.0, 6.0, 10.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.7578125, -9.4344482421875, -9.111083984375, -8.7877197265625, -8.46435546875, -8.1409912109375, -7.817626953125, -7.4942626953125, -7.1708984375, -6.8475341796875, -6.524169921875, -6.2008056640625, -5.87744140625, -5.5540771484375, -5.230712890625, -4.9073486328125, -4.583984375, -4.2606201171875, -3.937255859375, -3.6138916015625, -3.29052734375, -2.9671630859375, -2.643798828125, -2.3204345703125, -1.9970703125, -1.6737060546875, -1.350341796875, -1.0269775390625, -0.70361328125, -0.3802490234375, -0.056884765625, 0.2664794921875, 0.58984375, 0.9132080078125, 1.236572265625, 1.5599365234375, 1.88330078125, 2.2066650390625, 2.530029296875, 2.8533935546875, 3.1767578125, 3.5001220703125, 3.823486328125, 4.1468505859375, 4.47021484375, 4.7935791015625, 5.116943359375, 5.4403076171875, 5.763671875, 6.0870361328125, 6.410400390625, 6.7337646484375, 7.05712890625, 7.3804931640625, 7.703857421875, 8.0272216796875, 8.3505859375, 8.6739501953125, 8.997314453125, 9.3206787109375, 9.64404296875, 9.9674072265625, 10.290771484375, 10.6141357421875, 10.9375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 9.0, 11.0, 9.0, 9.0, 18.0, 16.0, 22.0, 23.0, 24.0, 34.0, 40.0, 34.0, 49.0, 65.0, 78.0, 109.0, 253.0, 1507.0, 171.0, 103.0, 73.0, 57.0, 44.0, 42.0, 36.0, 27.0, 34.0, 29.0, 15.0, 17.0, 10.0, 8.0, 9.0, 11.0, 11.0, 7.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.15625, -16.609375, -16.0625, -15.515625, -14.96875, -14.421875, -13.875, -13.328125, -12.78125, -12.234375, -11.6875, -11.140625, -10.59375, -10.046875, -9.5, -8.953125, -8.40625, -7.859375, -7.3125, -6.765625, -6.21875, -5.671875, -5.125, -4.578125, -4.03125, -3.484375, -2.9375, -2.390625, -1.84375, -1.296875, -0.75, -0.203125, 0.34375, 0.890625, 1.4375, 1.984375, 2.53125, 3.078125, 3.625, 4.171875, 4.71875, 5.265625, 5.8125, 6.359375, 6.90625, 7.453125, 8.0, 8.546875, 9.09375, 9.640625, 10.1875, 10.734375, 11.28125, 11.828125, 12.375, 12.921875, 13.46875, 14.015625, 14.5625, 15.109375, 15.65625, 16.203125, 16.75, 17.296875, 17.84375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 8.0, 13.0, 10.0, 10.0, 11.0, 16.0, 25.0, 55.0, 37.0, 56.0, 73.0, 86.0, 128.0, 230.0, 432.0, 1107.0, 3471.0, 23261.0, 739463.0, 2332194.0, 37968.0, 4522.0, 1205.0, 484.0, 257.0, 130.0, 110.0, 84.0, 55.0, 43.0, 30.0, 23.0, 16.0, 18.0, 17.0, 15.0, 7.0, 7.0, 3.0, 5.0, 2.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-32.53125, -31.517578125, -30.50390625, -29.490234375, -28.4765625, -27.462890625, -26.44921875, -25.435546875, -24.421875, -23.408203125, -22.39453125, -21.380859375, -20.3671875, -19.353515625, -18.33984375, -17.326171875, -16.3125, -15.298828125, -14.28515625, -13.271484375, -12.2578125, -11.244140625, -10.23046875, -9.216796875, -8.203125, -7.189453125, -6.17578125, -5.162109375, -4.1484375, -3.134765625, -2.12109375, -1.107421875, -0.09375, 0.919921875, 1.93359375, 2.947265625, 3.9609375, 4.974609375, 5.98828125, 7.001953125, 8.015625, 9.029296875, 10.04296875, 11.056640625, 12.0703125, 13.083984375, 14.09765625, 15.111328125, 16.125, 17.138671875, 18.15234375, 19.166015625, 20.1796875, 21.193359375, 22.20703125, 23.220703125, 24.234375, 25.248046875, 26.26171875, 27.275390625, 28.2890625, 29.302734375, 30.31640625, 31.330078125, 32.34375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [10.0, 522.0, 479.0, 8.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.799762725830078, -10.760702133178711, 0.27835845947265625, 11.31741714477539, 22.35647964477539, 33.39554214477539, 44.43459701538086, 55.47365951538086, 66.51272583007812, 77.55178833007812, 88.59085083007812, 99.6299057006836, 110.6689682006836, 121.7080307006836, 132.74708557128906, 143.78614807128906, 154.82521057128906, 165.86427307128906, 176.90333557128906, 187.9423828125, 198.9814453125, 210.0205078125, 221.0595703125, 232.0986328125, 243.1376953125, 254.1767578125, 265.2158203125, 276.2548828125, 287.2939453125, 298.3330078125, 309.3720703125, 320.4111328125, 331.4501953125, 342.4892578125, 353.5283203125, 364.5673828125, 375.6064453125, 386.6455078125, 397.6845703125, 408.7236328125, 419.7626953125, 430.8017578125, 441.8408203125, 452.8798828125, 463.9189453125, 474.9580078125, 485.9970703125, 497.0361328125, 508.0751647949219, 519.1141967773438, 530.1532592773438, 541.1923217773438, 552.2313842773438, 563.2704467773438, 574.3095092773438, 585.3485717773438, 596.3876342773438, 607.4266967773438, 618.4657592773438, 629.5048217773438, 640.5438842773438, 651.5829467773438, 662.6220092773438, 673.6610717773438, 684.7001342773438]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 18.0, 9.0, 14.0, 11.0, 17.0, 18.0, 32.0, 28.0, 18.0, 21.0, 35.0, 27.0, 39.0, 33.0, 37.0, 44.0, 50.0, 30.0, 56.0, 52.0, 41.0, 32.0, 33.0, 36.0, 31.0, 30.0, 27.0, 26.0, 25.0, 18.0, 20.0, 13.0, 10.0, 17.0, 8.0, 6.0, 3.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-47.15910339355469, -45.7601318359375, -44.36116409301758, -42.96219253540039, -41.56322479248047, -40.16425323486328, -38.765281677246094, -37.36631393432617, -35.967342376708984, -34.5683708190918, -33.169403076171875, -31.770431518554688, -30.371461868286133, -28.972492218017578, -27.573522567749023, -26.17455291748047, -24.775583267211914, -23.37661361694336, -21.977643966674805, -20.57867431640625, -19.179702758789062, -17.780733108520508, -16.381763458251953, -14.982792854309082, -13.583823204040527, -12.184853553771973, -10.785882949829102, -9.386913299560547, -7.987943172454834, -6.588973045349121, -5.190003395080566, -3.7910327911376953, -2.3920631408691406, -0.9930931329727173, 0.40587687492370605, 1.8048467636108398, 3.2038168907165527, 4.602787017822266, 6.00175666809082, 7.400727272033691, 8.799696922302246, 10.1986665725708, 11.597637176513672, 12.996606826782227, 14.395576477050781, 15.794547080993652, 17.19351577758789, 18.592487335205078, 19.991456985473633, 21.390426635742188, 22.789396286010742, 24.188365936279297, 25.587337493896484, 26.98630714416504, 28.385276794433594, 29.78424835205078, 31.183216094970703, 32.58218765258789, 33.98115539550781, 35.380126953125, 36.77909469604492, 38.17806625366211, 39.57703399658203, 40.97600555419922, 42.374977111816406]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 7.0, 13.0, 10.0, 15.0, 13.0, 14.0, 24.0, 20.0, 17.0, 31.0, 25.0, 44.0, 35.0, 46.0, 52.0, 32.0, 44.0, 49.0, 39.0, 44.0, 42.0, 39.0, 31.0, 27.0, 44.0, 33.0, 37.0, 31.0, 27.0, 20.0, 19.0, 13.0, 14.0, 9.0, 6.0, 8.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.48828125, -4.340576171875, -4.19287109375, -4.045166015625, -3.8974609375, -3.749755859375, -3.60205078125, -3.454345703125, -3.306640625, -3.158935546875, -3.01123046875, -2.863525390625, -2.7158203125, -2.568115234375, -2.42041015625, -2.272705078125, -2.125, -1.977294921875, -1.82958984375, -1.681884765625, -1.5341796875, -1.386474609375, -1.23876953125, -1.091064453125, -0.943359375, -0.795654296875, -0.64794921875, -0.500244140625, -0.3525390625, -0.204833984375, -0.05712890625, 0.090576171875, 0.23828125, 0.385986328125, 0.53369140625, 0.681396484375, 0.8291015625, 0.976806640625, 1.12451171875, 1.272216796875, 1.419921875, 1.567626953125, 1.71533203125, 1.863037109375, 2.0107421875, 2.158447265625, 2.30615234375, 2.453857421875, 2.6015625, 2.749267578125, 2.89697265625, 3.044677734375, 3.1923828125, 3.340087890625, 3.48779296875, 3.635498046875, 3.783203125, 3.930908203125, 4.07861328125, 4.226318359375, 4.3740234375, 4.521728515625, 4.66943359375, 4.817138671875, 4.96484375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 5.0, 7.0, 6.0, 11.0, 23.0, 31.0, 34.0, 60.0, 63.0, 91.0, 137.0, 219.0, 363.0, 606.0, 1094.0, 2424.0, 6665.0, 24079.0, 136408.0, 1989108.0, 1869003.0, 128940.0, 23221.0, 6465.0, 2351.0, 1148.0, 610.0, 352.0, 235.0, 147.0, 120.0, 64.0, 53.0, 46.0, 17.0, 18.0, 17.0, 11.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0], "bins": [-16.5, -16.0145263671875, -15.529052734375, -15.0435791015625, -14.55810546875, -14.0726318359375, -13.587158203125, -13.1016845703125, -12.6162109375, -12.1307373046875, -11.645263671875, -11.1597900390625, -10.67431640625, -10.1888427734375, -9.703369140625, -9.2178955078125, -8.732421875, -8.2469482421875, -7.761474609375, -7.2760009765625, -6.79052734375, -6.3050537109375, -5.819580078125, -5.3341064453125, -4.8486328125, -4.3631591796875, -3.877685546875, -3.3922119140625, -2.90673828125, -2.4212646484375, -1.935791015625, -1.4503173828125, -0.96484375, -0.4793701171875, 0.006103515625, 0.4915771484375, 0.97705078125, 1.4625244140625, 1.947998046875, 2.4334716796875, 2.9189453125, 3.4044189453125, 3.889892578125, 4.3753662109375, 4.86083984375, 5.3463134765625, 5.831787109375, 6.3172607421875, 6.802734375, 7.2882080078125, 7.773681640625, 8.2591552734375, 8.74462890625, 9.2301025390625, 9.715576171875, 10.2010498046875, 10.6865234375, 11.1719970703125, 11.657470703125, 12.1429443359375, 12.62841796875, 13.1138916015625, 13.599365234375, 14.0848388671875, 14.5703125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 3.0, 10.0, 9.0, 18.0, 21.0, 42.0, 70.0, 97.0, 137.0, 227.0, 374.0, 641.0, 801.0, 568.0, 347.0, 238.0, 138.0, 110.0, 66.0, 47.0, 21.0, 26.0, 15.0, 10.0, 7.0, 6.0, 5.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.140625, -11.7138671875, -11.287109375, -10.8603515625, -10.43359375, -10.0068359375, -9.580078125, -9.1533203125, -8.7265625, -8.2998046875, -7.873046875, -7.4462890625, -7.01953125, -6.5927734375, -6.166015625, -5.7392578125, -5.3125, -4.8857421875, -4.458984375, -4.0322265625, -3.60546875, -3.1787109375, -2.751953125, -2.3251953125, -1.8984375, -1.4716796875, -1.044921875, -0.6181640625, -0.19140625, 0.2353515625, 0.662109375, 1.0888671875, 1.515625, 1.9423828125, 2.369140625, 2.7958984375, 3.22265625, 3.6494140625, 4.076171875, 4.5029296875, 4.9296875, 5.3564453125, 5.783203125, 6.2099609375, 6.63671875, 7.0634765625, 7.490234375, 7.9169921875, 8.34375, 8.7705078125, 9.197265625, 9.6240234375, 10.05078125, 10.4775390625, 10.904296875, 11.3310546875, 11.7578125, 12.1845703125, 12.611328125, 13.0380859375, 13.46484375, 13.8916015625, 14.318359375, 14.7451171875, 15.171875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 11.0, 6.0, 8.0, 7.0, 20.0, 39.0, 54.0, 104.0, 189.0, 391.0, 881.0, 2298.0, 8391.0, 52721.0, 862710.0, 3095471.0, 148267.0, 16667.0, 3736.0, 1275.0, 526.0, 241.0, 112.0, 61.0, 29.0, 22.0, 17.0, 5.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.84375, -33.931884765625, -33.02001953125, -32.108154296875, -31.1962890625, -30.284423828125, -29.37255859375, -28.460693359375, -27.548828125, -26.636962890625, -25.72509765625, -24.813232421875, -23.9013671875, -22.989501953125, -22.07763671875, -21.165771484375, -20.25390625, -19.342041015625, -18.43017578125, -17.518310546875, -16.6064453125, -15.694580078125, -14.78271484375, -13.870849609375, -12.958984375, -12.047119140625, -11.13525390625, -10.223388671875, -9.3115234375, -8.399658203125, -7.48779296875, -6.575927734375, -5.6640625, -4.752197265625, -3.84033203125, -2.928466796875, -2.0166015625, -1.104736328125, -0.19287109375, 0.718994140625, 1.630859375, 2.542724609375, 3.45458984375, 4.366455078125, 5.2783203125, 6.190185546875, 7.10205078125, 8.013916015625, 8.92578125, 9.837646484375, 10.74951171875, 11.661376953125, 12.5732421875, 13.485107421875, 14.39697265625, 15.308837890625, 16.220703125, 17.132568359375, 18.04443359375, 18.956298828125, 19.8681640625, 20.780029296875, 21.69189453125, 22.603759765625, 23.515625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [2.0, 6.0, 15.0, 18.0, 35.0, 96.0, 130.0, 165.0, 175.0, 130.0, 130.0, 63.0, 33.0, 12.0, 8.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.355392456054688, -24.0870361328125, -20.818679809570312, -17.550325393676758, -14.28196907043457, -11.013612747192383, -7.745258331298828, -4.476902008056641, -1.2085456848144531, 2.059810161590576, 5.3281660079956055, 8.596521377563477, 11.864877700805664, 15.133234024047852, 18.401588439941406, 21.669944763183594, 24.93830108642578, 28.20665740966797, 31.475013732910156, 34.743370056152344, 38.01172637939453, 41.28008270263672, 44.54843521118164, 47.81679153442383, 51.085147857666016, 54.3535041809082, 57.62186050415039, 60.89021301269531, 64.1585693359375, 67.42692565917969, 70.69528198242188, 73.96363830566406, 77.23199462890625, 80.50035095214844, 83.76870727539062, 87.03706359863281, 90.305419921875, 93.57377624511719, 96.84213256835938, 100.11048889160156, 103.37884521484375, 106.64720153808594, 109.91555786132812, 113.18391418457031, 116.4522705078125, 119.72062683105469, 122.98898315429688, 126.25733947753906, 129.52569580078125, 132.79405212402344, 136.06240844726562, 139.3307647705078, 142.59912109375, 145.8674774169922, 149.13583374023438, 152.40419006347656, 155.6725311279297, 158.94088745117188, 162.20924377441406, 165.47760009765625, 168.74595642089844, 172.01431274414062, 175.2826690673828, 178.551025390625, 181.8193817138672]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 5.0, 4.0, 12.0, 7.0, 17.0, 12.0, 6.0, 21.0, 17.0, 27.0, 23.0, 36.0, 36.0, 35.0, 38.0, 48.0, 46.0, 44.0, 48.0, 55.0, 47.0, 37.0, 39.0, 32.0, 39.0, 34.0, 32.0, 32.0, 31.0, 31.0, 24.0, 18.0, 14.0, 13.0, 8.0, 7.0, 8.0, 4.0, 4.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-42.333343505859375, -41.19486999511719, -40.056396484375, -38.91792297363281, -37.779449462890625, -36.64097595214844, -35.50250244140625, -34.36403274536133, -33.22555923461914, -32.08708572387695, -30.948612213134766, -29.810138702392578, -28.671667098999023, -27.533193588256836, -26.39472007751465, -25.25624656677246, -24.117773056030273, -22.979299545288086, -21.8408260345459, -20.702354431152344, -19.563880920410156, -18.42540740966797, -17.28693389892578, -16.148460388183594, -15.009987831115723, -13.871514320373535, -12.733041763305664, -11.594568252563477, -10.456094741821289, -9.317622184753418, -8.17914867401123, -7.040675640106201, -5.902202606201172, -4.763729572296143, -3.625256299972534, -2.486783027648926, -1.3483099937438965, -0.2098369598388672, 0.9286365509033203, 2.0671095848083496, 3.205582618713379, 4.344055652618408, 5.4825286865234375, 6.621002197265625, 7.759475231170654, 8.897948265075684, 10.036421775817871, 11.174894332885742, 12.31336784362793, 13.451841354370117, 14.590313911437988, 15.728787422180176, 16.867259979248047, 18.005733489990234, 19.144207000732422, 20.28268051147461, 21.421154022216797, 22.559627532958984, 23.698101043701172, 24.83657455444336, 25.975046157836914, 27.1135196685791, 28.25199317932129, 29.390466690063477, 30.52893829345703]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 13.0, 15.0, 15.0, 24.0, 14.0, 20.0, 27.0, 29.0, 34.0, 44.0, 32.0, 49.0, 39.0, 49.0, 51.0, 49.0, 46.0, 55.0, 44.0, 38.0, 35.0, 37.0, 26.0, 29.0, 28.0, 33.0, 26.0, 19.0, 17.0, 12.0, 11.0, 9.0, 6.0, 4.0, 1.0, 5.0, 4.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.28948974609375, -4.1297607421875, -3.97003173828125, -3.810302734375, -3.65057373046875, -3.4908447265625, -3.33111572265625, -3.17138671875, -3.01165771484375, -2.8519287109375, -2.69219970703125, -2.532470703125, -2.37274169921875, -2.2130126953125, -2.05328369140625, -1.8935546875, -1.73382568359375, -1.5740966796875, -1.41436767578125, -1.254638671875, -1.09490966796875, -0.9351806640625, -0.77545166015625, -0.61572265625, -0.45599365234375, -0.2962646484375, -0.13653564453125, 0.023193359375, 0.18292236328125, 0.3426513671875, 0.50238037109375, 0.662109375, 0.82183837890625, 0.9815673828125, 1.14129638671875, 1.301025390625, 1.46075439453125, 1.6204833984375, 1.78021240234375, 1.93994140625, 2.09967041015625, 2.2593994140625, 2.41912841796875, 2.578857421875, 2.73858642578125, 2.8983154296875, 3.05804443359375, 3.2177734375, 3.37750244140625, 3.5372314453125, 3.69696044921875, 3.856689453125, 4.01641845703125, 4.1761474609375, 4.33587646484375, 4.49560546875, 4.65533447265625, 4.8150634765625, 4.97479248046875, 5.134521484375, 5.29425048828125, 5.4539794921875, 5.61370849609375, 5.7734375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 7.0, 10.0, 7.0, 17.0, 24.0, 39.0, 56.0, 84.0, 115.0, 178.0, 234.0, 397.0, 505.0, 821.0, 1313.0, 1983.0, 2945.0, 4402.0, 6827.0, 10695.0, 17071.0, 28016.0, 48060.0, 87986.0, 197711.0, 318661.0, 145463.0, 70661.0, 39941.0, 23580.0, 14344.0, 9179.0, 5884.0, 3860.0, 2431.0, 1668.0, 1127.0, 739.0, 480.0, 330.0, 234.0, 129.0, 102.0, 73.0, 47.0, 37.0, 27.0, 22.0, 7.0, 9.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.179443359375, -0.17371559143066406, -0.16798782348632812, -0.1622600555419922, -0.15653228759765625, -0.1508045196533203, -0.14507675170898438, -0.13934898376464844, -0.1336212158203125, -0.12789344787597656, -0.12216567993164062, -0.11643791198730469, -0.11071014404296875, -0.10498237609863281, -0.09925460815429688, -0.09352684020996094, -0.087799072265625, -0.08207130432128906, -0.07634353637695312, -0.07061576843261719, -0.06488800048828125, -0.05916023254394531, -0.053432464599609375, -0.04770469665527344, -0.0419769287109375, -0.03624916076660156, -0.030521392822265625, -0.024793624877929688, -0.01906585693359375, -0.013338088989257812, -0.007610321044921875, -0.0018825531005859375, 0.00384521484375, 0.009572982788085938, 0.015300750732421875, 0.021028518676757812, 0.02675628662109375, 0.03248405456542969, 0.038211822509765625, 0.04393959045410156, 0.0496673583984375, 0.05539512634277344, 0.061122894287109375, 0.06685066223144531, 0.07257843017578125, 0.07830619812011719, 0.08403396606445312, 0.08976173400878906, 0.095489501953125, 0.10121726989746094, 0.10694503784179688, 0.11267280578613281, 0.11840057373046875, 0.12412834167480469, 0.12985610961914062, 0.13558387756347656, 0.1413116455078125, 0.14703941345214844, 0.15276718139648438, 0.1584949493408203, 0.16422271728515625, 0.1699504852294922, 0.17567825317382812, 0.18140602111816406, 0.1871337890625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 12.0, 7.0, 12.0, 14.0, 13.0, 18.0, 14.0, 18.0, 12.0, 30.0, 27.0, 34.0, 40.0, 33.0, 43.0, 44.0, 35.0, 40.0, 57.0, 1066.0, 42.0, 40.0, 43.0, 40.0, 35.0, 34.0, 31.0, 27.0, 27.0, 25.0, 18.0, 18.0, 7.0, 17.0, 15.0, 12.0, 7.0, 6.0, 5.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0], "bins": [-3.8359375, -3.735137939453125, -3.63433837890625, -3.533538818359375, -3.4327392578125, -3.331939697265625, -3.23114013671875, -3.130340576171875, -3.029541015625, -2.928741455078125, -2.82794189453125, -2.727142333984375, -2.6263427734375, -2.525543212890625, -2.42474365234375, -2.323944091796875, -2.22314453125, -2.122344970703125, -2.02154541015625, -1.920745849609375, -1.8199462890625, -1.719146728515625, -1.61834716796875, -1.517547607421875, -1.416748046875, -1.315948486328125, -1.21514892578125, -1.114349365234375, -1.0135498046875, -0.912750244140625, -0.81195068359375, -0.711151123046875, -0.6103515625, -0.509552001953125, -0.40875244140625, -0.307952880859375, -0.2071533203125, -0.106353759765625, -0.00555419921875, 0.095245361328125, 0.196044921875, 0.296844482421875, 0.39764404296875, 0.498443603515625, 0.5992431640625, 0.700042724609375, 0.80084228515625, 0.901641845703125, 1.00244140625, 1.103240966796875, 1.20404052734375, 1.304840087890625, 1.4056396484375, 1.506439208984375, 1.60723876953125, 1.708038330078125, 1.808837890625, 1.909637451171875, 2.01043701171875, 2.111236572265625, 2.2120361328125, 2.312835693359375, 2.41363525390625, 2.514434814453125, 2.615234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 7.0, 5.0, 13.0, 18.0, 29.0, 48.0, 70.0, 115.0, 201.0, 294.0, 487.0, 881.0, 1402.0, 2270.0, 3889.0, 6312.0, 10522.0, 18061.0, 30635.0, 54454.0, 106646.0, 254652.0, 1341012.0, 121572.0, 61052.0, 33638.0, 19726.0, 11656.0, 6957.0, 4084.0, 2516.0, 1502.0, 932.0, 598.0, 329.0, 208.0, 133.0, 74.0, 47.0, 26.0, 20.0, 11.0, 9.0, 7.0, 3.0, 8.0, 1.0, 2.0, 3.0], "bins": [-0.1365966796875, -0.13291358947753906, -0.12923049926757812, -0.1255474090576172, -0.12186431884765625, -0.11818122863769531, -0.11449813842773438, -0.11081504821777344, -0.1071319580078125, -0.10344886779785156, -0.09976577758789062, -0.09608268737792969, -0.09239959716796875, -0.08871650695800781, -0.08503341674804688, -0.08135032653808594, -0.077667236328125, -0.07398414611816406, -0.07030105590820312, -0.06661796569824219, -0.06293487548828125, -0.05925178527832031, -0.055568695068359375, -0.05188560485839844, -0.0482025146484375, -0.04451942443847656, -0.040836334228515625, -0.03715324401855469, -0.03347015380859375, -0.029787063598632812, -0.026103973388671875, -0.022420883178710938, -0.01873779296875, -0.015054702758789062, -0.011371612548828125, -0.0076885223388671875, -0.00400543212890625, -0.0003223419189453125, 0.003360748291015625, 0.0070438385009765625, 0.0107269287109375, 0.014410018920898438, 0.018093109130859375, 0.021776199340820312, 0.02545928955078125, 0.029142379760742188, 0.032825469970703125, 0.03650856018066406, 0.040191650390625, 0.04387474060058594, 0.047557830810546875, 0.05124092102050781, 0.05492401123046875, 0.05860710144042969, 0.062290191650390625, 0.06597328186035156, 0.0696563720703125, 0.07333946228027344, 0.07702255249023438, 0.08070564270019531, 0.08438873291015625, 0.08807182312011719, 0.09175491333007812, 0.09543800354003906, 0.09912109375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 7.0, 4.0, 4.0, 11.0, 9.0, 19.0, 23.0, 26.0, 27.0, 29.0, 39.0, 33.0, 53.0, 53.0, 67.0, 55.0, 51.0, 66.0, 70.0, 53.0, 43.0, 46.0, 37.0, 31.0, 21.0, 26.0, 18.0, 19.0, 17.0, 7.0, 10.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.817413330078125e-05, -5.6619755923748016e-05, -5.506537854671478e-05, -5.351100116968155e-05, -5.1956623792648315e-05, -5.040224641561508e-05, -4.884786903858185e-05, -4.7293491661548615e-05, -4.573911428451538e-05, -4.418473690748215e-05, -4.2630359530448914e-05, -4.107598215341568e-05, -3.9521604776382446e-05, -3.796722739934921e-05, -3.641285002231598e-05, -3.4858472645282745e-05, -3.330409526824951e-05, -3.174971789121628e-05, -3.0195340514183044e-05, -2.864096313714981e-05, -2.7086585760116577e-05, -2.5532208383083344e-05, -2.397783100605011e-05, -2.2423453629016876e-05, -2.0869076251983643e-05, -1.931469887495041e-05, -1.7760321497917175e-05, -1.620594412088394e-05, -1.4651566743850708e-05, -1.3097189366817474e-05, -1.154281198978424e-05, -9.988434612751007e-06, -8.434057235717773e-06, -6.87967985868454e-06, -5.325302481651306e-06, -3.7709251046180725e-06, -2.216547727584839e-06, -6.621703505516052e-07, 8.922070264816284e-07, 2.446584403514862e-06, 4.000961780548096e-06, 5.555339157581329e-06, 7.109716534614563e-06, 8.664093911647797e-06, 1.021847128868103e-05, 1.1772848665714264e-05, 1.3327226042747498e-05, 1.4881603419780731e-05, 1.6435980796813965e-05, 1.79903581738472e-05, 1.9544735550880432e-05, 2.1099112927913666e-05, 2.26534903049469e-05, 2.4207867681980133e-05, 2.5762245059013367e-05, 2.73166224360466e-05, 2.8870999813079834e-05, 3.0425377190113068e-05, 3.19797545671463e-05, 3.3534131944179535e-05, 3.508850932121277e-05, 3.6642886698246e-05, 3.8197264075279236e-05, 3.975164145231247e-05, 4.13060188293457e-05]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 1.0, 5.0, 10.0, 4.0, 8.0, 18.0, 15.0, 19.0, 29.0, 27.0, 35.0, 48.0, 74.0, 135.0, 410.0, 1807.0, 31345.0, 701802.0, 302274.0, 8959.0, 892.0, 252.0, 110.0, 58.0, 43.0, 33.0, 24.0, 41.0, 15.0, 12.0, 7.0, 11.0, 8.0, 5.0, 5.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007033348083496094, -0.0006780475378036499, -0.0006527602672576904, -0.000627472996711731, -0.0006021857261657715, -0.000576898455619812, -0.0005516111850738525, -0.0005263239145278931, -0.0005010366439819336, -0.0004757493734359741, -0.00045046210289001465, -0.0004251748323440552, -0.0003998875617980957, -0.00037460029125213623, -0.00034931302070617676, -0.0003240257501602173, -0.0002987384796142578, -0.00027345120906829834, -0.00024816393852233887, -0.0002228766679763794, -0.00019758939743041992, -0.00017230212688446045, -0.00014701485633850098, -0.0001217275857925415, -9.644031524658203e-05, -7.115304470062256e-05, -4.5865774154663086e-05, -2.0578503608703613e-05, 4.708766937255859e-06, 2.9996037483215332e-05, 5.5283308029174805e-05, 8.057057857513428e-05, 0.00010585784912109375, 0.00013114511966705322, 0.0001564323902130127, 0.00018171966075897217, 0.00020700693130493164, 0.0002322942018508911, 0.0002575814723968506, 0.00028286874294281006, 0.00030815601348876953, 0.000333443284034729, 0.0003587305545806885, 0.00038401782512664795, 0.0004093050956726074, 0.0004345923662185669, 0.00045987963676452637, 0.00048516690731048584, 0.0005104541778564453, 0.0005357414484024048, 0.0005610287189483643, 0.0005863159894943237, 0.0006116032600402832, 0.0006368905305862427, 0.0006621778011322021, 0.0006874650716781616, 0.0007127523422241211, 0.0007380396127700806, 0.00076332688331604, 0.0007886141538619995, 0.000813901424407959, 0.0008391886949539185, 0.0008644759654998779, 0.0008897632360458374, 0.0009150505065917969]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 10.0, 19.0, 34.0, 88.0, 156.0, 258.0, 233.0, 134.0, 50.0, 16.0, 11.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.847589687211439e-05, -3.4081738704117015e-05, -2.968758053611964e-05, -2.5293424187111668e-05, -2.0899266019114293e-05, -1.6505107851116918e-05, -1.2110951502108946e-05, -7.716793334111571e-06, -3.322635166114196e-06, 1.071522547135828e-06, 5.465680260385852e-06, 9.859837518888526e-06, 1.42539956868859e-05, 1.8648153854883276e-05, 2.3042310203891248e-05, 2.7436468371888623e-05, 3.1830626539886e-05, 3.622478470788337e-05, 4.061894287588075e-05, 4.5013097405899316e-05, 4.94072592118755e-05, 5.3801413741894066e-05, 5.819557190989144e-05, 6.258973007788882e-05, 6.6983891883865e-05, 7.137804641388357e-05, 7.577220821985975e-05, 8.016636274987832e-05, 8.45605245558545e-05, 8.895467908587307e-05, 9.334883361589164e-05, 9.774299542186782e-05, 0.00010213714267592877, 0.00010653129720594734, 0.00011092545901192352, 0.00011531961354194209, 0.00011971377534791827, 0.00012410792987793684, 0.0001285020844079554, 0.00013289623893797398, 0.00013729040801990777, 0.00014168456254992634, 0.0001460787170799449, 0.0001504728861618787, 0.00015486704069189727, 0.00015926119522191584, 0.0001636553497519344, 0.00016804950428195298, 0.00017244365881197155, 0.0001768378133419901, 0.00018123196787200868, 0.00018562613695394248, 0.00019002029148396105, 0.00019441444601397961, 0.00019880860054399818, 0.00020320276962593198, 0.00020759692415595055, 0.00021199107868596911, 0.00021638523321598768, 0.00022077940229792148, 0.00022517355682794005, 0.00022956771135795861, 0.00023396186588797718, 0.00023835603496991098, 0.00024275018949992955]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 6.0, 11.0, 19.0, 17.0, 15.0, 24.0, 23.0, 23.0, 18.0, 29.0, 35.0, 39.0, 28.0, 19.0, 55.0, 48.0, 40.0, 40.0, 51.0, 39.0, 34.0, 26.0, 34.0, 37.0, 30.0, 30.0, 27.0, 26.0, 30.0, 26.0, 12.0, 15.0, 7.0, 13.0, 12.0, 11.0, 9.0, 5.0, 4.0, 1.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5212764739990234e-05, -2.442300319671631e-05, -2.3633241653442383e-05, -2.2843480110168457e-05, -2.205371856689453e-05, -2.1263957023620605e-05, -2.047419548034668e-05, -1.9684433937072754e-05, -1.8894672393798828e-05, -1.8104910850524902e-05, -1.7315149307250977e-05, -1.652538776397705e-05, -1.5735626220703125e-05, -1.49458646774292e-05, -1.4156103134155273e-05, -1.3366341590881348e-05, -1.2576580047607422e-05, -1.1786818504333496e-05, -1.099705696105957e-05, -1.0207295417785645e-05, -9.417533874511719e-06, -8.627772331237793e-06, -7.838010787963867e-06, -7.048249244689941e-06, -6.258487701416016e-06, -5.46872615814209e-06, -4.678964614868164e-06, -3.889203071594238e-06, -3.0994415283203125e-06, -2.3096799850463867e-06, -1.519918441772461e-06, -7.301568984985352e-07, 5.960464477539063e-08, 8.493661880493164e-07, 1.6391277313232422e-06, 2.428889274597168e-06, 3.2186508178710938e-06, 4.0084123611450195e-06, 4.798173904418945e-06, 5.587935447692871e-06, 6.377696990966797e-06, 7.167458534240723e-06, 7.957220077514648e-06, 8.746981620788574e-06, 9.5367431640625e-06, 1.0326504707336426e-05, 1.1116266250610352e-05, 1.1906027793884277e-05, 1.2695789337158203e-05, 1.3485550880432129e-05, 1.4275312423706055e-05, 1.506507396697998e-05, 1.5854835510253906e-05, 1.6644597053527832e-05, 1.7434358596801758e-05, 1.8224120140075684e-05, 1.901388168334961e-05, 1.9803643226623535e-05, 2.059340476989746e-05, 2.1383166313171387e-05, 2.2172927856445312e-05, 2.2962689399719238e-05, 2.3752450942993164e-05, 2.454221248626709e-05, 2.5331974029541016e-05]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 13.0, 15.0, 15.0, 24.0, 14.0, 20.0, 27.0, 29.0, 34.0, 44.0, 32.0, 49.0, 39.0, 49.0, 51.0, 49.0, 46.0, 55.0, 44.0, 38.0, 35.0, 37.0, 26.0, 29.0, 28.0, 33.0, 26.0, 19.0, 17.0, 12.0, 11.0, 9.0, 6.0, 4.0, 1.0, 5.0, 4.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.28948974609375, -4.1297607421875, -3.97003173828125, -3.810302734375, -3.65057373046875, -3.4908447265625, -3.33111572265625, -3.17138671875, -3.01165771484375, -2.8519287109375, -2.69219970703125, -2.532470703125, -2.37274169921875, -2.2130126953125, -2.05328369140625, -1.8935546875, -1.73382568359375, -1.5740966796875, -1.41436767578125, -1.254638671875, -1.09490966796875, -0.9351806640625, -0.77545166015625, -0.61572265625, -0.45599365234375, -0.2962646484375, -0.13653564453125, 0.023193359375, 0.18292236328125, 0.3426513671875, 0.50238037109375, 0.662109375, 0.82183837890625, 0.9815673828125, 1.14129638671875, 1.301025390625, 1.46075439453125, 1.6204833984375, 1.78021240234375, 1.93994140625, 2.09967041015625, 2.2593994140625, 2.41912841796875, 2.578857421875, 2.73858642578125, 2.8983154296875, 3.05804443359375, 3.2177734375, 3.37750244140625, 3.5372314453125, 3.69696044921875, 3.856689453125, 4.01641845703125, 4.1761474609375, 4.33587646484375, 4.49560546875, 4.65533447265625, 4.8150634765625, 4.97479248046875, 5.134521484375, 5.29425048828125, 5.4539794921875, 5.61370849609375, 5.7734375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 8.0, 8.0, 15.0, 32.0, 42.0, 61.0, 87.0, 137.0, 261.0, 493.0, 889.0, 1781.0, 3720.0, 8184.0, 20411.0, 55810.0, 242920.0, 578874.0, 85191.0, 28612.0, 11416.0, 4787.0, 2283.0, 1096.0, 580.0, 326.0, 171.0, 134.0, 79.0, 36.0, 33.0, 20.0, 15.0, 11.0, 2.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.5809326171875, -8.286865234375, -7.9927978515625, -7.69873046875, -7.4046630859375, -7.110595703125, -6.8165283203125, -6.5224609375, -6.2283935546875, -5.934326171875, -5.6402587890625, -5.34619140625, -5.0521240234375, -4.758056640625, -4.4639892578125, -4.169921875, -3.8758544921875, -3.581787109375, -3.2877197265625, -2.99365234375, -2.6995849609375, -2.405517578125, -2.1114501953125, -1.8173828125, -1.5233154296875, -1.229248046875, -0.9351806640625, -0.64111328125, -0.3470458984375, -0.052978515625, 0.2410888671875, 0.53515625, 0.8292236328125, 1.123291015625, 1.4173583984375, 1.71142578125, 2.0054931640625, 2.299560546875, 2.5936279296875, 2.8876953125, 3.1817626953125, 3.475830078125, 3.7698974609375, 4.06396484375, 4.3580322265625, 4.652099609375, 4.9461669921875, 5.240234375, 5.5343017578125, 5.828369140625, 6.1224365234375, 6.41650390625, 6.7105712890625, 7.004638671875, 7.2987060546875, 7.5927734375, 7.8868408203125, 8.180908203125, 8.4749755859375, 8.76904296875, 9.0631103515625, 9.357177734375, 9.6512451171875, 9.9453125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 3.0, 2.0, 4.0, 10.0, 5.0, 7.0, 12.0, 11.0, 28.0, 21.0, 19.0, 34.0, 41.0, 40.0, 45.0, 58.0, 64.0, 105.0, 116.0, 269.0, 1542.0, 110.0, 86.0, 78.0, 60.0, 51.0, 38.0, 44.0, 22.0, 23.0, 16.0, 20.0, 17.0, 15.0, 11.0, 8.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.25, -18.700439453125, -18.15087890625, -17.601318359375, -17.0517578125, -16.502197265625, -15.95263671875, -15.403076171875, -14.853515625, -14.303955078125, -13.75439453125, -13.204833984375, -12.6552734375, -12.105712890625, -11.55615234375, -11.006591796875, -10.45703125, -9.907470703125, -9.35791015625, -8.808349609375, -8.2587890625, -7.709228515625, -7.15966796875, -6.610107421875, -6.060546875, -5.510986328125, -4.96142578125, -4.411865234375, -3.8623046875, -3.312744140625, -2.76318359375, -2.213623046875, -1.6640625, -1.114501953125, -0.56494140625, -0.015380859375, 0.5341796875, 1.083740234375, 1.63330078125, 2.182861328125, 2.732421875, 3.281982421875, 3.83154296875, 4.381103515625, 4.9306640625, 5.480224609375, 6.02978515625, 6.579345703125, 7.12890625, 7.678466796875, 8.22802734375, 8.777587890625, 9.3271484375, 9.876708984375, 10.42626953125, 10.975830078125, 11.525390625, 12.074951171875, 12.62451171875, 13.174072265625, 13.7236328125, 14.273193359375, 14.82275390625, 15.372314453125, 15.921875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 1.0, 7.0, 8.0, 15.0, 11.0, 13.0, 27.0, 28.0, 38.0, 59.0, 76.0, 116.0, 162.0, 311.0, 730.0, 3116.0, 36942.0, 2732105.0, 356503.0, 12536.0, 1598.0, 529.0, 267.0, 133.0, 91.0, 73.0, 58.0, 39.0, 33.0, 22.0, 12.0, 5.0, 10.0, 8.0, 7.0, 7.0, 2.0, 1.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.9375, -34.73193359375, -33.5263671875, -32.32080078125, -31.115234375, -29.90966796875, -28.7041015625, -27.49853515625, -26.29296875, -25.08740234375, -23.8818359375, -22.67626953125, -21.470703125, -20.26513671875, -19.0595703125, -17.85400390625, -16.6484375, -15.44287109375, -14.2373046875, -13.03173828125, -11.826171875, -10.62060546875, -9.4150390625, -8.20947265625, -7.00390625, -5.79833984375, -4.5927734375, -3.38720703125, -2.181640625, -0.97607421875, 0.2294921875, 1.43505859375, 2.640625, 3.84619140625, 5.0517578125, 6.25732421875, 7.462890625, 8.66845703125, 9.8740234375, 11.07958984375, 12.28515625, 13.49072265625, 14.6962890625, 15.90185546875, 17.107421875, 18.31298828125, 19.5185546875, 20.72412109375, 21.9296875, 23.13525390625, 24.3408203125, 25.54638671875, 26.751953125, 27.95751953125, 29.1630859375, 30.36865234375, 31.57421875, 32.77978515625, 33.9853515625, 35.19091796875, 36.396484375, 37.60205078125, 38.8076171875, 40.01318359375, 41.21875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 49.0, 252.0, 460.0, 210.0, 35.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.912212371826172, -21.15459442138672, -16.3969783782959, -11.639361381530762, -6.881744384765625, -2.124126434326172, 2.6334896087646484, 7.391105651855469, 12.148723602294922, 16.906341552734375, 21.663957595825195, 26.421573638916016, 31.17919158935547, 35.93680953979492, 40.694427490234375, 45.45204162597656, 50.209659576416016, 54.96727752685547, 59.724891662597656, 64.48251342773438, 69.24012756347656, 73.99774169921875, 78.75536346435547, 83.51297760009766, 88.27059936523438, 93.02821350097656, 97.78583526611328, 102.54344940185547, 107.30107116699219, 112.05868530273438, 116.81629943847656, 121.57391357421875, 126.33154296875, 131.0891571044922, 135.84677124023438, 140.60440063476562, 145.3620147705078, 150.11962890625, 154.8772430419922, 159.63485717773438, 164.39248657226562, 169.1501007080078, 173.90771484375, 178.66534423828125, 183.42295837402344, 188.18057250976562, 192.9381866455078, 197.69580078125, 202.4534149169922, 207.21102905273438, 211.96864318847656, 216.7262725830078, 221.48388671875, 226.2415008544922, 230.99911499023438, 235.75672912597656, 240.51434326171875, 245.27195739746094, 250.02957153320312, 254.78720092773438, 259.5447998046875, 264.30242919921875, 269.06005859375, 273.8176574707031, 278.5752868652344]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 3.0, 12.0, 9.0, 11.0, 12.0, 12.0, 24.0, 21.0, 27.0, 22.0, 22.0, 29.0, 34.0, 39.0, 40.0, 44.0, 39.0, 32.0, 52.0, 34.0, 39.0, 39.0, 45.0, 35.0, 37.0, 27.0, 28.0, 25.0, 28.0, 25.0, 24.0, 18.0, 16.0, 7.0, 7.0, 13.0, 11.0, 12.0, 9.0, 6.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-41.16782760620117, -39.84314727783203, -38.518463134765625, -37.193782806396484, -35.869102478027344, -34.54441833496094, -33.2197380065918, -31.895055770874023, -30.57037353515625, -29.245691299438477, -27.921009063720703, -26.596328735351562, -25.27164649963379, -23.946964263916016, -22.622283935546875, -21.2976016998291, -19.972919464111328, -18.648237228393555, -17.32355499267578, -15.99887466430664, -14.674192428588867, -13.349510192871094, -12.024828910827637, -10.70014762878418, -9.375465393066406, -8.050783157348633, -6.726101875305176, -5.4014201164245605, -4.076738357543945, -2.75205659866333, -1.4273748397827148, -0.10269355773925781, 1.22198486328125, 2.5466666221618652, 3.8713483810424805, 5.196030139923096, 6.520711898803711, 7.845393657684326, 9.170075416564941, 10.494756698608398, 11.819438934326172, 13.144121170043945, 14.468802452087402, 15.79348373413086, 17.118165969848633, 18.442848205566406, 19.767528533935547, 21.09221076965332, 22.416893005371094, 23.741575241088867, 25.06625747680664, 26.39093780517578, 27.715620040893555, 29.040302276611328, 30.36498260498047, 31.689664840698242, 33.014347076416016, 34.339027404785156, 35.66371154785156, 36.9883918762207, 38.313072204589844, 39.63775634765625, 40.96243667602539, 42.28711700439453, 43.61180114746094]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 13.0, 9.0, 16.0, 24.0, 24.0, 18.0, 28.0, 24.0, 41.0, 40.0, 41.0, 44.0, 44.0, 44.0, 41.0, 46.0, 52.0, 45.0, 40.0, 42.0, 38.0, 32.0, 30.0, 27.0, 37.0, 27.0, 22.0, 14.0, 28.0, 12.0, 7.0, 5.0, 14.0, 5.0, 3.0, 5.0, 2.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.38385009765625, -4.2208251953125, -4.05780029296875, -3.894775390625, -3.73175048828125, -3.5687255859375, -3.40570068359375, -3.24267578125, -3.07965087890625, -2.9166259765625, -2.75360107421875, -2.590576171875, -2.42755126953125, -2.2645263671875, -2.10150146484375, -1.9384765625, -1.77545166015625, -1.6124267578125, -1.44940185546875, -1.286376953125, -1.12335205078125, -0.9603271484375, -0.79730224609375, -0.63427734375, -0.47125244140625, -0.3082275390625, -0.14520263671875, 0.017822265625, 0.18084716796875, 0.3438720703125, 0.50689697265625, 0.669921875, 0.83294677734375, 0.9959716796875, 1.15899658203125, 1.322021484375, 1.48504638671875, 1.6480712890625, 1.81109619140625, 1.97412109375, 2.13714599609375, 2.3001708984375, 2.46319580078125, 2.626220703125, 2.78924560546875, 2.9522705078125, 3.11529541015625, 3.2783203125, 3.44134521484375, 3.6043701171875, 3.76739501953125, 3.930419921875, 4.09344482421875, 4.2564697265625, 4.41949462890625, 4.58251953125, 4.74554443359375, 4.9085693359375, 5.07159423828125, 5.234619140625, 5.39764404296875, 5.5606689453125, 5.72369384765625, 5.88671875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 11.0, 6.0, 16.0, 32.0, 36.0, 57.0, 86.0, 154.0, 255.0, 526.0, 1178.0, 3119.0, 9427.0, 42049.0, 354452.0, 3159282.0, 548661.0, 56511.0, 11826.0, 3645.0, 1477.0, 633.0, 342.0, 194.0, 96.0, 57.0, 42.0, 36.0, 20.0, 11.0, 13.0, 7.0, 7.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-17.4375, -16.918212890625, -16.39892578125, -15.879638671875, -15.3603515625, -14.841064453125, -14.32177734375, -13.802490234375, -13.283203125, -12.763916015625, -12.24462890625, -11.725341796875, -11.2060546875, -10.686767578125, -10.16748046875, -9.648193359375, -9.12890625, -8.609619140625, -8.09033203125, -7.571044921875, -7.0517578125, -6.532470703125, -6.01318359375, -5.493896484375, -4.974609375, -4.455322265625, -3.93603515625, -3.416748046875, -2.8974609375, -2.378173828125, -1.85888671875, -1.339599609375, -0.8203125, -0.301025390625, 0.21826171875, 0.737548828125, 1.2568359375, 1.776123046875, 2.29541015625, 2.814697265625, 3.333984375, 3.853271484375, 4.37255859375, 4.891845703125, 5.4111328125, 5.930419921875, 6.44970703125, 6.968994140625, 7.48828125, 8.007568359375, 8.52685546875, 9.046142578125, 9.5654296875, 10.084716796875, 10.60400390625, 11.123291015625, 11.642578125, 12.161865234375, 12.68115234375, 13.200439453125, 13.7197265625, 14.239013671875, 14.75830078125, 15.277587890625, 15.796875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 14.0, 25.0, 21.0, 37.0, 47.0, 51.0, 87.0, 118.0, 156.0, 227.0, 313.0, 427.0, 550.0, 548.0, 400.0, 272.0, 186.0, 147.0, 105.0, 92.0, 62.0, 41.0, 30.0, 23.0, 19.0, 15.0, 7.0, 6.0, 5.0, 3.0, 7.0, 1.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3046875, -9.9715576171875, -9.638427734375, -9.3052978515625, -8.97216796875, -8.6390380859375, -8.305908203125, -7.9727783203125, -7.6396484375, -7.3065185546875, -6.973388671875, -6.6402587890625, -6.30712890625, -5.9739990234375, -5.640869140625, -5.3077392578125, -4.974609375, -4.6414794921875, -4.308349609375, -3.9752197265625, -3.64208984375, -3.3089599609375, -2.975830078125, -2.6427001953125, -2.3095703125, -1.9764404296875, -1.643310546875, -1.3101806640625, -0.97705078125, -0.6439208984375, -0.310791015625, 0.0223388671875, 0.35546875, 0.6885986328125, 1.021728515625, 1.3548583984375, 1.68798828125, 2.0211181640625, 2.354248046875, 2.6873779296875, 3.0205078125, 3.3536376953125, 3.686767578125, 4.0198974609375, 4.35302734375, 4.6861572265625, 5.019287109375, 5.3524169921875, 5.685546875, 6.0186767578125, 6.351806640625, 6.6849365234375, 7.01806640625, 7.3511962890625, 7.684326171875, 8.0174560546875, 8.3505859375, 8.6837158203125, 9.016845703125, 9.3499755859375, 9.68310546875, 10.0162353515625, 10.349365234375, 10.6824951171875, 11.015625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 4.0, 3.0, 1.0, 5.0, 9.0, 8.0, 11.0, 14.0, 18.0, 26.0, 33.0, 43.0, 102.0, 118.0, 215.0, 410.0, 1164.0, 4262.0, 26937.0, 356218.0, 3467679.0, 306452.0, 24526.0, 3936.0, 1059.0, 456.0, 217.0, 118.0, 68.0, 57.0, 34.0, 24.0, 20.0, 8.0, 8.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.515625, -28.547119140625, -27.57861328125, -26.610107421875, -25.6416015625, -24.673095703125, -23.70458984375, -22.736083984375, -21.767578125, -20.799072265625, -19.83056640625, -18.862060546875, -17.8935546875, -16.925048828125, -15.95654296875, -14.988037109375, -14.01953125, -13.051025390625, -12.08251953125, -11.114013671875, -10.1455078125, -9.177001953125, -8.20849609375, -7.239990234375, -6.271484375, -5.302978515625, -4.33447265625, -3.365966796875, -2.3974609375, -1.428955078125, -0.46044921875, 0.508056640625, 1.4765625, 2.445068359375, 3.41357421875, 4.382080078125, 5.3505859375, 6.319091796875, 7.28759765625, 8.256103515625, 9.224609375, 10.193115234375, 11.16162109375, 12.130126953125, 13.0986328125, 14.067138671875, 15.03564453125, 16.004150390625, 16.97265625, 17.941162109375, 18.90966796875, 19.878173828125, 20.8466796875, 21.815185546875, 22.78369140625, 23.752197265625, 24.720703125, 25.689208984375, 26.65771484375, 27.626220703125, 28.5947265625, 29.563232421875, 30.53173828125, 31.500244140625, 32.46875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 16.0, 39.0, 67.0, 127.0, 178.0, 188.0, 168.0, 102.0, 66.0, 32.0, 13.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.212127685546875, -53.722389221191406, -50.23265075683594, -46.74291229248047, -43.253173828125, -39.76343536376953, -36.27370071411133, -32.78396224975586, -29.29422378540039, -25.804485321044922, -22.314746856689453, -18.825010299682617, -15.335271835327148, -11.84553337097168, -8.355796813964844, -4.866058349609375, -1.3763198852539062, 2.1134181022644043, 5.603156089782715, 9.092893600463867, 12.582632064819336, 16.072370529174805, 19.56210708618164, 23.05184555053711, 26.541584014892578, 30.031322479248047, 33.521060943603516, 37.01079559326172, 40.50053405761719, 43.990272521972656, 47.480010986328125, 50.969749450683594, 54.45948791503906, 57.94922637939453, 61.43896484375, 64.92870330810547, 68.41844177246094, 71.9081802368164, 75.39791870117188, 78.88764953613281, 82.37739562988281, 85.86713409423828, 89.35687255859375, 92.84661102294922, 96.33634948730469, 99.82608795166016, 103.31582641601562, 106.80555725097656, 110.29529571533203, 113.7850341796875, 117.27477264404297, 120.76451110839844, 124.2542495727539, 127.74398803710938, 131.2337188720703, 134.7234649658203, 138.21319580078125, 141.7029266357422, 145.1926727294922, 148.68240356445312, 152.17214965820312, 155.66188049316406, 159.15162658691406, 162.641357421875, 166.131103515625]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 5.0, 8.0, 10.0, 10.0, 10.0, 17.0, 17.0, 17.0, 21.0, 23.0, 24.0, 28.0, 38.0, 38.0, 35.0, 37.0, 31.0, 40.0, 38.0, 39.0, 37.0, 40.0, 38.0, 39.0, 31.0, 29.0, 34.0, 33.0, 30.0, 26.0, 22.0, 23.0, 10.0, 15.0, 9.0, 16.0, 14.0, 7.0, 13.0, 8.0, 8.0, 9.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.246986389160156, -27.224376678466797, -26.201766967773438, -25.179157257080078, -24.15654754638672, -23.13393783569336, -22.111330032348633, -21.088720321655273, -20.066110610961914, -19.043500900268555, -18.020891189575195, -16.998281478881836, -15.975672721862793, -14.953063011169434, -13.93045425415039, -12.907844543457031, -11.885234832763672, -10.862625122070312, -9.840015411376953, -8.81740665435791, -7.794796943664551, -6.772187232971191, -5.74957799911499, -4.726968765258789, -3.7043590545654297, -2.6817495822906494, -1.6591401100158691, -0.6365306377410889, 0.3860788345336914, 1.4086885452270508, 2.431297779083252, 3.453907012939453, 4.4765167236328125, 5.499126434326172, 6.521735668182373, 7.544344902038574, 8.566954612731934, 9.589564323425293, 10.612173080444336, 11.634782791137695, 12.657392501831055, 13.680002212524414, 14.702611923217773, 15.725220680236816, 16.74782943725586, 17.77043914794922, 18.793048858642578, 19.815658569335938, 20.838268280029297, 21.860877990722656, 22.883487701416016, 23.906097412109375, 24.928707122802734, 25.951316833496094, 26.97392463684082, 27.99653434753418, 29.01914405822754, 30.0417537689209, 31.064363479614258, 32.086971282958984, 33.109580993652344, 34.1321907043457, 35.15480041503906, 36.17741012573242, 37.20001983642578]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 8.0, 10.0, 13.0, 17.0, 18.0, 14.0, 20.0, 25.0, 37.0, 49.0, 34.0, 38.0, 46.0, 44.0, 46.0, 48.0, 48.0, 44.0, 48.0, 45.0, 37.0, 54.0, 32.0, 40.0, 35.0, 21.0, 22.0, 24.0, 21.0, 14.0, 6.0, 10.0, 6.0, 2.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0078125, -4.83251953125, -4.6572265625, -4.48193359375, -4.306640625, -4.13134765625, -3.9560546875, -3.78076171875, -3.60546875, -3.43017578125, -3.2548828125, -3.07958984375, -2.904296875, -2.72900390625, -2.5537109375, -2.37841796875, -2.203125, -2.02783203125, -1.8525390625, -1.67724609375, -1.501953125, -1.32666015625, -1.1513671875, -0.97607421875, -0.80078125, -0.62548828125, -0.4501953125, -0.27490234375, -0.099609375, 0.07568359375, 0.2509765625, 0.42626953125, 0.6015625, 0.77685546875, 0.9521484375, 1.12744140625, 1.302734375, 1.47802734375, 1.6533203125, 1.82861328125, 2.00390625, 2.17919921875, 2.3544921875, 2.52978515625, 2.705078125, 2.88037109375, 3.0556640625, 3.23095703125, 3.40625, 3.58154296875, 3.7568359375, 3.93212890625, 4.107421875, 4.28271484375, 4.4580078125, 4.63330078125, 4.80859375, 4.98388671875, 5.1591796875, 5.33447265625, 5.509765625, 5.68505859375, 5.8603515625, 6.03564453125, 6.2109375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 14.0, 16.0, 24.0, 26.0, 35.0, 59.0, 105.0, 146.0, 198.0, 300.0, 480.0, 754.0, 1155.0, 1739.0, 2644.0, 4034.0, 6275.0, 9340.0, 14454.0, 23424.0, 37426.0, 63245.0, 117009.0, 255787.0, 240895.0, 110011.0, 60016.0, 36389.0, 22185.0, 13904.0, 9245.0, 5880.0, 3903.0, 2458.0, 1701.0, 1086.0, 745.0, 484.0, 297.0, 218.0, 129.0, 107.0, 74.0, 46.0, 32.0, 14.0, 17.0, 9.0, 8.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.18505859375, -0.179443359375, -0.173828125, -0.168212890625, -0.16259765625, -0.156982421875, -0.1513671875, -0.145751953125, -0.14013671875, -0.134521484375, -0.12890625, -0.123291015625, -0.11767578125, -0.112060546875, -0.1064453125, -0.100830078125, -0.09521484375, -0.089599609375, -0.083984375, -0.078369140625, -0.07275390625, -0.067138671875, -0.0615234375, -0.055908203125, -0.05029296875, -0.044677734375, -0.0390625, -0.033447265625, -0.02783203125, -0.022216796875, -0.0166015625, -0.010986328125, -0.00537109375, 0.000244140625, 0.005859375, 0.011474609375, 0.01708984375, 0.022705078125, 0.0283203125, 0.033935546875, 0.03955078125, 0.045166015625, 0.05078125, 0.056396484375, 0.06201171875, 0.067626953125, 0.0732421875, 0.078857421875, 0.08447265625, 0.090087890625, 0.095703125, 0.101318359375, 0.10693359375, 0.112548828125, 0.1181640625, 0.123779296875, 0.12939453125, 0.135009765625, 0.140625, 0.146240234375, 0.15185546875, 0.157470703125, 0.1630859375, 0.168701171875, 0.17431640625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 7.0, 3.0, 9.0, 7.0, 9.0, 8.0, 17.0, 17.0, 11.0, 12.0, 18.0, 16.0, 23.0, 30.0, 31.0, 39.0, 43.0, 31.0, 41.0, 37.0, 40.0, 43.0, 1070.0, 38.0, 34.0, 38.0, 37.0, 37.0, 32.0, 36.0, 31.0, 18.0, 28.0, 18.0, 25.0, 12.0, 17.0, 6.0, 9.0, 14.0, 4.0, 12.0, 6.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-3.017578125, -2.923431396484375, -2.82928466796875, -2.735137939453125, -2.6409912109375, -2.546844482421875, -2.45269775390625, -2.358551025390625, -2.264404296875, -2.170257568359375, -2.07611083984375, -1.981964111328125, -1.8878173828125, -1.793670654296875, -1.69952392578125, -1.605377197265625, -1.51123046875, -1.417083740234375, -1.32293701171875, -1.228790283203125, -1.1346435546875, -1.040496826171875, -0.94635009765625, -0.852203369140625, -0.758056640625, -0.663909912109375, -0.56976318359375, -0.475616455078125, -0.3814697265625, -0.287322998046875, -0.19317626953125, -0.099029541015625, -0.0048828125, 0.089263916015625, 0.18341064453125, 0.277557373046875, 0.3717041015625, 0.465850830078125, 0.55999755859375, 0.654144287109375, 0.748291015625, 0.842437744140625, 0.93658447265625, 1.030731201171875, 1.1248779296875, 1.219024658203125, 1.31317138671875, 1.407318115234375, 1.50146484375, 1.595611572265625, 1.68975830078125, 1.783905029296875, 1.8780517578125, 1.972198486328125, 2.06634521484375, 2.160491943359375, 2.254638671875, 2.348785400390625, 2.44293212890625, 2.537078857421875, 2.6312255859375, 2.725372314453125, 2.81951904296875, 2.913665771484375, 3.0078125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 11.0, 19.0, 31.0, 55.0, 76.0, 94.0, 162.0, 220.0, 327.0, 516.0, 783.0, 1155.0, 1813.0, 2755.0, 4259.0, 6873.0, 10393.0, 16771.0, 27771.0, 47806.0, 88292.0, 189562.0, 1354932.0, 156821.0, 76449.0, 42025.0, 24847.0, 15438.0, 9503.0, 5949.0, 3988.0, 2573.0, 1612.0, 1090.0, 725.0, 452.0, 327.0, 225.0, 145.0, 88.0, 70.0, 43.0, 25.0, 16.0, 11.0, 10.0, 3.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.10638427734375, -0.10299491882324219, -0.09960556030273438, -0.09621620178222656, -0.09282684326171875, -0.08943748474121094, -0.08604812622070312, -0.08265876770019531, -0.0792694091796875, -0.07588005065917969, -0.07249069213867188, -0.06910133361816406, -0.06571197509765625, -0.06232261657714844, -0.058933258056640625, -0.05554389953613281, -0.052154541015625, -0.04876518249511719, -0.045375823974609375, -0.04198646545410156, -0.03859710693359375, -0.03520774841308594, -0.031818389892578125, -0.028429031372070312, -0.0250396728515625, -0.021650314331054688, -0.018260955810546875, -0.014871597290039062, -0.01148223876953125, -0.008092880249023438, -0.004703521728515625, -0.0013141632080078125, 0.0020751953125, 0.0054645538330078125, 0.008853912353515625, 0.012243270874023438, 0.01563262939453125, 0.019021987915039062, 0.022411346435546875, 0.025800704956054688, 0.0291900634765625, 0.03257942199707031, 0.035968780517578125, 0.03935813903808594, 0.04274749755859375, 0.04613685607910156, 0.049526214599609375, 0.05291557312011719, 0.056304931640625, 0.05969429016113281, 0.06308364868164062, 0.06647300720214844, 0.06986236572265625, 0.07325172424316406, 0.07664108276367188, 0.08003044128417969, 0.0834197998046875, 0.08680915832519531, 0.09019851684570312, 0.09358787536621094, 0.09697723388671875, 0.10036659240722656, 0.10375595092773438, 0.10714530944824219, 0.11053466796875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 18.0, 7.0, 18.0, 15.0, 33.0, 39.0, 26.0, 37.0, 50.0, 37.0, 58.0, 49.0, 58.0, 50.0, 40.0, 59.0, 62.0, 45.0, 39.0, 37.0, 38.0, 25.0, 19.0, 26.0, 21.0, 12.0, 13.0, 7.0, 8.0, 14.0, 9.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.975629806518555e-05, -3.861915320158005e-05, -3.748200833797455e-05, -3.634486347436905e-05, -3.520771861076355e-05, -3.407057374715805e-05, -3.293342888355255e-05, -3.179628401994705e-05, -3.065913915634155e-05, -2.9521994292736053e-05, -2.8384849429130554e-05, -2.7247704565525055e-05, -2.6110559701919556e-05, -2.4973414838314056e-05, -2.3836269974708557e-05, -2.2699125111103058e-05, -2.156198024749756e-05, -2.042483538389206e-05, -1.928769052028656e-05, -1.815054565668106e-05, -1.701340079307556e-05, -1.5876255929470062e-05, -1.4739111065864563e-05, -1.3601966202259064e-05, -1.2464821338653564e-05, -1.1327676475048065e-05, -1.0190531611442566e-05, -9.053386747837067e-06, -7.916241884231567e-06, -6.779097020626068e-06, -5.641952157020569e-06, -4.50480729341507e-06, -3.3676624298095703e-06, -2.230517566204071e-06, -1.0933727025985718e-06, 4.377216100692749e-08, 1.1809170246124268e-06, 2.318061888217926e-06, 3.4552067518234253e-06, 4.5923516154289246e-06, 5.729496479034424e-06, 6.866641342639923e-06, 8.003786206245422e-06, 9.140931069850922e-06, 1.0278075933456421e-05, 1.141522079706192e-05, 1.255236566066742e-05, 1.3689510524272919e-05, 1.4826655387878418e-05, 1.5963800251483917e-05, 1.7100945115089417e-05, 1.8238089978694916e-05, 1.9375234842300415e-05, 2.0512379705905914e-05, 2.1649524569511414e-05, 2.2786669433116913e-05, 2.3923814296722412e-05, 2.506095916032791e-05, 2.619810402393341e-05, 2.733524888753891e-05, 2.847239375114441e-05, 2.960953861474991e-05, 3.074668347835541e-05, 3.188382834196091e-05, 3.3020973205566406e-05]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 8.0, 6.0, 13.0, 15.0, 11.0, 13.0, 17.0, 17.0, 22.0, 20.0, 41.0, 53.0, 84.0, 139.0, 249.0, 878.0, 10655.0, 284167.0, 702358.0, 46564.0, 2272.0, 418.0, 174.0, 91.0, 51.0, 41.0, 36.0, 32.0, 23.0, 18.0, 16.0, 13.0, 11.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006003379821777344, -0.0005804747343063354, -0.0005606114864349365, -0.0005407482385635376, -0.0005208849906921387, -0.0005010217428207397, -0.0004811584949493408, -0.0004612952470779419, -0.00044143199920654297, -0.00042156875133514404, -0.0004017055034637451, -0.0003818422555923462, -0.00036197900772094727, -0.00034211575984954834, -0.0003222525119781494, -0.0003023892641067505, -0.00028252601623535156, -0.00026266276836395264, -0.0002427995204925537, -0.00022293627262115479, -0.00020307302474975586, -0.00018320977687835693, -0.000163346529006958, -0.00014348328113555908, -0.00012362003326416016, -0.00010375678539276123, -8.38935375213623e-05, -6.403028964996338e-05, -4.416704177856445e-05, -2.4303793907165527e-05, -4.4405460357666016e-06, 1.5422701835632324e-05, 3.528594970703125e-05, 5.5149197578430176e-05, 7.50124454498291e-05, 9.487569332122803e-05, 0.00011473894119262695, 0.00013460218906402588, 0.0001544654369354248, 0.00017432868480682373, 0.00019419193267822266, 0.00021405518054962158, 0.0002339184284210205, 0.00025378167629241943, 0.00027364492416381836, 0.0002935081720352173, 0.0003133714199066162, 0.00033323466777801514, 0.00035309791564941406, 0.000372961163520813, 0.0003928244113922119, 0.00041268765926361084, 0.00043255090713500977, 0.0004524141550064087, 0.0004722774028778076, 0.0004921406507492065, 0.0005120038986206055, 0.0005318671464920044, 0.0005517303943634033, 0.0005715936422348022, 0.0005914568901062012, 0.0006113201379776001, 0.000631183385848999, 0.000651046633720398, 0.0006709098815917969]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 21.0, 111.0, 332.0, 371.0, 130.0, 35.0, 11.0], "bins": [-0.0003826766333077103, -0.00037630938459187746, -0.0003699421067722142, -0.00036357485805638134, -0.0003572076093405485, -0.00035084033152088523, -0.0003444730828050524, -0.00033810583408921957, -0.00033173858537338674, -0.0003253713366575539, -0.0003190040588378906, -0.0003126368101220578, -0.00030626956140622497, -0.0002999022835865617, -0.00029353503487072885, -0.000287167786154896, -0.00028080050833523273, -0.0002744332596193999, -0.0002680659817997366, -0.0002616987330839038, -0.00025533148436807096, -0.00024896423565223813, -0.00024259695783257484, -0.00023622970911674201, -0.00022986246040090919, -0.00022349519713316113, -0.0002171279484173283, -0.00021076068514958024, -0.0002043934364337474, -0.00019802617316599935, -0.0001916589098982513, -0.00018529166118241847, -0.00017892441246658564, -0.00017255714919883758, -0.00016618990048300475, -0.0001598226372152567, -0.00015345538849942386, -0.0001470881252316758, -0.00014072086196392775, -0.00013435361324809492, -0.00012798634998034686, -0.00012161909398855641, -0.00011525183799676597, -0.00010888457472901791, -0.00010251731873722747, -9.615006274543703e-05, -8.978280675364658e-05, -8.341555076185614e-05, -7.70482947700657e-05, -7.068103877827525e-05, -6.431378278648481e-05, -5.794652315671556e-05, -5.1579263526946306e-05, -4.521200753515586e-05, -3.884475154336542e-05, -3.247749191359617e-05, -2.611023410281632e-05, -1.9742976292036474e-05, -1.3375719390751328e-05, -7.008462489466183e-06, -6.412046786863357e-07, 5.7260531320935115e-06, 1.2093309123883955e-05, 1.8460568753653206e-05, 2.482782474544365e-05]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 8.0, 7.0, 11.0, 19.0, 19.0, 18.0, 25.0, 26.0, 27.0, 33.0, 28.0, 28.0, 42.0, 31.0, 36.0, 36.0, 36.0, 45.0, 52.0, 49.0, 51.0, 37.0, 39.0, 42.0, 38.0, 36.0, 23.0, 25.0, 29.0, 17.0, 15.0, 17.0, 9.0, 7.0, 12.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.895427703857422e-05, -1.8271617591381073e-05, -1.7588958144187927e-05, -1.690629869699478e-05, -1.6223639249801636e-05, -1.554097980260849e-05, -1.4858320355415344e-05, -1.4175660908222198e-05, -1.3493001461029053e-05, -1.2810342013835907e-05, -1.2127682566642761e-05, -1.1445023119449615e-05, -1.076236367225647e-05, -1.0079704225063324e-05, -9.397044777870178e-06, -8.714385330677032e-06, -8.031725883483887e-06, -7.349066436290741e-06, -6.666406989097595e-06, -5.9837475419044495e-06, -5.301088094711304e-06, -4.618428647518158e-06, -3.935769200325012e-06, -3.2531097531318665e-06, -2.5704503059387207e-06, -1.887790858745575e-06, -1.2051314115524292e-06, -5.224719643592834e-07, 1.601874828338623e-07, 8.428469300270081e-07, 1.5255063772201538e-06, 2.2081658244132996e-06, 2.8908252716064453e-06, 3.573484718799591e-06, 4.256144165992737e-06, 4.9388036131858826e-06, 5.621463060379028e-06, 6.304122507572174e-06, 6.98678195476532e-06, 7.669441401958466e-06, 8.352100849151611e-06, 9.034760296344757e-06, 9.717419743537903e-06, 1.0400079190731049e-05, 1.1082738637924194e-05, 1.176539808511734e-05, 1.2448057532310486e-05, 1.3130716979503632e-05, 1.3813376426696777e-05, 1.4496035873889923e-05, 1.5178695321083069e-05, 1.5861354768276215e-05, 1.654401421546936e-05, 1.7226673662662506e-05, 1.7909333109855652e-05, 1.8591992557048798e-05, 1.9274652004241943e-05, 1.995731145143509e-05, 2.0639970898628235e-05, 2.132263034582138e-05, 2.2005289793014526e-05, 2.2687949240207672e-05, 2.3370608687400818e-05, 2.4053268134593964e-05, 2.473592758178711e-05]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 8.0, 10.0, 13.0, 17.0, 18.0, 14.0, 20.0, 25.0, 37.0, 49.0, 34.0, 38.0, 46.0, 44.0, 46.0, 48.0, 48.0, 44.0, 48.0, 45.0, 37.0, 54.0, 32.0, 40.0, 35.0, 21.0, 22.0, 24.0, 21.0, 14.0, 6.0, 10.0, 6.0, 2.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0078125, -4.83251953125, -4.6572265625, -4.48193359375, -4.306640625, -4.13134765625, -3.9560546875, -3.78076171875, -3.60546875, -3.43017578125, -3.2548828125, -3.07958984375, -2.904296875, -2.72900390625, -2.5537109375, -2.37841796875, -2.203125, -2.02783203125, -1.8525390625, -1.67724609375, -1.501953125, -1.32666015625, -1.1513671875, -0.97607421875, -0.80078125, -0.62548828125, -0.4501953125, -0.27490234375, -0.099609375, 0.07568359375, 0.2509765625, 0.42626953125, 0.6015625, 0.77685546875, 0.9521484375, 1.12744140625, 1.302734375, 1.47802734375, 1.6533203125, 1.82861328125, 2.00390625, 2.17919921875, 2.3544921875, 2.52978515625, 2.705078125, 2.88037109375, 3.0556640625, 3.23095703125, 3.40625, 3.58154296875, 3.7568359375, 3.93212890625, 4.107421875, 4.28271484375, 4.4580078125, 4.63330078125, 4.80859375, 4.98388671875, 5.1591796875, 5.33447265625, 5.509765625, 5.68505859375, 5.8603515625, 6.03564453125, 6.2109375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 15.0, 19.0, 17.0, 32.0, 42.0, 54.0, 59.0, 89.0, 137.0, 191.0, 367.0, 482.0, 720.0, 1198.0, 2226.0, 3986.0, 8031.0, 19506.0, 59506.0, 244702.0, 508610.0, 134699.0, 36671.0, 13344.0, 6050.0, 3174.0, 1742.0, 1022.0, 612.0, 356.0, 277.0, 180.0, 110.0, 83.0, 54.0, 42.0, 22.0, 22.0, 20.0, 18.0, 5.0, 11.0, 7.0, 6.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.0234375, -7.7750244140625, -7.526611328125, -7.2781982421875, -7.02978515625, -6.7813720703125, -6.532958984375, -6.2845458984375, -6.0361328125, -5.7877197265625, -5.539306640625, -5.2908935546875, -5.04248046875, -4.7940673828125, -4.545654296875, -4.2972412109375, -4.048828125, -3.8004150390625, -3.552001953125, -3.3035888671875, -3.05517578125, -2.8067626953125, -2.558349609375, -2.3099365234375, -2.0615234375, -1.8131103515625, -1.564697265625, -1.3162841796875, -1.06787109375, -0.8194580078125, -0.571044921875, -0.3226318359375, -0.07421875, 0.1741943359375, 0.422607421875, 0.6710205078125, 0.91943359375, 1.1678466796875, 1.416259765625, 1.6646728515625, 1.9130859375, 2.1614990234375, 2.409912109375, 2.6583251953125, 2.90673828125, 3.1551513671875, 3.403564453125, 3.6519775390625, 3.900390625, 4.1488037109375, 4.397216796875, 4.6456298828125, 4.89404296875, 5.1424560546875, 5.390869140625, 5.6392822265625, 5.8876953125, 6.1361083984375, 6.384521484375, 6.6329345703125, 6.88134765625, 7.1297607421875, 7.378173828125, 7.6265869140625, 7.875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 9.0, 11.0, 11.0, 13.0, 14.0, 18.0, 21.0, 25.0, 21.0, 28.0, 29.0, 28.0, 43.0, 37.0, 62.0, 68.0, 102.0, 140.0, 1406.0, 311.0, 135.0, 93.0, 61.0, 52.0, 53.0, 23.0, 28.0, 32.0, 23.0, 17.0, 19.0, 18.0, 16.0, 15.0, 9.0, 11.0, 10.0, 4.0, 9.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-15.9140625, -15.4583740234375, -15.002685546875, -14.5469970703125, -14.09130859375, -13.6356201171875, -13.179931640625, -12.7242431640625, -12.2685546875, -11.8128662109375, -11.357177734375, -10.9014892578125, -10.44580078125, -9.9901123046875, -9.534423828125, -9.0787353515625, -8.623046875, -8.1673583984375, -7.711669921875, -7.2559814453125, -6.80029296875, -6.3446044921875, -5.888916015625, -5.4332275390625, -4.9775390625, -4.5218505859375, -4.066162109375, -3.6104736328125, -3.15478515625, -2.6990966796875, -2.243408203125, -1.7877197265625, -1.33203125, -0.8763427734375, -0.420654296875, 0.0350341796875, 0.49072265625, 0.9464111328125, 1.402099609375, 1.8577880859375, 2.3134765625, 2.7691650390625, 3.224853515625, 3.6805419921875, 4.13623046875, 4.5919189453125, 5.047607421875, 5.5032958984375, 5.958984375, 6.4146728515625, 6.870361328125, 7.3260498046875, 7.78173828125, 8.2374267578125, 8.693115234375, 9.1488037109375, 9.6044921875, 10.0601806640625, 10.515869140625, 10.9715576171875, 11.42724609375, 11.8829345703125, 12.338623046875, 12.7943115234375, 13.25]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 2.0, 9.0, 6.0, 11.0, 11.0, 17.0, 16.0, 28.0, 35.0, 36.0, 44.0, 53.0, 71.0, 75.0, 123.0, 122.0, 209.0, 298.0, 644.0, 2321.0, 16534.0, 433589.0, 2634533.0, 49475.0, 4946.0, 1063.0, 414.0, 226.0, 162.0, 142.0, 96.0, 75.0, 67.0, 53.0, 41.0, 38.0, 23.0, 15.0, 26.0, 14.0, 11.0, 6.0, 3.0, 6.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.03125, -22.21484375, -21.3984375, -20.58203125, -19.765625, -18.94921875, -18.1328125, -17.31640625, -16.5, -15.68359375, -14.8671875, -14.05078125, -13.234375, -12.41796875, -11.6015625, -10.78515625, -9.96875, -9.15234375, -8.3359375, -7.51953125, -6.703125, -5.88671875, -5.0703125, -4.25390625, -3.4375, -2.62109375, -1.8046875, -0.98828125, -0.171875, 0.64453125, 1.4609375, 2.27734375, 3.09375, 3.91015625, 4.7265625, 5.54296875, 6.359375, 7.17578125, 7.9921875, 8.80859375, 9.625, 10.44140625, 11.2578125, 12.07421875, 12.890625, 13.70703125, 14.5234375, 15.33984375, 16.15625, 16.97265625, 17.7890625, 18.60546875, 19.421875, 20.23828125, 21.0546875, 21.87109375, 22.6875, 23.50390625, 24.3203125, 25.13671875, 25.953125, 26.76953125, 27.5859375, 28.40234375, 29.21875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 18.0, 57.0, 62.0, 122.0, 150.0, 179.0, 139.0, 122.0, 77.0, 41.0, 20.0, 9.0, 4.0, 3.0, 0.0, 1.0], "bins": [-76.39627838134766, -74.9651107788086, -73.53395080566406, -72.102783203125, -70.67162322998047, -69.2404556274414, -67.80929565429688, -66.37812805175781, -64.94696044921875, -63.51579666137695, -62.084632873535156, -60.653465270996094, -59.2223014831543, -57.7911376953125, -56.3599739074707, -54.928810119628906, -53.49764633178711, -52.06648254394531, -50.635318756103516, -49.20415496826172, -47.772987365722656, -46.34182357788086, -44.91065979003906, -43.479496002197266, -42.04833221435547, -40.61716842651367, -39.186004638671875, -37.75483703613281, -36.323673248291016, -34.89250946044922, -33.46134567260742, -32.030181884765625, -30.599010467529297, -29.1678466796875, -27.73668098449707, -26.305517196655273, -24.874351501464844, -23.443187713623047, -22.01202392578125, -20.580860137939453, -19.149696350097656, -17.71853256225586, -16.28736686706543, -14.856203079223633, -13.42503833770752, -11.993873596191406, -10.56270980834961, -9.131545066833496, -7.700379371643066, -6.269214630126953, -4.838050365447998, -3.406886100769043, -1.9757213592529297, -0.5445566177368164, 0.8866071701049805, 2.3177719116210938, 3.748936653137207, 5.18010139465332, 6.611265659332275, 8.04242992401123, 9.473594665527344, 10.904759407043457, 12.335923194885254, 13.767087936401367, 15.19825267791748]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 10.0, 9.0, 4.0, 14.0, 17.0, 7.0, 13.0, 10.0, 15.0, 22.0, 21.0, 25.0, 17.0, 30.0, 18.0, 31.0, 30.0, 44.0, 45.0, 41.0, 39.0, 32.0, 31.0, 35.0, 37.0, 36.0, 30.0, 36.0, 26.0, 21.0, 20.0, 36.0, 22.0, 23.0, 27.0, 17.0, 12.0, 14.0, 12.0, 15.0, 9.0, 10.0, 9.0, 4.0, 5.0, 4.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-36.84569549560547, -35.63563919067383, -34.42558288574219, -33.21552276611328, -32.00546646118164, -30.79541015625, -29.58535385131836, -28.375295639038086, -27.165237426757812, -25.955181121826172, -24.7451229095459, -23.535066604614258, -22.325008392333984, -21.114952087402344, -19.904895782470703, -18.69483757019043, -17.48478126525879, -16.27472496032715, -15.064666748046875, -13.854610443115234, -12.644552230834961, -11.43449592590332, -10.224438667297363, -9.014381408691406, -7.804324150085449, -6.594266891479492, -5.384209632873535, -4.174152851104736, -2.9640955924987793, -1.7540383338928223, -0.5439815521240234, 0.6660757064819336, 1.8761329650878906, 3.0861902236938477, 4.296247482299805, 5.5063042640686035, 6.7163615226745605, 7.926418781280518, 9.136475563049316, 10.346532821655273, 11.55659008026123, 12.766647338867188, 13.976704597473145, 15.186761856079102, 16.396818161010742, 17.606876373291016, 18.816932678222656, 20.026988983154297, 21.23704719543457, 22.44710350036621, 23.657161712646484, 24.867218017578125, 26.0772762298584, 27.28733253479004, 28.497390747070312, 29.707447052001953, 30.917503356933594, 32.127559661865234, 33.337615966796875, 34.54767608642578, 35.75773239135742, 36.96778869628906, 38.1778450012207, 39.387901306152344, 40.59796142578125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 8.0, 21.0, 16.0, 13.0, 18.0, 20.0, 33.0, 41.0, 50.0, 34.0, 49.0, 41.0, 41.0, 45.0, 54.0, 54.0, 42.0, 47.0, 54.0, 44.0, 38.0, 41.0, 36.0, 24.0, 22.0, 18.0, 24.0, 11.0, 9.0, 10.0, 11.0, 2.0, 6.0, 6.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.96136474609375, -4.7781982421875, -4.59503173828125, -4.411865234375, -4.22869873046875, -4.0455322265625, -3.86236572265625, -3.67919921875, -3.49603271484375, -3.3128662109375, -3.12969970703125, -2.946533203125, -2.76336669921875, -2.5802001953125, -2.39703369140625, -2.2138671875, -2.03070068359375, -1.8475341796875, -1.66436767578125, -1.481201171875, -1.29803466796875, -1.1148681640625, -0.93170166015625, -0.74853515625, -0.56536865234375, -0.3822021484375, -0.19903564453125, -0.015869140625, 0.16729736328125, 0.3504638671875, 0.53363037109375, 0.716796875, 0.89996337890625, 1.0831298828125, 1.26629638671875, 1.449462890625, 1.63262939453125, 1.8157958984375, 1.99896240234375, 2.18212890625, 2.36529541015625, 2.5484619140625, 2.73162841796875, 2.914794921875, 3.09796142578125, 3.2811279296875, 3.46429443359375, 3.6474609375, 3.83062744140625, 4.0137939453125, 4.19696044921875, 4.380126953125, 4.56329345703125, 4.7464599609375, 4.92962646484375, 5.11279296875, 5.29595947265625, 5.4791259765625, 5.66229248046875, 5.845458984375, 6.02862548828125, 6.2117919921875, 6.39495849609375, 6.578125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 4.0, 7.0, 11.0, 21.0, 26.0, 42.0, 67.0, 132.0, 219.0, 438.0, 791.0, 1926.0, 5024.0, 15389.0, 62460.0, 444948.0, 3016063.0, 548449.0, 71300.0, 17231.0, 5585.0, 2156.0, 904.0, 467.0, 236.0, 147.0, 84.0, 45.0, 37.0, 21.0, 15.0, 9.0, 3.0, 1.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.0625, -13.63037109375, -13.1982421875, -12.76611328125, -12.333984375, -11.90185546875, -11.4697265625, -11.03759765625, -10.60546875, -10.17333984375, -9.7412109375, -9.30908203125, -8.876953125, -8.44482421875, -8.0126953125, -7.58056640625, -7.1484375, -6.71630859375, -6.2841796875, -5.85205078125, -5.419921875, -4.98779296875, -4.5556640625, -4.12353515625, -3.69140625, -3.25927734375, -2.8271484375, -2.39501953125, -1.962890625, -1.53076171875, -1.0986328125, -0.66650390625, -0.234375, 0.19775390625, 0.6298828125, 1.06201171875, 1.494140625, 1.92626953125, 2.3583984375, 2.79052734375, 3.22265625, 3.65478515625, 4.0869140625, 4.51904296875, 4.951171875, 5.38330078125, 5.8154296875, 6.24755859375, 6.6796875, 7.11181640625, 7.5439453125, 7.97607421875, 8.408203125, 8.84033203125, 9.2724609375, 9.70458984375, 10.13671875, 10.56884765625, 11.0009765625, 11.43310546875, 11.865234375, 12.29736328125, 12.7294921875, 13.16162109375, 13.59375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 8.0, 11.0, 12.0, 27.0, 30.0, 44.0, 53.0, 87.0, 93.0, 152.0, 194.0, 274.0, 388.0, 587.0, 629.0, 428.0, 297.0, 197.0, 147.0, 120.0, 74.0, 69.0, 35.0, 29.0, 18.0, 17.0, 10.0, 8.0, 5.0, 7.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.8795166015625, -9.571533203125, -9.2635498046875, -8.95556640625, -8.6475830078125, -8.339599609375, -8.0316162109375, -7.7236328125, -7.4156494140625, -7.107666015625, -6.7996826171875, -6.49169921875, -6.1837158203125, -5.875732421875, -5.5677490234375, -5.259765625, -4.9517822265625, -4.643798828125, -4.3358154296875, -4.02783203125, -3.7198486328125, -3.411865234375, -3.1038818359375, -2.7958984375, -2.4879150390625, -2.179931640625, -1.8719482421875, -1.56396484375, -1.2559814453125, -0.947998046875, -0.6400146484375, -0.33203125, -0.0240478515625, 0.283935546875, 0.5919189453125, 0.89990234375, 1.2078857421875, 1.515869140625, 1.8238525390625, 2.1318359375, 2.4398193359375, 2.747802734375, 3.0557861328125, 3.36376953125, 3.6717529296875, 3.979736328125, 4.2877197265625, 4.595703125, 4.9036865234375, 5.211669921875, 5.5196533203125, 5.82763671875, 6.1356201171875, 6.443603515625, 6.7515869140625, 7.0595703125, 7.3675537109375, 7.675537109375, 7.9835205078125, 8.29150390625, 8.5994873046875, 8.907470703125, 9.2154541015625, 9.5234375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 9.0, 13.0, 25.0, 22.0, 48.0, 62.0, 78.0, 146.0, 235.0, 360.0, 833.0, 2648.0, 14156.0, 145787.0, 3061031.0, 905442.0, 53665.0, 6766.0, 1524.0, 606.0, 295.0, 175.0, 93.0, 68.0, 53.0, 36.0, 22.0, 20.0, 17.0, 11.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.75, -22.895751953125, -22.04150390625, -21.187255859375, -20.3330078125, -19.478759765625, -18.62451171875, -17.770263671875, -16.916015625, -16.061767578125, -15.20751953125, -14.353271484375, -13.4990234375, -12.644775390625, -11.79052734375, -10.936279296875, -10.08203125, -9.227783203125, -8.37353515625, -7.519287109375, -6.6650390625, -5.810791015625, -4.95654296875, -4.102294921875, -3.248046875, -2.393798828125, -1.53955078125, -0.685302734375, 0.1689453125, 1.023193359375, 1.87744140625, 2.731689453125, 3.5859375, 4.440185546875, 5.29443359375, 6.148681640625, 7.0029296875, 7.857177734375, 8.71142578125, 9.565673828125, 10.419921875, 11.274169921875, 12.12841796875, 12.982666015625, 13.8369140625, 14.691162109375, 15.54541015625, 16.399658203125, 17.25390625, 18.108154296875, 18.96240234375, 19.816650390625, 20.6708984375, 21.525146484375, 22.37939453125, 23.233642578125, 24.087890625, 24.942138671875, 25.79638671875, 26.650634765625, 27.5048828125, 28.359130859375, 29.21337890625, 30.067626953125, 30.921875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 29.0, 35.0, 47.0, 70.0, 75.0, 100.0, 117.0, 114.0, 104.0, 71.0, 62.0, 69.0, 33.0, 26.0, 11.0, 15.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.11507034301758, -56.42194747924805, -54.72882080078125, -53.03569793701172, -51.34257507324219, -49.649452209472656, -47.956329345703125, -46.26320266723633, -44.5700798034668, -42.876956939697266, -41.18383026123047, -39.49070739746094, -37.797584533691406, -36.104461669921875, -34.411338806152344, -32.71821212768555, -31.025089263916016, -29.331966400146484, -27.63884162902832, -25.945716857910156, -24.252593994140625, -22.559471130371094, -20.86634635925293, -19.173221588134766, -17.480098724365234, -15.786974906921387, -14.093851089477539, -12.400727272033691, -10.707603454589844, -9.014479637145996, -7.321355819702148, -5.628232002258301, -3.9351119995117188, -2.241988182067871, -0.5488643646240234, 1.1442594528198242, 2.837383270263672, 4.5305070877075195, 6.223630905151367, 7.916754722595215, 9.609878540039062, 11.30300235748291, 12.996126174926758, 14.689249992370605, 16.382373809814453, 18.075496673583984, 19.76862144470215, 21.461746215820312, 23.154869079589844, 24.847991943359375, 26.54111671447754, 28.234241485595703, 29.927364349365234, 31.620487213134766, 33.31361389160156, 35.006736755371094, 36.699859619140625, 38.392982482910156, 40.08610534667969, 41.779232025146484, 43.472354888916016, 45.16547775268555, 46.858604431152344, 48.551727294921875, 50.244850158691406]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 5.0, 3.0, 6.0, 4.0, 11.0, 8.0, 11.0, 10.0, 17.0, 14.0, 18.0, 20.0, 25.0, 23.0, 21.0, 31.0, 30.0, 39.0, 25.0, 27.0, 40.0, 39.0, 24.0, 32.0, 30.0, 39.0, 47.0, 22.0, 37.0, 45.0, 27.0, 31.0, 24.0, 30.0, 23.0, 26.0, 15.0, 17.0, 22.0, 10.0, 15.0, 10.0, 12.0, 8.0, 6.0, 7.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-24.57305908203125, -23.747072219848633, -22.921085357666016, -22.09510040283203, -21.269113540649414, -20.443126678466797, -19.61713981628418, -18.791152954101562, -17.965167999267578, -17.13918113708496, -16.313194274902344, -15.487208366394043, -14.661222457885742, -13.835235595703125, -13.009248733520508, -12.18326187133789, -11.357275009155273, -10.531288146972656, -9.705302238464355, -8.879315376281738, -8.053329467773438, -7.22734260559082, -6.401355743408203, -5.575369358062744, -4.749382972717285, -3.923396587371826, -3.097409963607788, -2.27142333984375, -1.445436954498291, -0.619450569152832, 0.20653629302978516, 1.0325226783752441, 1.8585090637207031, 2.684495449066162, 3.5104820728302, 4.336468696594238, 5.162455081939697, 5.988441467285156, 6.814428329467773, 7.640414714813232, 8.466401100158691, 9.292387962341309, 10.11837387084961, 10.944360733032227, 11.770347595214844, 12.596333503723145, 13.422320365905762, 14.248306274414062, 15.07429313659668, 15.900279998779297, 16.726266860961914, 17.55225372314453, 18.378238677978516, 19.204225540161133, 20.03021240234375, 20.856199264526367, 21.682186126708984, 22.5081729888916, 23.33415985107422, 24.160144805908203, 24.98613166809082, 25.812118530273438, 26.638105392456055, 27.464092254638672, 28.290077209472656]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 20.0, 13.0, 18.0, 23.0, 20.0, 24.0, 22.0, 36.0, 35.0, 45.0, 51.0, 44.0, 43.0, 35.0, 47.0, 47.0, 54.0, 37.0, 50.0, 47.0, 37.0, 46.0, 36.0, 27.0, 30.0, 19.0, 13.0, 17.0, 12.0, 12.0, 7.0, 10.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.26190185546875, -5.0823974609375, -4.90289306640625, -4.723388671875, -4.54388427734375, -4.3643798828125, -4.18487548828125, -4.00537109375, -3.82586669921875, -3.6463623046875, -3.46685791015625, -3.287353515625, -3.10784912109375, -2.9283447265625, -2.74884033203125, -2.5693359375, -2.38983154296875, -2.2103271484375, -2.03082275390625, -1.851318359375, -1.67181396484375, -1.4923095703125, -1.31280517578125, -1.13330078125, -0.95379638671875, -0.7742919921875, -0.59478759765625, -0.415283203125, -0.23577880859375, -0.0562744140625, 0.12322998046875, 0.302734375, 0.48223876953125, 0.6617431640625, 0.84124755859375, 1.020751953125, 1.20025634765625, 1.3797607421875, 1.55926513671875, 1.73876953125, 1.91827392578125, 2.0977783203125, 2.27728271484375, 2.456787109375, 2.63629150390625, 2.8157958984375, 2.99530029296875, 3.1748046875, 3.35430908203125, 3.5338134765625, 3.71331787109375, 3.892822265625, 4.07232666015625, 4.2518310546875, 4.43133544921875, 4.61083984375, 4.79034423828125, 4.9698486328125, 5.14935302734375, 5.328857421875, 5.50836181640625, 5.6878662109375, 5.86737060546875, 6.046875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 2.0, 6.0, 7.0, 13.0, 13.0, 20.0, 31.0, 41.0, 58.0, 102.0, 117.0, 151.0, 222.0, 340.0, 467.0, 708.0, 1072.0, 1497.0, 2191.0, 3340.0, 5029.0, 7599.0, 11383.0, 17506.0, 27416.0, 45723.0, 78823.0, 153309.0, 287904.0, 177948.0, 88634.0, 50322.0, 30459.0, 18967.0, 12254.0, 8153.0, 5518.0, 3503.0, 2448.0, 1614.0, 1213.0, 800.0, 511.0, 349.0, 250.0, 139.0, 108.0, 71.0, 52.0, 51.0, 32.0, 22.0, 16.0, 13.0, 13.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.176513671875, -0.1709270477294922, -0.16534042358398438, -0.15975379943847656, -0.15416717529296875, -0.14858055114746094, -0.14299392700195312, -0.1374073028564453, -0.1318206787109375, -0.1262340545654297, -0.12064743041992188, -0.11506080627441406, -0.10947418212890625, -0.10388755798339844, -0.09830093383789062, -0.09271430969238281, -0.087127685546875, -0.08154106140136719, -0.07595443725585938, -0.07036781311035156, -0.06478118896484375, -0.05919456481933594, -0.053607940673828125, -0.04802131652832031, -0.0424346923828125, -0.03684806823730469, -0.031261444091796875, -0.025674819946289062, -0.02008819580078125, -0.014501571655273438, -0.008914947509765625, -0.0033283233642578125, 0.00225830078125, 0.007844924926757812, 0.013431549072265625, 0.019018173217773438, 0.02460479736328125, 0.030191421508789062, 0.035778045654296875, 0.04136466979980469, 0.0469512939453125, 0.05253791809082031, 0.058124542236328125, 0.06371116638183594, 0.06929779052734375, 0.07488441467285156, 0.08047103881835938, 0.08605766296386719, 0.091644287109375, 0.09723091125488281, 0.10281753540039062, 0.10840415954589844, 0.11399078369140625, 0.11957740783691406, 0.12516403198242188, 0.1307506561279297, 0.1363372802734375, 0.1419239044189453, 0.14751052856445312, 0.15309715270996094, 0.15868377685546875, 0.16427040100097656, 0.16985702514648438, 0.1754436492919922, 0.1810302734375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 3.0, 6.0, 5.0, 6.0, 8.0, 12.0, 17.0, 15.0, 12.0, 16.0, 23.0, 11.0, 20.0, 25.0, 38.0, 22.0, 36.0, 28.0, 44.0, 42.0, 36.0, 1068.0, 50.0, 53.0, 38.0, 41.0, 40.0, 40.0, 40.0, 35.0, 24.0, 23.0, 28.0, 25.0, 14.0, 15.0, 15.0, 13.0, 9.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.396484375, -3.290252685546875, -3.18402099609375, -3.077789306640625, -2.9715576171875, -2.865325927734375, -2.75909423828125, -2.652862548828125, -2.546630859375, -2.440399169921875, -2.33416748046875, -2.227935791015625, -2.1217041015625, -2.015472412109375, -1.90924072265625, -1.803009033203125, -1.69677734375, -1.590545654296875, -1.48431396484375, -1.378082275390625, -1.2718505859375, -1.165618896484375, -1.05938720703125, -0.953155517578125, -0.846923828125, -0.740692138671875, -0.63446044921875, -0.528228759765625, -0.4219970703125, -0.315765380859375, -0.20953369140625, -0.103302001953125, 0.0029296875, 0.109161376953125, 0.21539306640625, 0.321624755859375, 0.4278564453125, 0.534088134765625, 0.64031982421875, 0.746551513671875, 0.852783203125, 0.959014892578125, 1.06524658203125, 1.171478271484375, 1.2777099609375, 1.383941650390625, 1.49017333984375, 1.596405029296875, 1.70263671875, 1.808868408203125, 1.91510009765625, 2.021331787109375, 2.1275634765625, 2.233795166015625, 2.34002685546875, 2.446258544921875, 2.552490234375, 2.658721923828125, 2.76495361328125, 2.871185302734375, 2.9774169921875, 3.083648681640625, 3.18988037109375, 3.296112060546875, 3.40234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 9.0, 12.0, 28.0, 33.0, 63.0, 73.0, 122.0, 190.0, 289.0, 474.0, 725.0, 1130.0, 1827.0, 2921.0, 4698.0, 7386.0, 12079.0, 19800.0, 33098.0, 57146.0, 113191.0, 928723.0, 656874.0, 112983.0, 58249.0, 33108.0, 19908.0, 12112.0, 7385.0, 4559.0, 2969.0, 1784.0, 1161.0, 694.0, 473.0, 293.0, 201.0, 125.0, 87.0, 49.0, 32.0, 21.0, 20.0, 8.0, 8.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.1259765625, -0.12215900421142578, -0.11834144592285156, -0.11452388763427734, -0.11070632934570312, -0.1068887710571289, -0.10307121276855469, -0.09925365447998047, -0.09543609619140625, -0.09161853790283203, -0.08780097961425781, -0.0839834213256836, -0.08016586303710938, -0.07634830474853516, -0.07253074645996094, -0.06871318817138672, -0.0648956298828125, -0.06107807159423828, -0.05726051330566406, -0.053442955017089844, -0.049625396728515625, -0.045807838439941406, -0.04199028015136719, -0.03817272186279297, -0.03435516357421875, -0.03053760528564453, -0.026720046997070312, -0.022902488708496094, -0.019084930419921875, -0.015267372131347656, -0.011449813842773438, -0.007632255554199219, -0.003814697265625, 2.86102294921875e-06, 0.0038204193115234375, 0.007637977600097656, 0.011455535888671875, 0.015273094177246094, 0.019090652465820312, 0.02290821075439453, 0.02672576904296875, 0.03054332733154297, 0.03436088562011719, 0.038178443908691406, 0.041996002197265625, 0.045813560485839844, 0.04963111877441406, 0.05344867706298828, 0.0572662353515625, 0.06108379364013672, 0.06490135192871094, 0.06871891021728516, 0.07253646850585938, 0.0763540267944336, 0.08017158508300781, 0.08398914337158203, 0.08780670166015625, 0.09162425994873047, 0.09544181823730469, 0.0992593765258789, 0.10307693481445312, 0.10689449310302734, 0.11071205139160156, 0.11452960968017578, 0.11834716796875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 13.0, 10.0, 8.0, 15.0, 12.0, 15.0, 19.0, 19.0, 28.0, 31.0, 28.0, 38.0, 45.0, 48.0, 34.0, 49.0, 41.0, 31.0, 39.0, 47.0, 34.0, 43.0, 41.0, 36.0, 41.0, 29.0, 27.0, 24.0, 26.0, 24.0, 18.0, 16.0, 11.0, 13.0, 9.0, 6.0, 6.0, 4.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.202127456665039e-05, -4.076492041349411e-05, -3.950856626033783e-05, -3.825221210718155e-05, -3.699585795402527e-05, -3.573950380086899e-05, -3.448314964771271e-05, -3.322679549455643e-05, -3.1970441341400146e-05, -3.0714087188243866e-05, -2.9457733035087585e-05, -2.8201378881931305e-05, -2.6945024728775024e-05, -2.5688670575618744e-05, -2.4432316422462463e-05, -2.3175962269306183e-05, -2.1919608116149902e-05, -2.0663253962993622e-05, -1.940689980983734e-05, -1.815054565668106e-05, -1.689419150352478e-05, -1.56378373503685e-05, -1.438148319721222e-05, -1.3125129044055939e-05, -1.1868774890899658e-05, -1.0612420737743378e-05, -9.356066584587097e-06, -8.099712431430817e-06, -6.843358278274536e-06, -5.587004125118256e-06, -4.330649971961975e-06, -3.0742958188056946e-06, -1.817941665649414e-06, -5.615875124931335e-07, 6.94766640663147e-07, 1.9511207938194275e-06, 3.207474946975708e-06, 4.4638291001319885e-06, 5.720183253288269e-06, 6.9765374064445496e-06, 8.23289155960083e-06, 9.48924571275711e-06, 1.0745599865913391e-05, 1.2001954019069672e-05, 1.3258308172225952e-05, 1.4514662325382233e-05, 1.5771016478538513e-05, 1.7027370631694794e-05, 1.8283724784851074e-05, 1.9540078938007355e-05, 2.0796433091163635e-05, 2.2052787244319916e-05, 2.3309141397476196e-05, 2.4565495550632477e-05, 2.5821849703788757e-05, 2.7078203856945038e-05, 2.833455801010132e-05, 2.95909121632576e-05, 3.084726631641388e-05, 3.210362046957016e-05, 3.335997462272644e-05, 3.461632877588272e-05, 3.5872682929039e-05, 3.712903708219528e-05, 3.838539123535156e-05]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 5.0, 2.0, 1.0, 6.0, 3.0, 3.0, 4.0, 9.0, 15.0, 10.0, 6.0, 13.0, 26.0, 22.0, 28.0, 26.0, 36.0, 48.0, 53.0, 84.0, 140.0, 221.0, 673.0, 4755.0, 153984.0, 819659.0, 64934.0, 2687.0, 507.0, 190.0, 100.0, 69.0, 39.0, 34.0, 26.0, 28.0, 22.0, 22.0, 7.0, 9.0, 12.0, 11.0, 7.0, 7.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0006852149963378906, -0.0006626620888710022, -0.0006401091814041138, -0.0006175562739372253, -0.0005950033664703369, -0.0005724504590034485, -0.0005498975515365601, -0.0005273446440696716, -0.0005047917366027832, -0.0004822388291358948, -0.00045968592166900635, -0.0004371330142021179, -0.0004145801067352295, -0.00039202719926834106, -0.00036947429180145264, -0.0003469213843345642, -0.0003243684768676758, -0.00030181556940078735, -0.0002792626619338989, -0.0002567097544670105, -0.00023415684700012207, -0.00021160393953323364, -0.00018905103206634521, -0.0001664981245994568, -0.00014394521713256836, -0.00012139230966567993, -9.88394021987915e-05, -7.628649473190308e-05, -5.373358726501465e-05, -3.118067979812622e-05, -8.627772331237793e-06, 1.3925135135650635e-05, 3.647804260253906e-05, 5.903095006942749e-05, 8.158385753631592e-05, 0.00010413676500320435, 0.00012668967247009277, 0.0001492425799369812, 0.00017179548740386963, 0.00019434839487075806, 0.00021690130233764648, 0.0002394542098045349, 0.00026200711727142334, 0.00028456002473831177, 0.0003071129322052002, 0.0003296658396720886, 0.00035221874713897705, 0.0003747716546058655, 0.0003973245620727539, 0.00041987746953964233, 0.00044243037700653076, 0.0004649832844734192, 0.0004875361919403076, 0.000510089099407196, 0.0005326420068740845, 0.0005551949143409729, 0.0005777478218078613, 0.0006003007292747498, 0.0006228536367416382, 0.0006454065442085266, 0.000667959451675415, 0.0006905123591423035, 0.0007130652666091919, 0.0007356181740760803, 0.0007581710815429688]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 22.0, 345.0, 607.0, 44.0], "bins": [-0.0008578122942708433, -0.0008440157980658114, -0.0008302193018607795, -0.0008164228056557477, -0.0008026263094507158, -0.0007888298714533448, -0.000775033375248313, -0.0007612368790432811, -0.0007474403828382492, -0.0007336438866332173, -0.0007198473904281855, -0.0007060508942231536, -0.0006922543980181217, -0.0006784579018130898, -0.000664661405608058, -0.000650864967610687, -0.0006370684131979942, -0.0006232719169929624, -0.0006094754207879305, -0.0005956789245828986, -0.0005818824283778667, -0.0005680859321728349, -0.000554289435967803, -0.000540492997970432, -0.0005266965017654002, -0.0005129000055603683, -0.0004991035093553364, -0.00048530701315030456, -0.00047151054604910314, -0.00045771404984407127, -0.0004439175536390394, -0.0004301210574340075, -0.0004163245903328061, -0.00040252809412777424, -0.00038873159792274237, -0.0003749351017177105, -0.0003611386346165091, -0.0003473421384114772, -0.00033354564220644534, -0.00031974914600141346, -0.00030595267890021205, -0.0002921561826951802, -0.0002783596864901483, -0.00026456319028511643, -0.000250766723183915, -0.00023697022697888315, -0.00022317373077385128, -0.0002093772345688194, -0.00019558073836378753, -0.00018178424215875566, -0.00016798776050563902, -0.00015419126430060714, -0.0001403947826474905, -0.00012659828644245863, -0.00011280179023742676, -9.90053013083525e-05, -8.520881237927824e-05, -7.141232345020398e-05, -5.761583088315092e-05, -4.3819338316097856e-05, -3.0022849387023598e-05, -1.622636045794934e-05, -2.4298642529174685e-06, 1.1366624676156789e-05, 2.516310996725224e-05]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 9.0, 12.0, 13.0, 12.0, 22.0, 16.0, 23.0, 31.0, 29.0, 48.0, 52.0, 51.0, 51.0, 57.0, 64.0, 47.0, 59.0, 60.0, 50.0, 41.0, 46.0, 46.0, 35.0, 29.0, 21.0, 23.0, 13.0, 13.0, 11.0, 10.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9027462005615234e-05, -2.7797184884548187e-05, -2.656690776348114e-05, -2.5336630642414093e-05, -2.4106353521347046e-05, -2.287607640028e-05, -2.164579927921295e-05, -2.0415522158145905e-05, -1.9185245037078857e-05, -1.795496791601181e-05, -1.6724690794944763e-05, -1.5494413673877716e-05, -1.4264136552810669e-05, -1.3033859431743622e-05, -1.1803582310676575e-05, -1.0573305189609528e-05, -9.34302806854248e-06, -8.112750947475433e-06, -6.882473826408386e-06, -5.652196705341339e-06, -4.421919584274292e-06, -3.191642463207245e-06, -1.9613653421401978e-06, -7.310882210731506e-07, 4.991888999938965e-07, 1.7294660210609436e-06, 2.9597431421279907e-06, 4.190020263195038e-06, 5.420297384262085e-06, 6.650574505329132e-06, 7.88085162639618e-06, 9.111128747463226e-06, 1.0341405868530273e-05, 1.157168298959732e-05, 1.2801960110664368e-05, 1.4032237231731415e-05, 1.5262514352798462e-05, 1.649279147386551e-05, 1.7723068594932556e-05, 1.8953345715999603e-05, 2.018362283706665e-05, 2.1413899958133698e-05, 2.2644177079200745e-05, 2.3874454200267792e-05, 2.510473132133484e-05, 2.6335008442401886e-05, 2.7565285563468933e-05, 2.879556268453598e-05, 3.0025839805603027e-05, 3.1256116926670074e-05, 3.248639404773712e-05, 3.371667116880417e-05, 3.4946948289871216e-05, 3.617722541093826e-05, 3.740750253200531e-05, 3.863777965307236e-05, 3.9868056774139404e-05, 4.109833389520645e-05, 4.23286110162735e-05, 4.3558888137340546e-05, 4.478916525840759e-05, 4.601944237947464e-05, 4.724971950054169e-05, 4.8479996621608734e-05, 4.971027374267578e-05]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 20.0, 13.0, 18.0, 23.0, 20.0, 24.0, 22.0, 36.0, 35.0, 45.0, 51.0, 44.0, 43.0, 35.0, 47.0, 47.0, 54.0, 37.0, 50.0, 47.0, 37.0, 46.0, 36.0, 27.0, 30.0, 19.0, 13.0, 17.0, 12.0, 12.0, 7.0, 10.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.26190185546875, -5.0823974609375, -4.90289306640625, -4.723388671875, -4.54388427734375, -4.3643798828125, -4.18487548828125, -4.00537109375, -3.82586669921875, -3.6463623046875, -3.46685791015625, -3.287353515625, -3.10784912109375, -2.9283447265625, -2.74884033203125, -2.5693359375, -2.38983154296875, -2.2103271484375, -2.03082275390625, -1.851318359375, -1.67181396484375, -1.4923095703125, -1.31280517578125, -1.13330078125, -0.95379638671875, -0.7742919921875, -0.59478759765625, -0.415283203125, -0.23577880859375, -0.0562744140625, 0.12322998046875, 0.302734375, 0.48223876953125, 0.6617431640625, 0.84124755859375, 1.020751953125, 1.20025634765625, 1.3797607421875, 1.55926513671875, 1.73876953125, 1.91827392578125, 2.0977783203125, 2.27728271484375, 2.456787109375, 2.63629150390625, 2.8157958984375, 2.99530029296875, 3.1748046875, 3.35430908203125, 3.5338134765625, 3.71331787109375, 3.892822265625, 4.07232666015625, 4.2518310546875, 4.43133544921875, 4.61083984375, 4.79034423828125, 4.9698486328125, 5.14935302734375, 5.328857421875, 5.50836181640625, 5.6878662109375, 5.86737060546875, 6.046875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 10.0, 9.0, 13.0, 12.0, 15.0, 31.0, 33.0, 58.0, 62.0, 122.0, 162.0, 261.0, 426.0, 652.0, 1125.0, 1866.0, 3526.0, 7285.0, 17349.0, 54823.0, 253564.0, 532893.0, 120126.0, 31109.0, 11258.0, 5180.0, 2658.0, 1480.0, 855.0, 550.0, 345.0, 228.0, 141.0, 102.0, 66.0, 43.0, 23.0, 28.0, 21.0, 9.0, 9.0, 6.0, 5.0, 2.0, 5.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.875, -5.6871337890625, -5.499267578125, -5.3114013671875, -5.12353515625, -4.9356689453125, -4.747802734375, -4.5599365234375, -4.3720703125, -4.1842041015625, -3.996337890625, -3.8084716796875, -3.62060546875, -3.4327392578125, -3.244873046875, -3.0570068359375, -2.869140625, -2.6812744140625, -2.493408203125, -2.3055419921875, -2.11767578125, -1.9298095703125, -1.741943359375, -1.5540771484375, -1.3662109375, -1.1783447265625, -0.990478515625, -0.8026123046875, -0.61474609375, -0.4268798828125, -0.239013671875, -0.0511474609375, 0.13671875, 0.3245849609375, 0.512451171875, 0.7003173828125, 0.88818359375, 1.0760498046875, 1.263916015625, 1.4517822265625, 1.6396484375, 1.8275146484375, 2.015380859375, 2.2032470703125, 2.39111328125, 2.5789794921875, 2.766845703125, 2.9547119140625, 3.142578125, 3.3304443359375, 3.518310546875, 3.7061767578125, 3.89404296875, 4.0819091796875, 4.269775390625, 4.4576416015625, 4.6455078125, 4.8333740234375, 5.021240234375, 5.2091064453125, 5.39697265625, 5.5848388671875, 5.772705078125, 5.9605712890625, 6.1484375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 5.0, 7.0, 8.0, 5.0, 12.0, 14.0, 21.0, 16.0, 30.0, 17.0, 35.0, 23.0, 28.0, 27.0, 34.0, 46.0, 46.0, 63.0, 94.0, 322.0, 1542.0, 156.0, 76.0, 58.0, 47.0, 41.0, 29.0, 38.0, 27.0, 45.0, 18.0, 20.0, 21.0, 13.0, 18.0, 9.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4140625, -14.9190673828125, -14.424072265625, -13.9290771484375, -13.43408203125, -12.9390869140625, -12.444091796875, -11.9490966796875, -11.4541015625, -10.9591064453125, -10.464111328125, -9.9691162109375, -9.47412109375, -8.9791259765625, -8.484130859375, -7.9891357421875, -7.494140625, -6.9991455078125, -6.504150390625, -6.0091552734375, -5.51416015625, -5.0191650390625, -4.524169921875, -4.0291748046875, -3.5341796875, -3.0391845703125, -2.544189453125, -2.0491943359375, -1.55419921875, -1.0592041015625, -0.564208984375, -0.0692138671875, 0.42578125, 0.9207763671875, 1.415771484375, 1.9107666015625, 2.40576171875, 2.9007568359375, 3.395751953125, 3.8907470703125, 4.3857421875, 4.8807373046875, 5.375732421875, 5.8707275390625, 6.36572265625, 6.8607177734375, 7.355712890625, 7.8507080078125, 8.345703125, 8.8406982421875, 9.335693359375, 9.8306884765625, 10.32568359375, 10.8206787109375, 11.315673828125, 11.8106689453125, 12.3056640625, 12.8006591796875, 13.295654296875, 13.7906494140625, 14.28564453125, 14.7806396484375, 15.275634765625, 15.7706298828125, 16.265625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 10.0, 10.0, 14.0, 17.0, 22.0, 47.0, 36.0, 43.0, 81.0, 94.0, 118.0, 180.0, 269.0, 505.0, 1103.0, 4401.0, 43034.0, 2862960.0, 219009.0, 10116.0, 1825.0, 649.0, 364.0, 208.0, 128.0, 99.0, 75.0, 65.0, 51.0, 29.0, 29.0, 22.0, 18.0, 17.0, 14.0, 9.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0], "bins": [-27.71875, -26.896728515625, -26.07470703125, -25.252685546875, -24.4306640625, -23.608642578125, -22.78662109375, -21.964599609375, -21.142578125, -20.320556640625, -19.49853515625, -18.676513671875, -17.8544921875, -17.032470703125, -16.21044921875, -15.388427734375, -14.56640625, -13.744384765625, -12.92236328125, -12.100341796875, -11.2783203125, -10.456298828125, -9.63427734375, -8.812255859375, -7.990234375, -7.168212890625, -6.34619140625, -5.524169921875, -4.7021484375, -3.880126953125, -3.05810546875, -2.236083984375, -1.4140625, -0.592041015625, 0.22998046875, 1.052001953125, 1.8740234375, 2.696044921875, 3.51806640625, 4.340087890625, 5.162109375, 5.984130859375, 6.80615234375, 7.628173828125, 8.4501953125, 9.272216796875, 10.09423828125, 10.916259765625, 11.73828125, 12.560302734375, 13.38232421875, 14.204345703125, 15.0263671875, 15.848388671875, 16.67041015625, 17.492431640625, 18.314453125, 19.136474609375, 19.95849609375, 20.780517578125, 21.6025390625, 22.424560546875, 23.24658203125, 24.068603515625, 24.890625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [2.0, 56.0, 831.0, 127.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.220638275146484, -13.68605899810791, -5.151479721069336, 3.383098602294922, 11.917678833007812, 20.452259063720703, 28.986835479736328, 37.52141571044922, 46.05599594116211, 54.590576171875, 63.125152587890625, 71.65972900390625, 80.1943130493164, 88.72889709472656, 97.26347351074219, 105.79804992675781, 114.33262634277344, 122.86720275878906, 131.4017791748047, 139.93637084960938, 148.470947265625, 157.00552368164062, 165.54010009765625, 174.07467651367188, 182.60926818847656, 191.1438446044922, 199.6784210205078, 208.2130126953125, 216.74758911132812, 225.28216552734375, 233.81674194335938, 242.351318359375, 250.88589477539062, 259.42047119140625, 267.9550476074219, 276.4896240234375, 285.0242004394531, 293.55877685546875, 302.0933837890625, 310.6279602050781, 319.16253662109375, 327.6971130371094, 336.231689453125, 344.7662658691406, 353.30084228515625, 361.83544921875, 370.3699951171875, 378.90460205078125, 387.43914794921875, 395.9737243652344, 404.50830078125, 413.0428771972656, 421.57745361328125, 430.112060546875, 438.6466064453125, 447.18121337890625, 455.7157897949219, 464.2503662109375, 472.7849426269531, 481.31951904296875, 489.8540954589844, 498.388671875, 506.92327880859375, 515.4578247070312, 523.992431640625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 9.0, 9.0, 5.0, 13.0, 13.0, 16.0, 26.0, 18.0, 16.0, 30.0, 33.0, 32.0, 44.0, 35.0, 43.0, 32.0, 35.0, 48.0, 37.0, 33.0, 54.0, 41.0, 45.0, 40.0, 34.0, 33.0, 22.0, 26.0, 25.0, 29.0, 21.0, 19.0, 12.0, 9.0, 15.0, 9.0, 7.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.14728927612305, -47.708553314208984, -46.26981735229492, -44.83108139038086, -43.39234161376953, -41.95360565185547, -40.514869689941406, -39.076133728027344, -37.63739776611328, -36.19866180419922, -34.759925842285156, -33.321189880371094, -31.8824520111084, -30.443716049194336, -29.00497817993164, -27.566242218017578, -26.127506256103516, -24.688770294189453, -23.25003433227539, -21.811296463012695, -20.372560501098633, -18.93382453918457, -17.495086669921875, -16.056350708007812, -14.61761474609375, -13.178878784179688, -11.740141868591309, -10.30140495300293, -8.862668991088867, -7.4239325523376465, -5.985196113586426, -4.546459197998047, -3.1077232360839844, -1.6689867973327637, -0.23025035858154297, 1.2084860801696777, 2.6472225189208984, 4.085958957672119, 5.52469539642334, 6.963432312011719, 8.402168273925781, 9.840904235839844, 11.279641151428223, 12.718378067016602, 14.157114028930664, 15.595849990844727, 17.034587860107422, 18.473323822021484, 19.912059783935547, 21.35079574584961, 22.789531707763672, 24.228269577026367, 25.66700553894043, 27.105741500854492, 28.544479370117188, 29.98321533203125, 31.421951293945312, 32.860687255859375, 34.29942321777344, 35.7381591796875, 37.17689514160156, 38.61563491821289, 40.05437088012695, 41.493106842041016, 42.93184280395508]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 16.0, 18.0, 17.0, 18.0, 24.0, 24.0, 32.0, 37.0, 39.0, 45.0, 41.0, 53.0, 38.0, 40.0, 44.0, 56.0, 41.0, 44.0, 45.0, 51.0, 36.0, 41.0, 33.0, 27.0, 26.0, 16.0, 12.0, 17.0, 12.0, 12.0, 11.0, 5.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40625, -5.2254638671875, -5.044677734375, -4.8638916015625, -4.68310546875, -4.5023193359375, -4.321533203125, -4.1407470703125, -3.9599609375, -3.7791748046875, -3.598388671875, -3.4176025390625, -3.23681640625, -3.0560302734375, -2.875244140625, -2.6944580078125, -2.513671875, -2.3328857421875, -2.152099609375, -1.9713134765625, -1.79052734375, -1.6097412109375, -1.428955078125, -1.2481689453125, -1.0673828125, -0.8865966796875, -0.705810546875, -0.5250244140625, -0.34423828125, -0.1634521484375, 0.017333984375, 0.1981201171875, 0.37890625, 0.5596923828125, 0.740478515625, 0.9212646484375, 1.10205078125, 1.2828369140625, 1.463623046875, 1.6444091796875, 1.8251953125, 2.0059814453125, 2.186767578125, 2.3675537109375, 2.54833984375, 2.7291259765625, 2.909912109375, 3.0906982421875, 3.271484375, 3.4522705078125, 3.633056640625, 3.8138427734375, 3.99462890625, 4.1754150390625, 4.356201171875, 4.5369873046875, 4.7177734375, 4.8985595703125, 5.079345703125, 5.2601318359375, 5.44091796875, 5.6217041015625, 5.802490234375, 5.9832763671875, 6.1640625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 7.0, 5.0, 7.0, 17.0, 20.0, 25.0, 31.0, 53.0, 95.0, 163.0, 205.0, 376.0, 649.0, 1288.0, 2815.0, 7086.0, 22308.0, 89969.0, 677138.0, 2852694.0, 441134.0, 68669.0, 18283.0, 6103.0, 2491.0, 1117.0, 588.0, 312.0, 249.0, 109.0, 85.0, 51.0, 41.0, 25.0, 24.0, 14.0, 7.0, 6.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-13.484375, -13.080810546875, -12.67724609375, -12.273681640625, -11.8701171875, -11.466552734375, -11.06298828125, -10.659423828125, -10.255859375, -9.852294921875, -9.44873046875, -9.045166015625, -8.6416015625, -8.238037109375, -7.83447265625, -7.430908203125, -7.02734375, -6.623779296875, -6.22021484375, -5.816650390625, -5.4130859375, -5.009521484375, -4.60595703125, -4.202392578125, -3.798828125, -3.395263671875, -2.99169921875, -2.588134765625, -2.1845703125, -1.781005859375, -1.37744140625, -0.973876953125, -0.5703125, -0.166748046875, 0.23681640625, 0.640380859375, 1.0439453125, 1.447509765625, 1.85107421875, 2.254638671875, 2.658203125, 3.061767578125, 3.46533203125, 3.868896484375, 4.2724609375, 4.676025390625, 5.07958984375, 5.483154296875, 5.88671875, 6.290283203125, 6.69384765625, 7.097412109375, 7.5009765625, 7.904541015625, 8.30810546875, 8.711669921875, 9.115234375, 9.518798828125, 9.92236328125, 10.325927734375, 10.7294921875, 11.133056640625, 11.53662109375, 11.940185546875, 12.34375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 10.0, 22.0, 24.0, 40.0, 74.0, 112.0, 162.0, 286.0, 484.0, 761.0, 827.0, 486.0, 294.0, 183.0, 103.0, 66.0, 48.0, 32.0, 20.0, 15.0, 14.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.375, -17.927001953125, -17.47900390625, -17.031005859375, -16.5830078125, -16.135009765625, -15.68701171875, -15.239013671875, -14.791015625, -14.343017578125, -13.89501953125, -13.447021484375, -12.9990234375, -12.551025390625, -12.10302734375, -11.655029296875, -11.20703125, -10.759033203125, -10.31103515625, -9.863037109375, -9.4150390625, -8.967041015625, -8.51904296875, -8.071044921875, -7.623046875, -7.175048828125, -6.72705078125, -6.279052734375, -5.8310546875, -5.383056640625, -4.93505859375, -4.487060546875, -4.0390625, -3.591064453125, -3.14306640625, -2.695068359375, -2.2470703125, -1.799072265625, -1.35107421875, -0.903076171875, -0.455078125, -0.007080078125, 0.44091796875, 0.888916015625, 1.3369140625, 1.784912109375, 2.23291015625, 2.680908203125, 3.12890625, 3.576904296875, 4.02490234375, 4.472900390625, 4.9208984375, 5.368896484375, 5.81689453125, 6.264892578125, 6.712890625, 7.160888671875, 7.60888671875, 8.056884765625, 8.5048828125, 8.952880859375, 9.40087890625, 9.848876953125, 10.296875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 14.0, 11.0, 24.0, 22.0, 37.0, 65.0, 118.0, 230.0, 426.0, 1019.0, 10534.0, 1297104.0, 2866377.0, 16106.0, 1205.0, 428.0, 240.0, 147.0, 71.0, 42.0, 24.0, 16.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.75, -40.083984375, -38.41796875, -36.751953125, -35.0859375, -33.419921875, -31.75390625, -30.087890625, -28.421875, -26.755859375, -25.08984375, -23.423828125, -21.7578125, -20.091796875, -18.42578125, -16.759765625, -15.09375, -13.427734375, -11.76171875, -10.095703125, -8.4296875, -6.763671875, -5.09765625, -3.431640625, -1.765625, -0.099609375, 1.56640625, 3.232421875, 4.8984375, 6.564453125, 8.23046875, 9.896484375, 11.5625, 13.228515625, 14.89453125, 16.560546875, 18.2265625, 19.892578125, 21.55859375, 23.224609375, 24.890625, 26.556640625, 28.22265625, 29.888671875, 31.5546875, 33.220703125, 34.88671875, 36.552734375, 38.21875, 39.884765625, 41.55078125, 43.216796875, 44.8828125, 46.548828125, 48.21484375, 49.880859375, 51.546875, 53.212890625, 54.87890625, 56.544921875, 58.2109375, 59.876953125, 61.54296875, 63.208984375, 64.875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 8.0, 11.0, 35.0, 57.0, 103.0, 120.0, 163.0, 157.0, 134.0, 92.0, 63.0, 29.0, 19.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.79570007324219, -81.18170928955078, -78.56771087646484, -75.95372009277344, -73.33972930908203, -70.72573852539062, -68.11174011230469, -65.49774932861328, -62.88375473022461, -60.26976013183594, -57.65576934814453, -55.04177474975586, -52.42778015136719, -49.81378936767578, -47.19979476928711, -44.58580017089844, -41.97180938720703, -39.35781478881836, -36.74382400512695, -34.12982940673828, -31.515836715698242, -28.901844024658203, -26.28784942626953, -23.673856735229492, -21.059864044189453, -18.445871353149414, -15.831877708435059, -13.217884063720703, -10.603891372680664, -7.989898681640625, -5.3759050369262695, -2.761911392211914, -0.147918701171875, 2.4660744667053223, 5.0800676345825195, 7.694060802459717, 10.308053970336914, 12.922046661376953, 15.536040306091309, 18.150033950805664, 20.764026641845703, 23.378019332885742, 25.99201202392578, 28.606006622314453, 31.219999313354492, 33.83399200439453, 36.4479866027832, 39.061981201171875, 41.67597198486328, 44.28996658325195, 46.90395736694336, 49.51795196533203, 52.13194274902344, 54.74593734741211, 57.35993194580078, 59.97392272949219, 62.58791732788086, 65.20191192626953, 67.81590270996094, 70.42989349365234, 73.04389190673828, 75.65788269042969, 78.2718734741211, 80.88587188720703, 83.49986267089844]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 5.0, 4.0, 0.0, 14.0, 11.0, 13.0, 10.0, 15.0, 10.0, 21.0, 33.0, 20.0, 31.0, 34.0, 31.0, 45.0, 36.0, 35.0, 35.0, 39.0, 40.0, 41.0, 48.0, 48.0, 45.0, 37.0, 42.0, 35.0, 29.0, 36.0, 41.0, 26.0, 18.0, 14.0, 8.0, 14.0, 7.0, 5.0, 9.0, 8.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.581565856933594, -28.5837345123291, -27.585901260375977, -26.588069915771484, -25.590238571166992, -24.5924072265625, -23.594573974609375, -22.596742630004883, -21.59891128540039, -20.6010799407959, -19.603246688842773, -18.60541534423828, -17.60758399963379, -16.609752655029297, -15.611919403076172, -14.61408805847168, -13.616254806518555, -12.618422508239746, -11.620591163635254, -10.622758865356445, -9.624927520751953, -8.627095222473145, -7.629262924194336, -6.6314311027526855, -5.633599281311035, -4.635767459869385, -3.6379354000091553, -2.640103340148926, -1.6422715187072754, -0.644439697265625, 0.3533926010131836, 1.351224422454834, 2.3490562438964844, 3.3468880653381348, 4.344719886779785, 5.342552185058594, 6.340384006500244, 7.3382158279418945, 8.336048126220703, 9.333879470825195, 10.331711769104004, 11.329544067382812, 12.327375411987305, 13.325207710266113, 14.323040008544922, 15.320871353149414, 16.318702697753906, 17.31653594970703, 18.314367294311523, 19.312198638916016, 20.31003189086914, 21.307863235473633, 22.305694580078125, 23.30352783203125, 24.301359176635742, 25.299190521240234, 26.29702377319336, 27.29485511779785, 28.292688369750977, 29.29051971435547, 30.28835105895996, 31.286182403564453, 32.28401565551758, 33.2818489074707, 34.27967834472656]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 11.0, 21.0, 16.0, 14.0, 22.0, 25.0, 30.0, 42.0, 45.0, 29.0, 45.0, 51.0, 52.0, 48.0, 44.0, 44.0, 49.0, 56.0, 47.0, 46.0, 42.0, 41.0, 38.0, 29.0, 23.0, 18.0, 13.0, 10.0, 7.0, 14.0, 3.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6953125, -6.49761962890625, -6.2999267578125, -6.10223388671875, -5.904541015625, -5.70684814453125, -5.5091552734375, -5.31146240234375, -5.11376953125, -4.91607666015625, -4.7183837890625, -4.52069091796875, -4.322998046875, -4.12530517578125, -3.9276123046875, -3.72991943359375, -3.5322265625, -3.33453369140625, -3.1368408203125, -2.93914794921875, -2.741455078125, -2.54376220703125, -2.3460693359375, -2.14837646484375, -1.95068359375, -1.75299072265625, -1.5552978515625, -1.35760498046875, -1.159912109375, -0.96221923828125, -0.7645263671875, -0.56683349609375, -0.369140625, -0.17144775390625, 0.0262451171875, 0.22393798828125, 0.421630859375, 0.61932373046875, 0.8170166015625, 1.01470947265625, 1.21240234375, 1.41009521484375, 1.6077880859375, 1.80548095703125, 2.003173828125, 2.20086669921875, 2.3985595703125, 2.59625244140625, 2.7939453125, 2.99163818359375, 3.1893310546875, 3.38702392578125, 3.584716796875, 3.78240966796875, 3.9801025390625, 4.17779541015625, 4.37548828125, 4.57318115234375, 4.7708740234375, 4.96856689453125, 5.166259765625, 5.36395263671875, 5.5616455078125, 5.75933837890625, 5.95703125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 9.0, 16.0, 31.0, 45.0, 66.0, 112.0, 180.0, 298.0, 532.0, 1012.0, 1822.0, 3335.0, 6574.0, 12826.0, 25951.0, 53807.0, 125095.0, 355700.0, 275039.0, 97897.0, 44291.0, 21171.0, 10663.0, 5750.0, 2899.0, 1518.0, 794.0, 439.0, 251.0, 135.0, 103.0, 64.0, 45.0, 26.0, 15.0, 11.0, 9.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.301025390625, -0.29213714599609375, -0.2832489013671875, -0.27436065673828125, -0.265472412109375, -0.25658416748046875, -0.2476959228515625, -0.23880767822265625, -0.22991943359375, -0.22103118896484375, -0.2121429443359375, -0.20325469970703125, -0.194366455078125, -0.18547821044921875, -0.1765899658203125, -0.16770172119140625, -0.1588134765625, -0.14992523193359375, -0.1410369873046875, -0.13214874267578125, -0.123260498046875, -0.11437225341796875, -0.1054840087890625, -0.09659576416015625, -0.08770751953125, -0.07881927490234375, -0.0699310302734375, -0.06104278564453125, -0.052154541015625, -0.04326629638671875, -0.0343780517578125, -0.02548980712890625, -0.0166015625, -0.00771331787109375, 0.0011749267578125, 0.01006317138671875, 0.018951416015625, 0.02783966064453125, 0.0367279052734375, 0.04561614990234375, 0.05450439453125, 0.06339263916015625, 0.0722808837890625, 0.08116912841796875, 0.090057373046875, 0.09894561767578125, 0.1078338623046875, 0.11672210693359375, 0.1256103515625, 0.13449859619140625, 0.1433868408203125, 0.15227508544921875, 0.161163330078125, 0.17005157470703125, 0.1789398193359375, 0.18782806396484375, 0.19671630859375, 0.20560455322265625, 0.2144927978515625, 0.22338104248046875, 0.232269287109375, 0.24115753173828125, 0.2500457763671875, 0.25893402099609375, 0.267822265625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 10.0, 5.0, 7.0, 11.0, 9.0, 15.0, 12.0, 20.0, 20.0, 17.0, 18.0, 34.0, 29.0, 36.0, 42.0, 34.0, 53.0, 48.0, 36.0, 49.0, 1069.0, 47.0, 38.0, 44.0, 40.0, 42.0, 37.0, 31.0, 35.0, 29.0, 20.0, 14.0, 16.0, 10.0, 14.0, 10.0, 9.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.525390625, -3.4085693359375, -3.291748046875, -3.1749267578125, -3.05810546875, -2.9412841796875, -2.824462890625, -2.7076416015625, -2.5908203125, -2.4739990234375, -2.357177734375, -2.2403564453125, -2.12353515625, -2.0067138671875, -1.889892578125, -1.7730712890625, -1.65625, -1.5394287109375, -1.422607421875, -1.3057861328125, -1.18896484375, -1.0721435546875, -0.955322265625, -0.8385009765625, -0.7216796875, -0.6048583984375, -0.488037109375, -0.3712158203125, -0.25439453125, -0.1375732421875, -0.020751953125, 0.0960693359375, 0.212890625, 0.3297119140625, 0.446533203125, 0.5633544921875, 0.68017578125, 0.7969970703125, 0.913818359375, 1.0306396484375, 1.1474609375, 1.2642822265625, 1.381103515625, 1.4979248046875, 1.61474609375, 1.7315673828125, 1.848388671875, 1.9652099609375, 2.08203125, 2.1988525390625, 2.315673828125, 2.4324951171875, 2.54931640625, 2.6661376953125, 2.782958984375, 2.8997802734375, 3.0166015625, 3.1334228515625, 3.250244140625, 3.3670654296875, 3.48388671875, 3.6007080078125, 3.717529296875, 3.8343505859375, 3.951171875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 7.0, 9.0, 18.0, 23.0, 26.0, 63.0, 96.0, 135.0, 216.0, 358.0, 604.0, 964.0, 1553.0, 2667.0, 4387.0, 7272.0, 12771.0, 21779.0, 39304.0, 75192.0, 165232.0, 1385593.0, 193231.0, 84725.0, 43171.0, 23892.0, 13901.0, 8093.0, 4583.0, 2864.0, 1716.0, 1026.0, 638.0, 401.0, 221.0, 148.0, 94.0, 55.0, 35.0, 23.0, 22.0, 11.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.12622642517089844, -0.12195968627929688, -0.11769294738769531, -0.11342620849609375, -0.10915946960449219, -0.10489273071289062, -0.10062599182128906, -0.0963592529296875, -0.09209251403808594, -0.08782577514648438, -0.08355903625488281, -0.07929229736328125, -0.07502555847167969, -0.07075881958007812, -0.06649208068847656, -0.062225341796875, -0.05795860290527344, -0.053691864013671875, -0.04942512512207031, -0.04515838623046875, -0.04089164733886719, -0.036624908447265625, -0.03235816955566406, -0.0280914306640625, -0.023824691772460938, -0.019557952880859375, -0.015291213989257812, -0.01102447509765625, -0.0067577362060546875, -0.002490997314453125, 0.0017757415771484375, 0.00604248046875, 0.010309219360351562, 0.014575958251953125, 0.018842697143554688, 0.02310943603515625, 0.027376174926757812, 0.031642913818359375, 0.03590965270996094, 0.0401763916015625, 0.04444313049316406, 0.048709869384765625, 0.05297660827636719, 0.05724334716796875, 0.06151008605957031, 0.06577682495117188, 0.07004356384277344, 0.074310302734375, 0.07857704162597656, 0.08284378051757812, 0.08711051940917969, 0.09137725830078125, 0.09564399719238281, 0.09991073608398438, 0.10417747497558594, 0.1084442138671875, 0.11271095275878906, 0.11697769165039062, 0.12124443054199219, 0.12551116943359375, 0.1297779083251953, 0.13404464721679688, 0.13831138610839844, 0.142578125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 5.0, 6.0, 4.0, 9.0, 8.0, 9.0, 11.0, 18.0, 13.0, 20.0, 29.0, 38.0, 36.0, 40.0, 46.0, 45.0, 53.0, 50.0, 53.0, 55.0, 52.0, 55.0, 40.0, 35.0, 44.0, 45.0, 42.0, 26.0, 21.0, 27.0, 19.0, 14.0, 10.0, 6.0, 4.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7954578399658203e-05, -2.6697292923927307e-05, -2.544000744819641e-05, -2.4182721972465515e-05, -2.292543649673462e-05, -2.1668151021003723e-05, -2.0410865545272827e-05, -1.915358006954193e-05, -1.7896294593811035e-05, -1.663900911808014e-05, -1.5381723642349243e-05, -1.4124438166618347e-05, -1.2867152690887451e-05, -1.1609867215156555e-05, -1.035258173942566e-05, -9.095296263694763e-06, -7.838010787963867e-06, -6.580725312232971e-06, -5.323439836502075e-06, -4.066154360771179e-06, -2.808868885040283e-06, -1.5515834093093872e-06, -2.942979335784912e-07, 9.629875421524048e-07, 2.2202730178833008e-06, 3.4775584936141968e-06, 4.734843969345093e-06, 5.992129445075989e-06, 7.249414920806885e-06, 8.50670039653778e-06, 9.763985872268677e-06, 1.1021271347999573e-05, 1.2278556823730469e-05, 1.3535842299461365e-05, 1.479312777519226e-05, 1.6050413250923157e-05, 1.7307698726654053e-05, 1.856498420238495e-05, 1.9822269678115845e-05, 2.107955515384674e-05, 2.2336840629577637e-05, 2.3594126105308533e-05, 2.485141158103943e-05, 2.6108697056770325e-05, 2.736598253250122e-05, 2.8623268008232117e-05, 2.9880553483963013e-05, 3.113783895969391e-05, 3.2395124435424805e-05, 3.36524099111557e-05, 3.49096953868866e-05, 3.616698086261749e-05, 3.742426633834839e-05, 3.8681551814079285e-05, 3.993883728981018e-05, 4.119612276554108e-05, 4.245340824127197e-05, 4.371069371700287e-05, 4.4967979192733765e-05, 4.622526466846466e-05, 4.748255014419556e-05, 4.873983561992645e-05, 4.999712109565735e-05, 5.1254406571388245e-05, 5.251169204711914e-05]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 10.0, 14.0, 13.0, 15.0, 18.0, 25.0, 26.0, 42.0, 44.0, 57.0, 100.0, 190.0, 460.0, 2700.0, 105091.0, 854117.0, 82344.0, 2315.0, 400.0, 170.0, 114.0, 66.0, 47.0, 31.0, 30.0, 15.0, 22.0, 7.0, 16.0, 11.0, 7.0, 9.0, 3.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0], "bins": [-0.0009331703186035156, -0.0009101107716560364, -0.0008870512247085571, -0.0008639916777610779, -0.0008409321308135986, -0.0008178725838661194, -0.0007948130369186401, -0.0007717534899711609, -0.0007486939430236816, -0.0007256343960762024, -0.0007025748491287231, -0.0006795153021812439, -0.0006564557552337646, -0.0006333962082862854, -0.0006103366613388062, -0.0005872771143913269, -0.0005642175674438477, -0.0005411580204963684, -0.0005180984735488892, -0.0004950389266014099, -0.00047197937965393066, -0.0004489198327064514, -0.00042586028575897217, -0.0004028007388114929, -0.00037974119186401367, -0.0003566816449165344, -0.0003336220979690552, -0.00031056255102157593, -0.0002875030040740967, -0.00026444345712661743, -0.00024138391017913818, -0.00021832436323165894, -0.0001952648162841797, -0.00017220526933670044, -0.0001491457223892212, -0.00012608617544174194, -0.0001030266284942627, -7.996708154678345e-05, -5.69075345993042e-05, -3.384798765182495e-05, -1.0788440704345703e-05, 1.2271106243133545e-05, 3.533065319061279e-05, 5.839020013809204e-05, 8.144974708557129e-05, 0.00010450929403305054, 0.00012756884098052979, 0.00015062838792800903, 0.00017368793487548828, 0.00019674748182296753, 0.00021980702877044678, 0.00024286657571792603, 0.0002659261226654053, 0.0002889856696128845, 0.00031204521656036377, 0.000335104763507843, 0.00035816431045532227, 0.0003812238574028015, 0.00040428340435028076, 0.00042734295129776, 0.00045040249824523926, 0.0004734620451927185, 0.0004965215921401978, 0.000519581139087677, 0.0005426406860351562]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 58.0, 414.0, 485.0, 56.0, 3.0], "bins": [-0.0006435181712731719, -0.0006329793250188231, -0.0006224404205568135, -0.0006119015743024647, -0.000601362728048116, -0.0005908238817937672, -0.0005802849773317575, -0.0005697461310774088, -0.00055920728482306, -0.0005486684385687113, -0.0005381295341067016, -0.0005275906878523529, -0.0005170518415980041, -0.0005065129953436553, -0.0004959740908816457, -0.0004854352446272969, -0.0004748963692691177, -0.0004643574939109385, -0.00045381864765658975, -0.00044327977229841053, -0.0004327409260440618, -0.00042220205068588257, -0.0004116632044315338, -0.0004011243290733546, -0.0003905854537151754, -0.0003800465783569962, -0.0003695077321026474, -0.0003589688567444682, -0.00034843001049011946, -0.00033789113513194025, -0.00032735225977376103, -0.0003168134135194123, -0.0003062745672650635, -0.0002957356919068843, -0.00028519684565253556, -0.00027465797029435635, -0.0002641191240400076, -0.0002535802486818284, -0.0002430413878755644, -0.0002325025270693004, -0.00022196368081495166, -0.00021142482000868767, -0.0002008859592024237, -0.00019034708384424448, -0.00017980823758989573, -0.00016926936223171651, -0.00015873050142545253, -0.00014819164061918855, -0.00013765277981292456, -0.00012711391900666058, -0.0001165750582003966, -0.000106036190118175, -9.549732931191102e-05, -8.495846850564703e-05, -7.441960042342544e-05, -6.388073961716145e-05, -5.334187517291866e-05, -4.280301072867587e-05, -3.226414992241189e-05, -2.17252854781691e-05, -1.1186424671905115e-05, -6.47563865641132e-07, 9.891304216580465e-06, 2.043016502284445e-05, 3.096902582910843e-05]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 10.0, 13.0, 5.0, 15.0, 26.0, 20.0, 23.0, 33.0, 37.0, 35.0, 40.0, 38.0, 55.0, 46.0, 64.0, 48.0, 56.0, 39.0, 55.0, 58.0, 35.0, 47.0, 25.0, 29.0, 24.0, 20.0, 17.0, 20.0, 22.0, 7.0, 12.0, 6.0, 6.0, 6.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.568960189819336e-05, -2.481415867805481e-05, -2.393871545791626e-05, -2.306327223777771e-05, -2.218782901763916e-05, -2.131238579750061e-05, -2.043694257736206e-05, -1.956149935722351e-05, -1.868605613708496e-05, -1.781061291694641e-05, -1.693516969680786e-05, -1.605972647666931e-05, -1.5184283256530762e-05, -1.4308840036392212e-05, -1.3433396816253662e-05, -1.2557953596115112e-05, -1.1682510375976562e-05, -1.0807067155838013e-05, -9.931623935699463e-06, -9.056180715560913e-06, -8.180737495422363e-06, -7.3052942752838135e-06, -6.429851055145264e-06, -5.554407835006714e-06, -4.678964614868164e-06, -3.8035213947296143e-06, -2.9280781745910645e-06, -2.0526349544525146e-06, -1.1771917343139648e-06, -3.0174851417541504e-07, 5.736947059631348e-07, 1.4491379261016846e-06, 2.3245811462402344e-06, 3.200024366378784e-06, 4.075467586517334e-06, 4.950910806655884e-06, 5.826354026794434e-06, 6.701797246932983e-06, 7.577240467071533e-06, 8.452683687210083e-06, 9.328126907348633e-06, 1.0203570127487183e-05, 1.1079013347625732e-05, 1.1954456567764282e-05, 1.2829899787902832e-05, 1.3705343008041382e-05, 1.4580786228179932e-05, 1.545622944831848e-05, 1.633167266845703e-05, 1.720711588859558e-05, 1.808255910873413e-05, 1.895800232887268e-05, 1.983344554901123e-05, 2.070888876914978e-05, 2.158433198928833e-05, 2.245977520942688e-05, 2.333521842956543e-05, 2.421066164970398e-05, 2.508610486984253e-05, 2.596154808998108e-05, 2.683699131011963e-05, 2.771243453025818e-05, 2.858787775039673e-05, 2.946332097053528e-05, 3.0338764190673828e-05]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 11.0, 21.0, 16.0, 14.0, 22.0, 25.0, 30.0, 42.0, 45.0, 29.0, 45.0, 51.0, 52.0, 48.0, 44.0, 44.0, 49.0, 56.0, 47.0, 46.0, 42.0, 41.0, 38.0, 29.0, 23.0, 18.0, 13.0, 10.0, 7.0, 14.0, 3.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6953125, -6.49761962890625, -6.2999267578125, -6.10223388671875, -5.904541015625, -5.70684814453125, -5.5091552734375, -5.31146240234375, -5.11376953125, -4.91607666015625, -4.7183837890625, -4.52069091796875, -4.322998046875, -4.12530517578125, -3.9276123046875, -3.72991943359375, -3.5322265625, -3.33453369140625, -3.1368408203125, -2.93914794921875, -2.741455078125, -2.54376220703125, -2.3460693359375, -2.14837646484375, -1.95068359375, -1.75299072265625, -1.5552978515625, -1.35760498046875, -1.159912109375, -0.96221923828125, -0.7645263671875, -0.56683349609375, -0.369140625, -0.17144775390625, 0.0262451171875, 0.22393798828125, 0.421630859375, 0.61932373046875, 0.8170166015625, 1.01470947265625, 1.21240234375, 1.41009521484375, 1.6077880859375, 1.80548095703125, 2.003173828125, 2.20086669921875, 2.3985595703125, 2.59625244140625, 2.7939453125, 2.99163818359375, 3.1893310546875, 3.38702392578125, 3.584716796875, 3.78240966796875, 3.9801025390625, 4.17779541015625, 4.37548828125, 4.57318115234375, 4.7708740234375, 4.96856689453125, 5.166259765625, 5.36395263671875, 5.5616455078125, 5.75933837890625, 5.95703125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 12.0, 10.0, 16.0, 27.0, 36.0, 67.0, 106.0, 149.0, 299.0, 541.0, 1067.0, 2078.0, 4354.0, 8965.0, 20157.0, 51823.0, 224808.0, 566434.0, 107124.0, 33374.0, 14126.0, 6536.0, 3117.0, 1562.0, 771.0, 441.0, 220.0, 116.0, 76.0, 52.0, 31.0, 24.0, 16.0, 8.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6796875, -8.458740234375, -8.23779296875, -8.016845703125, -7.7958984375, -7.574951171875, -7.35400390625, -7.133056640625, -6.912109375, -6.691162109375, -6.47021484375, -6.249267578125, -6.0283203125, -5.807373046875, -5.58642578125, -5.365478515625, -5.14453125, -4.923583984375, -4.70263671875, -4.481689453125, -4.2607421875, -4.039794921875, -3.81884765625, -3.597900390625, -3.376953125, -3.156005859375, -2.93505859375, -2.714111328125, -2.4931640625, -2.272216796875, -2.05126953125, -1.830322265625, -1.609375, -1.388427734375, -1.16748046875, -0.946533203125, -0.7255859375, -0.504638671875, -0.28369140625, -0.062744140625, 0.158203125, 0.379150390625, 0.60009765625, 0.821044921875, 1.0419921875, 1.262939453125, 1.48388671875, 1.704833984375, 1.92578125, 2.146728515625, 2.36767578125, 2.588623046875, 2.8095703125, 3.030517578125, 3.25146484375, 3.472412109375, 3.693359375, 3.914306640625, 4.13525390625, 4.356201171875, 4.5771484375, 4.798095703125, 5.01904296875, 5.239990234375, 5.4609375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 11.0, 8.0, 11.0, 12.0, 10.0, 18.0, 22.0, 25.0, 18.0, 25.0, 25.0, 41.0, 31.0, 57.0, 48.0, 78.0, 95.0, 450.0, 1477.0, 110.0, 82.0, 54.0, 42.0, 37.0, 35.0, 32.0, 34.0, 32.0, 28.0, 25.0, 17.0, 16.0, 13.0, 13.0, 8.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.765625, -17.192626953125, -16.61962890625, -16.046630859375, -15.4736328125, -14.900634765625, -14.32763671875, -13.754638671875, -13.181640625, -12.608642578125, -12.03564453125, -11.462646484375, -10.8896484375, -10.316650390625, -9.74365234375, -9.170654296875, -8.59765625, -8.024658203125, -7.45166015625, -6.878662109375, -6.3056640625, -5.732666015625, -5.15966796875, -4.586669921875, -4.013671875, -3.440673828125, -2.86767578125, -2.294677734375, -1.7216796875, -1.148681640625, -0.57568359375, -0.002685546875, 0.5703125, 1.143310546875, 1.71630859375, 2.289306640625, 2.8623046875, 3.435302734375, 4.00830078125, 4.581298828125, 5.154296875, 5.727294921875, 6.30029296875, 6.873291015625, 7.4462890625, 8.019287109375, 8.59228515625, 9.165283203125, 9.73828125, 10.311279296875, 10.88427734375, 11.457275390625, 12.0302734375, 12.603271484375, 13.17626953125, 13.749267578125, 14.322265625, 14.895263671875, 15.46826171875, 16.041259765625, 16.6142578125, 17.187255859375, 17.76025390625, 18.333251953125, 18.90625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 15.0, 14.0, 15.0, 19.0, 29.0, 34.0, 50.0, 61.0, 73.0, 123.0, 129.0, 175.0, 275.0, 519.0, 4722.0, 735728.0, 2395531.0, 6563.0, 664.0, 262.0, 164.0, 113.0, 93.0, 78.0, 51.0, 40.0, 35.0, 27.0, 26.0, 14.0, 14.0, 9.0, 10.0, 10.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.6875, -39.45654296875, -38.2255859375, -36.99462890625, -35.763671875, -34.53271484375, -33.3017578125, -32.07080078125, -30.83984375, -29.60888671875, -28.3779296875, -27.14697265625, -25.916015625, -24.68505859375, -23.4541015625, -22.22314453125, -20.9921875, -19.76123046875, -18.5302734375, -17.29931640625, -16.068359375, -14.83740234375, -13.6064453125, -12.37548828125, -11.14453125, -9.91357421875, -8.6826171875, -7.45166015625, -6.220703125, -4.98974609375, -3.7587890625, -2.52783203125, -1.296875, -0.06591796875, 1.1650390625, 2.39599609375, 3.626953125, 4.85791015625, 6.0888671875, 7.31982421875, 8.55078125, 9.78173828125, 11.0126953125, 12.24365234375, 13.474609375, 14.70556640625, 15.9365234375, 17.16748046875, 18.3984375, 19.62939453125, 20.8603515625, 22.09130859375, 23.322265625, 24.55322265625, 25.7841796875, 27.01513671875, 28.24609375, 29.47705078125, 30.7080078125, 31.93896484375, 33.169921875, 34.40087890625, 35.6318359375, 36.86279296875, 38.09375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 103.0, 862.0, 53.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.199392318725586, -15.809703826904297, -9.420015335083008, -3.0303268432617188, 3.3593616485595703, 9.74905014038086, 16.13873863220215, 22.52842903137207, 28.918115615844727, 35.307804107666016, 41.69749450683594, 48.087181091308594, 54.47686767578125, 60.86655807495117, 67.2562484741211, 73.64593505859375, 80.0356216430664, 86.42530822753906, 92.81500244140625, 99.2046890258789, 105.59437561035156, 111.98406219482422, 118.37374877929688, 124.76344299316406, 131.15313720703125, 137.54283142089844, 143.93251037597656, 150.32220458984375, 156.71188354492188, 163.10157775878906, 169.49127197265625, 175.88095092773438, 182.2706298828125, 188.6603240966797, 195.0500030517578, 201.439697265625, 207.82937622070312, 214.2190704345703, 220.6087646484375, 226.99844360351562, 233.3881378173828, 239.77783203125, 246.16751098632812, 252.5572052001953, 258.9468994140625, 265.3365783691406, 271.72625732421875, 278.115966796875, 284.5056457519531, 290.89532470703125, 297.2850341796875, 303.6747131347656, 310.06439208984375, 316.4541015625, 322.8437805175781, 329.23345947265625, 335.6231689453125, 342.0128479003906, 348.4025573730469, 354.792236328125, 361.1819152832031, 367.5716247558594, 373.9613037109375, 380.3509826660156, 386.74066162109375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 5.0, 6.0, 10.0, 8.0, 15.0, 14.0, 12.0, 15.0, 20.0, 16.0, 15.0, 28.0, 22.0, 28.0, 34.0, 30.0, 26.0, 44.0, 42.0, 50.0, 31.0, 44.0, 40.0, 47.0, 38.0, 34.0, 31.0, 26.0, 28.0, 21.0, 32.0, 31.0, 22.0, 16.0, 19.0, 16.0, 14.0, 16.0, 8.0, 13.0, 9.0, 6.0, 5.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.385005950927734, -41.04255294799805, -39.700096130371094, -38.357643127441406, -37.01518630981445, -35.672733306884766, -34.33027648925781, -32.987823486328125, -31.645368576049805, -30.302913665771484, -28.960458755493164, -27.618003845214844, -26.275550842285156, -24.933094024658203, -23.590641021728516, -22.248186111450195, -20.905731201171875, -19.563276290893555, -18.220821380615234, -16.878368377685547, -15.53591251373291, -14.19345760345459, -12.851003646850586, -11.508548736572266, -10.166093826293945, -8.823638916015625, -7.481184482574463, -6.138730049133301, -4.7962751388549805, -3.45382022857666, -2.1113662719726562, -0.7689113616943359, 0.57354736328125, 1.9160020351409912, 3.2584567070007324, 4.6009111404418945, 5.943366050720215, 7.285820960998535, 8.628274917602539, 9.97072982788086, 11.31318473815918, 12.6556396484375, 13.99809455871582, 15.340548515319824, 16.683002471923828, 18.02545928955078, 19.36791229248047, 20.71036720275879, 22.05282211303711, 23.39527702331543, 24.73773193359375, 26.080184936523438, 27.42264175415039, 28.765094757080078, 30.1075496673584, 31.45000457763672, 32.792457580566406, 34.134910583496094, 35.47736740112305, 36.819820404052734, 38.16227722167969, 39.504730224609375, 40.84718322753906, 42.189640045166016, 43.53209686279297]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 15.0, 19.0, 17.0, 20.0, 23.0, 23.0, 28.0, 40.0, 42.0, 36.0, 50.0, 51.0, 50.0, 41.0, 46.0, 35.0, 64.0, 39.0, 48.0, 47.0, 43.0, 49.0, 27.0, 29.0, 27.0, 16.0, 8.0, 16.0, 12.0, 11.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.3280029296875, -6.128662109375, -5.9293212890625, -5.72998046875, -5.5306396484375, -5.331298828125, -5.1319580078125, -4.9326171875, -4.7332763671875, -4.533935546875, -4.3345947265625, -4.13525390625, -3.9359130859375, -3.736572265625, -3.5372314453125, -3.337890625, -3.1385498046875, -2.939208984375, -2.7398681640625, -2.54052734375, -2.3411865234375, -2.141845703125, -1.9425048828125, -1.7431640625, -1.5438232421875, -1.344482421875, -1.1451416015625, -0.94580078125, -0.7464599609375, -0.547119140625, -0.3477783203125, -0.1484375, 0.0509033203125, 0.250244140625, 0.4495849609375, 0.64892578125, 0.8482666015625, 1.047607421875, 1.2469482421875, 1.4462890625, 1.6456298828125, 1.844970703125, 2.0443115234375, 2.24365234375, 2.4429931640625, 2.642333984375, 2.8416748046875, 3.041015625, 3.2403564453125, 3.439697265625, 3.6390380859375, 3.83837890625, 4.0377197265625, 4.237060546875, 4.4364013671875, 4.6357421875, 4.8350830078125, 5.034423828125, 5.2337646484375, 5.43310546875, 5.6324462890625, 5.831787109375, 6.0311279296875, 6.23046875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 8.0, 8.0, 10.0, 13.0, 21.0, 31.0, 27.0, 50.0, 44.0, 99.0, 125.0, 182.0, 266.0, 499.0, 1027.0, 2653.0, 9213.0, 40769.0, 320663.0, 3119039.0, 618588.0, 61819.0, 12562.0, 3675.0, 1322.0, 583.0, 302.0, 195.0, 118.0, 77.0, 72.0, 61.0, 37.0, 29.0, 21.0, 20.0, 13.0, 10.0, 8.0, 2.0, 3.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.5078125, -15.017333984375, -14.52685546875, -14.036376953125, -13.5458984375, -13.055419921875, -12.56494140625, -12.074462890625, -11.583984375, -11.093505859375, -10.60302734375, -10.112548828125, -9.6220703125, -9.131591796875, -8.64111328125, -8.150634765625, -7.66015625, -7.169677734375, -6.67919921875, -6.188720703125, -5.6982421875, -5.207763671875, -4.71728515625, -4.226806640625, -3.736328125, -3.245849609375, -2.75537109375, -2.264892578125, -1.7744140625, -1.283935546875, -0.79345703125, -0.302978515625, 0.1875, 0.677978515625, 1.16845703125, 1.658935546875, 2.1494140625, 2.639892578125, 3.13037109375, 3.620849609375, 4.111328125, 4.601806640625, 5.09228515625, 5.582763671875, 6.0732421875, 6.563720703125, 7.05419921875, 7.544677734375, 8.03515625, 8.525634765625, 9.01611328125, 9.506591796875, 9.9970703125, 10.487548828125, 10.97802734375, 11.468505859375, 11.958984375, 12.449462890625, 12.93994140625, 13.430419921875, 13.9208984375, 14.411376953125, 14.90185546875, 15.392333984375, 15.8828125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 4.0, 3.0, 12.0, 18.0, 24.0, 58.0, 80.0, 137.0, 250.0, 418.0, 822.0, 927.0, 515.0, 319.0, 191.0, 122.0, 61.0, 45.0, 26.0, 19.0, 11.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15625, -14.669921875, -14.18359375, -13.697265625, -13.2109375, -12.724609375, -12.23828125, -11.751953125, -11.265625, -10.779296875, -10.29296875, -9.806640625, -9.3203125, -8.833984375, -8.34765625, -7.861328125, -7.375, -6.888671875, -6.40234375, -5.916015625, -5.4296875, -4.943359375, -4.45703125, -3.970703125, -3.484375, -2.998046875, -2.51171875, -2.025390625, -1.5390625, -1.052734375, -0.56640625, -0.080078125, 0.40625, 0.892578125, 1.37890625, 1.865234375, 2.3515625, 2.837890625, 3.32421875, 3.810546875, 4.296875, 4.783203125, 5.26953125, 5.755859375, 6.2421875, 6.728515625, 7.21484375, 7.701171875, 8.1875, 8.673828125, 9.16015625, 9.646484375, 10.1328125, 10.619140625, 11.10546875, 11.591796875, 12.078125, 12.564453125, 13.05078125, 13.537109375, 14.0234375, 14.509765625, 14.99609375, 15.482421875, 15.96875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 12.0, 24.0, 34.0, 52.0, 86.0, 209.0, 434.0, 1269.0, 16365.0, 3758184.0, 412050.0, 4302.0, 719.0, 255.0, 109.0, 71.0, 40.0, 21.0, 14.0, 13.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.46875, -60.50439453125, -58.5400390625, -56.57568359375, -54.611328125, -52.64697265625, -50.6826171875, -48.71826171875, -46.75390625, -44.78955078125, -42.8251953125, -40.86083984375, -38.896484375, -36.93212890625, -34.9677734375, -33.00341796875, -31.0390625, -29.07470703125, -27.1103515625, -25.14599609375, -23.181640625, -21.21728515625, -19.2529296875, -17.28857421875, -15.32421875, -13.35986328125, -11.3955078125, -9.43115234375, -7.466796875, -5.50244140625, -3.5380859375, -1.57373046875, 0.390625, 2.35498046875, 4.3193359375, 6.28369140625, 8.248046875, 10.21240234375, 12.1767578125, 14.14111328125, 16.10546875, 18.06982421875, 20.0341796875, 21.99853515625, 23.962890625, 25.92724609375, 27.8916015625, 29.85595703125, 31.8203125, 33.78466796875, 35.7490234375, 37.71337890625, 39.677734375, 41.64208984375, 43.6064453125, 45.57080078125, 47.53515625, 49.49951171875, 51.4638671875, 53.42822265625, 55.392578125, 57.35693359375, 59.3212890625, 61.28564453125, 63.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 8.0, 8.0, 12.0, 33.0, 47.0, 53.0, 76.0, 86.0, 104.0, 104.0, 105.0, 91.0, 81.0, 58.0, 51.0, 34.0, 18.0, 17.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.58395767211914, -24.022319793701172, -22.46068000793457, -20.8990421295166, -19.33740234375, -17.77576446533203, -16.214126586914062, -14.652487754821777, -13.090848922729492, -11.529210090637207, -9.967571258544922, -8.405933380126953, -6.844294548034668, -5.282655715942383, -3.721017837524414, -2.159379005432129, -0.5977401733398438, 0.9638984203338623, 2.5255370140075684, 4.087175369262695, 5.6488142013549805, 7.210453033447266, 8.772090911865234, 10.33372974395752, 11.895368576049805, 13.45700740814209, 15.018646240234375, 16.580284118652344, 18.141921997070312, 19.703561782836914, 21.265199661254883, 22.826839447021484, 24.38848114013672, 25.950119018554688, 27.51175880432129, 29.073396682739258, 30.63503646850586, 32.19667434692383, 33.7583122253418, 35.319950103759766, 36.881591796875, 38.44322967529297, 40.00486755371094, 41.566505432128906, 43.12814712524414, 44.68978500366211, 46.25142288208008, 47.81306076049805, 49.374698638916016, 50.936336517333984, 52.49797439575195, 54.05961608886719, 55.621253967285156, 57.182891845703125, 58.744529724121094, 60.30616760253906, 61.86780548095703, 63.429443359375, 64.99108123779297, 66.55271911621094, 68.1143569946289, 69.67599487304688, 71.23764038085938, 72.79927825927734, 74.36091613769531]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 12.0, 7.0, 9.0, 16.0, 14.0, 16.0, 19.0, 21.0, 18.0, 33.0, 24.0, 28.0, 22.0, 24.0, 37.0, 32.0, 35.0, 47.0, 41.0, 31.0, 40.0, 38.0, 53.0, 28.0, 36.0, 41.0, 38.0, 22.0, 34.0, 29.0, 16.0, 13.0, 25.0, 15.0, 16.0, 8.0, 11.0, 10.0, 5.0, 11.0, 3.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-32.1839599609375, -31.28742218017578, -30.39088249206543, -29.49434471130371, -28.59780502319336, -27.70126724243164, -26.804729461669922, -25.908191680908203, -25.01165199279785, -24.115114212036133, -23.21857452392578, -22.322036743164062, -21.425498962402344, -20.528959274291992, -19.632421493530273, -18.735881805419922, -17.839344024658203, -16.942806243896484, -16.046266555786133, -15.149728775024414, -14.253190040588379, -13.356651306152344, -12.460113525390625, -11.56357479095459, -10.667036056518555, -9.77049732208252, -8.873958587646484, -7.977420806884766, -7.0808820724487305, -6.184343338012695, -5.287805080413818, -4.391266822814941, -3.4947280883789062, -2.59818959236145, -1.7016510963439941, -0.8051126003265381, 0.09142589569091797, 0.9879646301269531, 1.88450288772583, 2.781041145324707, 3.677579879760742, 4.574118614196777, 5.470656871795654, 6.367195129394531, 7.263733863830566, 8.160272598266602, 9.05681037902832, 9.953349113464355, 10.84988784790039, 11.746426582336426, 12.642965316772461, 13.53950309753418, 14.436041831970215, 15.33258056640625, 16.22911834716797, 17.125656127929688, 18.02219581604004, 18.918733596801758, 19.81527328491211, 20.711811065673828, 21.608348846435547, 22.5048885345459, 23.401426315307617, 24.29796600341797, 25.194503784179688]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 11.0, 4.0, 15.0, 17.0, 18.0, 27.0, 18.0, 25.0, 16.0, 31.0, 35.0, 40.0, 36.0, 53.0, 62.0, 31.0, 46.0, 54.0, 53.0, 39.0, 35.0, 45.0, 65.0, 34.0, 36.0, 31.0, 28.0, 16.0, 17.0, 15.0, 17.0, 8.0, 7.0, 3.0, 7.0, 1.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41015625, -6.2171630859375, -6.024169921875, -5.8311767578125, -5.63818359375, -5.4451904296875, -5.252197265625, -5.0592041015625, -4.8662109375, -4.6732177734375, -4.480224609375, -4.2872314453125, -4.09423828125, -3.9012451171875, -3.708251953125, -3.5152587890625, -3.322265625, -3.1292724609375, -2.936279296875, -2.7432861328125, -2.55029296875, -2.3572998046875, -2.164306640625, -1.9713134765625, -1.7783203125, -1.5853271484375, -1.392333984375, -1.1993408203125, -1.00634765625, -0.8133544921875, -0.620361328125, -0.4273681640625, -0.234375, -0.0413818359375, 0.151611328125, 0.3446044921875, 0.53759765625, 0.7305908203125, 0.923583984375, 1.1165771484375, 1.3095703125, 1.5025634765625, 1.695556640625, 1.8885498046875, 2.08154296875, 2.2745361328125, 2.467529296875, 2.6605224609375, 2.853515625, 3.0465087890625, 3.239501953125, 3.4324951171875, 3.62548828125, 3.8184814453125, 4.011474609375, 4.2044677734375, 4.3974609375, 4.5904541015625, 4.783447265625, 4.9764404296875, 5.16943359375, 5.3624267578125, 5.555419921875, 5.7484130859375, 5.94140625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 20.0, 16.0, 25.0, 21.0, 46.0, 59.0, 74.0, 105.0, 160.0, 243.0, 354.0, 564.0, 870.0, 1364.0, 2132.0, 3290.0, 5104.0, 7958.0, 12370.0, 19817.0, 32412.0, 56015.0, 103102.0, 222950.0, 279343.0, 130764.0, 67057.0, 38907.0, 23339.0, 14363.0, 9181.0, 5743.0, 3710.0, 2440.0, 1556.0, 1024.0, 679.0, 438.0, 298.0, 188.0, 150.0, 102.0, 59.0, 44.0, 29.0, 19.0, 17.0, 13.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.19580078125, -0.18951797485351562, -0.18323516845703125, -0.17695236206054688, -0.1706695556640625, -0.16438674926757812, -0.15810394287109375, -0.15182113647460938, -0.145538330078125, -0.13925552368164062, -0.13297271728515625, -0.12668991088867188, -0.1204071044921875, -0.11412429809570312, -0.10784149169921875, -0.10155868530273438, -0.09527587890625, -0.08899307250976562, -0.08271026611328125, -0.07642745971679688, -0.0701446533203125, -0.06386184692382812, -0.05757904052734375, -0.051296234130859375, -0.045013427734375, -0.038730621337890625, -0.03244781494140625, -0.026165008544921875, -0.0198822021484375, -0.013599395751953125, -0.00731658935546875, -0.001033782958984375, 0.0052490234375, 0.011531829833984375, 0.01781463623046875, 0.024097442626953125, 0.0303802490234375, 0.036663055419921875, 0.04294586181640625, 0.049228668212890625, 0.055511474609375, 0.061794281005859375, 0.06807708740234375, 0.07435989379882812, 0.0806427001953125, 0.08692550659179688, 0.09320831298828125, 0.09949111938476562, 0.10577392578125, 0.11205673217773438, 0.11833953857421875, 0.12462234497070312, 0.1309051513671875, 0.13718795776367188, 0.14347076416015625, 0.14975357055664062, 0.156036376953125, 0.16231918334960938, 0.16860198974609375, 0.17488479614257812, 0.1811676025390625, 0.18745040893554688, 0.19373321533203125, 0.20001602172851562, 0.206298828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 7.0, 10.0, 9.0, 14.0, 19.0, 18.0, 13.0, 30.0, 15.0, 19.0, 23.0, 22.0, 38.0, 38.0, 24.0, 38.0, 31.0, 32.0, 43.0, 1065.0, 39.0, 47.0, 36.0, 46.0, 36.0, 36.0, 30.0, 29.0, 34.0, 33.0, 29.0, 19.0, 17.0, 10.0, 13.0, 9.0, 5.0, 8.0, 5.0, 2.0, 8.0, 4.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.048828125, -2.94244384765625, -2.8360595703125, -2.72967529296875, -2.623291015625, -2.51690673828125, -2.4105224609375, -2.30413818359375, -2.19775390625, -2.09136962890625, -1.9849853515625, -1.87860107421875, -1.772216796875, -1.66583251953125, -1.5594482421875, -1.45306396484375, -1.3466796875, -1.24029541015625, -1.1339111328125, -1.02752685546875, -0.921142578125, -0.81475830078125, -0.7083740234375, -0.60198974609375, -0.49560546875, -0.38922119140625, -0.2828369140625, -0.17645263671875, -0.070068359375, 0.03631591796875, 0.1427001953125, 0.24908447265625, 0.35546875, 0.46185302734375, 0.5682373046875, 0.67462158203125, 0.781005859375, 0.88739013671875, 0.9937744140625, 1.10015869140625, 1.20654296875, 1.31292724609375, 1.4193115234375, 1.52569580078125, 1.632080078125, 1.73846435546875, 1.8448486328125, 1.95123291015625, 2.0576171875, 2.16400146484375, 2.2703857421875, 2.37677001953125, 2.483154296875, 2.58953857421875, 2.6959228515625, 2.80230712890625, 2.90869140625, 3.01507568359375, 3.1214599609375, 3.22784423828125, 3.334228515625, 3.44061279296875, 3.5469970703125, 3.65338134765625, 3.759765625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 16.0, 23.0, 34.0, 33.0, 55.0, 78.0, 122.0, 204.0, 275.0, 433.0, 619.0, 955.0, 1504.0, 2331.0, 3644.0, 5687.0, 9077.0, 14692.0, 24026.0, 40341.0, 69012.0, 136226.0, 1331862.0, 216871.0, 100309.0, 54878.0, 31869.0, 19474.0, 11848.0, 7359.0, 4601.0, 3052.0, 1896.0, 1295.0, 797.0, 540.0, 375.0, 215.0, 159.0, 115.0, 68.0, 43.0, 36.0, 31.0, 11.0, 11.0, 4.0, 8.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.10986328125, -0.10604667663574219, -0.10223007202148438, -0.09841346740722656, -0.09459686279296875, -0.09078025817871094, -0.08696365356445312, -0.08314704895019531, -0.0793304443359375, -0.07551383972167969, -0.07169723510742188, -0.06788063049316406, -0.06406402587890625, -0.06024742126464844, -0.056430816650390625, -0.05261421203613281, -0.048797607421875, -0.04498100280761719, -0.041164398193359375, -0.03734779357910156, -0.03353118896484375, -0.029714584350585938, -0.025897979736328125, -0.022081375122070312, -0.0182647705078125, -0.014448165893554688, -0.010631561279296875, -0.0068149566650390625, -0.00299835205078125, 0.0008182525634765625, 0.004634857177734375, 0.008451461791992188, 0.01226806640625, 0.016084671020507812, 0.019901275634765625, 0.023717880249023438, 0.02753448486328125, 0.03135108947753906, 0.035167694091796875, 0.03898429870605469, 0.0428009033203125, 0.04661750793457031, 0.050434112548828125, 0.05425071716308594, 0.05806732177734375, 0.06188392639160156, 0.06570053100585938, 0.06951713562011719, 0.073333740234375, 0.07715034484863281, 0.08096694946289062, 0.08478355407714844, 0.08860015869140625, 0.09241676330566406, 0.09623336791992188, 0.10004997253417969, 0.1038665771484375, 0.10768318176269531, 0.11149978637695312, 0.11531639099121094, 0.11913299560546875, 0.12294960021972656, 0.12676620483398438, 0.1305828094482422, 0.1343994140625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 5.0, 8.0, 17.0, 10.0, 20.0, 17.0, 26.0, 27.0, 35.0, 39.0, 42.0, 57.0, 64.0, 56.0, 60.0, 62.0, 54.0, 61.0, 52.0, 40.0, 37.0, 25.0, 30.0, 26.0, 14.0, 21.0, 18.0, 14.0, 8.0, 9.0, 6.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2809715270996094e-05, -5.112495273351669e-05, -4.944019019603729e-05, -4.775542765855789e-05, -4.607066512107849e-05, -4.438590258359909e-05, -4.270114004611969e-05, -4.101637750864029e-05, -3.933161497116089e-05, -3.764685243368149e-05, -3.596208989620209e-05, -3.427732735872269e-05, -3.2592564821243286e-05, -3.0907802283763885e-05, -2.9223039746284485e-05, -2.7538277208805084e-05, -2.5853514671325684e-05, -2.4168752133846283e-05, -2.2483989596366882e-05, -2.079922705888748e-05, -1.911446452140808e-05, -1.742970198392868e-05, -1.574493944644928e-05, -1.4060176908969879e-05, -1.2375414371490479e-05, -1.0690651834011078e-05, -9.005889296531677e-06, -7.321126759052277e-06, -5.636364221572876e-06, -3.951601684093475e-06, -2.2668391466140747e-06, -5.820766091346741e-07, 1.1026859283447266e-06, 2.787448465824127e-06, 4.472211003303528e-06, 6.1569735407829285e-06, 7.841736078262329e-06, 9.52649861574173e-06, 1.121126115322113e-05, 1.2896023690700531e-05, 1.4580786228179932e-05, 1.6265548765659332e-05, 1.7950311303138733e-05, 1.9635073840618134e-05, 2.1319836378097534e-05, 2.3004598915576935e-05, 2.4689361453056335e-05, 2.6374123990535736e-05, 2.8058886528015137e-05, 2.9743649065494537e-05, 3.142841160297394e-05, 3.311317414045334e-05, 3.479793667793274e-05, 3.648269921541214e-05, 3.816746175289154e-05, 3.985222429037094e-05, 4.153698682785034e-05, 4.322174936532974e-05, 4.490651190280914e-05, 4.6591274440288544e-05, 4.8276036977767944e-05, 4.9960799515247345e-05, 5.1645562052726746e-05, 5.3330324590206146e-05, 5.501508712768555e-05]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 10.0, 11.0, 10.0, 20.0, 14.0, 21.0, 24.0, 32.0, 52.0, 55.0, 83.0, 169.0, 447.0, 3642.0, 321325.0, 711237.0, 10046.0, 705.0, 230.0, 112.0, 66.0, 49.0, 36.0, 30.0, 30.0, 10.0, 17.0, 13.0, 8.0, 10.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.001094818115234375, -0.0010607391595840454, -0.0010266602039337158, -0.0009925812482833862, -0.0009585022926330566, -0.000924423336982727, -0.0008903443813323975, -0.0008562654256820679, -0.0008221864700317383, -0.0007881075143814087, -0.0007540285587310791, -0.0007199496030807495, -0.0006858706474304199, -0.0006517916917800903, -0.0006177127361297607, -0.0005836337804794312, -0.0005495548248291016, -0.000515475869178772, -0.0004813969135284424, -0.0004473179578781128, -0.0004132390022277832, -0.0003791600465774536, -0.000345081090927124, -0.00031100213527679443, -0.00027692317962646484, -0.00024284422397613525, -0.00020876526832580566, -0.00017468631267547607, -0.00014060735702514648, -0.0001065284013748169, -7.24494457244873e-05, -3.8370490074157715e-05, -4.291534423828125e-06, 2.9787421226501465e-05, 6.386637687683105e-05, 9.794533252716064e-05, 0.00013202428817749023, 0.00016610324382781982, 0.00020018219947814941, 0.000234261155128479, 0.0002683401107788086, 0.0003024190664291382, 0.0003364980220794678, 0.00037057697772979736, 0.00040465593338012695, 0.00043873488903045654, 0.00047281384468078613, 0.0005068928003311157, 0.0005409717559814453, 0.0005750507116317749, 0.0006091296672821045, 0.0006432086229324341, 0.0006772875785827637, 0.0007113665342330933, 0.0007454454898834229, 0.0007795244455337524, 0.000813603401184082, 0.0008476823568344116, 0.0008817613124847412, 0.0009158402681350708, 0.0009499192237854004, 0.00098399817943573, 0.0010180771350860596, 0.0010521560907363892, 0.0010862350463867188]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 59.0, 707.0, 237.0, 9.0], "bins": [-0.001038096728734672, -0.0010212758788838983, -0.0010044550290331244, -0.0009876341791823506, -0.0009708133875392377, -0.0009539925376884639, -0.000937171746045351, -0.0009203508961945772, -0.0009035300463438034, -0.0008867091964930296, -0.0008698883466422558, -0.0008530675549991429, -0.0008362467051483691, -0.0008194258552975953, -0.0008026050636544824, -0.0007857842138037086, -0.0007689633639529347, -0.0007521425141021609, -0.0007353216642513871, -0.0007185008726082742, -0.0007016800227575004, -0.0006848591729067266, -0.0006680383812636137, -0.0006512175314128399, -0.0006343966815620661, -0.0006175758317112923, -0.0006007549818605185, -0.0005839341902174056, -0.0005671133403666317, -0.0005502924905158579, -0.000533471698872745, -0.0005166508490219712, -0.0004998300573788583, -0.0004830092075280845, -0.00046618838678114116, -0.0004493675660341978, -0.000432546716183424, -0.0004157258663326502, -0.00039890504558570683, -0.0003820842248387635, -0.00036526337498798966, -0.00034844252513721585, -0.0003316217043902725, -0.00031480088364332914, -0.00029798003379255533, -0.0002811591839417815, -0.00026433836319483817, -0.0002475175424478948, -0.000230696692597121, -0.00021387585729826242, -0.00019705502199940383, -0.00018023418670054525, -0.00016341335140168667, -0.00014659251610282809, -0.0001297716808039695, -0.00011295084550511092, -9.613000293029472e-05, -7.930916763143614e-05, -6.248833233257756e-05, -4.5667497033718973e-05, -2.884666173486039e-05, -1.2025826436001807e-05, 4.7950088628567755e-06, 2.161584416171536e-05, 3.843667946057394e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 2.0, 7.0, 8.0, 10.0, 17.0, 19.0, 17.0, 25.0, 32.0, 36.0, 46.0, 48.0, 50.0, 45.0, 41.0, 55.0, 67.0, 45.0, 46.0, 50.0, 55.0, 43.0, 38.0, 39.0, 24.0, 30.0, 13.0, 19.0, 15.0, 13.0, 8.0, 12.0, 5.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248453140258789e-05, -3.120489418506622e-05, -2.9925256967544556e-05, -2.8645619750022888e-05, -2.736598253250122e-05, -2.6086345314979553e-05, -2.4806708097457886e-05, -2.3527070879936218e-05, -2.224743366241455e-05, -2.0967796444892883e-05, -1.9688159227371216e-05, -1.840852200984955e-05, -1.712888479232788e-05, -1.5849247574806213e-05, -1.4569610357284546e-05, -1.3289973139762878e-05, -1.2010335922241211e-05, -1.0730698704719543e-05, -9.451061487197876e-06, -8.171424269676208e-06, -6.891787052154541e-06, -5.6121498346328735e-06, -4.332512617111206e-06, -3.0528753995895386e-06, -1.773238182067871e-06, -4.936009645462036e-07, 7.860362529754639e-07, 2.0656734704971313e-06, 3.345310688018799e-06, 4.624947905540466e-06, 5.904585123062134e-06, 7.184222340583801e-06, 8.463859558105469e-06, 9.743496775627136e-06, 1.1023133993148804e-05, 1.2302771210670471e-05, 1.3582408428192139e-05, 1.4862045645713806e-05, 1.6141682863235474e-05, 1.742132008075714e-05, 1.870095729827881e-05, 1.9980594515800476e-05, 2.1260231733322144e-05, 2.253986895084381e-05, 2.381950616836548e-05, 2.5099143385887146e-05, 2.6378780603408813e-05, 2.765841782093048e-05, 2.893805503845215e-05, 3.0217692255973816e-05, 3.1497329473495483e-05, 3.277696669101715e-05, 3.405660390853882e-05, 3.5336241126060486e-05, 3.661587834358215e-05, 3.789551556110382e-05, 3.917515277862549e-05, 4.0454789996147156e-05, 4.173442721366882e-05, 4.301406443119049e-05, 4.429370164871216e-05, 4.5573338866233826e-05, 4.685297608375549e-05, 4.813261330127716e-05, 4.941225051879883e-05]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 11.0, 4.0, 15.0, 17.0, 18.0, 27.0, 18.0, 25.0, 16.0, 31.0, 35.0, 40.0, 36.0, 53.0, 62.0, 31.0, 46.0, 54.0, 53.0, 39.0, 35.0, 45.0, 65.0, 34.0, 36.0, 31.0, 28.0, 16.0, 17.0, 15.0, 17.0, 8.0, 7.0, 3.0, 7.0, 1.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41015625, -6.2171630859375, -6.024169921875, -5.8311767578125, -5.63818359375, -5.4451904296875, -5.252197265625, -5.0592041015625, -4.8662109375, -4.6732177734375, -4.480224609375, -4.2872314453125, -4.09423828125, -3.9012451171875, -3.708251953125, -3.5152587890625, -3.322265625, -3.1292724609375, -2.936279296875, -2.7432861328125, -2.55029296875, -2.3572998046875, -2.164306640625, -1.9713134765625, -1.7783203125, -1.5853271484375, -1.392333984375, -1.1993408203125, -1.00634765625, -0.8133544921875, -0.620361328125, -0.4273681640625, -0.234375, -0.0413818359375, 0.151611328125, 0.3446044921875, 0.53759765625, 0.7305908203125, 0.923583984375, 1.1165771484375, 1.3095703125, 1.5025634765625, 1.695556640625, 1.8885498046875, 2.08154296875, 2.2745361328125, 2.467529296875, 2.6605224609375, 2.853515625, 3.0465087890625, 3.239501953125, 3.4324951171875, 3.62548828125, 3.8184814453125, 4.011474609375, 4.2044677734375, 4.3974609375, 4.5904541015625, 4.783447265625, 4.9764404296875, 5.16943359375, 5.3624267578125, 5.555419921875, 5.7484130859375, 5.94140625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 16.0, 18.0, 19.0, 19.0, 32.0, 58.0, 90.0, 114.0, 183.0, 260.0, 415.0, 632.0, 1038.0, 1603.0, 2628.0, 4370.0, 7534.0, 13183.0, 24845.0, 52493.0, 147979.0, 474564.0, 189787.0, 62795.0, 28320.0, 14600.0, 8364.0, 4775.0, 2859.0, 1746.0, 1118.0, 720.0, 477.0, 288.0, 184.0, 149.0, 85.0, 49.0, 45.0, 30.0, 13.0, 20.0, 11.0, 9.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0], "bins": [-7.0546875, -6.8382568359375, -6.621826171875, -6.4053955078125, -6.18896484375, -5.9725341796875, -5.756103515625, -5.5396728515625, -5.3232421875, -5.1068115234375, -4.890380859375, -4.6739501953125, -4.45751953125, -4.2410888671875, -4.024658203125, -3.8082275390625, -3.591796875, -3.3753662109375, -3.158935546875, -2.9425048828125, -2.72607421875, -2.5096435546875, -2.293212890625, -2.0767822265625, -1.8603515625, -1.6439208984375, -1.427490234375, -1.2110595703125, -0.99462890625, -0.7781982421875, -0.561767578125, -0.3453369140625, -0.12890625, 0.0875244140625, 0.303955078125, 0.5203857421875, 0.73681640625, 0.9532470703125, 1.169677734375, 1.3861083984375, 1.6025390625, 1.8189697265625, 2.035400390625, 2.2518310546875, 2.46826171875, 2.6846923828125, 2.901123046875, 3.1175537109375, 3.333984375, 3.5504150390625, 3.766845703125, 3.9832763671875, 4.19970703125, 4.4161376953125, 4.632568359375, 4.8489990234375, 5.0654296875, 5.2818603515625, 5.498291015625, 5.7147216796875, 5.93115234375, 6.1475830078125, 6.364013671875, 6.5804443359375, 6.796875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 3.0, 3.0, 5.0, 12.0, 10.0, 14.0, 15.0, 25.0, 16.0, 33.0, 35.0, 36.0, 26.0, 41.0, 43.0, 48.0, 66.0, 91.0, 217.0, 1598.0, 194.0, 77.0, 53.0, 56.0, 58.0, 34.0, 39.0, 33.0, 34.0, 24.0, 18.0, 21.0, 18.0, 5.0, 6.0, 12.0, 8.0, 10.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9765625, -15.4342041015625, -14.891845703125, -14.3494873046875, -13.80712890625, -13.2647705078125, -12.722412109375, -12.1800537109375, -11.6376953125, -11.0953369140625, -10.552978515625, -10.0106201171875, -9.46826171875, -8.9259033203125, -8.383544921875, -7.8411865234375, -7.298828125, -6.7564697265625, -6.214111328125, -5.6717529296875, -5.12939453125, -4.5870361328125, -4.044677734375, -3.5023193359375, -2.9599609375, -2.4176025390625, -1.875244140625, -1.3328857421875, -0.79052734375, -0.2481689453125, 0.294189453125, 0.8365478515625, 1.37890625, 1.9212646484375, 2.463623046875, 3.0059814453125, 3.54833984375, 4.0906982421875, 4.633056640625, 5.1754150390625, 5.7177734375, 6.2601318359375, 6.802490234375, 7.3448486328125, 7.88720703125, 8.4295654296875, 8.971923828125, 9.5142822265625, 10.056640625, 10.5989990234375, 11.141357421875, 11.6837158203125, 12.22607421875, 12.7684326171875, 13.310791015625, 13.8531494140625, 14.3955078125, 14.9378662109375, 15.480224609375, 16.0225830078125, 16.56494140625, 17.1072998046875, 17.649658203125, 18.1920166015625, 18.734375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 5.0, 8.0, 9.0, 17.0, 19.0, 21.0, 27.0, 38.0, 46.0, 61.0, 103.0, 132.0, 179.0, 279.0, 731.0, 2669.0, 18577.0, 402439.0, 2669565.0, 43405.0, 5174.0, 1043.0, 390.0, 203.0, 146.0, 96.0, 83.0, 62.0, 47.0, 38.0, 13.0, 22.0, 19.0, 9.0, 5.0, 4.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.21875, -30.24853515625, -29.2783203125, -28.30810546875, -27.337890625, -26.36767578125, -25.3974609375, -24.42724609375, -23.45703125, -22.48681640625, -21.5166015625, -20.54638671875, -19.576171875, -18.60595703125, -17.6357421875, -16.66552734375, -15.6953125, -14.72509765625, -13.7548828125, -12.78466796875, -11.814453125, -10.84423828125, -9.8740234375, -8.90380859375, -7.93359375, -6.96337890625, -5.9931640625, -5.02294921875, -4.052734375, -3.08251953125, -2.1123046875, -1.14208984375, -0.171875, 0.79833984375, 1.7685546875, 2.73876953125, 3.708984375, 4.67919921875, 5.6494140625, 6.61962890625, 7.58984375, 8.56005859375, 9.5302734375, 10.50048828125, 11.470703125, 12.44091796875, 13.4111328125, 14.38134765625, 15.3515625, 16.32177734375, 17.2919921875, 18.26220703125, 19.232421875, 20.20263671875, 21.1728515625, 22.14306640625, 23.11328125, 24.08349609375, 25.0537109375, 26.02392578125, 26.994140625, 27.96435546875, 28.9345703125, 29.90478515625, 30.875]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [574.0, 442.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.160618782043457, -0.012415885925292969, 14.135787010192871, 28.283992767333984, 42.432193756103516, 56.58039474487305, 70.72859954833984, 84.87680053710938, 99.0250015258789, 113.17320251464844, 127.3214111328125, 141.4696044921875, 155.61781311035156, 169.76602172851562, 183.91421508789062, 198.0624237060547, 212.21063232421875, 226.3588409423828, 240.5070343017578, 254.65524291992188, 268.8034362792969, 282.95166015625, 297.099853515625, 311.248046875, 325.396240234375, 339.54443359375, 353.6926574707031, 367.8408508300781, 381.9890441894531, 396.13726806640625, 410.28546142578125, 424.43365478515625, 438.58184814453125, 452.73004150390625, 466.8782653808594, 481.0264587402344, 495.1746520996094, 509.3228759765625, 523.4710693359375, 537.6192626953125, 551.7674560546875, 565.9156494140625, 580.0638427734375, 594.2120361328125, 608.3602905273438, 622.5084838867188, 636.6566772460938, 650.8048706054688, 664.953125, 679.101318359375, 693.24951171875, 707.397705078125, 721.5459594726562, 735.6941528320312, 749.8423461914062, 763.9905395507812, 778.1387329101562, 792.2869262695312, 806.4351196289062, 820.5833740234375, 834.7315673828125, 848.8797607421875, 863.0279541015625, 877.1761474609375, 891.3243408203125]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 5.0, 5.0, 7.0, 8.0, 10.0, 10.0, 9.0, 11.0, 14.0, 19.0, 18.0, 22.0, 35.0, 29.0, 38.0, 36.0, 39.0, 33.0, 34.0, 41.0, 37.0, 38.0, 38.0, 46.0, 45.0, 39.0, 25.0, 39.0, 35.0, 31.0, 32.0, 29.0, 24.0, 21.0, 14.0, 13.0, 12.0, 6.0, 16.0, 11.0, 5.0, 8.0, 2.0, 2.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.54676818847656, -42.063377380371094, -40.579986572265625, -39.096595764160156, -37.61320495605469, -36.12981414794922, -34.64642333984375, -33.16303253173828, -31.679643630981445, -30.196252822875977, -28.712862014770508, -27.229473114013672, -25.746082305908203, -24.262691497802734, -22.779300689697266, -21.295909881591797, -19.812519073486328, -18.32912826538086, -16.84573745727539, -15.362347602844238, -13.87895679473877, -12.3955659866333, -10.912176132202148, -9.42878532409668, -7.945394515991211, -6.462003707885742, -4.978613376617432, -3.495223045349121, -2.0118322372436523, -0.5284414291381836, 0.9549484252929688, 2.4383392333984375, 3.921733856201172, 5.405124664306641, 6.888514995574951, 8.371905326843262, 9.85529613494873, 11.3386869430542, 12.822076797485352, 14.30546760559082, 15.788858413696289, 17.272249221801758, 18.755640029907227, 20.239028930664062, 21.72241973876953, 23.205810546875, 24.68920135498047, 26.172592163085938, 27.655982971191406, 29.139373779296875, 30.622764587402344, 32.10615539550781, 33.58954620361328, 35.07293701171875, 36.55632781982422, 38.03971862792969, 39.523109436035156, 41.006500244140625, 42.489891052246094, 43.97328186035156, 45.45667266845703, 46.9400634765625, 48.42345428466797, 49.90684509277344, 51.39023208618164]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 5.0, 4.0, 17.0, 12.0, 23.0, 28.0, 18.0, 17.0, 23.0, 29.0, 27.0, 36.0, 42.0, 45.0, 51.0, 40.0, 36.0, 45.0, 56.0, 47.0, 44.0, 34.0, 49.0, 41.0, 31.0, 39.0, 30.0, 21.0, 25.0, 17.0, 15.0, 15.0, 7.0, 7.0, 4.0, 1.0, 2.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.63446044921875, -5.4447021484375, -5.25494384765625, -5.065185546875, -4.87542724609375, -4.6856689453125, -4.49591064453125, -4.30615234375, -4.11639404296875, -3.9266357421875, -3.73687744140625, -3.547119140625, -3.35736083984375, -3.1676025390625, -2.97784423828125, -2.7880859375, -2.59832763671875, -2.4085693359375, -2.21881103515625, -2.029052734375, -1.83929443359375, -1.6495361328125, -1.45977783203125, -1.27001953125, -1.08026123046875, -0.8905029296875, -0.70074462890625, -0.510986328125, -0.32122802734375, -0.1314697265625, 0.05828857421875, 0.248046875, 0.43780517578125, 0.6275634765625, 0.81732177734375, 1.007080078125, 1.19683837890625, 1.3865966796875, 1.57635498046875, 1.76611328125, 1.95587158203125, 2.1456298828125, 2.33538818359375, 2.525146484375, 2.71490478515625, 2.9046630859375, 3.09442138671875, 3.2841796875, 3.47393798828125, 3.6636962890625, 3.85345458984375, 4.043212890625, 4.23297119140625, 4.4227294921875, 4.61248779296875, 4.80224609375, 4.99200439453125, 5.1817626953125, 5.37152099609375, 5.561279296875, 5.75103759765625, 5.9407958984375, 6.13055419921875, 6.3203125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 9.0, 8.0, 14.0, 19.0, 19.0, 32.0, 39.0, 41.0, 73.0, 127.0, 180.0, 391.0, 776.0, 1708.0, 3727.0, 9705.0, 28538.0, 118618.0, 1085742.0, 2609576.0, 260456.0, 49050.0, 15028.0, 5533.0, 2434.0, 1106.0, 516.0, 293.0, 184.0, 120.0, 63.0, 39.0, 24.0, 15.0, 13.0, 19.0, 7.0, 5.0, 7.0, 9.0, 4.0, 1.0, 2.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.859375, -12.4337158203125, -12.008056640625, -11.5823974609375, -11.15673828125, -10.7310791015625, -10.305419921875, -9.8797607421875, -9.4541015625, -9.0284423828125, -8.602783203125, -8.1771240234375, -7.75146484375, -7.3258056640625, -6.900146484375, -6.4744873046875, -6.048828125, -5.6231689453125, -5.197509765625, -4.7718505859375, -4.34619140625, -3.9205322265625, -3.494873046875, -3.0692138671875, -2.6435546875, -2.2178955078125, -1.792236328125, -1.3665771484375, -0.94091796875, -0.5152587890625, -0.089599609375, 0.3360595703125, 0.76171875, 1.1873779296875, 1.613037109375, 2.0386962890625, 2.46435546875, 2.8900146484375, 3.315673828125, 3.7413330078125, 4.1669921875, 4.5926513671875, 5.018310546875, 5.4439697265625, 5.86962890625, 6.2952880859375, 6.720947265625, 7.1466064453125, 7.572265625, 7.9979248046875, 8.423583984375, 8.8492431640625, 9.27490234375, 9.7005615234375, 10.126220703125, 10.5518798828125, 10.9775390625, 11.4031982421875, 11.828857421875, 12.2545166015625, 12.68017578125, 13.1058349609375, 13.531494140625, 13.9571533203125, 14.3828125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 1.0, 5.0, 6.0, 6.0, 8.0, 11.0, 21.0, 25.0, 46.0, 60.0, 74.0, 107.0, 162.0, 248.0, 419.0, 642.0, 701.0, 504.0, 328.0, 196.0, 128.0, 99.0, 85.0, 56.0, 39.0, 24.0, 18.0, 12.0, 12.0, 7.0, 7.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.3646240234375, -7.018310546875, -6.6719970703125, -6.32568359375, -5.9793701171875, -5.633056640625, -5.2867431640625, -4.9404296875, -4.5941162109375, -4.247802734375, -3.9014892578125, -3.55517578125, -3.2088623046875, -2.862548828125, -2.5162353515625, -2.169921875, -1.8236083984375, -1.477294921875, -1.1309814453125, -0.78466796875, -0.4383544921875, -0.092041015625, 0.2542724609375, 0.6005859375, 0.9468994140625, 1.293212890625, 1.6395263671875, 1.98583984375, 2.3321533203125, 2.678466796875, 3.0247802734375, 3.37109375, 3.7174072265625, 4.063720703125, 4.4100341796875, 4.75634765625, 5.1026611328125, 5.448974609375, 5.7952880859375, 6.1416015625, 6.4879150390625, 6.834228515625, 7.1805419921875, 7.52685546875, 7.8731689453125, 8.219482421875, 8.5657958984375, 8.912109375, 9.2584228515625, 9.604736328125, 9.9510498046875, 10.29736328125, 10.6436767578125, 10.989990234375, 11.3363037109375, 11.6826171875, 12.0289306640625, 12.375244140625, 12.7215576171875, 13.06787109375, 13.4141845703125, 13.760498046875, 14.1068115234375, 14.453125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 9.0, 14.0, 25.0, 22.0, 49.0, 50.0, 101.0, 108.0, 176.0, 378.0, 1234.0, 13285.0, 1184023.0, 2971085.0, 21091.0, 1606.0, 417.0, 203.0, 119.0, 73.0, 55.0, 46.0, 31.0, 16.0, 13.0, 7.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-66.5625, -64.9013671875, -63.240234375, -61.5791015625, -59.91796875, -58.2568359375, -56.595703125, -54.9345703125, -53.2734375, -51.6123046875, -49.951171875, -48.2900390625, -46.62890625, -44.9677734375, -43.306640625, -41.6455078125, -39.984375, -38.3232421875, -36.662109375, -35.0009765625, -33.33984375, -31.6787109375, -30.017578125, -28.3564453125, -26.6953125, -25.0341796875, -23.373046875, -21.7119140625, -20.05078125, -18.3896484375, -16.728515625, -15.0673828125, -13.40625, -11.7451171875, -10.083984375, -8.4228515625, -6.76171875, -5.1005859375, -3.439453125, -1.7783203125, -0.1171875, 1.5439453125, 3.205078125, 4.8662109375, 6.52734375, 8.1884765625, 9.849609375, 11.5107421875, 13.171875, 14.8330078125, 16.494140625, 18.1552734375, 19.81640625, 21.4775390625, 23.138671875, 24.7998046875, 26.4609375, 28.1220703125, 29.783203125, 31.4443359375, 33.10546875, 34.7666015625, 36.427734375, 38.0888671875, 39.75]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 8.0, 16.0, 17.0, 18.0, 33.0, 43.0, 64.0, 59.0, 80.0, 74.0, 83.0, 76.0, 77.0, 67.0, 65.0, 54.0, 54.0, 22.0, 24.0, 16.0, 14.0, 6.0, 6.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.069292068481445, -24.909761428833008, -23.750228881835938, -22.5906982421875, -21.431167602539062, -20.271636962890625, -19.112104415893555, -17.952573776245117, -16.793041229248047, -15.633509635925293, -14.473978996276855, -13.314447402954102, -12.154916763305664, -10.99538516998291, -9.835853576660156, -8.676322937011719, -7.516792297363281, -6.3572611808776855, -5.19773006439209, -4.038198471069336, -2.8786673545837402, -1.7191362380981445, -0.5596046447753906, 0.5999259948730469, 1.7594575881958008, 2.9189887046813965, 4.078519821166992, 5.238051414489746, 6.397582530975342, 7.5571136474609375, 8.716645240783691, 9.876175880432129, 11.035709381103516, 12.19524097442627, 13.354771614074707, 14.514303207397461, 15.673833847045898, 16.83336639404297, 17.992897033691406, 19.152427673339844, 20.31195831298828, 21.47148895263672, 22.63102149963379, 23.790552139282227, 24.950082778930664, 26.109615325927734, 27.269145965576172, 28.42867660522461, 29.58820915222168, 30.747739791870117, 31.907272338867188, 33.066802978515625, 34.22633361816406, 35.3858642578125, 36.54539489746094, 37.704925537109375, 38.86445999145508, 40.023990631103516, 41.18352127075195, 42.343055725097656, 43.502586364746094, 44.66211700439453, 45.82164764404297, 46.981178283691406, 48.140708923339844]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 6.0, 7.0, 12.0, 8.0, 12.0, 17.0, 15.0, 19.0, 20.0, 26.0, 40.0, 36.0, 31.0, 36.0, 38.0, 40.0, 53.0, 33.0, 41.0, 37.0, 32.0, 47.0, 38.0, 29.0, 33.0, 35.0, 28.0, 15.0, 22.0, 28.0, 16.0, 23.0, 15.0, 17.0, 19.0, 14.0, 9.0, 11.0, 8.0, 3.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.185523986816406, -32.191131591796875, -31.196735382080078, -30.202341079711914, -29.20794677734375, -28.213552474975586, -27.219158172607422, -26.22476577758789, -25.230369567871094, -24.23597526550293, -23.241580963134766, -22.2471866607666, -21.252792358398438, -20.258398056030273, -19.26400375366211, -18.269611358642578, -17.275217056274414, -16.28082275390625, -15.286428451538086, -14.292034149169922, -13.297639846801758, -12.303245544433594, -11.308852195739746, -10.314457893371582, -9.320063591003418, -8.325669288635254, -7.33127498626709, -6.336881160736084, -5.34248685836792, -4.348092555999756, -3.35369873046875, -2.359304428100586, -1.3649101257324219, -0.37051594257354736, 0.6238782405853271, 1.618272304534912, 2.612666606903076, 3.6070609092712402, 4.601454734802246, 5.59584903717041, 6.590243339538574, 7.584637641906738, 8.579031944274902, 9.57342529296875, 10.567819595336914, 11.562213897705078, 12.556608200073242, 13.551002502441406, 14.54539680480957, 15.539791107177734, 16.5341854095459, 17.528579711914062, 18.522974014282227, 19.51736831665039, 20.511760711669922, 21.50615692138672, 22.50054931640625, 23.494943618774414, 24.489337921142578, 25.483732223510742, 26.478126525878906, 27.47252082824707, 28.466915130615234, 29.461307525634766, 30.455703735351562]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 5.0, 8.0, 18.0, 19.0, 26.0, 25.0, 37.0, 24.0, 21.0, 35.0, 29.0, 54.0, 40.0, 46.0, 56.0, 52.0, 45.0, 58.0, 40.0, 53.0, 45.0, 43.0, 37.0, 26.0, 24.0, 26.0, 26.0, 16.0, 18.0, 7.0, 10.0, 12.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9609375, -5.75567626953125, -5.5504150390625, -5.34515380859375, -5.139892578125, -4.93463134765625, -4.7293701171875, -4.52410888671875, -4.31884765625, -4.11358642578125, -3.9083251953125, -3.70306396484375, -3.497802734375, -3.29254150390625, -3.0872802734375, -2.88201904296875, -2.6767578125, -2.47149658203125, -2.2662353515625, -2.06097412109375, -1.855712890625, -1.65045166015625, -1.4451904296875, -1.23992919921875, -1.03466796875, -0.82940673828125, -0.6241455078125, -0.41888427734375, -0.213623046875, -0.00836181640625, 0.1968994140625, 0.40216064453125, 0.607421875, 0.81268310546875, 1.0179443359375, 1.22320556640625, 1.428466796875, 1.63372802734375, 1.8389892578125, 2.04425048828125, 2.24951171875, 2.45477294921875, 2.6600341796875, 2.86529541015625, 3.070556640625, 3.27581787109375, 3.4810791015625, 3.68634033203125, 3.8916015625, 4.09686279296875, 4.3021240234375, 4.50738525390625, 4.712646484375, 4.91790771484375, 5.1231689453125, 5.32843017578125, 5.53369140625, 5.73895263671875, 5.9442138671875, 6.14947509765625, 6.354736328125, 6.55999755859375, 6.7652587890625, 6.97052001953125, 7.17578125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 4.0, 7.0, 10.0, 10.0, 15.0, 37.0, 38.0, 57.0, 84.0, 147.0, 215.0, 342.0, 526.0, 873.0, 1371.0, 2401.0, 4000.0, 6682.0, 11968.0, 20550.0, 36957.0, 69461.0, 147133.0, 344529.0, 206650.0, 88648.0, 45498.0, 25144.0, 14722.0, 8423.0, 4811.0, 2794.0, 1676.0, 1015.0, 623.0, 417.0, 240.0, 151.0, 109.0, 66.0, 56.0, 31.0, 18.0, 12.0, 14.0, 9.0, 4.0, 2.0, 8.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2254638671875, -0.2178668975830078, -0.21026992797851562, -0.20267295837402344, -0.19507598876953125, -0.18747901916503906, -0.17988204956054688, -0.1722850799560547, -0.1646881103515625, -0.1570911407470703, -0.14949417114257812, -0.14189720153808594, -0.13430023193359375, -0.12670326232910156, -0.11910629272460938, -0.11150932312011719, -0.103912353515625, -0.09631538391113281, -0.08871841430664062, -0.08112144470214844, -0.07352447509765625, -0.06592750549316406, -0.058330535888671875, -0.05073356628417969, -0.0431365966796875, -0.03553962707519531, -0.027942657470703125, -0.020345687866210938, -0.01274871826171875, -0.0051517486572265625, 0.002445220947265625, 0.010042190551757812, 0.01763916015625, 0.025236129760742188, 0.032833099365234375, 0.04043006896972656, 0.04802703857421875, 0.05562400817871094, 0.06322097778320312, 0.07081794738769531, 0.0784149169921875, 0.08601188659667969, 0.09360885620117188, 0.10120582580566406, 0.10880279541015625, 0.11639976501464844, 0.12399673461914062, 0.1315937042236328, 0.139190673828125, 0.1467876434326172, 0.15438461303710938, 0.16198158264160156, 0.16957855224609375, 0.17717552185058594, 0.18477249145507812, 0.1923694610595703, 0.1999664306640625, 0.2075634002685547, 0.21516036987304688, 0.22275733947753906, 0.23035430908203125, 0.23795127868652344, 0.24554824829101562, 0.2531452178955078, 0.2607421875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 6.0, 8.0, 14.0, 16.0, 21.0, 18.0, 24.0, 25.0, 25.0, 30.0, 17.0, 38.0, 28.0, 38.0, 39.0, 29.0, 41.0, 42.0, 1068.0, 39.0, 40.0, 44.0, 32.0, 33.0, 36.0, 31.0, 15.0, 35.0, 33.0, 21.0, 24.0, 14.0, 14.0, 12.0, 12.0, 10.0, 11.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.701171875, -3.5859375, -3.470703125, -3.35546875, -3.240234375, -3.125, -3.009765625, -2.89453125, -2.779296875, -2.6640625, -2.548828125, -2.43359375, -2.318359375, -2.203125, -2.087890625, -1.97265625, -1.857421875, -1.7421875, -1.626953125, -1.51171875, -1.396484375, -1.28125, -1.166015625, -1.05078125, -0.935546875, -0.8203125, -0.705078125, -0.58984375, -0.474609375, -0.359375, -0.244140625, -0.12890625, -0.013671875, 0.1015625, 0.216796875, 0.33203125, 0.447265625, 0.5625, 0.677734375, 0.79296875, 0.908203125, 1.0234375, 1.138671875, 1.25390625, 1.369140625, 1.484375, 1.599609375, 1.71484375, 1.830078125, 1.9453125, 2.060546875, 2.17578125, 2.291015625, 2.40625, 2.521484375, 2.63671875, 2.751953125, 2.8671875, 2.982421875, 3.09765625, 3.212890625, 3.328125, 3.443359375, 3.55859375, 3.673828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 8.0, 14.0, 25.0, 30.0, 52.0, 78.0, 133.0, 200.0, 301.0, 447.0, 757.0, 1103.0, 1737.0, 2756.0, 4438.0, 7434.0, 11731.0, 19602.0, 32392.0, 55331.0, 102932.0, 233014.0, 1333315.0, 127369.0, 65556.0, 37734.0, 22767.0, 13719.0, 8332.0, 5095.0, 3189.0, 2020.0, 1254.0, 813.0, 515.0, 318.0, 213.0, 134.0, 86.0, 62.0, 48.0, 29.0, 12.0, 12.0, 7.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13671875, -0.13246536254882812, -0.12821197509765625, -0.12395858764648438, -0.1197052001953125, -0.11545181274414062, -0.11119842529296875, -0.10694503784179688, -0.102691650390625, -0.09843826293945312, -0.09418487548828125, -0.08993148803710938, -0.0856781005859375, -0.08142471313476562, -0.07717132568359375, -0.07291793823242188, -0.06866455078125, -0.06441116333007812, -0.06015777587890625, -0.055904388427734375, -0.0516510009765625, -0.047397613525390625, -0.04314422607421875, -0.038890838623046875, -0.034637451171875, -0.030384063720703125, -0.02613067626953125, -0.021877288818359375, -0.0176239013671875, -0.013370513916015625, -0.00911712646484375, -0.004863739013671875, -0.0006103515625, 0.003643035888671875, 0.00789642333984375, 0.012149810791015625, 0.0164031982421875, 0.020656585693359375, 0.02490997314453125, 0.029163360595703125, 0.033416748046875, 0.037670135498046875, 0.04192352294921875, 0.046176910400390625, 0.0504302978515625, 0.054683685302734375, 0.05893707275390625, 0.06319046020507812, 0.06744384765625, 0.07169723510742188, 0.07595062255859375, 0.08020401000976562, 0.0844573974609375, 0.08871078491210938, 0.09296417236328125, 0.09721755981445312, 0.101470947265625, 0.10572433471679688, 0.10997772216796875, 0.11423110961914062, 0.1184844970703125, 0.12273788452148438, 0.12699127197265625, 0.13124465942382812, 0.135498046875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 4.0, 3.0, 8.0, 7.0, 11.0, 16.0, 28.0, 20.0, 23.0, 26.0, 19.0, 28.0, 39.0, 22.0, 36.0, 38.0, 41.0, 37.0, 46.0, 62.0, 51.0, 34.0, 39.0, 41.0, 33.0, 37.0, 34.0, 27.0, 36.0, 22.0, 15.0, 16.0, 12.0, 14.0, 15.0, 8.0, 13.0, 7.0, 3.0, 4.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-3.999471664428711e-05, -3.8691796362400055e-05, -3.7388876080513e-05, -3.6085955798625946e-05, -3.478303551673889e-05, -3.348011523485184e-05, -3.217719495296478e-05, -3.087427467107773e-05, -2.9571354389190674e-05, -2.826843410730362e-05, -2.6965513825416565e-05, -2.566259354352951e-05, -2.4359673261642456e-05, -2.30567529797554e-05, -2.1753832697868347e-05, -2.0450912415981293e-05, -1.9147992134094238e-05, -1.7845071852207184e-05, -1.654215157032013e-05, -1.5239231288433075e-05, -1.393631100654602e-05, -1.2633390724658966e-05, -1.1330470442771912e-05, -1.0027550160884857e-05, -8.724629878997803e-06, -7.421709597110748e-06, -6.118789315223694e-06, -4.815869033336639e-06, -3.512948751449585e-06, -2.2100284695625305e-06, -9.071081876754761e-07, 3.9581209421157837e-07, 1.6987323760986328e-06, 3.0016526579856873e-06, 4.304572939872742e-06, 5.607493221759796e-06, 6.910413503646851e-06, 8.213333785533905e-06, 9.51625406742096e-06, 1.0819174349308014e-05, 1.2122094631195068e-05, 1.3425014913082123e-05, 1.4727935194969177e-05, 1.603085547685623e-05, 1.7333775758743286e-05, 1.863669604063034e-05, 1.9939616322517395e-05, 2.124253660440445e-05, 2.2545456886291504e-05, 2.384837716817856e-05, 2.5151297450065613e-05, 2.6454217731952667e-05, 2.775713801383972e-05, 2.9060058295726776e-05, 3.036297857761383e-05, 3.1665898859500885e-05, 3.296881914138794e-05, 3.4271739423274994e-05, 3.557465970516205e-05, 3.68775799870491e-05, 3.818050026893616e-05, 3.948342055082321e-05, 4.0786340832710266e-05, 4.208926111459732e-05, 4.3392181396484375e-05]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 8.0, 10.0, 11.0, 16.0, 18.0, 17.0, 18.0, 39.0, 38.0, 41.0, 70.0, 86.0, 155.0, 328.0, 1371.0, 49279.0, 918038.0, 76309.0, 1727.0, 397.0, 155.0, 85.0, 61.0, 46.0, 26.0, 31.0, 26.0, 25.0, 15.0, 23.0, 15.0, 8.0, 6.0, 13.0, 6.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008473396301269531, -0.0008196011185646057, -0.0007918626070022583, -0.0007641240954399109, -0.0007363855838775635, -0.0007086470723152161, -0.0006809085607528687, -0.0006531700491905212, -0.0006254315376281738, -0.0005976930260658264, -0.000569954514503479, -0.0005422160029411316, -0.0005144774913787842, -0.00048673897981643677, -0.00045900046825408936, -0.00043126195669174194, -0.00040352344512939453, -0.0003757849335670471, -0.0003480464220046997, -0.0003203079104423523, -0.0002925693988800049, -0.00026483088731765747, -0.00023709237575531006, -0.00020935386419296265, -0.00018161535263061523, -0.00015387684106826782, -0.0001261383295059204, -9.8399817943573e-05, -7.066130638122559e-05, -4.2922794818878174e-05, -1.5184283256530762e-05, 1.255422830581665e-05, 4.029273986816406e-05, 6.803125143051147e-05, 9.576976299285889e-05, 0.0001235082745552063, 0.0001512467861175537, 0.00017898529767990112, 0.00020672380924224854, 0.00023446232080459595, 0.00026220083236694336, 0.00028993934392929077, 0.0003176778554916382, 0.0003454163670539856, 0.000373154878616333, 0.0004008933901786804, 0.00042863190174102783, 0.00045637041330337524, 0.00048410892486572266, 0.0005118474364280701, 0.0005395859479904175, 0.0005673244595527649, 0.0005950629711151123, 0.0006228014826774597, 0.0006505399942398071, 0.0006782785058021545, 0.000706017017364502, 0.0007337555289268494, 0.0007614940404891968, 0.0007892325520515442, 0.0008169710636138916, 0.000844709575176239, 0.0008724480867385864, 0.0009001865983009338, 0.0009279251098632812]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 44.0, 670.0, 294.0, 8.0, 2.0], "bins": [-0.0008232136606238782, -0.0008096713572740555, -0.0007961291121318936, -0.0007825868087820709, -0.000769044563639909, -0.0007555022602900863, -0.0007419599569402635, -0.0007284177117981017, -0.0007148754084482789, -0.0007013331050984561, -0.0006877908599562943, -0.0006742485566064715, -0.0006607063114643097, -0.0006471640081144869, -0.0006336217047646642, -0.0006200794596225023, -0.0006065371562726796, -0.0005929948529228568, -0.000579452607780695, -0.0005659103044308722, -0.0005523680592887104, -0.0005388257559388876, -0.0005252834525890648, -0.000511741207446903, -0.0004981989040970802, -0.00048465662985108793, -0.0004711143556050956, -0.00045757205225527287, -0.00044402977800928056, -0.00043048750376328826, -0.00041694522951729596, -0.00040340295527130365, -0.00038986068102531135, -0.00037631840677931905, -0.00036277613253332675, -0.000349233829183504, -0.0003356915549375117, -0.0003221492806915194, -0.0003086070064455271, -0.0002950647030957043, -0.000281522428849712, -0.0002679801546037197, -0.0002544378803577274, -0.00024089559155981988, -0.00022735330276191235, -0.00021381102851592004, -0.00020026875426992774, -0.0001867264654720202, -0.0001731841912260279, -0.0001596419169800356, -0.00014609962818212807, -0.00013255735393613577, -0.00011901506513822824, -0.00010547279089223593, -9.193050937028602e-05, -7.83882278483361e-05, -6.484594632638618e-05, -5.1303664804436266e-05, -3.776138328248635e-05, -2.421910539851524e-05, -1.0676823876565322e-05, 2.8654540074057877e-06, 1.6407735529355705e-05, 2.9950017051305622e-05, 4.349229857325554e-05]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 1.0, 8.0, 9.0, 12.0, 14.0, 16.0, 9.0, 18.0, 28.0, 22.0, 25.0, 33.0, 37.0, 32.0, 39.0, 48.0, 58.0, 42.0, 49.0, 49.0, 32.0, 42.0, 49.0, 42.0, 34.0, 37.0, 32.0, 31.0, 21.0, 16.0, 24.0, 20.0, 14.0, 15.0, 13.0, 6.0, 4.0, 11.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6404857635498047e-05, -2.5389716029167175e-05, -2.4374574422836304e-05, -2.3359432816505432e-05, -2.234429121017456e-05, -2.132914960384369e-05, -2.0314007997512817e-05, -1.9298866391181946e-05, -1.8283724784851074e-05, -1.7268583178520203e-05, -1.625344157218933e-05, -1.523829996585846e-05, -1.4223158359527588e-05, -1.3208016753196716e-05, -1.2192875146865845e-05, -1.1177733540534973e-05, -1.0162591934204102e-05, -9.14745032787323e-06, -8.132308721542358e-06, -7.117167115211487e-06, -6.102025508880615e-06, -5.086883902549744e-06, -4.071742296218872e-06, -3.0566006898880005e-06, -2.041459083557129e-06, -1.0263174772262573e-06, -1.1175870895385742e-08, 1.0039657354354858e-06, 2.0191073417663574e-06, 3.034248948097229e-06, 4.049390554428101e-06, 5.064532160758972e-06, 6.079673767089844e-06, 7.094815373420715e-06, 8.109956979751587e-06, 9.125098586082458e-06, 1.014024019241333e-05, 1.1155381798744202e-05, 1.2170523405075073e-05, 1.3185665011405945e-05, 1.4200806617736816e-05, 1.5215948224067688e-05, 1.623108983039856e-05, 1.724623143672943e-05, 1.8261373043060303e-05, 1.9276514649391174e-05, 2.0291656255722046e-05, 2.1306797862052917e-05, 2.232193946838379e-05, 2.333708107471466e-05, 2.4352222681045532e-05, 2.5367364287376404e-05, 2.6382505893707275e-05, 2.7397647500038147e-05, 2.841278910636902e-05, 2.942793071269989e-05, 3.0443072319030762e-05, 3.145821392536163e-05, 3.2473355531692505e-05, 3.3488497138023376e-05, 3.450363874435425e-05, 3.551878035068512e-05, 3.653392195701599e-05, 3.754906356334686e-05, 3.8564205169677734e-05]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 5.0, 8.0, 18.0, 19.0, 26.0, 25.0, 37.0, 24.0, 21.0, 35.0, 29.0, 54.0, 40.0, 46.0, 56.0, 52.0, 45.0, 58.0, 40.0, 53.0, 45.0, 43.0, 37.0, 26.0, 24.0, 26.0, 26.0, 16.0, 18.0, 7.0, 10.0, 12.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9609375, -5.75567626953125, -5.5504150390625, -5.34515380859375, -5.139892578125, -4.93463134765625, -4.7293701171875, -4.52410888671875, -4.31884765625, -4.11358642578125, -3.9083251953125, -3.70306396484375, -3.497802734375, -3.29254150390625, -3.0872802734375, -2.88201904296875, -2.6767578125, -2.47149658203125, -2.2662353515625, -2.06097412109375, -1.855712890625, -1.65045166015625, -1.4451904296875, -1.23992919921875, -1.03466796875, -0.82940673828125, -0.6241455078125, -0.41888427734375, -0.213623046875, -0.00836181640625, 0.1968994140625, 0.40216064453125, 0.607421875, 0.81268310546875, 1.0179443359375, 1.22320556640625, 1.428466796875, 1.63372802734375, 1.8389892578125, 2.04425048828125, 2.24951171875, 2.45477294921875, 2.6600341796875, 2.86529541015625, 3.070556640625, 3.27581787109375, 3.4810791015625, 3.68634033203125, 3.8916015625, 4.09686279296875, 4.3021240234375, 4.50738525390625, 4.712646484375, 4.91790771484375, 5.1231689453125, 5.32843017578125, 5.53369140625, 5.73895263671875, 5.9442138671875, 6.14947509765625, 6.354736328125, 6.55999755859375, 6.7652587890625, 6.97052001953125, 7.17578125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 10.0, 6.0, 7.0, 15.0, 16.0, 26.0, 29.0, 61.0, 94.0, 137.0, 206.0, 312.0, 572.0, 947.0, 1672.0, 3156.0, 6304.0, 12954.0, 27927.0, 70615.0, 294583.0, 467539.0, 94738.0, 35093.0, 15562.0, 7557.0, 3767.0, 2007.0, 1064.0, 551.0, 372.0, 228.0, 153.0, 82.0, 68.0, 48.0, 18.0, 20.0, 17.0, 6.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.87890625, -7.62579345703125, -7.3726806640625, -7.11956787109375, -6.866455078125, -6.61334228515625, -6.3602294921875, -6.10711669921875, -5.85400390625, -5.60089111328125, -5.3477783203125, -5.09466552734375, -4.841552734375, -4.58843994140625, -4.3353271484375, -4.08221435546875, -3.8291015625, -3.57598876953125, -3.3228759765625, -3.06976318359375, -2.816650390625, -2.56353759765625, -2.3104248046875, -2.05731201171875, -1.80419921875, -1.55108642578125, -1.2979736328125, -1.04486083984375, -0.791748046875, -0.53863525390625, -0.2855224609375, -0.03240966796875, 0.220703125, 0.47381591796875, 0.7269287109375, 0.98004150390625, 1.233154296875, 1.48626708984375, 1.7393798828125, 1.99249267578125, 2.24560546875, 2.49871826171875, 2.7518310546875, 3.00494384765625, 3.258056640625, 3.51116943359375, 3.7642822265625, 4.01739501953125, 4.2705078125, 4.52362060546875, 4.7767333984375, 5.02984619140625, 5.282958984375, 5.53607177734375, 5.7891845703125, 6.04229736328125, 6.29541015625, 6.54852294921875, 6.8016357421875, 7.05474853515625, 7.307861328125, 7.56097412109375, 7.8140869140625, 8.06719970703125, 8.3203125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 5.0, 6.0, 7.0, 14.0, 11.0, 7.0, 14.0, 18.0, 16.0, 23.0, 30.0, 31.0, 33.0, 34.0, 46.0, 50.0, 59.0, 62.0, 103.0, 168.0, 1547.0, 191.0, 90.0, 60.0, 50.0, 44.0, 40.0, 32.0, 42.0, 26.0, 28.0, 35.0, 21.0, 18.0, 14.0, 23.0, 9.0, 7.0, 8.0, 3.0, 9.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.75, -15.2509765625, -14.751953125, -14.2529296875, -13.75390625, -13.2548828125, -12.755859375, -12.2568359375, -11.7578125, -11.2587890625, -10.759765625, -10.2607421875, -9.76171875, -9.2626953125, -8.763671875, -8.2646484375, -7.765625, -7.2666015625, -6.767578125, -6.2685546875, -5.76953125, -5.2705078125, -4.771484375, -4.2724609375, -3.7734375, -3.2744140625, -2.775390625, -2.2763671875, -1.77734375, -1.2783203125, -0.779296875, -0.2802734375, 0.21875, 0.7177734375, 1.216796875, 1.7158203125, 2.21484375, 2.7138671875, 3.212890625, 3.7119140625, 4.2109375, 4.7099609375, 5.208984375, 5.7080078125, 6.20703125, 6.7060546875, 7.205078125, 7.7041015625, 8.203125, 8.7021484375, 9.201171875, 9.7001953125, 10.19921875, 10.6982421875, 11.197265625, 11.6962890625, 12.1953125, 12.6943359375, 13.193359375, 13.6923828125, 14.19140625, 14.6904296875, 15.189453125, 15.6884765625, 16.1875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 9.0, 3.0, 7.0, 4.0, 13.0, 17.0, 26.0, 32.0, 24.0, 37.0, 44.0, 61.0, 90.0, 160.0, 249.0, 467.0, 1195.0, 4681.0, 34134.0, 1949709.0, 1118518.0, 29754.0, 4143.0, 1115.0, 457.0, 248.0, 150.0, 91.0, 51.0, 46.0, 29.0, 31.0, 14.0, 19.0, 13.0, 7.0, 16.0, 13.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.53125, -32.51416015625, -31.4970703125, -30.47998046875, -29.462890625, -28.44580078125, -27.4287109375, -26.41162109375, -25.39453125, -24.37744140625, -23.3603515625, -22.34326171875, -21.326171875, -20.30908203125, -19.2919921875, -18.27490234375, -17.2578125, -16.24072265625, -15.2236328125, -14.20654296875, -13.189453125, -12.17236328125, -11.1552734375, -10.13818359375, -9.12109375, -8.10400390625, -7.0869140625, -6.06982421875, -5.052734375, -4.03564453125, -3.0185546875, -2.00146484375, -0.984375, 0.03271484375, 1.0498046875, 2.06689453125, 3.083984375, 4.10107421875, 5.1181640625, 6.13525390625, 7.15234375, 8.16943359375, 9.1865234375, 10.20361328125, 11.220703125, 12.23779296875, 13.2548828125, 14.27197265625, 15.2890625, 16.30615234375, 17.3232421875, 18.34033203125, 19.357421875, 20.37451171875, 21.3916015625, 22.40869140625, 23.42578125, 24.44287109375, 25.4599609375, 26.47705078125, 27.494140625, 28.51123046875, 29.5283203125, 30.54541015625, 31.5625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 45.0, 262.0, 470.0, 198.0, 31.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.696006774902344, -39.95793914794922, -35.21986770629883, -30.481800079345703, -25.743730545043945, -21.005661010742188, -16.267593383789062, -11.529521942138672, -6.791454315185547, -2.0533852577209473, 2.6846837997436523, 7.422752380371094, 12.160821914672852, 16.89889144897461, 21.636959075927734, 26.375030517578125, 31.11309814453125, 35.851165771484375, 40.589237213134766, 45.32730484008789, 50.06537628173828, 54.803443908691406, 59.54151153564453, 64.27958679199219, 69.01765441894531, 73.75572204589844, 78.49378967285156, 83.23185729980469, 87.96993255615234, 92.70800018310547, 97.4460678100586, 102.18414306640625, 106.92219543457031, 111.66026306152344, 116.39833068847656, 121.13639831542969, 125.87447357177734, 130.612548828125, 135.35061645507812, 140.08868408203125, 144.82675170898438, 149.5648193359375, 154.30288696289062, 159.04095458984375, 163.77902221679688, 168.51708984375, 173.25515747070312, 177.9932403564453, 182.73129272460938, 187.4693603515625, 192.20742797851562, 196.94549560546875, 201.68356323242188, 206.421630859375, 211.15969848632812, 215.8977813720703, 220.63584899902344, 225.37391662597656, 230.1119842529297, 234.8500518798828, 239.58811950683594, 244.32620239257812, 249.06427001953125, 253.80233764648438, 258.5404052734375]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 4.0, 3.0, 12.0, 4.0, 9.0, 19.0, 12.0, 17.0, 26.0, 16.0, 18.0, 34.0, 16.0, 22.0, 29.0, 40.0, 34.0, 40.0, 35.0, 39.0, 31.0, 31.0, 43.0, 44.0, 47.0, 31.0, 38.0, 37.0, 29.0, 36.0, 29.0, 24.0, 21.0, 22.0, 16.0, 14.0, 13.0, 5.0, 8.0, 9.0, 5.0, 11.0, 5.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-47.423702239990234, -46.028743743896484, -44.6337890625, -43.23883056640625, -41.8438720703125, -40.44891357421875, -39.053958892822266, -37.659000396728516, -36.26404571533203, -34.86908721923828, -33.4741325378418, -32.07917404174805, -30.684215545654297, -29.28925895690918, -27.894302368164062, -26.499343872070312, -25.104385375976562, -23.709428787231445, -22.314470291137695, -20.919513702392578, -19.524555206298828, -18.12959861755371, -16.734642028808594, -15.33968448638916, -13.944726943969727, -12.549769401550293, -11.15481185913086, -9.759855270385742, -8.364897727966309, -6.969940185546875, -5.574983596801758, -4.180026054382324, -2.7850723266601562, -1.3901150226593018, 0.004842281341552734, 1.3997993469238281, 2.7947568893432617, 4.189714431762695, 5.5846710205078125, 6.979628562927246, 8.37458610534668, 9.769543647766113, 11.164501190185547, 12.559457778930664, 13.954415321350098, 15.349372863769531, 16.74432945251465, 18.139286041259766, 19.534244537353516, 20.929201126098633, 22.324159622192383, 23.7191162109375, 25.11407470703125, 26.509031295776367, 27.903987884521484, 29.298946380615234, 30.69390296936035, 32.08885955810547, 33.48381805419922, 34.87877655029297, 36.27373123168945, 37.6686897277832, 39.06364440917969, 40.45860290527344, 41.85356140136719]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 13.0, 10.0, 11.0, 19.0, 21.0, 24.0, 28.0, 26.0, 20.0, 21.0, 33.0, 40.0, 32.0, 41.0, 41.0, 51.0, 58.0, 39.0, 43.0, 44.0, 34.0, 50.0, 48.0, 40.0, 31.0, 35.0, 14.0, 23.0, 21.0, 12.0, 16.0, 17.0, 13.0, 9.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.36328125, -5.1676025390625, -4.971923828125, -4.7762451171875, -4.58056640625, -4.3848876953125, -4.189208984375, -3.9935302734375, -3.7978515625, -3.6021728515625, -3.406494140625, -3.2108154296875, -3.01513671875, -2.8194580078125, -2.623779296875, -2.4281005859375, -2.232421875, -2.0367431640625, -1.841064453125, -1.6453857421875, -1.44970703125, -1.2540283203125, -1.058349609375, -0.8626708984375, -0.6669921875, -0.4713134765625, -0.275634765625, -0.0799560546875, 0.11572265625, 0.3114013671875, 0.507080078125, 0.7027587890625, 0.8984375, 1.0941162109375, 1.289794921875, 1.4854736328125, 1.68115234375, 1.8768310546875, 2.072509765625, 2.2681884765625, 2.4638671875, 2.6595458984375, 2.855224609375, 3.0509033203125, 3.24658203125, 3.4422607421875, 3.637939453125, 3.8336181640625, 4.029296875, 4.2249755859375, 4.420654296875, 4.6163330078125, 4.81201171875, 5.0076904296875, 5.203369140625, 5.3990478515625, 5.5947265625, 5.7904052734375, 5.986083984375, 6.1817626953125, 6.37744140625, 6.5731201171875, 6.768798828125, 6.9644775390625, 7.16015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 5.0, 4.0, 15.0, 22.0, 19.0, 31.0, 47.0, 66.0, 118.0, 185.0, 314.0, 659.0, 1438.0, 3670.0, 10012.0, 33119.0, 141522.0, 1105203.0, 2479573.0, 329356.0, 61210.0, 17317.0, 5825.0, 2278.0, 1012.0, 511.0, 289.0, 148.0, 96.0, 72.0, 42.0, 34.0, 21.0, 15.0, 11.0, 6.0, 11.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.96875, -13.521484375, -13.07421875, -12.626953125, -12.1796875, -11.732421875, -11.28515625, -10.837890625, -10.390625, -9.943359375, -9.49609375, -9.048828125, -8.6015625, -8.154296875, -7.70703125, -7.259765625, -6.8125, -6.365234375, -5.91796875, -5.470703125, -5.0234375, -4.576171875, -4.12890625, -3.681640625, -3.234375, -2.787109375, -2.33984375, -1.892578125, -1.4453125, -0.998046875, -0.55078125, -0.103515625, 0.34375, 0.791015625, 1.23828125, 1.685546875, 2.1328125, 2.580078125, 3.02734375, 3.474609375, 3.921875, 4.369140625, 4.81640625, 5.263671875, 5.7109375, 6.158203125, 6.60546875, 7.052734375, 7.5, 7.947265625, 8.39453125, 8.841796875, 9.2890625, 9.736328125, 10.18359375, 10.630859375, 11.078125, 11.525390625, 11.97265625, 12.419921875, 12.8671875, 13.314453125, 13.76171875, 14.208984375, 14.65625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 13.0, 19.0, 18.0, 16.0, 32.0, 49.0, 66.0, 91.0, 124.0, 134.0, 204.0, 280.0, 408.0, 540.0, 519.0, 411.0, 293.0, 228.0, 147.0, 115.0, 74.0, 70.0, 50.0, 52.0, 25.0, 19.0, 8.0, 17.0, 12.0, 4.0, 7.0, 9.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-10.828125, -10.518798828125, -10.20947265625, -9.900146484375, -9.5908203125, -9.281494140625, -8.97216796875, -8.662841796875, -8.353515625, -8.044189453125, -7.73486328125, -7.425537109375, -7.1162109375, -6.806884765625, -6.49755859375, -6.188232421875, -5.87890625, -5.569580078125, -5.26025390625, -4.950927734375, -4.6416015625, -4.332275390625, -4.02294921875, -3.713623046875, -3.404296875, -3.094970703125, -2.78564453125, -2.476318359375, -2.1669921875, -1.857666015625, -1.54833984375, -1.239013671875, -0.9296875, -0.620361328125, -0.31103515625, -0.001708984375, 0.3076171875, 0.616943359375, 0.92626953125, 1.235595703125, 1.544921875, 1.854248046875, 2.16357421875, 2.472900390625, 2.7822265625, 3.091552734375, 3.40087890625, 3.710205078125, 4.01953125, 4.328857421875, 4.63818359375, 4.947509765625, 5.2568359375, 5.566162109375, 5.87548828125, 6.184814453125, 6.494140625, 6.803466796875, 7.11279296875, 7.422119140625, 7.7314453125, 8.040771484375, 8.35009765625, 8.659423828125, 8.96875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 5.0, 9.0, 10.0, 7.0, 8.0, 31.0, 30.0, 44.0, 73.0, 98.0, 152.0, 226.0, 376.0, 945.0, 3978.0, 36400.0, 991730.0, 3065506.0, 85090.0, 6937.0, 1342.0, 517.0, 262.0, 180.0, 105.0, 66.0, 45.0, 28.0, 23.0, 20.0, 8.0, 13.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-39.0625, -37.951171875, -36.83984375, -35.728515625, -34.6171875, -33.505859375, -32.39453125, -31.283203125, -30.171875, -29.060546875, -27.94921875, -26.837890625, -25.7265625, -24.615234375, -23.50390625, -22.392578125, -21.28125, -20.169921875, -19.05859375, -17.947265625, -16.8359375, -15.724609375, -14.61328125, -13.501953125, -12.390625, -11.279296875, -10.16796875, -9.056640625, -7.9453125, -6.833984375, -5.72265625, -4.611328125, -3.5, -2.388671875, -1.27734375, -0.166015625, 0.9453125, 2.056640625, 3.16796875, 4.279296875, 5.390625, 6.501953125, 7.61328125, 8.724609375, 9.8359375, 10.947265625, 12.05859375, 13.169921875, 14.28125, 15.392578125, 16.50390625, 17.615234375, 18.7265625, 19.837890625, 20.94921875, 22.060546875, 23.171875, 24.283203125, 25.39453125, 26.505859375, 27.6171875, 28.728515625, 29.83984375, 30.951171875, 32.0625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 14.0, 40.0, 101.0, 152.0, 282.0, 197.0, 135.0, 53.0, 31.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.33702087402344, -94.77400207519531, -91.21097564697266, -87.64795684814453, -84.08493041992188, -80.52191162109375, -76.95889282226562, -73.3958740234375, -69.83284759521484, -66.26982879638672, -62.70680236816406, -59.14378356933594, -55.58076095581055, -52.017738342285156, -48.45471954345703, -44.89169692993164, -41.32867431640625, -37.76565170288086, -34.20262908935547, -30.639610290527344, -27.076587677001953, -23.513565063476562, -19.950544357299805, -16.387523651123047, -12.824501037597656, -9.261479377746582, -5.698457717895508, -2.1354360580444336, 1.4275856018066406, 4.990608215332031, 8.553628921508789, 12.116649627685547, 15.679672241210938, 19.242694854736328, 22.805715560913086, 26.368736267089844, 29.931758880615234, 33.494781494140625, 37.05780029296875, 40.62082290649414, 44.18384552001953, 47.74686813354492, 51.30989074707031, 54.87290954589844, 58.43593215942383, 61.99895477294922, 65.56197357177734, 69.125, 72.68801879882812, 76.25103759765625, 79.8140640258789, 83.37708282470703, 86.94010925292969, 90.50312805175781, 94.06614685058594, 97.62916564941406, 101.19219207763672, 104.75521087646484, 108.3182373046875, 111.88125610351562, 115.44427490234375, 119.0073013305664, 122.57032012939453, 126.13334655761719, 129.6963653564453]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 6.0, 10.0, 8.0, 11.0, 12.0, 18.0, 15.0, 24.0, 26.0, 23.0, 20.0, 32.0, 38.0, 37.0, 41.0, 20.0, 41.0, 46.0, 45.0, 49.0, 48.0, 38.0, 34.0, 36.0, 41.0, 28.0, 39.0, 26.0, 20.0, 25.0, 24.0, 22.0, 16.0, 19.0, 10.0, 7.0, 11.0, 7.0, 6.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0], "bins": [-35.319610595703125, -34.29916000366211, -33.278709411621094, -32.258262634277344, -31.237812042236328, -30.217361450195312, -29.19691276550293, -28.176464080810547, -27.15601348876953, -26.135562896728516, -25.115114212036133, -24.09466552734375, -23.074214935302734, -22.05376434326172, -21.033315658569336, -20.012866973876953, -18.992416381835938, -17.971965789794922, -16.95151710510254, -15.93106746673584, -14.91061782836914, -13.890168190002441, -12.869718551635742, -11.849268913269043, -10.828819274902344, -9.808369636535645, -8.787919998168945, -7.767470359802246, -6.747020721435547, -5.726571083068848, -4.706121444702148, -3.685671806335449, -2.6652259826660156, -1.6447763442993164, -0.6243267059326172, 0.39612293243408203, 1.4165725708007812, 2.4370222091674805, 3.4574718475341797, 4.477921485900879, 5.498371124267578, 6.518820762634277, 7.539270401000977, 8.559720039367676, 9.580169677734375, 10.600619316101074, 11.621068954467773, 12.641518592834473, 13.661968231201172, 14.682417869567871, 15.70286750793457, 16.723316192626953, 17.74376678466797, 18.764217376708984, 19.784666061401367, 20.80511474609375, 21.825565338134766, 22.84601593017578, 23.866464614868164, 24.886913299560547, 25.907363891601562, 26.927814483642578, 27.94826316833496, 28.968711853027344, 29.98916244506836]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 10.0, 7.0, 13.0, 14.0, 23.0, 19.0, 18.0, 22.0, 30.0, 23.0, 37.0, 31.0, 26.0, 32.0, 45.0, 52.0, 43.0, 52.0, 45.0, 41.0, 41.0, 42.0, 41.0, 42.0, 37.0, 25.0, 40.0, 19.0, 18.0, 23.0, 17.0, 15.0, 17.0, 8.0, 8.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.4296875, -5.23675537109375, -5.0438232421875, -4.85089111328125, -4.657958984375, -4.46502685546875, -4.2720947265625, -4.07916259765625, -3.88623046875, -3.69329833984375, -3.5003662109375, -3.30743408203125, -3.114501953125, -2.92156982421875, -2.7286376953125, -2.53570556640625, -2.3427734375, -2.14984130859375, -1.9569091796875, -1.76397705078125, -1.571044921875, -1.37811279296875, -1.1851806640625, -0.99224853515625, -0.79931640625, -0.60638427734375, -0.4134521484375, -0.22052001953125, -0.027587890625, 0.16534423828125, 0.3582763671875, 0.55120849609375, 0.744140625, 0.93707275390625, 1.1300048828125, 1.32293701171875, 1.515869140625, 1.70880126953125, 1.9017333984375, 2.09466552734375, 2.28759765625, 2.48052978515625, 2.6734619140625, 2.86639404296875, 3.059326171875, 3.25225830078125, 3.4451904296875, 3.63812255859375, 3.8310546875, 4.02398681640625, 4.2169189453125, 4.40985107421875, 4.602783203125, 4.79571533203125, 4.9886474609375, 5.18157958984375, 5.37451171875, 5.56744384765625, 5.7603759765625, 5.95330810546875, 6.146240234375, 6.33917236328125, 6.5321044921875, 6.72503662109375, 6.91796875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 3.0, 6.0, 5.0, 15.0, 27.0, 31.0, 51.0, 66.0, 96.0, 119.0, 187.0, 286.0, 439.0, 673.0, 1087.0, 1650.0, 2581.0, 3904.0, 5964.0, 9315.0, 14110.0, 22431.0, 35531.0, 58344.0, 105823.0, 239030.0, 263185.0, 116101.0, 62805.0, 37825.0, 23643.0, 15304.0, 9777.0, 6360.0, 4152.0, 2733.0, 1644.0, 1147.0, 678.0, 459.0, 300.0, 215.0, 143.0, 90.0, 56.0, 51.0, 28.0, 22.0, 25.0, 15.0, 7.0, 7.0, 2.0, 7.0, 2.0, 0.0, 2.0], "bins": [-0.2100830078125, -0.20372962951660156, -0.19737625122070312, -0.1910228729248047, -0.18466949462890625, -0.1783161163330078, -0.17196273803710938, -0.16560935974121094, -0.1592559814453125, -0.15290260314941406, -0.14654922485351562, -0.1401958465576172, -0.13384246826171875, -0.1274890899658203, -0.12113571166992188, -0.11478233337402344, -0.108428955078125, -0.10207557678222656, -0.09572219848632812, -0.08936882019042969, -0.08301544189453125, -0.07666206359863281, -0.07030868530273438, -0.06395530700683594, -0.0576019287109375, -0.05124855041503906, -0.044895172119140625, -0.03854179382324219, -0.03218841552734375, -0.025835037231445312, -0.019481658935546875, -0.013128280639648438, -0.00677490234375, -0.0004215240478515625, 0.005931854248046875, 0.012285232543945312, 0.01863861083984375, 0.024991989135742188, 0.031345367431640625, 0.03769874572753906, 0.0440521240234375, 0.05040550231933594, 0.056758880615234375, 0.06311225891113281, 0.06946563720703125, 0.07581901550292969, 0.08217239379882812, 0.08852577209472656, 0.094879150390625, 0.10123252868652344, 0.10758590698242188, 0.11393928527832031, 0.12029266357421875, 0.1266460418701172, 0.13299942016601562, 0.13935279846191406, 0.1457061767578125, 0.15205955505371094, 0.15841293334960938, 0.1647663116455078, 0.17111968994140625, 0.1774730682373047, 0.18382644653320312, 0.19017982482910156, 0.196533203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 10.0, 7.0, 11.0, 8.0, 13.0, 14.0, 23.0, 15.0, 26.0, 25.0, 23.0, 28.0, 21.0, 31.0, 28.0, 35.0, 36.0, 39.0, 35.0, 46.0, 1076.0, 41.0, 39.0, 33.0, 33.0, 39.0, 22.0, 33.0, 32.0, 29.0, 20.0, 18.0, 31.0, 16.0, 18.0, 15.0, 13.0, 13.0, 5.0, 6.0, 3.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.88671875, -3.766082763671875, -3.64544677734375, -3.524810791015625, -3.4041748046875, -3.283538818359375, -3.16290283203125, -3.042266845703125, -2.921630859375, -2.800994873046875, -2.68035888671875, -2.559722900390625, -2.4390869140625, -2.318450927734375, -2.19781494140625, -2.077178955078125, -1.95654296875, -1.835906982421875, -1.71527099609375, -1.594635009765625, -1.4739990234375, -1.353363037109375, -1.23272705078125, -1.112091064453125, -0.991455078125, -0.870819091796875, -0.75018310546875, -0.629547119140625, -0.5089111328125, -0.388275146484375, -0.26763916015625, -0.147003173828125, -0.0263671875, 0.094268798828125, 0.21490478515625, 0.335540771484375, 0.4561767578125, 0.576812744140625, 0.69744873046875, 0.818084716796875, 0.938720703125, 1.059356689453125, 1.17999267578125, 1.300628662109375, 1.4212646484375, 1.541900634765625, 1.66253662109375, 1.783172607421875, 1.90380859375, 2.024444580078125, 2.14508056640625, 2.265716552734375, 2.3863525390625, 2.506988525390625, 2.62762451171875, 2.748260498046875, 2.868896484375, 2.989532470703125, 3.11016845703125, 3.230804443359375, 3.3514404296875, 3.472076416015625, 3.59271240234375, 3.713348388671875, 3.833984375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 10.0, 15.0, 25.0, 36.0, 70.0, 63.0, 140.0, 218.0, 330.0, 489.0, 827.0, 1295.0, 2098.0, 3396.0, 5356.0, 8880.0, 14409.0, 23675.0, 38553.0, 65439.0, 124524.0, 1329420.0, 231153.0, 102731.0, 56466.0, 33784.0, 20606.0, 12660.0, 7706.0, 4803.0, 2962.0, 1840.0, 1132.0, 720.0, 469.0, 294.0, 206.0, 120.0, 67.0, 56.0, 31.0, 15.0, 13.0, 9.0, 5.0, 9.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1436767578125, -0.13930511474609375, -0.1349334716796875, -0.13056182861328125, -0.126190185546875, -0.12181854248046875, -0.1174468994140625, -0.11307525634765625, -0.10870361328125, -0.10433197021484375, -0.0999603271484375, -0.09558868408203125, -0.091217041015625, -0.08684539794921875, -0.0824737548828125, -0.07810211181640625, -0.07373046875, -0.06935882568359375, -0.0649871826171875, -0.06061553955078125, -0.056243896484375, -0.05187225341796875, -0.0475006103515625, -0.04312896728515625, -0.03875732421875, -0.03438568115234375, -0.0300140380859375, -0.02564239501953125, -0.021270751953125, -0.01689910888671875, -0.0125274658203125, -0.00815582275390625, -0.0037841796875, 0.00058746337890625, 0.0049591064453125, 0.00933074951171875, 0.013702392578125, 0.01807403564453125, 0.0224456787109375, 0.02681732177734375, 0.03118896484375, 0.03556060791015625, 0.0399322509765625, 0.04430389404296875, 0.048675537109375, 0.05304718017578125, 0.0574188232421875, 0.06179046630859375, 0.066162109375, 0.07053375244140625, 0.0749053955078125, 0.07927703857421875, 0.083648681640625, 0.08802032470703125, 0.0923919677734375, 0.09676361083984375, 0.10113525390625, 0.10550689697265625, 0.1098785400390625, 0.11425018310546875, 0.118621826171875, 0.12299346923828125, 0.1273651123046875, 0.13173675537109375, 0.1361083984375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 6.0, 5.0, 11.0, 4.0, 7.0, 14.0, 12.0, 14.0, 18.0, 22.0, 33.0, 31.0, 40.0, 35.0, 57.0, 51.0, 56.0, 50.0, 44.0, 49.0, 48.0, 47.0, 53.0, 35.0, 50.0, 37.0, 26.0, 27.0, 12.0, 17.0, 8.0, 13.0, 16.0, 6.0, 14.0, 6.0, 4.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.225969314575195e-05, -4.070345312356949e-05, -3.9147213101387024e-05, -3.759097307920456e-05, -3.6034733057022095e-05, -3.447849303483963e-05, -3.2922253012657166e-05, -3.13660129904747e-05, -2.9809772968292236e-05, -2.8253532946109772e-05, -2.6697292923927307e-05, -2.5141052901744843e-05, -2.3584812879562378e-05, -2.2028572857379913e-05, -2.047233283519745e-05, -1.8916092813014984e-05, -1.735985279083252e-05, -1.5803612768650055e-05, -1.424737274646759e-05, -1.2691132724285126e-05, -1.1134892702102661e-05, -9.578652679920197e-06, -8.022412657737732e-06, -6.466172635555267e-06, -4.909932613372803e-06, -3.353692591190338e-06, -1.7974525690078735e-06, -2.4121254682540894e-07, 1.3150274753570557e-06, 2.8712674975395203e-06, 4.427507519721985e-06, 5.9837475419044495e-06, 7.539987564086914e-06, 9.096227586269379e-06, 1.0652467608451843e-05, 1.2208707630634308e-05, 1.3764947652816772e-05, 1.5321187674999237e-05, 1.68774276971817e-05, 1.8433667719364166e-05, 1.998990774154663e-05, 2.1546147763729095e-05, 2.310238778591156e-05, 2.4658627808094025e-05, 2.621486783027649e-05, 2.7771107852458954e-05, 2.932734787464142e-05, 3.088358789682388e-05, 3.243982791900635e-05, 3.399606794118881e-05, 3.555230796337128e-05, 3.710854798555374e-05, 3.8664788007736206e-05, 4.022102802991867e-05, 4.1777268052101135e-05, 4.33335080742836e-05, 4.4889748096466064e-05, 4.644598811864853e-05, 4.8002228140830994e-05, 4.955846816301346e-05, 5.111470818519592e-05, 5.267094820737839e-05, 5.422718822956085e-05, 5.578342825174332e-05, 5.733966827392578e-05]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 5.0, 5.0, 7.0, 12.0, 12.0, 12.0, 7.0, 9.0, 19.0, 19.0, 24.0, 28.0, 49.0, 59.0, 92.0, 183.0, 360.0, 2174.0, 259703.0, 777016.0, 7486.0, 565.0, 260.0, 109.0, 88.0, 53.0, 43.0, 23.0, 25.0, 23.0, 21.0, 14.0, 3.0, 8.0, 13.0, 5.0, 9.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.001285552978515625, -0.0012527257204055786, -0.0012198984622955322, -0.0011870712041854858, -0.0011542439460754395, -0.001121416687965393, -0.0010885894298553467, -0.0010557621717453003, -0.001022934913635254, -0.0009901076555252075, -0.0009572803974151611, -0.0009244531393051147, -0.0008916258811950684, -0.000858798623085022, -0.0008259713649749756, -0.0007931441068649292, -0.0007603168487548828, -0.0007274895906448364, -0.00069466233253479, -0.0006618350744247437, -0.0006290078163146973, -0.0005961805582046509, -0.0005633533000946045, -0.0005305260419845581, -0.0004976987838745117, -0.00046487152576446533, -0.00043204426765441895, -0.00039921700954437256, -0.00036638975143432617, -0.0003335624933242798, -0.0003007352352142334, -0.000267907977104187, -0.00023508071899414062, -0.00020225346088409424, -0.00016942620277404785, -0.00013659894466400146, -0.00010377168655395508, -7.094442844390869e-05, -3.8117170333862305e-05, -5.289912223815918e-06, 2.753734588623047e-05, 6.0364603996276855e-05, 9.319186210632324e-05, 0.00012601912021636963, 0.00015884637832641602, 0.0001916736364364624, 0.0002245008945465088, 0.0002573281526565552, 0.00029015541076660156, 0.00032298266887664795, 0.00035580992698669434, 0.0003886371850967407, 0.0004214644432067871, 0.0004542917013168335, 0.0004871189594268799, 0.0005199462175369263, 0.0005527734756469727, 0.000585600733757019, 0.0006184279918670654, 0.0006512552499771118, 0.0006840825080871582, 0.0007169097661972046, 0.000749737024307251, 0.0007825642824172974, 0.0008153915405273438]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 11.0, 24.0, 82.0, 234.0, 344.0, 214.0, 76.0, 26.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002615794073790312, -0.0002567744813859463, -0.00025196955539286137, -0.000247164600295946, -0.0002423596743028611, -0.0002375547483097762, -0.00023274982231669128, -0.00022794489632360637, -0.00022313995577860624, -0.00021833502978552133, -0.0002135300892405212, -0.00020872516324743629, -0.00020392023725435138, -0.00019911529670935124, -0.00019431037071626633, -0.0001895054301712662, -0.0001847005041781813, -0.00017989557818509638, -0.00017509063764009625, -0.00017028571164701134, -0.0001654807711020112, -0.0001606758451089263, -0.0001558709191158414, -0.00015106599312275648, -0.00014626105257775635, -0.00014145612658467144, -0.0001366511860396713, -0.0001318462600465864, -0.0001270413340535015, -0.00012223639350850135, -0.00011743146751541644, -0.00011262653424637392, -0.0001078216009773314, -0.00010301666770828888, -9.821173443924636e-05, -9.340680844616145e-05, -8.860187517711893e-05, -8.37969419080764e-05, -7.89920159149915e-05, -7.418708264594898e-05, -6.938214937690645e-05, -6.457721610786393e-05, -5.977228647680022e-05, -5.4967356845736504e-05, -5.016242357669398e-05, -4.535749030765146e-05, -4.0552560676587746e-05, -3.574763104552403e-05, -3.0942701414460316e-05, -2.6137769964407198e-05, -2.133283851435408e-05, -1.6527907064300962e-05, -1.1722975614247844e-05, -6.9180441641947255e-06, -2.1131127141416073e-06, 2.6918169169221073e-06, 7.496750185964629e-06, 1.2301681636017747e-05, 1.7106613086070865e-05, 2.1911544536123984e-05, 2.6716475986177102e-05, 3.1521405617240816e-05, 3.632633888628334e-05, 4.113126851734705e-05, 4.5936201786389574e-05]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 2.0, 11.0, 12.0, 10.0, 9.0, 18.0, 14.0, 17.0, 21.0, 41.0, 29.0, 29.0, 39.0, 39.0, 38.0, 41.0, 37.0, 42.0, 46.0, 37.0, 45.0, 46.0, 42.0, 42.0, 36.0, 34.0, 32.0, 32.0, 23.0, 24.0, 24.0, 18.0, 16.0, 12.0, 5.0, 10.0, 7.0, 7.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.664327621459961e-05, -2.568308264017105e-05, -2.4722889065742493e-05, -2.3762695491313934e-05, -2.2802501916885376e-05, -2.1842308342456818e-05, -2.088211476802826e-05, -1.99219211935997e-05, -1.8961727619171143e-05, -1.8001534044742584e-05, -1.7041340470314026e-05, -1.6081146895885468e-05, -1.512095332145691e-05, -1.416075974702835e-05, -1.3200566172599792e-05, -1.2240372598171234e-05, -1.1280179023742676e-05, -1.0319985449314117e-05, -9.359791874885559e-06, -8.399598300457e-06, -7.439404726028442e-06, -6.479211151599884e-06, -5.519017577171326e-06, -4.558824002742767e-06, -3.598630428314209e-06, -2.6384368538856506e-06, -1.6782432794570923e-06, -7.180497050285339e-07, 2.421438694000244e-07, 1.2023374438285828e-06, 2.162531018257141e-06, 3.1227245926856995e-06, 4.082918167114258e-06, 5.043111741542816e-06, 6.0033053159713745e-06, 6.963498890399933e-06, 7.923692464828491e-06, 8.88388603925705e-06, 9.844079613685608e-06, 1.0804273188114166e-05, 1.1764466762542725e-05, 1.2724660336971283e-05, 1.3684853911399841e-05, 1.46450474858284e-05, 1.5605241060256958e-05, 1.6565434634685516e-05, 1.7525628209114075e-05, 1.8485821783542633e-05, 1.944601535797119e-05, 2.040620893239975e-05, 2.1366402506828308e-05, 2.2326596081256866e-05, 2.3286789655685425e-05, 2.4246983230113983e-05, 2.520717680454254e-05, 2.61673703789711e-05, 2.7127563953399658e-05, 2.8087757527828217e-05, 2.9047951102256775e-05, 3.0008144676685333e-05, 3.096833825111389e-05, 3.192853182554245e-05, 3.288872539997101e-05, 3.384891897439957e-05, 3.4809112548828125e-05]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 10.0, 7.0, 13.0, 14.0, 23.0, 19.0, 18.0, 22.0, 30.0, 23.0, 37.0, 31.0, 26.0, 32.0, 45.0, 52.0, 43.0, 52.0, 45.0, 41.0, 41.0, 42.0, 41.0, 42.0, 37.0, 25.0, 40.0, 19.0, 18.0, 23.0, 17.0, 15.0, 17.0, 8.0, 8.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.4296875, -5.23675537109375, -5.0438232421875, -4.85089111328125, -4.657958984375, -4.46502685546875, -4.2720947265625, -4.07916259765625, -3.88623046875, -3.69329833984375, -3.5003662109375, -3.30743408203125, -3.114501953125, -2.92156982421875, -2.7286376953125, -2.53570556640625, -2.3427734375, -2.14984130859375, -1.9569091796875, -1.76397705078125, -1.571044921875, -1.37811279296875, -1.1851806640625, -0.99224853515625, -0.79931640625, -0.60638427734375, -0.4134521484375, -0.22052001953125, -0.027587890625, 0.16534423828125, 0.3582763671875, 0.55120849609375, 0.744140625, 0.93707275390625, 1.1300048828125, 1.32293701171875, 1.515869140625, 1.70880126953125, 1.9017333984375, 2.09466552734375, 2.28759765625, 2.48052978515625, 2.6734619140625, 2.86639404296875, 3.059326171875, 3.25225830078125, 3.4451904296875, 3.63812255859375, 3.8310546875, 4.02398681640625, 4.2169189453125, 4.40985107421875, 4.602783203125, 4.79571533203125, 4.9886474609375, 5.18157958984375, 5.37451171875, 5.56744384765625, 5.7603759765625, 5.95330810546875, 6.146240234375, 6.33917236328125, 6.5321044921875, 6.72503662109375, 6.91796875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 11.0, 19.0, 17.0, 30.0, 52.0, 75.0, 141.0, 200.0, 345.0, 550.0, 1069.0, 1801.0, 3208.0, 5818.0, 10762.0, 21900.0, 47235.0, 114491.0, 337005.0, 310039.0, 105959.0, 44110.0, 20613.0, 10302.0, 5497.0, 3049.0, 1735.0, 1024.0, 600.0, 362.0, 172.0, 136.0, 80.0, 40.0, 41.0, 17.0, 13.0, 8.0, 8.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.427734375, -8.13671875, -7.845703125, -7.5546875, -7.263671875, -6.97265625, -6.681640625, -6.390625, -6.099609375, -5.80859375, -5.517578125, -5.2265625, -4.935546875, -4.64453125, -4.353515625, -4.0625, -3.771484375, -3.48046875, -3.189453125, -2.8984375, -2.607421875, -2.31640625, -2.025390625, -1.734375, -1.443359375, -1.15234375, -0.861328125, -0.5703125, -0.279296875, 0.01171875, 0.302734375, 0.59375, 0.884765625, 1.17578125, 1.466796875, 1.7578125, 2.048828125, 2.33984375, 2.630859375, 2.921875, 3.212890625, 3.50390625, 3.794921875, 4.0859375, 4.376953125, 4.66796875, 4.958984375, 5.25, 5.541015625, 5.83203125, 6.123046875, 6.4140625, 6.705078125, 6.99609375, 7.287109375, 7.578125, 7.869140625, 8.16015625, 8.451171875, 8.7421875, 9.033203125, 9.32421875, 9.615234375, 9.90625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 7.0, 1.0, 3.0, 10.0, 7.0, 13.0, 9.0, 12.0, 18.0, 22.0, 14.0, 22.0, 27.0, 35.0, 40.0, 33.0, 57.0, 76.0, 93.0, 135.0, 293.0, 1328.0, 195.0, 121.0, 81.0, 62.0, 53.0, 43.0, 33.0, 33.0, 34.0, 19.0, 25.0, 17.0, 14.0, 11.0, 9.0, 10.0, 6.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4140625, -14.8858642578125, -14.357666015625, -13.8294677734375, -13.30126953125, -12.7730712890625, -12.244873046875, -11.7166748046875, -11.1884765625, -10.6602783203125, -10.132080078125, -9.6038818359375, -9.07568359375, -8.5474853515625, -8.019287109375, -7.4910888671875, -6.962890625, -6.4346923828125, -5.906494140625, -5.3782958984375, -4.85009765625, -4.3218994140625, -3.793701171875, -3.2655029296875, -2.7373046875, -2.2091064453125, -1.680908203125, -1.1527099609375, -0.62451171875, -0.0963134765625, 0.431884765625, 0.9600830078125, 1.48828125, 2.0164794921875, 2.544677734375, 3.0728759765625, 3.60107421875, 4.1292724609375, 4.657470703125, 5.1856689453125, 5.7138671875, 6.2420654296875, 6.770263671875, 7.2984619140625, 7.82666015625, 8.3548583984375, 8.883056640625, 9.4112548828125, 9.939453125, 10.4676513671875, 10.995849609375, 11.5240478515625, 12.05224609375, 12.5804443359375, 13.108642578125, 13.6368408203125, 14.1650390625, 14.6932373046875, 15.221435546875, 15.7496337890625, 16.27783203125, 16.8060302734375, 17.334228515625, 17.8624267578125, 18.390625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 11.0, 7.0, 9.0, 8.0, 18.0, 19.0, 38.0, 32.0, 44.0, 101.0, 111.0, 189.0, 378.0, 602.0, 1264.0, 3251.0, 10519.0, 46742.0, 328392.0, 2394440.0, 300277.0, 43420.0, 10002.0, 3155.0, 1171.0, 577.0, 334.0, 192.0, 108.0, 81.0, 49.0, 44.0, 24.0, 17.0, 18.0, 12.0, 12.0, 11.0, 5.0, 5.0, 6.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 3.0], "bins": [-22.21875, -21.592529296875, -20.96630859375, -20.340087890625, -19.7138671875, -19.087646484375, -18.46142578125, -17.835205078125, -17.208984375, -16.582763671875, -15.95654296875, -15.330322265625, -14.7041015625, -14.077880859375, -13.45166015625, -12.825439453125, -12.19921875, -11.572998046875, -10.94677734375, -10.320556640625, -9.6943359375, -9.068115234375, -8.44189453125, -7.815673828125, -7.189453125, -6.563232421875, -5.93701171875, -5.310791015625, -4.6845703125, -4.058349609375, -3.43212890625, -2.805908203125, -2.1796875, -1.553466796875, -0.92724609375, -0.301025390625, 0.3251953125, 0.951416015625, 1.57763671875, 2.203857421875, 2.830078125, 3.456298828125, 4.08251953125, 4.708740234375, 5.3349609375, 5.961181640625, 6.58740234375, 7.213623046875, 7.83984375, 8.466064453125, 9.09228515625, 9.718505859375, 10.3447265625, 10.970947265625, 11.59716796875, 12.223388671875, 12.849609375, 13.475830078125, 14.10205078125, 14.728271484375, 15.3544921875, 15.980712890625, 16.60693359375, 17.233154296875, 17.859375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [8.0, 235.0, 659.0, 109.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.266681671142578, -12.285698890686035, -3.304716110229492, 5.676265716552734, 14.657249450683594, 23.638233184814453, 32.61921310424805, 41.600196838378906, 50.581180572509766, 59.562164306640625, 68.54314422607422, 77.52412414550781, 86.50511169433594, 95.48609924316406, 104.46707153320312, 113.44805908203125, 122.42904663085938, 131.4100341796875, 140.39100646972656, 149.3719940185547, 158.3529815673828, 167.33395385742188, 176.31494140625, 185.29592895507812, 194.2769012451172, 203.2578887939453, 212.23886108398438, 221.2198486328125, 230.20083618164062, 239.18182373046875, 248.1627960205078, 257.1437683105469, 266.1247863769531, 275.10577392578125, 284.0867614746094, 293.0677490234375, 302.0487060546875, 311.0296936035156, 320.01068115234375, 328.9916687011719, 337.97265625, 346.9536437988281, 355.93463134765625, 364.91558837890625, 373.8965759277344, 382.8775634765625, 391.8585510253906, 400.83953857421875, 409.82049560546875, 418.8014831542969, 427.782470703125, 436.763427734375, 445.7444152832031, 454.72540283203125, 463.7063903808594, 472.6873779296875, 481.6683654785156, 490.64935302734375, 499.6303405761719, 508.611328125, 517.59228515625, 526.5733032226562, 535.5542602539062, 544.5352172851562, 553.5162353515625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 2.0, 7.0, 4.0, 4.0, 5.0, 10.0, 14.0, 17.0, 25.0, 19.0, 33.0, 27.0, 39.0, 36.0, 36.0, 51.0, 44.0, 36.0, 56.0, 40.0, 42.0, 46.0, 45.0, 39.0, 45.0, 37.0, 42.0, 28.0, 26.0, 26.0, 21.0, 16.0, 15.0, 11.0, 15.0, 15.0, 5.0, 7.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.654327392578125, -45.12055206298828, -43.58677673339844, -42.053001403808594, -40.519229888916016, -38.98545455932617, -37.45167922973633, -35.917903900146484, -34.38412857055664, -32.8503532409668, -31.316579818725586, -29.782804489135742, -28.2490291595459, -26.715255737304688, -25.181480407714844, -23.647705078125, -22.11393165588379, -20.580156326293945, -19.046382904052734, -17.51260757446289, -15.978832244873047, -14.44505786895752, -12.911283493041992, -11.377508163452148, -9.843733787536621, -8.309959411621094, -6.77618408203125, -5.242409706115723, -3.708634853363037, -2.1748600006103516, -0.6410856246948242, 0.8926897048950195, 2.426464080810547, 3.9602389335632324, 5.494013786315918, 7.027788162231445, 8.561563491821289, 10.095337867736816, 11.629112243652344, 13.162887573242188, 14.696661949157715, 16.230436325073242, 17.764211654663086, 19.297985076904297, 20.83176040649414, 22.365535736083984, 23.899311065673828, 25.433086395263672, 26.966859817504883, 28.500635147094727, 30.034408569335938, 31.56818389892578, 33.101959228515625, 34.63573455810547, 36.16950988769531, 37.703285217285156, 39.237056732177734, 40.77083206176758, 42.30460739135742, 43.83837890625, 45.372154235839844, 46.90592956542969, 48.43970489501953, 49.973480224609375, 51.50725555419922]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 7.0, 4.0, 10.0, 13.0, 18.0, 18.0, 15.0, 23.0, 32.0, 18.0, 39.0, 28.0, 39.0, 31.0, 17.0, 49.0, 35.0, 51.0, 33.0, 38.0, 52.0, 46.0, 41.0, 42.0, 39.0, 36.0, 28.0, 25.0, 31.0, 21.0, 30.0, 17.0, 10.0, 14.0, 12.0, 9.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.43359375, -5.24163818359375, -5.0496826171875, -4.85772705078125, -4.665771484375, -4.47381591796875, -4.2818603515625, -4.08990478515625, -3.89794921875, -3.70599365234375, -3.5140380859375, -3.32208251953125, -3.130126953125, -2.93817138671875, -2.7462158203125, -2.55426025390625, -2.3623046875, -2.17034912109375, -1.9783935546875, -1.78643798828125, -1.594482421875, -1.40252685546875, -1.2105712890625, -1.01861572265625, -0.82666015625, -0.63470458984375, -0.4427490234375, -0.25079345703125, -0.058837890625, 0.13311767578125, 0.3250732421875, 0.51702880859375, 0.708984375, 0.90093994140625, 1.0928955078125, 1.28485107421875, 1.476806640625, 1.66876220703125, 1.8607177734375, 2.05267333984375, 2.24462890625, 2.43658447265625, 2.6285400390625, 2.82049560546875, 3.012451171875, 3.20440673828125, 3.3963623046875, 3.58831787109375, 3.7802734375, 3.97222900390625, 4.1641845703125, 4.35614013671875, 4.548095703125, 4.74005126953125, 4.9320068359375, 5.12396240234375, 5.31591796875, 5.50787353515625, 5.6998291015625, 5.89178466796875, 6.083740234375, 6.27569580078125, 6.4676513671875, 6.65960693359375, 6.8515625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 9.0, 12.0, 11.0, 21.0, 40.0, 53.0, 74.0, 128.0, 188.0, 331.0, 593.0, 1020.0, 1842.0, 3488.0, 7367.0, 17299.0, 47944.0, 166699.0, 1088243.0, 2378135.0, 351307.0, 80456.0, 27354.0, 10951.0, 4921.0, 2483.0, 1326.0, 753.0, 438.0, 251.0, 176.0, 120.0, 73.0, 43.0, 34.0, 29.0, 25.0, 12.0, 7.0, 7.0, 5.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.46875, -10.097900390625, -9.72705078125, -9.356201171875, -8.9853515625, -8.614501953125, -8.24365234375, -7.872802734375, -7.501953125, -7.131103515625, -6.76025390625, -6.389404296875, -6.0185546875, -5.647705078125, -5.27685546875, -4.906005859375, -4.53515625, -4.164306640625, -3.79345703125, -3.422607421875, -3.0517578125, -2.680908203125, -2.31005859375, -1.939208984375, -1.568359375, -1.197509765625, -0.82666015625, -0.455810546875, -0.0849609375, 0.285888671875, 0.65673828125, 1.027587890625, 1.3984375, 1.769287109375, 2.14013671875, 2.510986328125, 2.8818359375, 3.252685546875, 3.62353515625, 3.994384765625, 4.365234375, 4.736083984375, 5.10693359375, 5.477783203125, 5.8486328125, 6.219482421875, 6.59033203125, 6.961181640625, 7.33203125, 7.702880859375, 8.07373046875, 8.444580078125, 8.8154296875, 9.186279296875, 9.55712890625, 9.927978515625, 10.298828125, 10.669677734375, 11.04052734375, 11.411376953125, 11.7822265625, 12.153076171875, 12.52392578125, 12.894775390625, 13.265625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 13.0, 13.0, 13.0, 20.0, 36.0, 47.0, 60.0, 92.0, 119.0, 183.0, 247.0, 368.0, 568.0, 692.0, 486.0, 357.0, 207.0, 140.0, 106.0, 77.0, 57.0, 44.0, 20.0, 21.0, 20.0, 18.0, 12.0, 8.0, 4.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.5859375, -12.2296142578125, -11.873291015625, -11.5169677734375, -11.16064453125, -10.8043212890625, -10.447998046875, -10.0916748046875, -9.7353515625, -9.3790283203125, -9.022705078125, -8.6663818359375, -8.31005859375, -7.9537353515625, -7.597412109375, -7.2410888671875, -6.884765625, -6.5284423828125, -6.172119140625, -5.8157958984375, -5.45947265625, -5.1031494140625, -4.746826171875, -4.3905029296875, -4.0341796875, -3.6778564453125, -3.321533203125, -2.9652099609375, -2.60888671875, -2.2525634765625, -1.896240234375, -1.5399169921875, -1.18359375, -0.8272705078125, -0.470947265625, -0.1146240234375, 0.24169921875, 0.5980224609375, 0.954345703125, 1.3106689453125, 1.6669921875, 2.0233154296875, 2.379638671875, 2.7359619140625, 3.09228515625, 3.4486083984375, 3.804931640625, 4.1612548828125, 4.517578125, 4.8739013671875, 5.230224609375, 5.5865478515625, 5.94287109375, 6.2991943359375, 6.655517578125, 7.0118408203125, 7.3681640625, 7.7244873046875, 8.080810546875, 8.4371337890625, 8.79345703125, 9.1497802734375, 9.506103515625, 9.8624267578125, 10.21875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 6.0, 8.0, 9.0, 17.0, 21.0, 29.0, 21.0, 48.0, 68.0, 100.0, 184.0, 270.0, 471.0, 1021.0, 2808.0, 10903.0, 69510.0, 1245209.0, 2730438.0, 111842.0, 15060.0, 3601.0, 1211.0, 554.0, 310.0, 180.0, 135.0, 65.0, 47.0, 44.0, 28.0, 17.0, 14.0, 5.0, 6.0, 7.0, 6.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.875, -29.88232421875, -28.8896484375, -27.89697265625, -26.904296875, -25.91162109375, -24.9189453125, -23.92626953125, -22.93359375, -21.94091796875, -20.9482421875, -19.95556640625, -18.962890625, -17.97021484375, -16.9775390625, -15.98486328125, -14.9921875, -13.99951171875, -13.0068359375, -12.01416015625, -11.021484375, -10.02880859375, -9.0361328125, -8.04345703125, -7.05078125, -6.05810546875, -5.0654296875, -4.07275390625, -3.080078125, -2.08740234375, -1.0947265625, -0.10205078125, 0.890625, 1.88330078125, 2.8759765625, 3.86865234375, 4.861328125, 5.85400390625, 6.8466796875, 7.83935546875, 8.83203125, 9.82470703125, 10.8173828125, 11.81005859375, 12.802734375, 13.79541015625, 14.7880859375, 15.78076171875, 16.7734375, 17.76611328125, 18.7587890625, 19.75146484375, 20.744140625, 21.73681640625, 22.7294921875, 23.72216796875, 24.71484375, 25.70751953125, 26.7001953125, 27.69287109375, 28.685546875, 29.67822265625, 30.6708984375, 31.66357421875, 32.65625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 7.0, 8.0, 20.0, 26.0, 42.0, 57.0, 87.0, 100.0, 114.0, 111.0, 95.0, 94.0, 66.0, 56.0, 47.0, 34.0, 19.0, 14.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.049339294433594, -50.26707458496094, -48.484806060791016, -46.702537536621094, -44.92027282714844, -43.13800811767578, -41.35573959350586, -39.57347106933594, -37.79120635986328, -36.008941650390625, -34.2266731262207, -32.44440460205078, -30.662139892578125, -28.879873275756836, -27.097606658935547, -25.315340042114258, -23.53307342529297, -21.75080680847168, -19.96854019165039, -18.1862735748291, -16.404006958007812, -14.621740341186523, -12.839473724365234, -11.057207107543945, -9.274940490722656, -7.492673873901367, -5.710407257080078, -3.928140640258789, -2.1458740234375, -0.36360740661621094, 1.4186592102050781, 3.200925827026367, 4.983188629150391, 6.76545524597168, 8.547721862792969, 10.329988479614258, 12.112255096435547, 13.894521713256836, 15.676788330078125, 17.459054946899414, 19.241321563720703, 21.023588180541992, 22.80585479736328, 24.58812141418457, 26.37038803100586, 28.15265464782715, 29.934921264648438, 31.717187881469727, 33.499454498291016, 35.28172302246094, 37.063987731933594, 38.84625244140625, 40.62852096557617, 42.410789489746094, 44.19305419921875, 45.975318908691406, 47.75758743286133, 49.53985595703125, 51.322120666503906, 53.10438537597656, 54.886653900146484, 56.668922424316406, 58.45118713378906, 60.23345184326172, 62.01572036743164]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 6.0, 6.0, 5.0, 8.0, 7.0, 8.0, 7.0, 11.0, 15.0, 20.0, 23.0, 24.0, 21.0, 26.0, 31.0, 30.0, 34.0, 29.0, 30.0, 32.0, 35.0, 45.0, 40.0, 40.0, 52.0, 39.0, 38.0, 36.0, 34.0, 27.0, 32.0, 26.0, 30.0, 25.0, 30.0, 18.0, 18.0, 24.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.224472045898438, -28.254533767700195, -27.284595489501953, -26.31465721130371, -25.34471893310547, -24.374780654907227, -23.404842376708984, -22.434904098510742, -21.4649658203125, -20.495027542114258, -19.525089263916016, -18.555150985717773, -17.58521270751953, -16.61527442932129, -15.645336151123047, -14.675397872924805, -13.705459594726562, -12.73552131652832, -11.765583038330078, -10.795644760131836, -9.825706481933594, -8.855768203735352, -7.885829925537109, -6.915891647338867, -5.945953369140625, -4.976015090942383, -4.006076812744141, -3.0361385345458984, -2.0662002563476562, -1.096261978149414, -0.12632369995117188, 0.8436145782470703, 1.8135528564453125, 2.7834911346435547, 3.753429412841797, 4.723367691040039, 5.693305969238281, 6.663244247436523, 7.633182525634766, 8.603120803833008, 9.57305908203125, 10.542997360229492, 11.512935638427734, 12.482873916625977, 13.452812194824219, 14.422750473022461, 15.392688751220703, 16.362627029418945, 17.332565307617188, 18.30250358581543, 19.272441864013672, 20.242380142211914, 21.212318420410156, 22.1822566986084, 23.15219497680664, 24.122133255004883, 25.092071533203125, 26.062009811401367, 27.03194808959961, 28.00188636779785, 28.971824645996094, 29.941762924194336, 30.911701202392578, 31.88163948059082, 32.85157775878906]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 5.0, 4.0, 4.0, 3.0, 3.0, 6.0, 10.0, 19.0, 15.0, 23.0, 23.0, 24.0, 33.0, 20.0, 23.0, 25.0, 41.0, 36.0, 31.0, 37.0, 37.0, 37.0, 39.0, 39.0, 43.0, 46.0, 33.0, 39.0, 35.0, 35.0, 29.0, 33.0, 27.0, 22.0, 23.0, 17.0, 11.0, 18.0, 18.0, 8.0, 11.0, 5.0, 10.0, 2.0, 2.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2578125, -5.07037353515625, -4.8829345703125, -4.69549560546875, -4.508056640625, -4.32061767578125, -4.1331787109375, -3.94573974609375, -3.75830078125, -3.57086181640625, -3.3834228515625, -3.19598388671875, -3.008544921875, -2.82110595703125, -2.6336669921875, -2.44622802734375, -2.2587890625, -2.07135009765625, -1.8839111328125, -1.69647216796875, -1.509033203125, -1.32159423828125, -1.1341552734375, -0.94671630859375, -0.75927734375, -0.57183837890625, -0.3843994140625, -0.19696044921875, -0.009521484375, 0.17791748046875, 0.3653564453125, 0.55279541015625, 0.740234375, 0.92767333984375, 1.1151123046875, 1.30255126953125, 1.489990234375, 1.67742919921875, 1.8648681640625, 2.05230712890625, 2.23974609375, 2.42718505859375, 2.6146240234375, 2.80206298828125, 2.989501953125, 3.17694091796875, 3.3643798828125, 3.55181884765625, 3.7392578125, 3.92669677734375, 4.1141357421875, 4.30157470703125, 4.489013671875, 4.67645263671875, 4.8638916015625, 5.05133056640625, 5.23876953125, 5.42620849609375, 5.6136474609375, 5.80108642578125, 5.988525390625, 6.17596435546875, 6.3634033203125, 6.55084228515625, 6.73828125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 0.0, 6.0, 5.0, 8.0, 15.0, 16.0, 32.0, 44.0, 69.0, 70.0, 136.0, 210.0, 313.0, 457.0, 739.0, 1063.0, 1671.0, 2559.0, 4021.0, 6148.0, 9967.0, 15950.0, 26346.0, 42854.0, 74810.0, 145971.0, 304855.0, 189906.0, 89230.0, 50894.0, 30107.0, 18416.0, 11470.0, 7206.0, 4618.0, 2890.0, 1848.0, 1249.0, 817.0, 560.0, 306.0, 247.0, 157.0, 91.0, 71.0, 56.0, 27.0, 23.0, 17.0, 10.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.208740234375, -0.20170021057128906, -0.19466018676757812, -0.1876201629638672, -0.18058013916015625, -0.1735401153564453, -0.16650009155273438, -0.15946006774902344, -0.1524200439453125, -0.14538002014160156, -0.13833999633789062, -0.1312999725341797, -0.12425994873046875, -0.11721992492675781, -0.11017990112304688, -0.10313987731933594, -0.096099853515625, -0.08905982971191406, -0.08201980590820312, -0.07497978210449219, -0.06793975830078125, -0.06089973449707031, -0.053859710693359375, -0.04681968688964844, -0.0397796630859375, -0.03273963928222656, -0.025699615478515625, -0.018659591674804688, -0.01161956787109375, -0.0045795440673828125, 0.002460479736328125, 0.009500503540039062, 0.01654052734375, 0.023580551147460938, 0.030620574951171875, 0.03766059875488281, 0.04470062255859375, 0.05174064636230469, 0.058780670166015625, 0.06582069396972656, 0.0728607177734375, 0.07990074157714844, 0.08694076538085938, 0.09398078918457031, 0.10102081298828125, 0.10806083679199219, 0.11510086059570312, 0.12214088439941406, 0.129180908203125, 0.13622093200683594, 0.14326095581054688, 0.1503009796142578, 0.15734100341796875, 0.1643810272216797, 0.17142105102539062, 0.17846107482910156, 0.1855010986328125, 0.19254112243652344, 0.19958114624023438, 0.2066211700439453, 0.21366119384765625, 0.2207012176513672, 0.22774124145507812, 0.23478126525878906, 0.2418212890625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 3.0, 5.0, 4.0, 12.0, 17.0, 9.0, 10.0, 9.0, 20.0, 11.0, 19.0, 18.0, 28.0, 29.0, 34.0, 33.0, 23.0, 43.0, 47.0, 38.0, 39.0, 1070.0, 43.0, 50.0, 46.0, 30.0, 37.0, 42.0, 40.0, 31.0, 29.0, 32.0, 19.0, 17.0, 9.0, 16.0, 9.0, 11.0, 7.0, 12.0, 5.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.390625, -4.256591796875, -4.12255859375, -3.988525390625, -3.8544921875, -3.720458984375, -3.58642578125, -3.452392578125, -3.318359375, -3.184326171875, -3.05029296875, -2.916259765625, -2.7822265625, -2.648193359375, -2.51416015625, -2.380126953125, -2.24609375, -2.112060546875, -1.97802734375, -1.843994140625, -1.7099609375, -1.575927734375, -1.44189453125, -1.307861328125, -1.173828125, -1.039794921875, -0.90576171875, -0.771728515625, -0.6376953125, -0.503662109375, -0.36962890625, -0.235595703125, -0.1015625, 0.032470703125, 0.16650390625, 0.300537109375, 0.4345703125, 0.568603515625, 0.70263671875, 0.836669921875, 0.970703125, 1.104736328125, 1.23876953125, 1.372802734375, 1.5068359375, 1.640869140625, 1.77490234375, 1.908935546875, 2.04296875, 2.177001953125, 2.31103515625, 2.445068359375, 2.5791015625, 2.713134765625, 2.84716796875, 2.981201171875, 3.115234375, 3.249267578125, 3.38330078125, 3.517333984375, 3.6513671875, 3.785400390625, 3.91943359375, 4.053466796875, 4.1875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 8.0, 13.0, 23.0, 34.0, 44.0, 60.0, 110.0, 164.0, 226.0, 392.0, 582.0, 863.0, 1437.0, 2193.0, 3319.0, 5393.0, 8502.0, 13968.0, 23009.0, 39773.0, 72502.0, 151884.0, 1370721.0, 196925.0, 88658.0, 47159.0, 26432.0, 16147.0, 9860.0, 6045.0, 3837.0, 2399.0, 1607.0, 1013.0, 634.0, 412.0, 287.0, 164.0, 113.0, 74.0, 59.0, 28.0, 17.0, 11.0, 15.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.168701171875, -0.1638317108154297, -0.15896224975585938, -0.15409278869628906, -0.14922332763671875, -0.14435386657714844, -0.13948440551757812, -0.1346149444580078, -0.1297454833984375, -0.12487602233886719, -0.12000656127929688, -0.11513710021972656, -0.11026763916015625, -0.10539817810058594, -0.10052871704101562, -0.09565925598144531, -0.090789794921875, -0.08592033386230469, -0.08105087280273438, -0.07618141174316406, -0.07131195068359375, -0.06644248962402344, -0.061573028564453125, -0.05670356750488281, -0.0518341064453125, -0.04696464538574219, -0.042095184326171875, -0.03722572326660156, -0.03235626220703125, -0.027486801147460938, -0.022617340087890625, -0.017747879028320312, -0.01287841796875, -0.008008956909179688, -0.003139495849609375, 0.0017299652099609375, 0.00659942626953125, 0.011468887329101562, 0.016338348388671875, 0.021207809448242188, 0.0260772705078125, 0.030946731567382812, 0.035816192626953125, 0.04068565368652344, 0.04555511474609375, 0.05042457580566406, 0.055294036865234375, 0.06016349792480469, 0.065032958984375, 0.06990242004394531, 0.07477188110351562, 0.07964134216308594, 0.08451080322265625, 0.08938026428222656, 0.09424972534179688, 0.09911918640136719, 0.1039886474609375, 0.10885810852050781, 0.11372756958007812, 0.11859703063964844, 0.12346649169921875, 0.12833595275878906, 0.13320541381835938, 0.1380748748779297, 0.1429443359375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 5.0, 6.0, 7.0, 18.0, 16.0, 13.0, 26.0, 24.0, 32.0, 29.0, 29.0, 53.0, 39.0, 40.0, 43.0, 55.0, 46.0, 54.0, 47.0, 56.0, 47.0, 38.0, 32.0, 34.0, 31.0, 24.0, 30.0, 23.0, 15.0, 13.0, 12.0, 8.0, 8.0, 6.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.2869319915771484e-05, -5.1233917474746704e-05, -4.9598515033721924e-05, -4.7963112592697144e-05, -4.632771015167236e-05, -4.469230771064758e-05, -4.30569052696228e-05, -4.142150282859802e-05, -3.978610038757324e-05, -3.815069794654846e-05, -3.651529550552368e-05, -3.48798930644989e-05, -3.324449062347412e-05, -3.160908818244934e-05, -2.997368574142456e-05, -2.833828330039978e-05, -2.6702880859375e-05, -2.506747841835022e-05, -2.343207597732544e-05, -2.179667353630066e-05, -2.016127109527588e-05, -1.85258686542511e-05, -1.689046621322632e-05, -1.5255063772201538e-05, -1.3619661331176758e-05, -1.1984258890151978e-05, -1.0348856449127197e-05, -8.713454008102417e-06, -7.078051567077637e-06, -5.4426491260528564e-06, -3.807246685028076e-06, -2.171844244003296e-06, -5.364418029785156e-07, 1.0989606380462646e-06, 2.734363079071045e-06, 4.369765520095825e-06, 6.0051679611206055e-06, 7.640570402145386e-06, 9.275972843170166e-06, 1.0911375284194946e-05, 1.2546777725219727e-05, 1.4182180166244507e-05, 1.5817582607269287e-05, 1.7452985048294067e-05, 1.9088387489318848e-05, 2.0723789930343628e-05, 2.2359192371368408e-05, 2.399459481239319e-05, 2.562999725341797e-05, 2.726539969444275e-05, 2.890080213546753e-05, 3.053620457649231e-05, 3.217160701751709e-05, 3.380700945854187e-05, 3.544241189956665e-05, 3.707781434059143e-05, 3.871321678161621e-05, 4.034861922264099e-05, 4.198402166366577e-05, 4.361942410469055e-05, 4.525482654571533e-05, 4.689022898674011e-05, 4.852563142776489e-05, 5.016103386878967e-05, 5.179643630981445e-05]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 4.0, 5.0, 3.0, 9.0, 8.0, 15.0, 8.0, 21.0, 36.0, 24.0, 34.0, 58.0, 54.0, 85.0, 154.0, 337.0, 1856.0, 299612.0, 740652.0, 4455.0, 447.0, 213.0, 105.0, 75.0, 59.0, 43.0, 33.0, 30.0, 27.0, 15.0, 14.0, 14.0, 9.0, 4.0, 9.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00118255615234375, -0.0011457353830337524, -0.0011089146137237549, -0.0010720938444137573, -0.0010352730751037598, -0.0009984523057937622, -0.0009616315364837646, -0.0009248107671737671, -0.0008879899978637695, -0.000851169228553772, -0.0008143484592437744, -0.0007775276899337769, -0.0007407069206237793, -0.0007038861513137817, -0.0006670653820037842, -0.0006302446126937866, -0.0005934238433837891, -0.0005566030740737915, -0.0005197823047637939, -0.0004829615354537964, -0.00044614076614379883, -0.00040931999683380127, -0.0003724992275238037, -0.00033567845821380615, -0.0002988576889038086, -0.00026203691959381104, -0.00022521615028381348, -0.00018839538097381592, -0.00015157461166381836, -0.0001147538423538208, -7.793307304382324e-05, -4.1112303733825684e-05, -4.291534423828125e-06, 3.2529234886169434e-05, 6.935000419616699e-05, 0.00010617077350616455, 0.0001429915428161621, 0.00017981231212615967, 0.00021663308143615723, 0.0002534538507461548, 0.00029027462005615234, 0.0003270953893661499, 0.00036391615867614746, 0.000400736927986145, 0.0004375576972961426, 0.00047437846660614014, 0.0005111992359161377, 0.0005480200052261353, 0.0005848407745361328, 0.0006216615438461304, 0.0006584823131561279, 0.0006953030824661255, 0.000732123851776123, 0.0007689446210861206, 0.0008057653903961182, 0.0008425861597061157, 0.0008794069290161133, 0.0009162276983261108, 0.0009530484676361084, 0.000989869236946106, 0.0010266900062561035, 0.001063510775566101, 0.0011003315448760986, 0.0011371523141860962, 0.0011739730834960938]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 19.0, 334.0, 607.0, 55.0, 2.0], "bins": [-0.0007627009763382375, -0.0007502383668906987, -0.0007377757574431598, -0.000725313147995621, -0.0007128505385480821, -0.0007003879291005433, -0.0006879253196530044, -0.0006754627102054656, -0.0006630001007579267, -0.0006505374913103878, -0.000638074881862849, -0.0006256122724153101, -0.0006131496629677713, -0.0006006870535202324, -0.0005882244440726936, -0.0005757618346251547, -0.0005632992251776159, -0.000550836615730077, -0.0005383740062825382, -0.0005259113968349993, -0.0005134487873874605, -0.0005009861779399216, -0.0004885235684923828, -0.0004760609590448439, -0.0004635983204934746, -0.00045113571104593575, -0.0004386731015983969, -0.00042621049215085804, -0.0004137478827033192, -0.00040128527325578034, -0.0003888226638082415, -0.00037636005436070263, -0.00036389747401699424, -0.0003514348645694554, -0.00033897225512191653, -0.0003265096456743777, -0.00031404703622683883, -0.0003015844267793, -0.0002891218173317611, -0.00027665920788422227, -0.00026419656933285296, -0.0002517339598853141, -0.00023927135043777525, -0.0002268087409902364, -0.00021434613154269755, -0.0002018835220951587, -0.00018942091264761984, -0.000176958303200081, -0.00016449569375254214, -0.00015203308430500329, -0.00013957047485746443, -0.00012710786540992558, -0.00011464525596238673, -0.00010218263923889026, -8.972002979135141e-05, -7.725742034381256e-05, -6.479481817223132e-05, -5.2332208724692464e-05, -3.986959927715361e-05, -2.740698619163595e-05, -1.4944376744097099e-05, -2.481763658579439e-06, 9.980845788959414e-06, 2.2443455236498266e-05, 3.4906068322015926e-05]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 7.0, 5.0, 12.0, 10.0, 12.0, 18.0, 17.0, 22.0, 8.0, 25.0, 35.0, 33.0, 40.0, 45.0, 45.0, 44.0, 44.0, 41.0, 56.0, 51.0, 45.0, 50.0, 35.0, 34.0, 35.0, 32.0, 33.0, 27.0, 22.0, 19.0, 22.0, 16.0, 9.0, 12.0, 15.0, 7.0, 7.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.24249267578125e-05, -3.1334348022937775e-05, -3.024376928806305e-05, -2.9153190553188324e-05, -2.80626118183136e-05, -2.6972033083438873e-05, -2.5881454348564148e-05, -2.4790875613689423e-05, -2.3700296878814697e-05, -2.2609718143939972e-05, -2.1519139409065247e-05, -2.042856067419052e-05, -1.9337981939315796e-05, -1.824740320444107e-05, -1.7156824469566345e-05, -1.606624573469162e-05, -1.4975666999816895e-05, -1.388508826494217e-05, -1.2794509530067444e-05, -1.1703930795192719e-05, -1.0613352060317993e-05, -9.522773325443268e-06, -8.432194590568542e-06, -7.341615855693817e-06, -6.251037120819092e-06, -5.1604583859443665e-06, -4.069879651069641e-06, -2.9793009161949158e-06, -1.8887221813201904e-06, -7.981434464454651e-07, 2.9243528842926025e-07, 1.3830140233039856e-06, 2.473592758178711e-06, 3.5641714930534363e-06, 4.654750227928162e-06, 5.745328962802887e-06, 6.835907697677612e-06, 7.926486432552338e-06, 9.017065167427063e-06, 1.0107643902301788e-05, 1.1198222637176514e-05, 1.2288801372051239e-05, 1.3379380106925964e-05, 1.446995884180069e-05, 1.5560537576675415e-05, 1.665111631155014e-05, 1.7741695046424866e-05, 1.883227378129959e-05, 1.9922852516174316e-05, 2.1013431251049042e-05, 2.2104009985923767e-05, 2.3194588720798492e-05, 2.4285167455673218e-05, 2.5375746190547943e-05, 2.646632492542267e-05, 2.7556903660297394e-05, 2.864748239517212e-05, 2.9738061130046844e-05, 3.082863986492157e-05, 3.1919218599796295e-05, 3.300979733467102e-05, 3.4100376069545746e-05, 3.519095480442047e-05, 3.6281533539295197e-05, 3.737211227416992e-05]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 5.0, 4.0, 4.0, 3.0, 3.0, 6.0, 10.0, 19.0, 15.0, 23.0, 23.0, 24.0, 33.0, 20.0, 23.0, 25.0, 41.0, 36.0, 31.0, 37.0, 37.0, 37.0, 39.0, 39.0, 43.0, 46.0, 33.0, 39.0, 35.0, 35.0, 29.0, 33.0, 27.0, 22.0, 23.0, 17.0, 11.0, 18.0, 18.0, 8.0, 11.0, 5.0, 10.0, 2.0, 2.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2578125, -5.07037353515625, -4.8829345703125, -4.69549560546875, -4.508056640625, -4.32061767578125, -4.1331787109375, -3.94573974609375, -3.75830078125, -3.57086181640625, -3.3834228515625, -3.19598388671875, -3.008544921875, -2.82110595703125, -2.6336669921875, -2.44622802734375, -2.2587890625, -2.07135009765625, -1.8839111328125, -1.69647216796875, -1.509033203125, -1.32159423828125, -1.1341552734375, -0.94671630859375, -0.75927734375, -0.57183837890625, -0.3843994140625, -0.19696044921875, -0.009521484375, 0.17791748046875, 0.3653564453125, 0.55279541015625, 0.740234375, 0.92767333984375, 1.1151123046875, 1.30255126953125, 1.489990234375, 1.67742919921875, 1.8648681640625, 2.05230712890625, 2.23974609375, 2.42718505859375, 2.6146240234375, 2.80206298828125, 2.989501953125, 3.17694091796875, 3.3643798828125, 3.55181884765625, 3.7392578125, 3.92669677734375, 4.1141357421875, 4.30157470703125, 4.489013671875, 4.67645263671875, 4.8638916015625, 5.05133056640625, 5.23876953125, 5.42620849609375, 5.6136474609375, 5.80108642578125, 5.988525390625, 6.17596435546875, 6.3634033203125, 6.55084228515625, 6.73828125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 8.0, 8.0, 9.0, 13.0, 18.0, 17.0, 33.0, 39.0, 54.0, 76.0, 110.0, 166.0, 261.0, 368.0, 555.0, 772.0, 1172.0, 1785.0, 2892.0, 4721.0, 7981.0, 13964.0, 25811.0, 50440.0, 108201.0, 327890.0, 295337.0, 100258.0, 47561.0, 24384.0, 13505.0, 7536.0, 4455.0, 2893.0, 1754.0, 1169.0, 740.0, 492.0, 344.0, 233.0, 164.0, 109.0, 91.0, 56.0, 24.0, 31.0, 19.0, 12.0, 9.0, 15.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-8.140625, -7.8594970703125, -7.578369140625, -7.2972412109375, -7.01611328125, -6.7349853515625, -6.453857421875, -6.1727294921875, -5.8916015625, -5.6104736328125, -5.329345703125, -5.0482177734375, -4.76708984375, -4.4859619140625, -4.204833984375, -3.9237060546875, -3.642578125, -3.3614501953125, -3.080322265625, -2.7991943359375, -2.51806640625, -2.2369384765625, -1.955810546875, -1.6746826171875, -1.3935546875, -1.1124267578125, -0.831298828125, -0.5501708984375, -0.26904296875, 0.0120849609375, 0.293212890625, 0.5743408203125, 0.85546875, 1.1365966796875, 1.417724609375, 1.6988525390625, 1.97998046875, 2.2611083984375, 2.542236328125, 2.8233642578125, 3.1044921875, 3.3856201171875, 3.666748046875, 3.9478759765625, 4.22900390625, 4.5101318359375, 4.791259765625, 5.0723876953125, 5.353515625, 5.6346435546875, 5.915771484375, 6.1968994140625, 6.47802734375, 6.7591552734375, 7.040283203125, 7.3214111328125, 7.6025390625, 7.8836669921875, 8.164794921875, 8.4459228515625, 8.72705078125, 9.0081787109375, 9.289306640625, 9.5704345703125, 9.8515625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 6.0, 5.0, 1.0, 7.0, 10.0, 12.0, 14.0, 25.0, 21.0, 23.0, 35.0, 41.0, 34.0, 58.0, 70.0, 75.0, 104.0, 352.0, 1528.0, 190.0, 82.0, 70.0, 40.0, 55.0, 39.0, 42.0, 25.0, 24.0, 21.0, 15.0, 14.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.40625, -19.656494140625, -18.90673828125, -18.156982421875, -17.4072265625, -16.657470703125, -15.90771484375, -15.157958984375, -14.408203125, -13.658447265625, -12.90869140625, -12.158935546875, -11.4091796875, -10.659423828125, -9.90966796875, -9.159912109375, -8.41015625, -7.660400390625, -6.91064453125, -6.160888671875, -5.4111328125, -4.661376953125, -3.91162109375, -3.161865234375, -2.412109375, -1.662353515625, -0.91259765625, -0.162841796875, 0.5869140625, 1.336669921875, 2.08642578125, 2.836181640625, 3.5859375, 4.335693359375, 5.08544921875, 5.835205078125, 6.5849609375, 7.334716796875, 8.08447265625, 8.834228515625, 9.583984375, 10.333740234375, 11.08349609375, 11.833251953125, 12.5830078125, 13.332763671875, 14.08251953125, 14.832275390625, 15.58203125, 16.331787109375, 17.08154296875, 17.831298828125, 18.5810546875, 19.330810546875, 20.08056640625, 20.830322265625, 21.580078125, 22.329833984375, 23.07958984375, 23.829345703125, 24.5791015625, 25.328857421875, 26.07861328125, 26.828369140625, 27.578125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 9.0, 3.0, 7.0, 11.0, 26.0, 19.0, 29.0, 43.0, 57.0, 86.0, 156.0, 315.0, 885.0, 3637.0, 22046.0, 271274.0, 2696200.0, 133002.0, 13977.0, 2526.0, 715.0, 239.0, 111.0, 106.0, 65.0, 41.0, 35.0, 22.0, 16.0, 14.0, 11.0, 6.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.75, -33.7392578125, -32.728515625, -31.7177734375, -30.70703125, -29.6962890625, -28.685546875, -27.6748046875, -26.6640625, -25.6533203125, -24.642578125, -23.6318359375, -22.62109375, -21.6103515625, -20.599609375, -19.5888671875, -18.578125, -17.5673828125, -16.556640625, -15.5458984375, -14.53515625, -13.5244140625, -12.513671875, -11.5029296875, -10.4921875, -9.4814453125, -8.470703125, -7.4599609375, -6.44921875, -5.4384765625, -4.427734375, -3.4169921875, -2.40625, -1.3955078125, -0.384765625, 0.6259765625, 1.63671875, 2.6474609375, 3.658203125, 4.6689453125, 5.6796875, 6.6904296875, 7.701171875, 8.7119140625, 9.72265625, 10.7333984375, 11.744140625, 12.7548828125, 13.765625, 14.7763671875, 15.787109375, 16.7978515625, 17.80859375, 18.8193359375, 19.830078125, 20.8408203125, 21.8515625, 22.8623046875, 23.873046875, 24.8837890625, 25.89453125, 26.9052734375, 27.916015625, 28.9267578125, 29.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 22.0, 31.0, 44.0, 83.0, 117.0, 171.0, 145.0, 130.0, 100.0, 68.0, 40.0, 26.0, 10.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.14958190917969, -41.562477111816406, -39.975372314453125, -38.388267517089844, -36.80116271972656, -35.21405792236328, -33.626953125, -32.03984832763672, -30.45274543762207, -28.86564064025879, -27.278535842895508, -25.69143295288086, -24.104328155517578, -22.517223358154297, -20.930118560791016, -19.343013763427734, -17.755908966064453, -16.168804168701172, -14.58169937133789, -12.994595527648926, -11.407490730285645, -9.820385932922363, -8.233282089233398, -6.646177291870117, -5.059072494506836, -3.471967935562134, -1.8848633766174316, -0.2977590560913086, 1.2893457412719727, 2.876450538635254, 4.463554382324219, 6.0506591796875, 7.637767791748047, 9.224872589111328, 10.81197738647461, 12.399081230163574, 13.986186027526855, 15.573290824890137, 17.1603946685791, 18.747499465942383, 20.334604263305664, 21.921709060668945, 23.508813858032227, 25.095916748046875, 26.683021545410156, 28.270126342773438, 29.85723114013672, 31.4443359375, 33.03144073486328, 34.61854553222656, 36.205650329589844, 37.792755126953125, 39.379859924316406, 40.96696472167969, 42.55406951904297, 44.14117431640625, 45.72827911376953, 47.31538391113281, 48.902488708496094, 50.489593505859375, 52.076698303222656, 53.66380310058594, 55.25090789794922, 56.8380126953125, 58.425113677978516]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 0.0, 7.0, 5.0, 3.0, 3.0, 9.0, 5.0, 10.0, 7.0, 4.0, 11.0, 16.0, 21.0, 21.0, 28.0, 23.0, 27.0, 26.0, 40.0, 42.0, 47.0, 51.0, 44.0, 41.0, 57.0, 45.0, 32.0, 37.0, 32.0, 27.0, 39.0, 34.0, 32.0, 21.0, 24.0, 12.0, 31.0, 18.0, 13.0, 17.0, 13.0, 4.0, 5.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.379905700683594, -43.79947280883789, -42.21903991699219, -40.638607025146484, -39.05817413330078, -37.47774124145508, -35.897308349609375, -34.316871643066406, -32.73644256591797, -31.156009674072266, -29.575576782226562, -27.99514389038086, -26.414710998535156, -24.834278106689453, -23.253843307495117, -21.673410415649414, -20.092975616455078, -18.512542724609375, -16.932109832763672, -15.351675987243652, -13.77124309539795, -12.190810203552246, -10.610376358032227, -9.029943466186523, -7.44951057434082, -5.869077682495117, -4.288644313812256, -2.7082109451293945, -1.1277780532836914, 0.4526548385620117, 2.0330886840820312, 3.6135215759277344, 5.193950653076172, 6.774383544921875, 8.354816436767578, 9.935250282287598, 11.5156831741333, 13.096116065979004, 14.676549911499023, 16.256982803344727, 17.83741569519043, 19.417848587036133, 20.998281478881836, 22.578716278076172, 24.159149169921875, 25.739582061767578, 27.32001495361328, 28.900447845458984, 30.480880737304688, 32.06131362915039, 33.641746520996094, 35.2221794128418, 36.8026123046875, 38.3830451965332, 39.963478088378906, 41.543914794921875, 43.12434387207031, 44.704776763916016, 46.28520965576172, 47.86564254760742, 49.446075439453125, 51.02650833129883, 52.60694122314453, 54.1873779296875, 55.7678108215332]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 2.0, 7.0, 6.0, 10.0, 13.0, 9.0, 23.0, 19.0, 24.0, 31.0, 17.0, 22.0, 29.0, 36.0, 30.0, 28.0, 36.0, 47.0, 36.0, 36.0, 41.0, 38.0, 44.0, 43.0, 40.0, 40.0, 27.0, 27.0, 34.0, 26.0, 32.0, 22.0, 27.0, 15.0, 7.0, 9.0, 16.0, 14.0, 10.0, 7.0, 3.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.44921875, -5.260009765625, -5.07080078125, -4.881591796875, -4.6923828125, -4.503173828125, -4.31396484375, -4.124755859375, -3.935546875, -3.746337890625, -3.55712890625, -3.367919921875, -3.1787109375, -2.989501953125, -2.80029296875, -2.611083984375, -2.421875, -2.232666015625, -2.04345703125, -1.854248046875, -1.6650390625, -1.475830078125, -1.28662109375, -1.097412109375, -0.908203125, -0.718994140625, -0.52978515625, -0.340576171875, -0.1513671875, 0.037841796875, 0.22705078125, 0.416259765625, 0.60546875, 0.794677734375, 0.98388671875, 1.173095703125, 1.3623046875, 1.551513671875, 1.74072265625, 1.929931640625, 2.119140625, 2.308349609375, 2.49755859375, 2.686767578125, 2.8759765625, 3.065185546875, 3.25439453125, 3.443603515625, 3.6328125, 3.822021484375, 4.01123046875, 4.200439453125, 4.3896484375, 4.578857421875, 4.76806640625, 4.957275390625, 5.146484375, 5.335693359375, 5.52490234375, 5.714111328125, 5.9033203125, 6.092529296875, 6.28173828125, 6.470947265625, 6.66015625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 11.0, 16.0, 15.0, 25.0, 38.0, 63.0, 85.0, 163.0, 234.0, 439.0, 815.0, 1418.0, 3012.0, 6802.0, 16768.0, 47568.0, 173548.0, 1195427.0, 2320913.0, 310676.0, 73974.0, 24724.0, 9354.0, 3984.0, 1946.0, 927.0, 477.0, 337.0, 166.0, 120.0, 88.0, 48.0, 19.0, 26.0, 15.0, 11.0, 10.0, 8.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4453125, -13.9820556640625, -13.518798828125, -13.0555419921875, -12.59228515625, -12.1290283203125, -11.665771484375, -11.2025146484375, -10.7392578125, -10.2760009765625, -9.812744140625, -9.3494873046875, -8.88623046875, -8.4229736328125, -7.959716796875, -7.4964599609375, -7.033203125, -6.5699462890625, -6.106689453125, -5.6434326171875, -5.18017578125, -4.7169189453125, -4.253662109375, -3.7904052734375, -3.3271484375, -2.8638916015625, -2.400634765625, -1.9373779296875, -1.47412109375, -1.0108642578125, -0.547607421875, -0.0843505859375, 0.37890625, 0.8421630859375, 1.305419921875, 1.7686767578125, 2.23193359375, 2.6951904296875, 3.158447265625, 3.6217041015625, 4.0849609375, 4.5482177734375, 5.011474609375, 5.4747314453125, 5.93798828125, 6.4012451171875, 6.864501953125, 7.3277587890625, 7.791015625, 8.2542724609375, 8.717529296875, 9.1807861328125, 9.64404296875, 10.1072998046875, 10.570556640625, 11.0338134765625, 11.4970703125, 11.9603271484375, 12.423583984375, 12.8868408203125, 13.35009765625, 13.8133544921875, 14.276611328125, 14.7398681640625, 15.203125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 10.0, 18.0, 17.0, 24.0, 41.0, 49.0, 77.0, 89.0, 171.0, 255.0, 350.0, 526.0, 685.0, 558.0, 360.0, 258.0, 180.0, 121.0, 69.0, 55.0, 46.0, 33.0, 28.0, 13.0, 17.0, 5.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.9765625, -13.572265625, -13.16796875, -12.763671875, -12.359375, -11.955078125, -11.55078125, -11.146484375, -10.7421875, -10.337890625, -9.93359375, -9.529296875, -9.125, -8.720703125, -8.31640625, -7.912109375, -7.5078125, -7.103515625, -6.69921875, -6.294921875, -5.890625, -5.486328125, -5.08203125, -4.677734375, -4.2734375, -3.869140625, -3.46484375, -3.060546875, -2.65625, -2.251953125, -1.84765625, -1.443359375, -1.0390625, -0.634765625, -0.23046875, 0.173828125, 0.578125, 0.982421875, 1.38671875, 1.791015625, 2.1953125, 2.599609375, 3.00390625, 3.408203125, 3.8125, 4.216796875, 4.62109375, 5.025390625, 5.4296875, 5.833984375, 6.23828125, 6.642578125, 7.046875, 7.451171875, 7.85546875, 8.259765625, 8.6640625, 9.068359375, 9.47265625, 9.876953125, 10.28125, 10.685546875, 11.08984375, 11.494140625, 11.8984375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 7.0, 9.0, 14.0, 23.0, 25.0, 40.0, 100.0, 132.0, 258.0, 520.0, 1384.0, 4404.0, 22311.0, 193966.0, 3230392.0, 675253.0, 53498.0, 8270.0, 2113.0, 761.0, 367.0, 180.0, 96.0, 70.0, 34.0, 21.0, 15.0, 10.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.6875, -28.65380859375, -27.6201171875, -26.58642578125, -25.552734375, -24.51904296875, -23.4853515625, -22.45166015625, -21.41796875, -20.38427734375, -19.3505859375, -18.31689453125, -17.283203125, -16.24951171875, -15.2158203125, -14.18212890625, -13.1484375, -12.11474609375, -11.0810546875, -10.04736328125, -9.013671875, -7.97998046875, -6.9462890625, -5.91259765625, -4.87890625, -3.84521484375, -2.8115234375, -1.77783203125, -0.744140625, 0.28955078125, 1.3232421875, 2.35693359375, 3.390625, 4.42431640625, 5.4580078125, 6.49169921875, 7.525390625, 8.55908203125, 9.5927734375, 10.62646484375, 11.66015625, 12.69384765625, 13.7275390625, 14.76123046875, 15.794921875, 16.82861328125, 17.8623046875, 18.89599609375, 19.9296875, 20.96337890625, 21.9970703125, 23.03076171875, 24.064453125, 25.09814453125, 26.1318359375, 27.16552734375, 28.19921875, 29.23291015625, 30.2666015625, 31.30029296875, 32.333984375, 33.36767578125, 34.4013671875, 35.43505859375, 36.46875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 20.0, 58.0, 101.0, 162.0, 222.0, 217.0, 138.0, 63.0, 19.0, 12.0], "bins": [-218.2934112548828, -214.56678771972656, -210.8401641845703, -207.11354064941406, -203.3869171142578, -199.66029357910156, -195.9336700439453, -192.20704650878906, -188.4804229736328, -184.75379943847656, -181.0271759033203, -177.30055236816406, -173.5739288330078, -169.84730529785156, -166.1206817626953, -162.39405822753906, -158.6674346923828, -154.94081115722656, -151.2141876220703, -147.48756408691406, -143.7609405517578, -140.03431701660156, -136.3076934814453, -132.58106994628906, -128.8544464111328, -125.12782287597656, -121.40119934082031, -117.67457580566406, -113.94795227050781, -110.22132873535156, -106.49470520019531, -102.76808166503906, -99.04144287109375, -95.3148193359375, -91.58819580078125, -87.861572265625, -84.13494873046875, -80.4083251953125, -76.68170166015625, -72.955078125, -69.22845458984375, -65.5018310546875, -61.77520751953125, -58.048583984375, -54.32196044921875, -50.5953369140625, -46.86871337890625, -43.14208984375, -39.41546630859375, -35.6888427734375, -31.96221923828125, -28.235595703125, -24.50897216796875, -20.782346725463867, -17.055723190307617, -13.329099655151367, -9.602474212646484, -5.875850677490234, -2.149226665496826, 1.577397346496582, 5.304020881652832, 9.030645370483398, 12.757268905639648, 16.4838924407959, 20.21051597595215]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 0.0, 6.0, 4.0, 2.0, 3.0, 6.0, 8.0, 8.0, 18.0, 13.0, 14.0, 24.0, 17.0, 21.0, 19.0, 23.0, 35.0, 25.0, 31.0, 42.0, 37.0, 44.0, 53.0, 45.0, 45.0, 41.0, 52.0, 43.0, 39.0, 36.0, 36.0, 25.0, 32.0, 23.0, 21.0, 13.0, 15.0, 14.0, 10.0, 14.0, 6.0, 13.0, 8.0, 3.0, 7.0, 2.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.807167053222656, -34.7009391784668, -33.59470748901367, -32.48847961425781, -31.382247924804688, -30.276018142700195, -29.169788360595703, -28.063560485839844, -26.95732879638672, -25.851099014282227, -24.744869232177734, -23.638639450073242, -22.53240966796875, -21.426179885864258, -20.319950103759766, -19.213722229003906, -18.107492446899414, -17.001262664794922, -15.89503288269043, -14.788803100585938, -13.682573318481445, -12.576343536376953, -11.470114707946777, -10.363884925842285, -9.257655143737793, -8.1514253616333, -7.045195579528809, -5.938966274261475, -4.832736492156982, -3.7265067100524902, -2.6202774047851562, -1.514047622680664, -0.4078178405761719, 0.6984118223190308, 1.8046414852142334, 2.9108710289001465, 4.017100811004639, 5.123330593109131, 6.229559898376465, 7.335789680480957, 8.44201946258545, 9.548249244689941, 10.654479026794434, 11.76070785522461, 12.866937637329102, 13.973167419433594, 15.079397201538086, 16.185626983642578, 17.29185676574707, 18.398086547851562, 19.504316329956055, 20.610546112060547, 21.71677589416504, 22.82300567626953, 23.92923355102539, 25.035465240478516, 26.141693115234375, 27.247922897338867, 28.35415267944336, 29.46038246154785, 30.566612243652344, 31.672842025756836, 32.77907180786133, 33.88529968261719, 34.99153137207031]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 9.0, 7.0, 15.0, 15.0, 14.0, 11.0, 16.0, 19.0, 23.0, 25.0, 27.0, 23.0, 34.0, 35.0, 26.0, 34.0, 38.0, 36.0, 40.0, 46.0, 42.0, 32.0, 45.0, 28.0, 36.0, 44.0, 29.0, 27.0, 35.0, 19.0, 22.0, 23.0, 25.0, 11.0, 13.0, 16.0, 9.0, 9.0, 10.0, 5.0, 4.0, 8.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.31640625, -5.1279296875, -4.939453125, -4.7509765625, -4.5625, -4.3740234375, -4.185546875, -3.9970703125, -3.80859375, -3.6201171875, -3.431640625, -3.2431640625, -3.0546875, -2.8662109375, -2.677734375, -2.4892578125, -2.30078125, -2.1123046875, -1.923828125, -1.7353515625, -1.546875, -1.3583984375, -1.169921875, -0.9814453125, -0.79296875, -0.6044921875, -0.416015625, -0.2275390625, -0.0390625, 0.1494140625, 0.337890625, 0.5263671875, 0.71484375, 0.9033203125, 1.091796875, 1.2802734375, 1.46875, 1.6572265625, 1.845703125, 2.0341796875, 2.22265625, 2.4111328125, 2.599609375, 2.7880859375, 2.9765625, 3.1650390625, 3.353515625, 3.5419921875, 3.73046875, 3.9189453125, 4.107421875, 4.2958984375, 4.484375, 4.6728515625, 4.861328125, 5.0498046875, 5.23828125, 5.4267578125, 5.615234375, 5.8037109375, 5.9921875, 6.1806640625, 6.369140625, 6.5576171875, 6.74609375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 8.0, 15.0, 26.0, 32.0, 45.0, 60.0, 76.0, 154.0, 183.0, 315.0, 442.0, 619.0, 933.0, 1347.0, 2019.0, 2893.0, 4281.0, 6506.0, 9490.0, 14367.0, 21497.0, 33335.0, 53327.0, 94287.0, 200397.0, 276131.0, 133993.0, 69998.0, 41471.0, 26887.0, 17498.0, 11701.0, 7843.0, 5225.0, 3578.0, 2404.0, 1625.0, 1121.0, 798.0, 486.0, 361.0, 251.0, 169.0, 108.0, 94.0, 58.0, 30.0, 27.0, 13.0, 11.0, 12.0, 3.0, 5.0, 3.0, 4.0], "bins": [-0.214599609375, -0.20833396911621094, -0.20206832885742188, -0.1958026885986328, -0.18953704833984375, -0.1832714080810547, -0.17700576782226562, -0.17074012756347656, -0.1644744873046875, -0.15820884704589844, -0.15194320678710938, -0.1456775665283203, -0.13941192626953125, -0.1331462860107422, -0.12688064575195312, -0.12061500549316406, -0.114349365234375, -0.10808372497558594, -0.10181808471679688, -0.09555244445800781, -0.08928680419921875, -0.08302116394042969, -0.07675552368164062, -0.07048988342285156, -0.0642242431640625, -0.05795860290527344, -0.051692962646484375, -0.04542732238769531, -0.03916168212890625, -0.03289604187011719, -0.026630401611328125, -0.020364761352539062, -0.01409912109375, -0.007833480834960938, -0.001567840576171875, 0.0046977996826171875, 0.01096343994140625, 0.017229080200195312, 0.023494720458984375, 0.029760360717773438, 0.0360260009765625, 0.04229164123535156, 0.048557281494140625, 0.05482292175292969, 0.06108856201171875, 0.06735420227050781, 0.07361984252929688, 0.07988548278808594, 0.086151123046875, 0.09241676330566406, 0.09868240356445312, 0.10494804382324219, 0.11121368408203125, 0.11747932434082031, 0.12374496459960938, 0.13001060485839844, 0.1362762451171875, 0.14254188537597656, 0.14880752563476562, 0.1550731658935547, 0.16133880615234375, 0.1676044464111328, 0.17387008666992188, 0.18013572692871094, 0.1864013671875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 8.0, 12.0, 6.0, 13.0, 17.0, 16.0, 20.0, 20.0, 30.0, 34.0, 36.0, 24.0, 34.0, 32.0, 30.0, 36.0, 41.0, 32.0, 1057.0, 39.0, 41.0, 38.0, 41.0, 36.0, 47.0, 24.0, 29.0, 24.0, 28.0, 22.0, 22.0, 17.0, 20.0, 18.0, 14.0, 7.0, 2.0, 8.0, 4.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.09765625, -3.970703125, -3.84375, -3.716796875, -3.58984375, -3.462890625, -3.3359375, -3.208984375, -3.08203125, -2.955078125, -2.828125, -2.701171875, -2.57421875, -2.447265625, -2.3203125, -2.193359375, -2.06640625, -1.939453125, -1.8125, -1.685546875, -1.55859375, -1.431640625, -1.3046875, -1.177734375, -1.05078125, -0.923828125, -0.796875, -0.669921875, -0.54296875, -0.416015625, -0.2890625, -0.162109375, -0.03515625, 0.091796875, 0.21875, 0.345703125, 0.47265625, 0.599609375, 0.7265625, 0.853515625, 0.98046875, 1.107421875, 1.234375, 1.361328125, 1.48828125, 1.615234375, 1.7421875, 1.869140625, 1.99609375, 2.123046875, 2.25, 2.376953125, 2.50390625, 2.630859375, 2.7578125, 2.884765625, 3.01171875, 3.138671875, 3.265625, 3.392578125, 3.51953125, 3.646484375, 3.7734375, 3.900390625, 4.02734375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 13.0, 19.0, 21.0, 32.0, 54.0, 75.0, 106.0, 180.0, 273.0, 380.0, 577.0, 868.0, 1267.0, 2083.0, 2963.0, 4737.0, 7473.0, 11573.0, 18551.0, 30282.0, 51008.0, 90144.0, 182335.0, 1330315.0, 159265.0, 80853.0, 46468.0, 27882.0, 17106.0, 10708.0, 6880.0, 4310.0, 2865.0, 1813.0, 1213.0, 829.0, 521.0, 355.0, 249.0, 160.0, 108.0, 64.0, 48.0, 40.0, 23.0, 13.0, 14.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1451416015625, -0.14066314697265625, -0.1361846923828125, -0.13170623779296875, -0.127227783203125, -0.12274932861328125, -0.1182708740234375, -0.11379241943359375, -0.10931396484375, -0.10483551025390625, -0.1003570556640625, -0.09587860107421875, -0.091400146484375, -0.08692169189453125, -0.0824432373046875, -0.07796478271484375, -0.073486328125, -0.06900787353515625, -0.0645294189453125, -0.06005096435546875, -0.055572509765625, -0.05109405517578125, -0.0466156005859375, -0.04213714599609375, -0.03765869140625, -0.03318023681640625, -0.0287017822265625, -0.02422332763671875, -0.019744873046875, -0.01526641845703125, -0.0107879638671875, -0.00630950927734375, -0.0018310546875, 0.00264739990234375, 0.0071258544921875, 0.01160430908203125, 0.016082763671875, 0.02056121826171875, 0.0250396728515625, 0.02951812744140625, 0.03399658203125, 0.03847503662109375, 0.0429534912109375, 0.04743194580078125, 0.051910400390625, 0.05638885498046875, 0.0608673095703125, 0.06534576416015625, 0.06982421875, 0.07430267333984375, 0.0787811279296875, 0.08325958251953125, 0.087738037109375, 0.09221649169921875, 0.0966949462890625, 0.10117340087890625, 0.10565185546875, 0.11013031005859375, 0.1146087646484375, 0.11908721923828125, 0.123565673828125, 0.12804412841796875, 0.1325225830078125, 0.13700103759765625, 0.1414794921875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 8.0, 10.0, 14.0, 13.0, 24.0, 12.0, 30.0, 19.0, 46.0, 36.0, 24.0, 53.0, 42.0, 56.0, 59.0, 49.0, 50.0, 47.0, 44.0, 50.0, 39.0, 35.0, 34.0, 31.0, 26.0, 27.0, 25.0, 9.0, 19.0, 14.0, 8.0, 5.0, 8.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.488229751586914e-05, -4.3081119656562805e-05, -4.127994179725647e-05, -3.9478763937950134e-05, -3.76775860786438e-05, -3.587640821933746e-05, -3.407523036003113e-05, -3.227405250072479e-05, -3.0472874641418457e-05, -2.867169678211212e-05, -2.6870518922805786e-05, -2.506934106349945e-05, -2.3268163204193115e-05, -2.146698534488678e-05, -1.9665807485580444e-05, -1.786462962627411e-05, -1.6063451766967773e-05, -1.4262273907661438e-05, -1.2461096048355103e-05, -1.0659918189048767e-05, -8.858740329742432e-06, -7.057562470436096e-06, -5.256384611129761e-06, -3.4552067518234253e-06, -1.6540288925170898e-06, 1.471489667892456e-07, 1.948326826095581e-06, 3.7495046854019165e-06, 5.550682544708252e-06, 7.351860404014587e-06, 9.153038263320923e-06, 1.0954216122627258e-05, 1.2755393981933594e-05, 1.455657184123993e-05, 1.6357749700546265e-05, 1.81589275598526e-05, 1.9960105419158936e-05, 2.176128327846527e-05, 2.3562461137771606e-05, 2.5363638997077942e-05, 2.7164816856384277e-05, 2.8965994715690613e-05, 3.076717257499695e-05, 3.2568350434303284e-05, 3.436952829360962e-05, 3.6170706152915955e-05, 3.797188401222229e-05, 3.9773061871528625e-05, 4.157423973083496e-05, 4.3375417590141296e-05, 4.517659544944763e-05, 4.697777330875397e-05, 4.87789511680603e-05, 5.058012902736664e-05, 5.2381306886672974e-05, 5.418248474597931e-05, 5.5983662605285645e-05, 5.778484046459198e-05, 5.9586018323898315e-05, 6.138719618320465e-05, 6.318837404251099e-05, 6.498955190181732e-05, 6.679072976112366e-05, 6.859190762042999e-05, 7.039308547973633e-05]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 8.0, 12.0, 8.0, 15.0, 19.0, 23.0, 26.0, 33.0, 52.0, 47.0, 83.0, 123.0, 224.0, 535.0, 5574.0, 596546.0, 439872.0, 4214.0, 519.0, 186.0, 113.0, 73.0, 62.0, 51.0, 35.0, 19.0, 20.0, 18.0, 14.0, 8.0, 3.0, 7.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0], "bins": [-0.001674652099609375, -0.001634739339351654, -0.001594826579093933, -0.0015549138188362122, -0.0015150010585784912, -0.0014750882983207703, -0.0014351755380630493, -0.0013952627778053284, -0.0013553500175476074, -0.0013154372572898865, -0.0012755244970321655, -0.0012356117367744446, -0.0011956989765167236, -0.0011557862162590027, -0.0011158734560012817, -0.0010759606957435608, -0.0010360479354858398, -0.000996135175228119, -0.000956222414970398, -0.000916309654712677, -0.0008763968944549561, -0.0008364841341972351, -0.0007965713739395142, -0.0007566586136817932, -0.0007167458534240723, -0.0006768330931663513, -0.0006369203329086304, -0.0005970075726509094, -0.0005570948123931885, -0.0005171820521354675, -0.0004772692918777466, -0.00043735653162002563, -0.0003974437713623047, -0.00035753101110458374, -0.0003176182508468628, -0.00027770549058914185, -0.0002377927303314209, -0.00019787997007369995, -0.000157967209815979, -0.00011805444955825806, -7.814168930053711e-05, -3.822892904281616e-05, 1.6838312149047852e-06, 4.159659147262573e-05, 8.150935173034668e-05, 0.00012142211198806763, 0.00016133487224578857, 0.00020124763250350952, 0.00024116039276123047, 0.0002810731530189514, 0.00032098591327667236, 0.0003608986735343933, 0.00040081143379211426, 0.0004407241940498352, 0.00048063695430755615, 0.0005205497145652771, 0.000560462474822998, 0.000600375235080719, 0.0006402879953384399, 0.0006802007555961609, 0.0007201135158538818, 0.0007600262761116028, 0.0007999390363693237, 0.0008398517966270447, 0.0008797645568847656]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 31.0, 116.0, 266.0, 330.0, 169.0, 59.0, 27.0, 9.0, 0.0, 2.0], "bins": [-0.0003462833119556308, -0.00034024176420643926, -0.0003342002455610782, -0.00032815869781188667, -0.00032211715006269515, -0.0003160756314173341, -0.00031003408366814256, -0.00030399253591895103, -0.00029795101727358997, -0.00029190946952439845, -0.0002858679508790374, -0.00027982640312984586, -0.00027378485538065434, -0.00026774333673529327, -0.00026170178898610175, -0.0002556602412369102, -0.00024961872259154916, -0.00024357718939427286, -0.00023753564164508134, -0.00023149410844780505, -0.00022545257525052875, -0.00021941104205325246, -0.00021336949430406094, -0.00020732796110678464, -0.0002012863988056779, -0.0001952448656084016, -0.00018920331785921007, -0.00018316178466193378, -0.00017712025146465749, -0.0001710787182673812, -0.00016503717051818967, -0.00015899563732091337, -0.00015295410412363708, -0.00014691257092636079, -0.00014087102317716926, -0.00013482948997989297, -0.00012878795678261667, -0.00012274642358534038, -0.00011670487583614886, -0.00011066334263887256, -0.00010462180216563866, -9.858026169240475e-05, -9.253872849512845e-05, -8.649718802189454e-05, -8.045564754866064e-05, -7.441411435138434e-05, -6.837257387815043e-05, -6.233103340491652e-05, -5.628950020764023e-05, -5.024796337238513e-05, -4.420642653713003e-05, -3.816488606389612e-05, -3.212334922864102e-05, -2.6081812393385917e-05, -2.004027192015201e-05, -1.3998735084896907e-05, -7.957198249641806e-06, -1.915660504892003e-06, 4.1258772398578e-06, 1.0167415894102305e-05, 1.6208952729357406e-05, 2.2250489564612508e-05, 2.8292030037846416e-05, 3.433356687310152e-05, 4.037510370835662e-05]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 3.0, 3.0, 2.0, 5.0, 14.0, 2.0, 15.0, 9.0, 12.0, 10.0, 17.0, 23.0, 15.0, 19.0, 30.0, 39.0, 35.0, 29.0, 32.0, 32.0, 34.0, 48.0, 34.0, 32.0, 33.0, 39.0, 47.0, 42.0, 38.0, 23.0, 27.0, 36.0, 30.0, 24.0, 21.0, 27.0, 30.0, 15.0, 12.0, 13.0, 7.0, 15.0, 12.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.123283386230469e-05, -3.0227936804294586e-05, -2.9223039746284485e-05, -2.8218142688274384e-05, -2.7213245630264282e-05, -2.620834857225418e-05, -2.520345151424408e-05, -2.4198554456233978e-05, -2.3193657398223877e-05, -2.2188760340213776e-05, -2.1183863282203674e-05, -2.0178966224193573e-05, -1.917406916618347e-05, -1.816917210817337e-05, -1.716427505016327e-05, -1.6159377992153168e-05, -1.5154480934143066e-05, -1.4149583876132965e-05, -1.3144686818122864e-05, -1.2139789760112762e-05, -1.1134892702102661e-05, -1.012999564409256e-05, -9.125098586082458e-06, -8.120201528072357e-06, -7.115304470062256e-06, -6.1104074120521545e-06, -5.105510354042053e-06, -4.100613296031952e-06, -3.0957162380218506e-06, -2.0908191800117493e-06, -1.085922122001648e-06, -8.102506399154663e-08, 9.238719940185547e-07, 1.928769052028656e-06, 2.9336661100387573e-06, 3.938563168048859e-06, 4.94346022605896e-06, 5.948357284069061e-06, 6.953254342079163e-06, 7.958151400089264e-06, 8.963048458099365e-06, 9.967945516109467e-06, 1.0972842574119568e-05, 1.197773963212967e-05, 1.298263669013977e-05, 1.3987533748149872e-05, 1.4992430806159973e-05, 1.5997327864170074e-05, 1.7002224922180176e-05, 1.8007121980190277e-05, 1.901201903820038e-05, 2.001691609621048e-05, 2.102181315422058e-05, 2.2026710212230682e-05, 2.3031607270240784e-05, 2.4036504328250885e-05, 2.5041401386260986e-05, 2.6046298444271088e-05, 2.705119550228119e-05, 2.805609256029129e-05, 2.906098961830139e-05, 3.0065886676311493e-05, 3.1070783734321594e-05, 3.2075680792331696e-05, 3.30805778503418e-05]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 9.0, 7.0, 15.0, 15.0, 14.0, 11.0, 16.0, 19.0, 23.0, 25.0, 27.0, 23.0, 34.0, 35.0, 26.0, 34.0, 38.0, 36.0, 40.0, 46.0, 42.0, 32.0, 45.0, 28.0, 36.0, 44.0, 29.0, 27.0, 35.0, 19.0, 22.0, 23.0, 25.0, 11.0, 13.0, 16.0, 9.0, 9.0, 10.0, 5.0, 4.0, 8.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.31640625, -5.1279296875, -4.939453125, -4.7509765625, -4.5625, -4.3740234375, -4.185546875, -3.9970703125, -3.80859375, -3.6201171875, -3.431640625, -3.2431640625, -3.0546875, -2.8662109375, -2.677734375, -2.4892578125, -2.30078125, -2.1123046875, -1.923828125, -1.7353515625, -1.546875, -1.3583984375, -1.169921875, -0.9814453125, -0.79296875, -0.6044921875, -0.416015625, -0.2275390625, -0.0390625, 0.1494140625, 0.337890625, 0.5263671875, 0.71484375, 0.9033203125, 1.091796875, 1.2802734375, 1.46875, 1.6572265625, 1.845703125, 2.0341796875, 2.22265625, 2.4111328125, 2.599609375, 2.7880859375, 2.9765625, 3.1650390625, 3.353515625, 3.5419921875, 3.73046875, 3.9189453125, 4.107421875, 4.2958984375, 4.484375, 4.6728515625, 4.861328125, 5.0498046875, 5.23828125, 5.4267578125, 5.615234375, 5.8037109375, 5.9921875, 6.1806640625, 6.369140625, 6.5576171875, 6.74609375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 11.0, 10.0, 24.0, 31.0, 47.0, 59.0, 82.0, 146.0, 192.0, 348.0, 511.0, 812.0, 1390.0, 2547.0, 4562.0, 8250.0, 15384.0, 29496.0, 60762.0, 166926.0, 490329.0, 149346.0, 56381.0, 28167.0, 14545.0, 7897.0, 4276.0, 2478.0, 1369.0, 806.0, 486.0, 273.0, 190.0, 135.0, 87.0, 69.0, 44.0, 21.0, 23.0, 14.0, 6.0, 7.0, 4.0, 7.0, 2.0, 0.0, 1.0], "bins": [-13.4609375, -13.1015625, -12.7421875, -12.3828125, -12.0234375, -11.6640625, -11.3046875, -10.9453125, -10.5859375, -10.2265625, -9.8671875, -9.5078125, -9.1484375, -8.7890625, -8.4296875, -8.0703125, -7.7109375, -7.3515625, -6.9921875, -6.6328125, -6.2734375, -5.9140625, -5.5546875, -5.1953125, -4.8359375, -4.4765625, -4.1171875, -3.7578125, -3.3984375, -3.0390625, -2.6796875, -2.3203125, -1.9609375, -1.6015625, -1.2421875, -0.8828125, -0.5234375, -0.1640625, 0.1953125, 0.5546875, 0.9140625, 1.2734375, 1.6328125, 1.9921875, 2.3515625, 2.7109375, 3.0703125, 3.4296875, 3.7890625, 4.1484375, 4.5078125, 4.8671875, 5.2265625, 5.5859375, 5.9453125, 6.3046875, 6.6640625, 7.0234375, 7.3828125, 7.7421875, 8.1015625, 8.4609375, 8.8203125, 9.1796875, 9.5390625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 5.0, 4.0, 1.0, 4.0, 2.0, 5.0, 8.0, 12.0, 8.0, 15.0, 11.0, 13.0, 14.0, 19.0, 25.0, 30.0, 26.0, 29.0, 40.0, 39.0, 49.0, 58.0, 87.0, 119.0, 220.0, 1452.0, 175.0, 118.0, 70.0, 61.0, 43.0, 39.0, 43.0, 27.0, 26.0, 23.0, 23.0, 22.0, 17.0, 13.0, 8.0, 9.0, 16.0, 10.0, 6.0, 4.0, 6.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.9765625, -14.4493408203125, -13.922119140625, -13.3948974609375, -12.86767578125, -12.3404541015625, -11.813232421875, -11.2860107421875, -10.7587890625, -10.2315673828125, -9.704345703125, -9.1771240234375, -8.64990234375, -8.1226806640625, -7.595458984375, -7.0682373046875, -6.541015625, -6.0137939453125, -5.486572265625, -4.9593505859375, -4.43212890625, -3.9049072265625, -3.377685546875, -2.8504638671875, -2.3232421875, -1.7960205078125, -1.268798828125, -0.7415771484375, -0.21435546875, 0.3128662109375, 0.840087890625, 1.3673095703125, 1.89453125, 2.4217529296875, 2.948974609375, 3.4761962890625, 4.00341796875, 4.5306396484375, 5.057861328125, 5.5850830078125, 6.1123046875, 6.6395263671875, 7.166748046875, 7.6939697265625, 8.22119140625, 8.7484130859375, 9.275634765625, 9.8028564453125, 10.330078125, 10.8572998046875, 11.384521484375, 11.9117431640625, 12.43896484375, 12.9661865234375, 13.493408203125, 14.0206298828125, 14.5478515625, 15.0750732421875, 15.602294921875, 16.1295166015625, 16.65673828125, 17.1839599609375, 17.711181640625, 18.2384033203125, 18.765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 12.0, 2.0, 13.0, 6.0, 14.0, 14.0, 26.0, 30.0, 35.0, 50.0, 75.0, 100.0, 189.0, 321.0, 718.0, 1665.0, 4831.0, 16433.0, 69603.0, 628206.0, 2244087.0, 139200.0, 28051.0, 7522.0, 2428.0, 985.0, 424.0, 225.0, 130.0, 80.0, 49.0, 41.0, 27.0, 34.0, 18.0, 19.0, 12.0, 9.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-24.25, -23.47265625, -22.6953125, -21.91796875, -21.140625, -20.36328125, -19.5859375, -18.80859375, -18.03125, -17.25390625, -16.4765625, -15.69921875, -14.921875, -14.14453125, -13.3671875, -12.58984375, -11.8125, -11.03515625, -10.2578125, -9.48046875, -8.703125, -7.92578125, -7.1484375, -6.37109375, -5.59375, -4.81640625, -4.0390625, -3.26171875, -2.484375, -1.70703125, -0.9296875, -0.15234375, 0.625, 1.40234375, 2.1796875, 2.95703125, 3.734375, 4.51171875, 5.2890625, 6.06640625, 6.84375, 7.62109375, 8.3984375, 9.17578125, 9.953125, 10.73046875, 11.5078125, 12.28515625, 13.0625, 13.83984375, 14.6171875, 15.39453125, 16.171875, 16.94921875, 17.7265625, 18.50390625, 19.28125, 20.05859375, 20.8359375, 21.61328125, 22.390625, 23.16796875, 23.9453125, 24.72265625, 25.5]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 7.0, 7.0, 21.0, 15.0, 25.0, 42.0, 59.0, 75.0, 94.0, 92.0, 98.0, 102.0, 96.0, 69.0, 61.0, 41.0, 28.0, 26.0, 15.0, 15.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.96511459350586, -46.81098556518555, -45.656856536865234, -44.50272750854492, -43.34859848022461, -42.1944694519043, -41.040340423583984, -39.886207580566406, -38.732078552246094, -37.57794952392578, -36.42382049560547, -35.269691467285156, -34.115562438964844, -32.96143341064453, -31.807302474975586, -30.653173446655273, -29.499046325683594, -28.34491729736328, -27.19078826904297, -26.036659240722656, -24.882530212402344, -23.72840118408203, -22.574270248413086, -21.420141220092773, -20.26601219177246, -19.11188316345215, -17.957754135131836, -16.803625106811523, -15.649495124816895, -14.495366096496582, -13.341236114501953, -12.18710708618164, -11.032976150512695, -9.878847122192383, -8.72471809387207, -7.570588111877441, -6.416459083557129, -5.262330055236816, -4.108200550079346, -2.954071044921875, -1.7999420166015625, -0.6458127498626709, 0.5083165168762207, 1.6624457836151123, 2.816575050354004, 3.9707040786743164, 5.124833583831787, 6.278963088989258, 7.43309211730957, 8.587221145629883, 9.741350173950195, 10.895480155944824, 12.049609184265137, 13.20373821258545, 14.357868194580078, 15.51199722290039, 16.666126251220703, 17.820255279541016, 18.974384307861328, 20.12851333618164, 21.282642364501953, 22.436771392822266, 23.59090232849121, 24.745031356811523, 25.899160385131836]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 2.0, 9.0, 6.0, 14.0, 9.0, 9.0, 13.0, 16.0, 23.0, 19.0, 21.0, 32.0, 38.0, 38.0, 38.0, 46.0, 28.0, 48.0, 45.0, 28.0, 41.0, 31.0, 36.0, 45.0, 46.0, 37.0, 43.0, 28.0, 30.0, 21.0, 21.0, 29.0, 18.0, 18.0, 20.0, 11.0, 9.0, 12.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-57.57184600830078, -55.94717025756836, -54.32249069213867, -52.69781494140625, -51.07313919067383, -49.448463439941406, -47.82378387451172, -46.1991081237793, -44.574432373046875, -42.94975662231445, -41.325077056884766, -39.700401306152344, -38.07572555541992, -36.4510498046875, -34.82637023925781, -33.20169448852539, -31.577014923095703, -29.95233726501465, -28.327661514282227, -26.702983856201172, -25.07830810546875, -23.453630447387695, -21.82895278930664, -20.20427703857422, -18.579599380493164, -16.95492172241211, -15.330245971679688, -13.705568313598633, -12.080891609191895, -10.456214904785156, -8.831537246704102, -7.206860542297363, -5.582180023193359, -3.957503080368042, -2.3328261375427246, -0.7081489562988281, 0.9165277481079102, 2.5412044525146484, 4.165882110595703, 5.790558815002441, 7.41523551940918, 9.039912223815918, 10.664588928222656, 12.289266586303711, 13.91394329071045, 15.538619995117188, 17.163297653198242, 18.787975311279297, 20.41265106201172, 22.037328720092773, 23.662004470825195, 25.28668212890625, 26.911357879638672, 28.536035537719727, 30.16071319580078, 31.785388946533203, 33.410064697265625, 35.03474044799805, 36.659420013427734, 38.284095764160156, 39.90877151489258, 41.533447265625, 43.15812683105469, 44.78280258178711, 46.4074821472168]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 5.0, 1.0, 2.0, 6.0, 7.0, 13.0, 8.0, 10.0, 15.0, 21.0, 23.0, 19.0, 21.0, 26.0, 20.0, 29.0, 33.0, 28.0, 38.0, 31.0, 36.0, 35.0, 26.0, 42.0, 38.0, 33.0, 48.0, 32.0, 38.0, 26.0, 37.0, 28.0, 37.0, 23.0, 21.0, 19.0, 12.0, 18.0, 20.0, 8.0, 13.0, 17.0, 9.0, 6.0, 4.0, 10.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.5831298828125, -5.396728515625, -5.2103271484375, -5.02392578125, -4.8375244140625, -4.651123046875, -4.4647216796875, -4.2783203125, -4.0919189453125, -3.905517578125, -3.7191162109375, -3.53271484375, -3.3463134765625, -3.159912109375, -2.9735107421875, -2.787109375, -2.6007080078125, -2.414306640625, -2.2279052734375, -2.04150390625, -1.8551025390625, -1.668701171875, -1.4822998046875, -1.2958984375, -1.1094970703125, -0.923095703125, -0.7366943359375, -0.55029296875, -0.3638916015625, -0.177490234375, 0.0089111328125, 0.1953125, 0.3817138671875, 0.568115234375, 0.7545166015625, 0.94091796875, 1.1273193359375, 1.313720703125, 1.5001220703125, 1.6865234375, 1.8729248046875, 2.059326171875, 2.2457275390625, 2.43212890625, 2.6185302734375, 2.804931640625, 2.9913330078125, 3.177734375, 3.3641357421875, 3.550537109375, 3.7369384765625, 3.92333984375, 4.1097412109375, 4.296142578125, 4.4825439453125, 4.6689453125, 4.8553466796875, 5.041748046875, 5.2281494140625, 5.41455078125, 5.6009521484375, 5.787353515625, 5.9737548828125, 6.16015625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 5.0, 3.0, 0.0, 6.0, 11.0, 24.0, 29.0, 41.0, 60.0, 79.0, 113.0, 176.0, 266.0, 380.0, 579.0, 889.0, 1327.0, 2187.0, 3607.0, 6066.0, 10934.0, 20320.0, 41541.0, 98172.0, 303813.0, 1300935.0, 1745760.0, 426051.0, 124050.0, 50946.0, 24526.0, 12871.0, 7165.0, 4210.0, 2501.0, 1611.0, 1062.0, 645.0, 446.0, 277.0, 181.0, 141.0, 90.0, 60.0, 34.0, 27.0, 27.0, 13.0, 7.0, 4.0, 12.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-9.4296875, -9.14501953125, -8.8603515625, -8.57568359375, -8.291015625, -8.00634765625, -7.7216796875, -7.43701171875, -7.15234375, -6.86767578125, -6.5830078125, -6.29833984375, -6.013671875, -5.72900390625, -5.4443359375, -5.15966796875, -4.875, -4.59033203125, -4.3056640625, -4.02099609375, -3.736328125, -3.45166015625, -3.1669921875, -2.88232421875, -2.59765625, -2.31298828125, -2.0283203125, -1.74365234375, -1.458984375, -1.17431640625, -0.8896484375, -0.60498046875, -0.3203125, -0.03564453125, 0.2490234375, 0.53369140625, 0.818359375, 1.10302734375, 1.3876953125, 1.67236328125, 1.95703125, 2.24169921875, 2.5263671875, 2.81103515625, 3.095703125, 3.38037109375, 3.6650390625, 3.94970703125, 4.234375, 4.51904296875, 4.8037109375, 5.08837890625, 5.373046875, 5.65771484375, 5.9423828125, 6.22705078125, 6.51171875, 6.79638671875, 7.0810546875, 7.36572265625, 7.650390625, 7.93505859375, 8.2197265625, 8.50439453125, 8.7890625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 8.0, 8.0, 11.0, 16.0, 23.0, 31.0, 48.0, 71.0, 75.0, 92.0, 145.0, 177.0, 258.0, 432.0, 650.0, 600.0, 448.0, 286.0, 179.0, 150.0, 99.0, 66.0, 53.0, 32.0, 27.0, 19.0, 8.0, 16.0, 7.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.359375, -11.9847412109375, -11.610107421875, -11.2354736328125, -10.86083984375, -10.4862060546875, -10.111572265625, -9.7369384765625, -9.3623046875, -8.9876708984375, -8.613037109375, -8.2384033203125, -7.86376953125, -7.4891357421875, -7.114501953125, -6.7398681640625, -6.365234375, -5.9906005859375, -5.615966796875, -5.2413330078125, -4.86669921875, -4.4920654296875, -4.117431640625, -3.7427978515625, -3.3681640625, -2.9935302734375, -2.618896484375, -2.2442626953125, -1.86962890625, -1.4949951171875, -1.120361328125, -0.7457275390625, -0.37109375, 0.0035400390625, 0.378173828125, 0.7528076171875, 1.12744140625, 1.5020751953125, 1.876708984375, 2.2513427734375, 2.6259765625, 3.0006103515625, 3.375244140625, 3.7498779296875, 4.12451171875, 4.4991455078125, 4.873779296875, 5.2484130859375, 5.623046875, 5.9976806640625, 6.372314453125, 6.7469482421875, 7.12158203125, 7.4962158203125, 7.870849609375, 8.2454833984375, 8.6201171875, 8.9947509765625, 9.369384765625, 9.7440185546875, 10.11865234375, 10.4932861328125, 10.867919921875, 11.2425537109375, 11.6171875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 6.0, 11.0, 21.0, 24.0, 31.0, 85.0, 113.0, 197.0, 394.0, 1018.0, 3080.0, 13432.0, 88986.0, 1531169.0, 2419669.0, 114139.0, 16066.0, 3646.0, 1160.0, 432.0, 212.0, 125.0, 77.0, 43.0, 46.0, 23.0, 15.0, 14.0, 15.0, 6.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.234375, -28.228271484375, -27.22216796875, -26.216064453125, -25.2099609375, -24.203857421875, -23.19775390625, -22.191650390625, -21.185546875, -20.179443359375, -19.17333984375, -18.167236328125, -17.1611328125, -16.155029296875, -15.14892578125, -14.142822265625, -13.13671875, -12.130615234375, -11.12451171875, -10.118408203125, -9.1123046875, -8.106201171875, -7.10009765625, -6.093994140625, -5.087890625, -4.081787109375, -3.07568359375, -2.069580078125, -1.0634765625, -0.057373046875, 0.94873046875, 1.954833984375, 2.9609375, 3.967041015625, 4.97314453125, 5.979248046875, 6.9853515625, 7.991455078125, 8.99755859375, 10.003662109375, 11.009765625, 12.015869140625, 13.02197265625, 14.028076171875, 15.0341796875, 16.040283203125, 17.04638671875, 18.052490234375, 19.05859375, 20.064697265625, 21.07080078125, 22.076904296875, 23.0830078125, 24.089111328125, 25.09521484375, 26.101318359375, 27.107421875, 28.113525390625, 29.11962890625, 30.125732421875, 31.1318359375, 32.137939453125, 33.14404296875, 34.150146484375, 35.15625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 10.0, 27.0, 35.0, 68.0, 121.0, 151.0, 163.0, 139.0, 92.0, 85.0, 54.0, 32.0, 16.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.89708709716797, -92.38953399658203, -89.88197326660156, -87.37442016601562, -84.86686706542969, -82.35930633544922, -79.85175323486328, -77.34419250488281, -74.83663940429688, -72.32908630371094, -69.82152557373047, -67.31397247314453, -64.80641174316406, -62.298858642578125, -59.79130554199219, -57.283748626708984, -54.77619171142578, -52.26863479614258, -49.761077880859375, -47.25352478027344, -44.745967864990234, -42.23841094970703, -39.730857849121094, -37.22330093383789, -34.71574401855469, -32.208187103271484, -29.700632095336914, -27.193077087402344, -24.68552017211914, -22.177963256835938, -19.670408248901367, -17.162853240966797, -14.655303955078125, -12.147747993469238, -9.640192031860352, -7.132636070251465, -4.625080108642578, -2.1175241470336914, 0.3900318145751953, 2.8975868225097656, 5.405143737792969, 7.9126996994018555, 10.420255661010742, 12.927811622619629, 15.435367584228516, 17.94292449951172, 20.45047950744629, 22.95803451538086, 25.465591430664062, 27.973148345947266, 30.480703353881836, 32.988258361816406, 35.49581527709961, 38.00337219238281, 40.51092529296875, 43.01848220825195, 45.526039123535156, 48.03359603881836, 50.54115295410156, 53.0487060546875, 55.5562629699707, 58.063819885253906, 60.571372985839844, 63.07892990112305, 65.58648681640625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 2.0, 6.0, 1.0, 12.0, 16.0, 10.0, 11.0, 16.0, 8.0, 19.0, 21.0, 21.0, 31.0, 26.0, 32.0, 37.0, 29.0, 33.0, 38.0, 33.0, 44.0, 40.0, 35.0, 56.0, 33.0, 22.0, 34.0, 39.0, 28.0, 30.0, 38.0, 21.0, 24.0, 18.0, 18.0, 19.0, 18.0, 21.0, 6.0, 13.0, 9.0, 8.0, 6.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-35.9652099609375, -34.81837844848633, -33.671546936035156, -32.52471160888672, -31.377880096435547, -30.231048583984375, -29.08421516418457, -27.937381744384766, -26.790550231933594, -25.643718719482422, -24.496885299682617, -23.350051879882812, -22.20322036743164, -21.05638885498047, -19.909555435180664, -18.76272201538086, -17.615890502929688, -16.469058990478516, -15.322225570678711, -14.175393104553223, -13.028560638427734, -11.881728172302246, -10.734895706176758, -9.58806324005127, -8.441230773925781, -7.294398307800293, -6.147565841674805, -5.000733375549316, -3.853900909423828, -2.70706844329834, -1.5602359771728516, -0.4134035110473633, 0.733428955078125, 1.8802614212036133, 3.0270938873291016, 4.17392635345459, 5.320758819580078, 6.467591285705566, 7.614423751831055, 8.761256217956543, 9.908088684082031, 11.05492115020752, 12.201753616333008, 13.348586082458496, 14.495418548583984, 15.642251014709473, 16.78908348083496, 17.935916900634766, 19.082748413085938, 20.22957992553711, 21.376413345336914, 22.52324676513672, 23.67007827758789, 24.816909790039062, 25.963743209838867, 27.110576629638672, 28.257408142089844, 29.404239654541016, 30.55107307434082, 31.697906494140625, 32.8447380065918, 33.99156951904297, 35.138404846191406, 36.28523635864258, 37.43206787109375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 4.0, 8.0, 9.0, 10.0, 15.0, 19.0, 23.0, 27.0, 26.0, 21.0, 43.0, 38.0, 31.0, 34.0, 42.0, 39.0, 40.0, 45.0, 40.0, 45.0, 49.0, 42.0, 45.0, 35.0, 24.0, 30.0, 34.0, 34.0, 23.0, 26.0, 17.0, 10.0, 17.0, 9.0, 9.0, 8.0, 3.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.63671875, -7.4132080078125, -7.189697265625, -6.9661865234375, -6.74267578125, -6.5191650390625, -6.295654296875, -6.0721435546875, -5.8486328125, -5.6251220703125, -5.401611328125, -5.1781005859375, -4.95458984375, -4.7310791015625, -4.507568359375, -4.2840576171875, -4.060546875, -3.8370361328125, -3.613525390625, -3.3900146484375, -3.16650390625, -2.9429931640625, -2.719482421875, -2.4959716796875, -2.2724609375, -2.0489501953125, -1.825439453125, -1.6019287109375, -1.37841796875, -1.1549072265625, -0.931396484375, -0.7078857421875, -0.484375, -0.2608642578125, -0.037353515625, 0.1861572265625, 0.40966796875, 0.6331787109375, 0.856689453125, 1.0802001953125, 1.3037109375, 1.5272216796875, 1.750732421875, 1.9742431640625, 2.19775390625, 2.4212646484375, 2.644775390625, 2.8682861328125, 3.091796875, 3.3153076171875, 3.538818359375, 3.7623291015625, 3.98583984375, 4.2093505859375, 4.432861328125, 4.6563720703125, 4.8798828125, 5.1033935546875, 5.326904296875, 5.5504150390625, 5.77392578125, 5.9974365234375, 6.220947265625, 6.4444580078125, 6.66796875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 15.0, 10.0, 7.0, 18.0, 26.0, 45.0, 77.0, 110.0, 120.0, 204.0, 292.0, 471.0, 655.0, 950.0, 1454.0, 2295.0, 3546.0, 5384.0, 8525.0, 13944.0, 22662.0, 38719.0, 70989.0, 148424.0, 322628.0, 200610.0, 88161.0, 47003.0, 26759.0, 16444.0, 10006.0, 6281.0, 3920.0, 2644.0, 1722.0, 1122.0, 721.0, 492.0, 313.0, 275.0, 173.0, 118.0, 78.0, 45.0, 23.0, 22.0, 24.0, 9.0, 12.0, 8.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.262939453125, -0.2551288604736328, -0.24731826782226562, -0.23950767517089844, -0.23169708251953125, -0.22388648986816406, -0.21607589721679688, -0.2082653045654297, -0.2004547119140625, -0.1926441192626953, -0.18483352661132812, -0.17702293395996094, -0.16921234130859375, -0.16140174865722656, -0.15359115600585938, -0.1457805633544922, -0.137969970703125, -0.1301593780517578, -0.12234878540039062, -0.11453819274902344, -0.10672760009765625, -0.09891700744628906, -0.09110641479492188, -0.08329582214355469, -0.0754852294921875, -0.06767463684082031, -0.059864044189453125, -0.05205345153808594, -0.04424285888671875, -0.03643226623535156, -0.028621673583984375, -0.020811080932617188, -0.01300048828125, -0.0051898956298828125, 0.002620697021484375, 0.010431289672851562, 0.01824188232421875, 0.026052474975585938, 0.033863067626953125, 0.04167366027832031, 0.0494842529296875, 0.05729484558105469, 0.06510543823242188, 0.07291603088378906, 0.08072662353515625, 0.08853721618652344, 0.09634780883789062, 0.10415840148925781, 0.111968994140625, 0.11977958679199219, 0.12759017944335938, 0.13540077209472656, 0.14321136474609375, 0.15102195739746094, 0.15883255004882812, 0.1666431427001953, 0.1744537353515625, 0.1822643280029297, 0.19007492065429688, 0.19788551330566406, 0.20569610595703125, 0.21350669860839844, 0.22131729125976562, 0.2291278839111328, 0.2369384765625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 9.0, 6.0, 10.0, 5.0, 10.0, 5.0, 13.0, 12.0, 16.0, 18.0, 21.0, 9.0, 14.0, 17.0, 31.0, 26.0, 34.0, 38.0, 39.0, 35.0, 37.0, 44.0, 49.0, 1056.0, 34.0, 33.0, 28.0, 33.0, 25.0, 30.0, 39.0, 36.0, 19.0, 21.0, 20.0, 18.0, 18.0, 9.0, 15.0, 16.0, 11.0, 14.0, 9.0, 6.0, 10.0, 5.0, 6.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.23046875, -4.09588623046875, -3.9613037109375, -3.82672119140625, -3.692138671875, -3.55755615234375, -3.4229736328125, -3.28839111328125, -3.15380859375, -3.01922607421875, -2.8846435546875, -2.75006103515625, -2.615478515625, -2.48089599609375, -2.3463134765625, -2.21173095703125, -2.0771484375, -1.94256591796875, -1.8079833984375, -1.67340087890625, -1.538818359375, -1.40423583984375, -1.2696533203125, -1.13507080078125, -1.00048828125, -0.86590576171875, -0.7313232421875, -0.59674072265625, -0.462158203125, -0.32757568359375, -0.1929931640625, -0.05841064453125, 0.076171875, 0.21075439453125, 0.3453369140625, 0.47991943359375, 0.614501953125, 0.74908447265625, 0.8836669921875, 1.01824951171875, 1.15283203125, 1.28741455078125, 1.4219970703125, 1.55657958984375, 1.691162109375, 1.82574462890625, 1.9603271484375, 2.09490966796875, 2.2294921875, 2.36407470703125, 2.4986572265625, 2.63323974609375, 2.767822265625, 2.90240478515625, 3.0369873046875, 3.17156982421875, 3.30615234375, 3.44073486328125, 3.5753173828125, 3.70989990234375, 3.844482421875, 3.97906494140625, 4.1136474609375, 4.24822998046875, 4.3828125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 5.0, 1.0, 4.0, 3.0, 6.0, 16.0, 25.0, 22.0, 33.0, 45.0, 95.0, 150.0, 210.0, 307.0, 457.0, 668.0, 1004.0, 1515.0, 2150.0, 3197.0, 4749.0, 7188.0, 10604.0, 15794.0, 24037.0, 38520.0, 65894.0, 122053.0, 1297617.0, 227464.0, 109466.0, 59878.0, 35577.0, 23099.0, 14835.0, 9859.0, 6729.0, 4551.0, 3020.0, 2060.0, 1358.0, 935.0, 652.0, 452.0, 275.0, 170.0, 135.0, 96.0, 62.0, 36.0, 22.0, 15.0, 11.0, 3.0, 9.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1514892578125, -0.1467437744140625, -0.141998291015625, -0.1372528076171875, -0.13250732421875, -0.1277618408203125, -0.123016357421875, -0.1182708740234375, -0.113525390625, -0.1087799072265625, -0.104034423828125, -0.0992889404296875, -0.09454345703125, -0.0897979736328125, -0.085052490234375, -0.0803070068359375, -0.0755615234375, -0.0708160400390625, -0.066070556640625, -0.0613250732421875, -0.05657958984375, -0.0518341064453125, -0.047088623046875, -0.0423431396484375, -0.03759765625, -0.0328521728515625, -0.028106689453125, -0.0233612060546875, -0.01861572265625, -0.0138702392578125, -0.009124755859375, -0.0043792724609375, 0.0003662109375, 0.0051116943359375, 0.009857177734375, 0.0146026611328125, 0.01934814453125, 0.0240936279296875, 0.028839111328125, 0.0335845947265625, 0.038330078125, 0.0430755615234375, 0.047821044921875, 0.0525665283203125, 0.05731201171875, 0.0620574951171875, 0.066802978515625, 0.0715484619140625, 0.0762939453125, 0.0810394287109375, 0.085784912109375, 0.0905303955078125, 0.09527587890625, 0.1000213623046875, 0.104766845703125, 0.1095123291015625, 0.1142578125, 0.1190032958984375, 0.123748779296875, 0.1284942626953125, 0.13323974609375, 0.1379852294921875, 0.142730712890625, 0.1474761962890625, 0.1522216796875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 10.0, 11.0, 7.0, 6.0, 13.0, 17.0, 22.0, 25.0, 28.0, 26.0, 42.0, 43.0, 44.0, 49.0, 59.0, 50.0, 64.0, 56.0, 50.0, 61.0, 53.0, 43.0, 36.0, 34.0, 33.0, 21.0, 22.0, 13.0, 14.0, 8.0, 7.0, 5.0, 4.0, 4.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.003545761108398e-05, -6.7858025431633e-05, -6.568059325218201e-05, -6.350316107273102e-05, -6.132572889328003e-05, -5.914829671382904e-05, -5.697086453437805e-05, -5.479343235492706e-05, -5.2616000175476074e-05, -5.0438567996025085e-05, -4.82611358165741e-05, -4.608370363712311e-05, -4.390627145767212e-05, -4.172883927822113e-05, -3.955140709877014e-05, -3.737397491931915e-05, -3.5196542739868164e-05, -3.3019110560417175e-05, -3.0841678380966187e-05, -2.8664246201515198e-05, -2.648681402206421e-05, -2.430938184261322e-05, -2.213194966316223e-05, -1.9954517483711243e-05, -1.7777085304260254e-05, -1.5599653124809265e-05, -1.3422220945358276e-05, -1.1244788765907288e-05, -9.067356586456299e-06, -6.88992440700531e-06, -4.712492227554321e-06, -2.5350600481033325e-06, -3.5762786865234375e-07, 1.819804310798645e-06, 3.997236490249634e-06, 6.1746686697006226e-06, 8.352100849151611e-06, 1.05295330286026e-05, 1.2706965208053589e-05, 1.4884397387504578e-05, 1.7061829566955566e-05, 1.9239261746406555e-05, 2.1416693925857544e-05, 2.3594126105308533e-05, 2.577155828475952e-05, 2.794899046421051e-05, 3.01264226436615e-05, 3.230385482311249e-05, 3.4481287002563477e-05, 3.6658719182014465e-05, 3.8836151361465454e-05, 4.101358354091644e-05, 4.319101572036743e-05, 4.536844789981842e-05, 4.754588007926941e-05, 4.97233122587204e-05, 5.190074443817139e-05, 5.4078176617622375e-05, 5.6255608797073364e-05, 5.843304097652435e-05, 6.061047315597534e-05, 6.278790533542633e-05, 6.496533751487732e-05, 6.714276969432831e-05, 6.93202018737793e-05]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 8.0, 3.0, 7.0, 10.0, 12.0, 14.0, 27.0, 24.0, 40.0, 47.0, 55.0, 57.0, 131.0, 209.0, 428.0, 2539.0, 712881.0, 329694.0, 1444.0, 356.0, 198.0, 81.0, 60.0, 42.0, 29.0, 26.0, 28.0, 20.0, 21.0, 9.0, 8.0, 9.0, 10.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0016145706176757812, -0.001566961407661438, -0.0015193521976470947, -0.0014717429876327515, -0.0014241337776184082, -0.001376524567604065, -0.0013289153575897217, -0.0012813061475753784, -0.0012336969375610352, -0.001186087727546692, -0.0011384785175323486, -0.0010908693075180054, -0.0010432600975036621, -0.0009956508874893188, -0.0009480416774749756, -0.0009004324674606323, -0.0008528232574462891, -0.0008052140474319458, -0.0007576048374176025, -0.0007099956274032593, -0.000662386417388916, -0.0006147772073745728, -0.0005671679973602295, -0.0005195587873458862, -0.00047194957733154297, -0.0004243403673171997, -0.00037673115730285645, -0.0003291219472885132, -0.0002815127372741699, -0.00023390352725982666, -0.0001862943172454834, -0.00013868510723114014, -9.107589721679688e-05, -4.346668720245361e-05, 4.1425228118896484e-06, 5.175173282623291e-05, 9.936094284057617e-05, 0.00014697015285491943, 0.0001945793628692627, 0.00024218857288360596, 0.0002897977828979492, 0.0003374069929122925, 0.00038501620292663574, 0.000432625412940979, 0.00048023462295532227, 0.0005278438329696655, 0.0005754530429840088, 0.000623062252998352, 0.0006706714630126953, 0.0007182806730270386, 0.0007658898830413818, 0.0008134990930557251, 0.0008611083030700684, 0.0009087175130844116, 0.0009563267230987549, 0.0010039359331130981, 0.0010515451431274414, 0.0010991543531417847, 0.001146763563156128, 0.0011943727731704712, 0.0012419819831848145, 0.0012895911931991577, 0.001337200403213501, 0.0013848096132278442, 0.0014324188232421875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 46.0, 300.0, 522.0, 135.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005373908788897097, -0.0005276696756482124, -0.0005179484724067152, -0.0005082272691652179, -0.0004985061241313815, -0.0004887849208898842, -0.00047906371764838696, -0.0004693425144068897, -0.0004596213111653924, -0.0004499001079238951, -0.00044017890468239784, -0.000430457730544731, -0.00042073652730323374, -0.00041101532406173646, -0.00040129414992406964, -0.00039157294668257236, -0.0003818517434410751, -0.0003721305401995778, -0.00036240933695808053, -0.0003526881628204137, -0.00034296695957891643, -0.00033324575633741915, -0.00032352458219975233, -0.00031380337895825505, -0.0003040821757167578, -0.0002943609724752605, -0.0002846397692337632, -0.0002749185950960964, -0.0002651973918545991, -0.00025547618861310184, -0.000245755014475435, -0.00023603381123393774, -0.00022631263709627092, -0.00021659143385477364, -0.0002068702451651916, -0.00019714905647560954, -0.00018742785323411226, -0.00017770664999261498, -0.00016798546130303293, -0.00015826427261345088, -0.0001485430693719536, -0.00013882186613045633, -0.00012910067744087428, -0.00011937948147533461, -0.00010965828550979495, -9.993708954425529e-05, -9.021589357871562e-05, -8.049469761317596e-05, -7.077349437167868e-05, -6.105229840613902e-05, -5.133110244059935e-05, -4.160990647505969e-05, -3.1888710509520024e-05, -2.216751454398036e-05, -1.2446318578440696e-05, -2.725122612901032e-06, 6.996073352638632e-06, 1.6717269318178296e-05, 2.643846528371796e-05, 3.6159661249257624e-05, 4.588085721479729e-05, 5.560205318033695e-05, 6.532324914587662e-05, 7.504444511141628e-05, 8.476564107695594e-05]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 9.0, 3.0, 7.0, 6.0, 10.0, 7.0, 11.0, 10.0, 10.0, 11.0, 17.0, 14.0, 26.0, 25.0, 36.0, 30.0, 32.0, 41.0, 51.0, 42.0, 36.0, 34.0, 44.0, 37.0, 40.0, 43.0, 41.0, 49.0, 38.0, 31.0, 28.0, 18.0, 32.0, 26.0, 21.0, 20.0, 17.0, 13.0, 5.0, 7.0, 3.0, 7.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6835670471191406e-05, -3.565941005945206e-05, -3.448314964771271e-05, -3.330688923597336e-05, -3.213062882423401e-05, -3.095436841249466e-05, -2.977810800075531e-05, -2.860184758901596e-05, -2.742558717727661e-05, -2.6249326765537262e-05, -2.5073066353797913e-05, -2.3896805942058563e-05, -2.2720545530319214e-05, -2.1544285118579865e-05, -2.0368024706840515e-05, -1.9191764295101166e-05, -1.8015503883361816e-05, -1.6839243471622467e-05, -1.5662983059883118e-05, -1.4486722648143768e-05, -1.3310462236404419e-05, -1.213420182466507e-05, -1.095794141292572e-05, -9.781681001186371e-06, -8.605420589447021e-06, -7.429160177707672e-06, -6.252899765968323e-06, -5.076639354228973e-06, -3.900378942489624e-06, -2.7241185307502747e-06, -1.5478581190109253e-06, -3.7159770727157593e-07, 8.046627044677734e-07, 1.980923116207123e-06, 3.157183527946472e-06, 4.3334439396858215e-06, 5.509704351425171e-06, 6.68596476316452e-06, 7.86222517490387e-06, 9.038485586643219e-06, 1.0214745998382568e-05, 1.1391006410121918e-05, 1.2567266821861267e-05, 1.3743527233600616e-05, 1.4919787645339966e-05, 1.6096048057079315e-05, 1.7272308468818665e-05, 1.8448568880558014e-05, 1.9624829292297363e-05, 2.0801089704036713e-05, 2.1977350115776062e-05, 2.315361052751541e-05, 2.432987093925476e-05, 2.550613135099411e-05, 2.668239176273346e-05, 2.785865217447281e-05, 2.9034912586212158e-05, 3.0211172997951508e-05, 3.138743340969086e-05, 3.2563693821430206e-05, 3.3739954233169556e-05, 3.4916214644908905e-05, 3.6092475056648254e-05, 3.7268735468387604e-05, 3.844499588012695e-05]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 4.0, 8.0, 9.0, 10.0, 15.0, 19.0, 23.0, 27.0, 26.0, 21.0, 43.0, 38.0, 31.0, 34.0, 42.0, 39.0, 40.0, 45.0, 40.0, 45.0, 49.0, 42.0, 45.0, 35.0, 24.0, 30.0, 34.0, 34.0, 23.0, 26.0, 17.0, 10.0, 17.0, 9.0, 9.0, 8.0, 3.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.63671875, -7.4132080078125, -7.189697265625, -6.9661865234375, -6.74267578125, -6.5191650390625, -6.295654296875, -6.0721435546875, -5.8486328125, -5.6251220703125, -5.401611328125, -5.1781005859375, -4.95458984375, -4.7310791015625, -4.507568359375, -4.2840576171875, -4.060546875, -3.8370361328125, -3.613525390625, -3.3900146484375, -3.16650390625, -2.9429931640625, -2.719482421875, -2.4959716796875, -2.2724609375, -2.0489501953125, -1.825439453125, -1.6019287109375, -1.37841796875, -1.1549072265625, -0.931396484375, -0.7078857421875, -0.484375, -0.2608642578125, -0.037353515625, 0.1861572265625, 0.40966796875, 0.6331787109375, 0.856689453125, 1.0802001953125, 1.3037109375, 1.5272216796875, 1.750732421875, 1.9742431640625, 2.19775390625, 2.4212646484375, 2.644775390625, 2.8682861328125, 3.091796875, 3.3153076171875, 3.538818359375, 3.7623291015625, 3.98583984375, 4.2093505859375, 4.432861328125, 4.6563720703125, 4.8798828125, 5.1033935546875, 5.326904296875, 5.5504150390625, 5.77392578125, 5.9974365234375, 6.220947265625, 6.4444580078125, 6.66796875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 5.0, 8.0, 19.0, 22.0, 28.0, 41.0, 48.0, 68.0, 113.0, 151.0, 262.0, 402.0, 585.0, 962.0, 1475.0, 2414.0, 3771.0, 6272.0, 10268.0, 17498.0, 30147.0, 54146.0, 102209.0, 195024.0, 259322.0, 165801.0, 86185.0, 46280.0, 26268.0, 15129.0, 9021.0, 5453.0, 3287.0, 2024.0, 1326.0, 859.0, 594.0, 364.0, 216.0, 174.0, 93.0, 71.0, 53.0, 39.0, 25.0, 12.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.046875, -8.7757568359375, -8.504638671875, -8.2335205078125, -7.96240234375, -7.6912841796875, -7.420166015625, -7.1490478515625, -6.8779296875, -6.6068115234375, -6.335693359375, -6.0645751953125, -5.79345703125, -5.5223388671875, -5.251220703125, -4.9801025390625, -4.708984375, -4.4378662109375, -4.166748046875, -3.8956298828125, -3.62451171875, -3.3533935546875, -3.082275390625, -2.8111572265625, -2.5400390625, -2.2689208984375, -1.997802734375, -1.7266845703125, -1.45556640625, -1.1844482421875, -0.913330078125, -0.6422119140625, -0.37109375, -0.0999755859375, 0.171142578125, 0.4422607421875, 0.71337890625, 0.9844970703125, 1.255615234375, 1.5267333984375, 1.7978515625, 2.0689697265625, 2.340087890625, 2.6112060546875, 2.88232421875, 3.1534423828125, 3.424560546875, 3.6956787109375, 3.966796875, 4.2379150390625, 4.509033203125, 4.7801513671875, 5.05126953125, 5.3223876953125, 5.593505859375, 5.8646240234375, 6.1357421875, 6.4068603515625, 6.677978515625, 6.9490966796875, 7.22021484375, 7.4913330078125, 7.762451171875, 8.0335693359375, 8.3046875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 9.0, 6.0, 7.0, 10.0, 11.0, 11.0, 23.0, 13.0, 18.0, 30.0, 40.0, 39.0, 40.0, 55.0, 61.0, 82.0, 149.0, 219.0, 1329.0, 230.0, 151.0, 85.0, 68.0, 45.0, 50.0, 46.0, 35.0, 29.0, 28.0, 18.0, 20.0, 15.0, 17.0, 8.0, 5.0, 10.0, 8.0, 11.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0, -17.43017578125, -16.8603515625, -16.29052734375, -15.720703125, -15.15087890625, -14.5810546875, -14.01123046875, -13.44140625, -12.87158203125, -12.3017578125, -11.73193359375, -11.162109375, -10.59228515625, -10.0224609375, -9.45263671875, -8.8828125, -8.31298828125, -7.7431640625, -7.17333984375, -6.603515625, -6.03369140625, -5.4638671875, -4.89404296875, -4.32421875, -3.75439453125, -3.1845703125, -2.61474609375, -2.044921875, -1.47509765625, -0.9052734375, -0.33544921875, 0.234375, 0.80419921875, 1.3740234375, 1.94384765625, 2.513671875, 3.08349609375, 3.6533203125, 4.22314453125, 4.79296875, 5.36279296875, 5.9326171875, 6.50244140625, 7.072265625, 7.64208984375, 8.2119140625, 8.78173828125, 9.3515625, 9.92138671875, 10.4912109375, 11.06103515625, 11.630859375, 12.20068359375, 12.7705078125, 13.34033203125, 13.91015625, 14.47998046875, 15.0498046875, 15.61962890625, 16.189453125, 16.75927734375, 17.3291015625, 17.89892578125, 18.46875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 15.0, 12.0, 15.0, 31.0, 32.0, 36.0, 60.0, 82.0, 174.0, 332.0, 704.0, 1517.0, 3610.0, 9476.0, 27499.0, 93658.0, 554221.0, 2009286.0, 341705.0, 68983.0, 21281.0, 7517.0, 2842.0, 1290.0, 584.0, 288.0, 144.0, 78.0, 54.0, 38.0, 31.0, 31.0, 18.0, 9.0, 9.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 4.0, 5.0, 2.0], "bins": [-21.125, -20.5599365234375, -19.994873046875, -19.4298095703125, -18.86474609375, -18.2996826171875, -17.734619140625, -17.1695556640625, -16.6044921875, -16.0394287109375, -15.474365234375, -14.9093017578125, -14.34423828125, -13.7791748046875, -13.214111328125, -12.6490478515625, -12.083984375, -11.5189208984375, -10.953857421875, -10.3887939453125, -9.82373046875, -9.2586669921875, -8.693603515625, -8.1285400390625, -7.5634765625, -6.9984130859375, -6.433349609375, -5.8682861328125, -5.30322265625, -4.7381591796875, -4.173095703125, -3.6080322265625, -3.04296875, -2.4779052734375, -1.912841796875, -1.3477783203125, -0.78271484375, -0.2176513671875, 0.347412109375, 0.9124755859375, 1.4775390625, 2.0426025390625, 2.607666015625, 3.1727294921875, 3.73779296875, 4.3028564453125, 4.867919921875, 5.4329833984375, 5.998046875, 6.5631103515625, 7.128173828125, 7.6932373046875, 8.25830078125, 8.8233642578125, 9.388427734375, 9.9534912109375, 10.5185546875, 11.0836181640625, 11.648681640625, 12.2137451171875, 12.77880859375, 13.3438720703125, 13.908935546875, 14.4739990234375, 15.0390625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 23.0, 36.0, 83.0, 140.0, 211.0, 195.0, 140.0, 85.0, 48.0, 22.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.17153549194336, -41.76957702636719, -38.36761474609375, -34.96565246582031, -31.56369400024414, -28.161733627319336, -24.75977325439453, -21.357812881469727, -17.955852508544922, -14.553892135620117, -11.151931762695312, -7.749971389770508, -4.348011016845703, -0.9460506439208984, 2.4559097290039062, 5.857870101928711, 9.259830474853516, 12.66179084777832, 16.063751220703125, 19.46571159362793, 22.867671966552734, 26.26963233947754, 29.671592712402344, 33.07355499267578, 36.47551345825195, 39.877471923828125, 43.27943420410156, 46.681396484375, 50.08335494995117, 53.485313415527344, 56.88727569580078, 60.28923797607422, 63.691192626953125, 67.09315490722656, 70.4951171875, 73.8970718383789, 77.29903411865234, 80.70099639892578, 84.10295104980469, 87.50491333007812, 90.90687561035156, 94.308837890625, 97.71080017089844, 101.11275482177734, 104.51471710205078, 107.91667938232422, 111.31863403320312, 114.72059631347656, 118.12255859375, 121.52452087402344, 124.92648315429688, 128.3284454345703, 131.73040771484375, 135.13235473632812, 138.53431701660156, 141.936279296875, 145.33824157714844, 148.74020385742188, 152.1421661376953, 155.54412841796875, 158.94607543945312, 162.34803771972656, 165.75, 169.15196228027344, 172.55392456054688]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 5.0, 7.0, 4.0, 4.0, 7.0, 11.0, 8.0, 10.0, 12.0, 8.0, 17.0, 16.0, 24.0, 18.0, 26.0, 27.0, 34.0, 26.0, 39.0, 30.0, 41.0, 34.0, 39.0, 36.0, 47.0, 42.0, 42.0, 33.0, 32.0, 33.0, 43.0, 40.0, 23.0, 28.0, 23.0, 25.0, 25.0, 16.0, 14.0, 9.0, 12.0, 9.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-54.364418029785156, -52.8651123046875, -51.36580276489258, -49.86649703979492, -48.367191314697266, -46.86788558959961, -45.36857604980469, -43.86927032470703, -42.369964599609375, -40.87065887451172, -39.3713493347168, -37.87204360961914, -36.372737884521484, -34.87343215942383, -33.374122619628906, -31.87481689453125, -30.37550926208496, -28.876201629638672, -27.376895904541016, -25.877588272094727, -24.37828254699707, -22.87897491455078, -21.379669189453125, -19.880361557006836, -18.381053924560547, -16.881746292114258, -15.382440567016602, -13.883132934570312, -12.383827209472656, -10.884519577026367, -9.385212898254395, -7.885906219482422, -6.386600494384766, -4.887293815612793, -3.387986898422241, -1.8886799812316895, -0.3893733024597168, 1.1099333763122559, 2.6092405319213867, 4.108547210693359, 5.607853889465332, 7.107160568237305, 8.606467247009277, 10.10577392578125, 11.605081558227539, 13.104387283325195, 14.603694915771484, 16.10300064086914, 17.60230827331543, 19.10161590576172, 20.600921630859375, 22.100229263305664, 23.59953498840332, 25.09884262084961, 26.598148345947266, 28.097455978393555, 29.596763610839844, 31.096071243286133, 32.59537887573242, 34.09468460083008, 35.593990325927734, 37.09329605102539, 38.59260559082031, 40.09191131591797, 41.591217041015625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 7.0, 8.0, 6.0, 6.0, 12.0, 18.0, 15.0, 18.0, 22.0, 23.0, 26.0, 33.0, 38.0, 45.0, 44.0, 43.0, 42.0, 55.0, 42.0, 44.0, 35.0, 44.0, 35.0, 50.0, 46.0, 32.0, 39.0, 25.0, 25.0, 25.0, 23.0, 13.0, 15.0, 13.0, 4.0, 8.0, 8.0, 8.0, 6.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.8046875, -8.552978515625, -8.30126953125, -8.049560546875, -7.7978515625, -7.546142578125, -7.29443359375, -7.042724609375, -6.791015625, -6.539306640625, -6.28759765625, -6.035888671875, -5.7841796875, -5.532470703125, -5.28076171875, -5.029052734375, -4.77734375, -4.525634765625, -4.27392578125, -4.022216796875, -3.7705078125, -3.518798828125, -3.26708984375, -3.015380859375, -2.763671875, -2.511962890625, -2.26025390625, -2.008544921875, -1.7568359375, -1.505126953125, -1.25341796875, -1.001708984375, -0.75, -0.498291015625, -0.24658203125, 0.005126953125, 0.2568359375, 0.508544921875, 0.76025390625, 1.011962890625, 1.263671875, 1.515380859375, 1.76708984375, 2.018798828125, 2.2705078125, 2.522216796875, 2.77392578125, 3.025634765625, 3.27734375, 3.529052734375, 3.78076171875, 4.032470703125, 4.2841796875, 4.535888671875, 4.78759765625, 5.039306640625, 5.291015625, 5.542724609375, 5.79443359375, 6.046142578125, 6.2978515625, 6.549560546875, 6.80126953125, 7.052978515625, 7.3046875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 13.0, 18.0, 19.0, 26.0, 46.0, 70.0, 88.0, 148.0, 248.0, 465.0, 829.0, 1570.0, 3143.0, 6497.0, 14203.0, 33535.0, 91593.0, 348818.0, 2202948.0, 1181129.0, 201690.0, 62137.0, 24357.0, 10648.0, 4862.0, 2408.0, 1150.0, 648.0, 352.0, 226.0, 132.0, 69.0, 55.0, 39.0, 32.0, 31.0, 9.0, 4.0, 10.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.9140625, -14.4595947265625, -14.005126953125, -13.5506591796875, -13.09619140625, -12.6417236328125, -12.187255859375, -11.7327880859375, -11.2783203125, -10.8238525390625, -10.369384765625, -9.9149169921875, -9.46044921875, -9.0059814453125, -8.551513671875, -8.0970458984375, -7.642578125, -7.1881103515625, -6.733642578125, -6.2791748046875, -5.82470703125, -5.3702392578125, -4.915771484375, -4.4613037109375, -4.0068359375, -3.5523681640625, -3.097900390625, -2.6434326171875, -2.18896484375, -1.7344970703125, -1.280029296875, -0.8255615234375, -0.37109375, 0.0833740234375, 0.537841796875, 0.9923095703125, 1.44677734375, 1.9012451171875, 2.355712890625, 2.8101806640625, 3.2646484375, 3.7191162109375, 4.173583984375, 4.6280517578125, 5.08251953125, 5.5369873046875, 5.991455078125, 6.4459228515625, 6.900390625, 7.3548583984375, 7.809326171875, 8.2637939453125, 8.71826171875, 9.1727294921875, 9.627197265625, 10.0816650390625, 10.5361328125, 10.9906005859375, 11.445068359375, 11.8995361328125, 12.35400390625, 12.8084716796875, 13.262939453125, 13.7174072265625, 14.171875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 7.0, 9.0, 9.0, 17.0, 15.0, 28.0, 37.0, 54.0, 45.0, 91.0, 111.0, 154.0, 240.0, 350.0, 529.0, 616.0, 550.0, 328.0, 207.0, 150.0, 119.0, 78.0, 78.0, 47.0, 43.0, 31.0, 30.0, 16.0, 18.0, 12.0, 6.0, 9.0, 5.0, 3.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-14.3515625, -13.9688720703125, -13.586181640625, -13.2034912109375, -12.82080078125, -12.4381103515625, -12.055419921875, -11.6727294921875, -11.2900390625, -10.9073486328125, -10.524658203125, -10.1419677734375, -9.75927734375, -9.3765869140625, -8.993896484375, -8.6112060546875, -8.228515625, -7.8458251953125, -7.463134765625, -7.0804443359375, -6.69775390625, -6.3150634765625, -5.932373046875, -5.5496826171875, -5.1669921875, -4.7843017578125, -4.401611328125, -4.0189208984375, -3.63623046875, -3.2535400390625, -2.870849609375, -2.4881591796875, -2.10546875, -1.7227783203125, -1.340087890625, -0.9573974609375, -0.57470703125, -0.1920166015625, 0.190673828125, 0.5733642578125, 0.9560546875, 1.3387451171875, 1.721435546875, 2.1041259765625, 2.48681640625, 2.8695068359375, 3.252197265625, 3.6348876953125, 4.017578125, 4.4002685546875, 4.782958984375, 5.1656494140625, 5.54833984375, 5.9310302734375, 6.313720703125, 6.6964111328125, 7.0791015625, 7.4617919921875, 7.844482421875, 8.2271728515625, 8.60986328125, 8.9925537109375, 9.375244140625, 9.7579345703125, 10.140625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 8.0, 11.0, 15.0, 15.0, 32.0, 44.0, 87.0, 149.0, 253.0, 474.0, 1010.0, 2222.0, 5108.0, 13772.0, 43993.0, 183175.0, 1470719.0, 2162596.0, 230208.0, 53366.0, 16401.0, 5902.0, 2404.0, 1101.0, 555.0, 301.0, 142.0, 83.0, 45.0, 30.0, 22.0, 14.0, 7.0, 3.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.265625, -16.54833984375, -15.8310546875, -15.11376953125, -14.396484375, -13.67919921875, -12.9619140625, -12.24462890625, -11.52734375, -10.81005859375, -10.0927734375, -9.37548828125, -8.658203125, -7.94091796875, -7.2236328125, -6.50634765625, -5.7890625, -5.07177734375, -4.3544921875, -3.63720703125, -2.919921875, -2.20263671875, -1.4853515625, -0.76806640625, -0.05078125, 0.66650390625, 1.3837890625, 2.10107421875, 2.818359375, 3.53564453125, 4.2529296875, 4.97021484375, 5.6875, 6.40478515625, 7.1220703125, 7.83935546875, 8.556640625, 9.27392578125, 9.9912109375, 10.70849609375, 11.42578125, 12.14306640625, 12.8603515625, 13.57763671875, 14.294921875, 15.01220703125, 15.7294921875, 16.44677734375, 17.1640625, 17.88134765625, 18.5986328125, 19.31591796875, 20.033203125, 20.75048828125, 21.4677734375, 22.18505859375, 22.90234375, 23.61962890625, 24.3369140625, 25.05419921875, 25.771484375, 26.48876953125, 27.2060546875, 27.92333984375, 28.640625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 9.0, 12.0, 23.0, 22.0, 36.0, 58.0, 59.0, 50.0, 75.0, 112.0, 99.0, 74.0, 82.0, 87.0, 51.0, 41.0, 37.0, 29.0, 16.0, 15.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.692049026489258, -27.03499984741211, -25.377948760986328, -23.720897674560547, -22.0638484954834, -20.40679931640625, -18.74974822998047, -17.092697143554688, -15.435647964477539, -13.778597831726074, -12.12154769897461, -10.464497566223145, -8.80744743347168, -7.150397300720215, -5.49334716796875, -3.836297035217285, -2.1792469024658203, -0.5221967697143555, 1.1348533630371094, 2.791903495788574, 4.448953628540039, 6.106003761291504, 7.763053894042969, 9.420104026794434, 11.077154159545898, 12.734204292297363, 14.391254425048828, 16.04830551147461, 17.705354690551758, 19.362403869628906, 21.019454956054688, 22.67650604248047, 24.33355712890625, 25.99060821533203, 27.64765739440918, 29.304706573486328, 30.96175765991211, 32.61880874633789, 34.275856018066406, 35.93290710449219, 37.58995819091797, 39.24700927734375, 40.90406036376953, 42.56110763549805, 44.21815872192383, 45.87520980834961, 47.532257080078125, 49.189308166503906, 50.84635925292969, 52.50341033935547, 54.16046142578125, 55.817508697509766, 57.47455978393555, 59.13161087036133, 60.788658142089844, 62.445709228515625, 64.1027603149414, 65.75981140136719, 67.41686248779297, 69.07391357421875, 70.73095703125, 72.38800811767578, 74.04505920410156, 75.70211029052734, 77.35916137695312]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 2.0, 7.0, 9.0, 5.0, 5.0, 9.0, 11.0, 13.0, 13.0, 23.0, 26.0, 20.0, 21.0, 23.0, 31.0, 37.0, 32.0, 35.0, 36.0, 42.0, 40.0, 38.0, 54.0, 34.0, 50.0, 30.0, 37.0, 37.0, 31.0, 24.0, 28.0, 24.0, 35.0, 13.0, 21.0, 19.0, 18.0, 13.0, 8.0, 19.0, 5.0, 8.0, 8.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-43.9974365234375, -42.66325759887695, -41.329078674316406, -39.994895935058594, -38.66071701049805, -37.3265380859375, -35.99235916137695, -34.658180236816406, -33.323997497558594, -31.989818572998047, -30.655637741088867, -29.32145881652832, -27.98727798461914, -26.653099060058594, -25.318920135498047, -23.9847412109375, -22.650562286376953, -21.316383361816406, -19.982202529907227, -18.64802360534668, -17.3138427734375, -15.979663848876953, -14.645484924316406, -13.311305046081543, -11.97712516784668, -10.642945289611816, -9.308765411376953, -7.974586486816406, -6.640406608581543, -5.30622673034668, -3.972047805786133, -2.6378679275512695, -1.3036880493164062, 0.03049159049987793, 1.364671230316162, 2.698850631713867, 4.0330305099487305, 5.367210388183594, 6.701389312744141, 8.035569190979004, 9.369749069213867, 10.70392894744873, 12.038108825683594, 13.37228775024414, 14.706467628479004, 16.040647506713867, 17.374826431274414, 18.709007263183594, 20.04318618774414, 21.377365112304688, 22.711545944213867, 24.045724868774414, 25.379905700683594, 26.71408462524414, 28.048263549804688, 29.382442474365234, 30.716623306274414, 32.050804138183594, 33.38498306274414, 34.71916198730469, 36.053340911865234, 37.38751983642578, 38.721702575683594, 40.05588150024414, 41.39006042480469]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 4.0, 9.0, 4.0, 12.0, 18.0, 17.0, 18.0, 16.0, 26.0, 23.0, 22.0, 27.0, 21.0, 29.0, 45.0, 46.0, 37.0, 31.0, 49.0, 40.0, 32.0, 39.0, 31.0, 48.0, 37.0, 33.0, 39.0, 34.0, 29.0, 20.0, 15.0, 25.0, 14.0, 18.0, 14.0, 11.0, 5.0, 15.0, 12.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0], "bins": [-7.87109375, -7.6510009765625, -7.430908203125, -7.2108154296875, -6.99072265625, -6.7706298828125, -6.550537109375, -6.3304443359375, -6.1103515625, -5.8902587890625, -5.670166015625, -5.4500732421875, -5.22998046875, -5.0098876953125, -4.789794921875, -4.5697021484375, -4.349609375, -4.1295166015625, -3.909423828125, -3.6893310546875, -3.46923828125, -3.2491455078125, -3.029052734375, -2.8089599609375, -2.5888671875, -2.3687744140625, -2.148681640625, -1.9285888671875, -1.70849609375, -1.4884033203125, -1.268310546875, -1.0482177734375, -0.828125, -0.6080322265625, -0.387939453125, -0.1678466796875, 0.05224609375, 0.2723388671875, 0.492431640625, 0.7125244140625, 0.9326171875, 1.1527099609375, 1.372802734375, 1.5928955078125, 1.81298828125, 2.0330810546875, 2.253173828125, 2.4732666015625, 2.693359375, 2.9134521484375, 3.133544921875, 3.3536376953125, 3.57373046875, 3.7938232421875, 4.013916015625, 4.2340087890625, 4.4541015625, 4.6741943359375, 4.894287109375, 5.1143798828125, 5.33447265625, 5.5545654296875, 5.774658203125, 5.9947509765625, 6.21484375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 2.0, 4.0, 5.0, 11.0, 14.0, 18.0, 28.0, 47.0, 70.0, 103.0, 178.0, 237.0, 377.0, 583.0, 920.0, 1464.0, 2268.0, 3516.0, 5710.0, 9024.0, 14905.0, 25265.0, 44085.0, 85910.0, 195849.0, 322873.0, 163084.0, 74325.0, 39176.0, 22462.0, 13675.0, 8219.0, 5235.0, 3196.0, 2037.0, 1250.0, 866.0, 523.0, 346.0, 224.0, 152.0, 114.0, 64.0, 48.0, 26.0, 25.0, 18.0, 10.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.251220703125, -0.24237442016601562, -0.23352813720703125, -0.22468185424804688, -0.2158355712890625, -0.20698928833007812, -0.19814300537109375, -0.18929672241210938, -0.180450439453125, -0.17160415649414062, -0.16275787353515625, -0.15391159057617188, -0.1450653076171875, -0.13621902465820312, -0.12737274169921875, -0.11852645874023438, -0.10968017578125, -0.10083389282226562, -0.09198760986328125, -0.08314132690429688, -0.0742950439453125, -0.06544876098632812, -0.05660247802734375, -0.047756195068359375, -0.038909912109375, -0.030063629150390625, -0.02121734619140625, -0.012371063232421875, -0.0035247802734375, 0.005321502685546875, 0.01416778564453125, 0.023014068603515625, 0.0318603515625, 0.040706634521484375, 0.04955291748046875, 0.058399200439453125, 0.0672454833984375, 0.07609176635742188, 0.08493804931640625, 0.09378433227539062, 0.102630615234375, 0.11147689819335938, 0.12032318115234375, 0.12916946411132812, 0.1380157470703125, 0.14686203002929688, 0.15570831298828125, 0.16455459594726562, 0.17340087890625, 0.18224716186523438, 0.19109344482421875, 0.19993972778320312, 0.2087860107421875, 0.21763229370117188, 0.22647857666015625, 0.23532485961914062, 0.244171142578125, 0.2530174255371094, 0.26186370849609375, 0.2707099914550781, 0.2795562744140625, 0.2884025573730469, 0.29724884033203125, 0.3060951232910156, 0.31494140625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 8.0, 11.0, 13.0, 12.0, 14.0, 15.0, 22.0, 25.0, 30.0, 28.0, 32.0, 34.0, 36.0, 30.0, 36.0, 33.0, 34.0, 45.0, 1065.0, 41.0, 36.0, 33.0, 35.0, 39.0, 40.0, 27.0, 28.0, 34.0, 28.0, 23.0, 17.0, 18.0, 20.0, 10.0, 16.0, 6.0, 6.0, 6.0, 8.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9296875, -4.7691650390625, -4.608642578125, -4.4481201171875, -4.28759765625, -4.1270751953125, -3.966552734375, -3.8060302734375, -3.6455078125, -3.4849853515625, -3.324462890625, -3.1639404296875, -3.00341796875, -2.8428955078125, -2.682373046875, -2.5218505859375, -2.361328125, -2.2008056640625, -2.040283203125, -1.8797607421875, -1.71923828125, -1.5587158203125, -1.398193359375, -1.2376708984375, -1.0771484375, -0.9166259765625, -0.756103515625, -0.5955810546875, -0.43505859375, -0.2745361328125, -0.114013671875, 0.0465087890625, 0.20703125, 0.3675537109375, 0.528076171875, 0.6885986328125, 0.84912109375, 1.0096435546875, 1.170166015625, 1.3306884765625, 1.4912109375, 1.6517333984375, 1.812255859375, 1.9727783203125, 2.13330078125, 2.2938232421875, 2.454345703125, 2.6148681640625, 2.775390625, 2.9359130859375, 3.096435546875, 3.2569580078125, 3.41748046875, 3.5780029296875, 3.738525390625, 3.8990478515625, 4.0595703125, 4.2200927734375, 4.380615234375, 4.5411376953125, 4.70166015625, 4.8621826171875, 5.022705078125, 5.1832275390625, 5.34375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 11.0, 13.0, 18.0, 34.0, 58.0, 79.0, 131.0, 212.0, 300.0, 443.0, 707.0, 1067.0, 1638.0, 2648.0, 4129.0, 6581.0, 10825.0, 17460.0, 28806.0, 48697.0, 86936.0, 178170.0, 1339075.0, 167540.0, 82809.0, 46827.0, 27644.0, 16779.0, 10061.0, 6320.0, 4050.0, 2481.0, 1617.0, 1029.0, 687.0, 427.0, 271.0, 200.0, 118.0, 71.0, 55.0, 41.0, 23.0, 15.0, 6.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1739501953125, -0.16823959350585938, -0.16252899169921875, -0.15681838989257812, -0.1511077880859375, -0.14539718627929688, -0.13968658447265625, -0.13397598266601562, -0.128265380859375, -0.12255477905273438, -0.11684417724609375, -0.11113357543945312, -0.1054229736328125, -0.09971237182617188, -0.09400177001953125, -0.08829116821289062, -0.08258056640625, -0.07686996459960938, -0.07115936279296875, -0.06544876098632812, -0.0597381591796875, -0.054027557373046875, -0.04831695556640625, -0.042606353759765625, -0.036895751953125, -0.031185150146484375, -0.02547454833984375, -0.019763946533203125, -0.0140533447265625, -0.008342742919921875, -0.00263214111328125, 0.003078460693359375, 0.0087890625, 0.014499664306640625, 0.02021026611328125, 0.025920867919921875, 0.0316314697265625, 0.037342071533203125, 0.04305267333984375, 0.048763275146484375, 0.054473876953125, 0.060184478759765625, 0.06589508056640625, 0.07160568237304688, 0.0773162841796875, 0.08302688598632812, 0.08873748779296875, 0.09444808959960938, 0.10015869140625, 0.10586929321289062, 0.11157989501953125, 0.11729049682617188, 0.1230010986328125, 0.12871170043945312, 0.13442230224609375, 0.14013290405273438, 0.145843505859375, 0.15155410766601562, 0.15726470947265625, 0.16297531127929688, 0.1686859130859375, 0.17439651489257812, 0.18010711669921875, 0.18581771850585938, 0.1915283203125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 8.0, 11.0, 9.0, 12.0, 19.0, 10.0, 21.0, 12.0, 32.0, 31.0, 31.0, 25.0, 39.0, 44.0, 39.0, 47.0, 56.0, 49.0, 57.0, 40.0, 40.0, 39.0, 44.0, 34.0, 28.0, 33.0, 19.0, 25.0, 28.0, 19.0, 17.0, 17.0, 11.0, 11.0, 11.0, 11.0, 3.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-7.027387619018555e-05, -6.82976096868515e-05, -6.632134318351746e-05, -6.434507668018341e-05, -6.236881017684937e-05, -6.039254367351532e-05, -5.8416277170181274e-05, -5.644001066684723e-05, -5.4463744163513184e-05, -5.248747766017914e-05, -5.051121115684509e-05, -4.853494465351105e-05, -4.6558678150177e-05, -4.4582411646842957e-05, -4.260614514350891e-05, -4.0629878640174866e-05, -3.865361213684082e-05, -3.6677345633506775e-05, -3.470107913017273e-05, -3.2724812626838684e-05, -3.074854612350464e-05, -2.8772279620170593e-05, -2.6796013116836548e-05, -2.4819746613502502e-05, -2.2843480110168457e-05, -2.086721360683441e-05, -1.8890947103500366e-05, -1.691468060016632e-05, -1.4938414096832275e-05, -1.296214759349823e-05, -1.0985881090164185e-05, -9.00961458683014e-06, -7.033348083496094e-06, -5.057081580162048e-06, -3.080815076828003e-06, -1.1045485734939575e-06, 8.717179298400879e-07, 2.8479844331741333e-06, 4.824250936508179e-06, 6.800517439842224e-06, 8.77678394317627e-06, 1.0753050446510315e-05, 1.272931694984436e-05, 1.4705583453178406e-05, 1.668184995651245e-05, 1.8658116459846497e-05, 2.0634382963180542e-05, 2.2610649466514587e-05, 2.4586915969848633e-05, 2.6563182473182678e-05, 2.8539448976516724e-05, 3.051571547985077e-05, 3.2491981983184814e-05, 3.446824848651886e-05, 3.6444514989852905e-05, 3.842078149318695e-05, 4.0397047996520996e-05, 4.237331449985504e-05, 4.434958100318909e-05, 4.632584750652313e-05, 4.830211400985718e-05, 5.027838051319122e-05, 5.225464701652527e-05, 5.4230913519859314e-05, 5.620718002319336e-05]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 6.0, 9.0, 10.0, 12.0, 18.0, 19.0, 17.0, 31.0, 28.0, 36.0, 44.0, 71.0, 108.0, 180.0, 361.0, 1071.0, 46895.0, 974337.0, 23466.0, 877.0, 293.0, 192.0, 117.0, 72.0, 48.0, 40.0, 40.0, 26.0, 27.0, 12.0, 12.0, 18.0, 7.0, 8.0, 16.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013151168823242188, -0.0012704432010650635, -0.0012257695198059082, -0.001181095838546753, -0.0011364221572875977, -0.0010917484760284424, -0.0010470747947692871, -0.0010024011135101318, -0.0009577274322509766, -0.0009130537509918213, -0.000868380069732666, -0.0008237063884735107, -0.0007790327072143555, -0.0007343590259552002, -0.0006896853446960449, -0.0006450116634368896, -0.0006003379821777344, -0.0005556643009185791, -0.0005109906196594238, -0.00046631693840026855, -0.0004216432571411133, -0.000376969575881958, -0.00033229589462280273, -0.00028762221336364746, -0.0002429485321044922, -0.00019827485084533691, -0.00015360116958618164, -0.00010892748832702637, -6.42538070678711e-05, -1.958012580871582e-05, 2.5093555450439453e-05, 6.976723670959473e-05, 0.00011444091796875, 0.00015911459922790527, 0.00020378828048706055, 0.0002484619617462158, 0.0002931356430053711, 0.00033780932426452637, 0.00038248300552368164, 0.0004271566867828369, 0.0004718303680419922, 0.0005165040493011475, 0.0005611777305603027, 0.000605851411819458, 0.0006505250930786133, 0.0006951987743377686, 0.0007398724555969238, 0.0007845461368560791, 0.0008292198181152344, 0.0008738934993743896, 0.0009185671806335449, 0.0009632408618927002, 0.0010079145431518555, 0.0010525882244110107, 0.001097261905670166, 0.0011419355869293213, 0.0011866092681884766, 0.0012312829494476318, 0.0012759566307067871, 0.0013206303119659424, 0.0013653039932250977, 0.001409977674484253, 0.0014546513557434082, 0.0014993250370025635, 0.0015439987182617188]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 10.0, 38.0, 120.0, 298.0, 321.0, 156.0, 47.0, 11.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.975300569436513e-05, -3.3293083106400445e-05, -2.683316051843576e-05, -2.0373237930471078e-05, -1.3913315342506394e-05, -7.45339275454171e-06, -9.934701665770262e-07, 5.4664524213876575e-06, 1.1926375009352341e-05, 1.8386297597317025e-05, 2.484622018528171e-05, 3.130614277324639e-05, 3.7766065361211076e-05, 4.422598794917576e-05, 5.0685910537140444e-05, 5.714583312510513e-05, 6.3605752075091e-05, 7.006567466305569e-05, 7.652559725102037e-05, 8.298551983898506e-05, 8.944544242694974e-05, 9.590536501491442e-05, 0.00010236528760287911, 0.00010882521019084379, 0.00011528513277880847, 0.00012174505536677316, 0.00012820497795473784, 0.00013466490781866014, 0.0001411248231306672, 0.00014758473844267428, 0.00015404466830659658, 0.00016050459817051888, 0.00016696451348252594, 0.00017342442879453301, 0.0001798843586584553, 0.0001863442885223776, 0.00019280420383438468, 0.00019926411914639175, 0.00020572404901031405, 0.00021218397887423635, 0.00021864389418624341, 0.00022510380949825048, 0.00023156373936217278, 0.00023802366922609508, 0.00024448358453810215, 0.0002509434998501092, 0.0002574034151621163, 0.0002638633595779538, 0.0002703232748899609, 0.00027678319020196795, 0.0002832431346178055, 0.00028970304992981255, 0.0002961629652418196, 0.0003026228805538267, 0.00030908279586583376, 0.0003155427402816713, 0.00032200265559367836, 0.0003284625709056854, 0.00033492251532152295, 0.00034138243063353, 0.0003478423459455371, 0.00035430226125754416, 0.00036076217656955123, 0.00036722212098538876, 0.0003736820362973958]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 7.0, 7.0, 3.0, 7.0, 4.0, 6.0, 7.0, 11.0, 6.0, 14.0, 19.0, 22.0, 14.0, 21.0, 24.0, 26.0, 32.0, 27.0, 24.0, 32.0, 36.0, 38.0, 37.0, 24.0, 39.0, 41.0, 35.0, 34.0, 32.0, 21.0, 29.0, 32.0, 27.0, 26.0, 19.0, 24.0, 34.0, 27.0, 20.0, 11.0, 13.0, 13.0, 15.0, 11.0, 12.0, 10.0, 10.0, 3.0, 6.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1948089599609375e-05, -3.0836090445518494e-05, -2.9724091291427612e-05, -2.861209213733673e-05, -2.750009298324585e-05, -2.6388093829154968e-05, -2.5276094675064087e-05, -2.4164095520973206e-05, -2.3052096366882324e-05, -2.1940097212791443e-05, -2.082809805870056e-05, -1.971609890460968e-05, -1.86040997505188e-05, -1.7492100596427917e-05, -1.6380101442337036e-05, -1.5268102288246155e-05, -1.4156103134155273e-05, -1.3044103980064392e-05, -1.193210482597351e-05, -1.082010567188263e-05, -9.708106517791748e-06, -8.596107363700867e-06, -7.484108209609985e-06, -6.372109055519104e-06, -5.260109901428223e-06, -4.148110747337341e-06, -3.03611159324646e-06, -1.9241124391555786e-06, -8.121132850646973e-07, 2.998858690261841e-07, 1.4118850231170654e-06, 2.5238841772079468e-06, 3.635883331298828e-06, 4.7478824853897095e-06, 5.859881639480591e-06, 6.971880793571472e-06, 8.083879947662354e-06, 9.195879101753235e-06, 1.0307878255844116e-05, 1.1419877409934998e-05, 1.2531876564025879e-05, 1.364387571811676e-05, 1.4755874872207642e-05, 1.5867874026298523e-05, 1.6979873180389404e-05, 1.8091872334480286e-05, 1.9203871488571167e-05, 2.031587064266205e-05, 2.142786979675293e-05, 2.253986895084381e-05, 2.3651868104934692e-05, 2.4763867259025574e-05, 2.5875866413116455e-05, 2.6987865567207336e-05, 2.8099864721298218e-05, 2.92118638753891e-05, 3.032386302947998e-05, 3.143586218357086e-05, 3.254786133766174e-05, 3.3659860491752625e-05, 3.4771859645843506e-05, 3.588385879993439e-05, 3.699585795402527e-05, 3.810785710811615e-05, 3.921985626220703e-05]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 4.0, 9.0, 4.0, 12.0, 18.0, 17.0, 18.0, 16.0, 26.0, 23.0, 22.0, 27.0, 21.0, 29.0, 45.0, 46.0, 37.0, 31.0, 49.0, 40.0, 32.0, 39.0, 31.0, 48.0, 37.0, 33.0, 39.0, 34.0, 29.0, 20.0, 15.0, 25.0, 14.0, 18.0, 14.0, 11.0, 5.0, 15.0, 12.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0], "bins": [-7.87109375, -7.6510009765625, -7.430908203125, -7.2108154296875, -6.99072265625, -6.7706298828125, -6.550537109375, -6.3304443359375, -6.1103515625, -5.8902587890625, -5.670166015625, -5.4500732421875, -5.22998046875, -5.0098876953125, -4.789794921875, -4.5697021484375, -4.349609375, -4.1295166015625, -3.909423828125, -3.6893310546875, -3.46923828125, -3.2491455078125, -3.029052734375, -2.8089599609375, -2.5888671875, -2.3687744140625, -2.148681640625, -1.9285888671875, -1.70849609375, -1.4884033203125, -1.268310546875, -1.0482177734375, -0.828125, -0.6080322265625, -0.387939453125, -0.1678466796875, 0.05224609375, 0.2723388671875, 0.492431640625, 0.7125244140625, 0.9326171875, 1.1527099609375, 1.372802734375, 1.5928955078125, 1.81298828125, 2.0330810546875, 2.253173828125, 2.4732666015625, 2.693359375, 2.9134521484375, 3.133544921875, 3.3536376953125, 3.57373046875, 3.7938232421875, 4.013916015625, 4.2340087890625, 4.4541015625, 4.6741943359375, 4.894287109375, 5.1143798828125, 5.33447265625, 5.5545654296875, 5.774658203125, 5.9947509765625, 6.21484375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 10.0, 22.0, 16.0, 37.0, 48.0, 72.0, 109.0, 154.0, 218.0, 374.0, 550.0, 827.0, 1227.0, 2037.0, 3353.0, 5429.0, 9182.0, 14835.0, 24523.0, 40723.0, 71037.0, 136257.0, 279249.0, 215459.0, 102574.0, 56007.0, 32868.0, 19626.0, 12125.0, 7376.0, 4507.0, 2882.0, 1733.0, 1081.0, 671.0, 394.0, 306.0, 186.0, 124.0, 102.0, 67.0, 37.0, 38.0, 21.0, 25.0, 14.0, 9.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0], "bins": [-9.671875, -9.376953125, -9.08203125, -8.787109375, -8.4921875, -8.197265625, -7.90234375, -7.607421875, -7.3125, -7.017578125, -6.72265625, -6.427734375, -6.1328125, -5.837890625, -5.54296875, -5.248046875, -4.953125, -4.658203125, -4.36328125, -4.068359375, -3.7734375, -3.478515625, -3.18359375, -2.888671875, -2.59375, -2.298828125, -2.00390625, -1.708984375, -1.4140625, -1.119140625, -0.82421875, -0.529296875, -0.234375, 0.060546875, 0.35546875, 0.650390625, 0.9453125, 1.240234375, 1.53515625, 1.830078125, 2.125, 2.419921875, 2.71484375, 3.009765625, 3.3046875, 3.599609375, 3.89453125, 4.189453125, 4.484375, 4.779296875, 5.07421875, 5.369140625, 5.6640625, 5.958984375, 6.25390625, 6.548828125, 6.84375, 7.138671875, 7.43359375, 7.728515625, 8.0234375, 8.318359375, 8.61328125, 8.908203125, 9.203125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 5.0, 6.0, 7.0, 8.0, 11.0, 15.0, 9.0, 14.0, 21.0, 26.0, 30.0, 20.0, 34.0, 37.0, 45.0, 61.0, 50.0, 62.0, 81.0, 153.0, 190.0, 1278.0, 200.0, 133.0, 98.0, 71.0, 64.0, 48.0, 38.0, 35.0, 29.0, 18.0, 28.0, 20.0, 20.0, 11.0, 12.0, 13.0, 13.0, 4.0, 8.0, 7.0, 7.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-18.453125, -17.903564453125, -17.35400390625, -16.804443359375, -16.2548828125, -15.705322265625, -15.15576171875, -14.606201171875, -14.056640625, -13.507080078125, -12.95751953125, -12.407958984375, -11.8583984375, -11.308837890625, -10.75927734375, -10.209716796875, -9.66015625, -9.110595703125, -8.56103515625, -8.011474609375, -7.4619140625, -6.912353515625, -6.36279296875, -5.813232421875, -5.263671875, -4.714111328125, -4.16455078125, -3.614990234375, -3.0654296875, -2.515869140625, -1.96630859375, -1.416748046875, -0.8671875, -0.317626953125, 0.23193359375, 0.781494140625, 1.3310546875, 1.880615234375, 2.43017578125, 2.979736328125, 3.529296875, 4.078857421875, 4.62841796875, 5.177978515625, 5.7275390625, 6.277099609375, 6.82666015625, 7.376220703125, 7.92578125, 8.475341796875, 9.02490234375, 9.574462890625, 10.1240234375, 10.673583984375, 11.22314453125, 11.772705078125, 12.322265625, 12.871826171875, 13.42138671875, 13.970947265625, 14.5205078125, 15.070068359375, 15.61962890625, 16.169189453125, 16.71875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 6.0, 5.0, 18.0, 15.0, 13.0, 25.0, 15.0, 36.0, 37.0, 68.0, 85.0, 167.0, 283.0, 585.0, 1369.0, 3808.0, 11319.0, 37795.0, 165770.0, 1550133.0, 1182805.0, 141472.0, 33537.0, 10238.0, 3469.0, 1270.0, 547.0, 282.0, 168.0, 109.0, 60.0, 45.0, 26.0, 32.0, 14.0, 15.0, 9.0, 10.0, 9.0, 5.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.671875, -19.01513671875, -18.3583984375, -17.70166015625, -17.044921875, -16.38818359375, -15.7314453125, -15.07470703125, -14.41796875, -13.76123046875, -13.1044921875, -12.44775390625, -11.791015625, -11.13427734375, -10.4775390625, -9.82080078125, -9.1640625, -8.50732421875, -7.8505859375, -7.19384765625, -6.537109375, -5.88037109375, -5.2236328125, -4.56689453125, -3.91015625, -3.25341796875, -2.5966796875, -1.93994140625, -1.283203125, -0.62646484375, 0.0302734375, 0.68701171875, 1.34375, 2.00048828125, 2.6572265625, 3.31396484375, 3.970703125, 4.62744140625, 5.2841796875, 5.94091796875, 6.59765625, 7.25439453125, 7.9111328125, 8.56787109375, 9.224609375, 9.88134765625, 10.5380859375, 11.19482421875, 11.8515625, 12.50830078125, 13.1650390625, 13.82177734375, 14.478515625, 15.13525390625, 15.7919921875, 16.44873046875, 17.10546875, 17.76220703125, 18.4189453125, 19.07568359375, 19.732421875, 20.38916015625, 21.0458984375, 21.70263671875, 22.359375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [2.0, 14.0, 57.0, 151.0, 270.0, 319.0, 129.0, 51.0, 13.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.686716079711914, -22.20356559753418, -16.720415115356445, -11.237264633178711, -5.754114151000977, -0.2709636688232422, 5.212186813354492, 10.695337295532227, 16.17848777770996, 21.661638259887695, 27.14478874206543, 32.62793731689453, 38.11109161376953, 43.59423828125, 49.077392578125, 54.56053924560547, 60.04369354248047, 65.52684020996094, 71.00999450683594, 76.49314880371094, 81.9762954711914, 87.45944213867188, 92.94259643554688, 98.42575073242188, 103.90889739990234, 109.39204406738281, 114.87519836425781, 120.35835266113281, 125.84149932861328, 131.32464599609375, 136.80780029296875, 142.29095458984375, 147.77410888671875, 153.25726318359375, 158.74041748046875, 164.2235565185547, 169.7067108154297, 175.1898651123047, 180.67300415039062, 186.15615844726562, 191.63931274414062, 197.12246704101562, 202.60562133789062, 208.08876037597656, 213.57191467285156, 219.05506896972656, 224.5382080078125, 230.0213623046875, 235.5045166015625, 240.9876708984375, 246.4708251953125, 251.95396423339844, 257.4371337890625, 262.9202575683594, 268.4034118652344, 273.8865661621094, 279.3697204589844, 284.8528747558594, 290.3360290527344, 295.8191833496094, 301.30230712890625, 306.78546142578125, 312.26861572265625, 317.75177001953125, 323.23492431640625]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 4.0, 3.0, 2.0, 6.0, 13.0, 11.0, 14.0, 22.0, 18.0, 17.0, 25.0, 21.0, 37.0, 36.0, 40.0, 39.0, 22.0, 44.0, 48.0, 33.0, 41.0, 33.0, 37.0, 37.0, 44.0, 39.0, 32.0, 34.0, 32.0, 35.0, 29.0, 22.0, 21.0, 19.0, 17.0, 12.0, 12.0, 10.0, 4.0, 9.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.54527282714844, -43.94932556152344, -42.35337829589844, -40.75743103027344, -39.16148376464844, -37.56553268432617, -35.96958541870117, -34.37363815307617, -32.77769088745117, -31.181743621826172, -29.585796356201172, -27.98984718322754, -26.39389991760254, -24.79795265197754, -23.202003479003906, -21.606056213378906, -20.010108947753906, -18.414161682128906, -16.818214416503906, -15.222265243530273, -13.626317977905273, -12.030370712280273, -10.434422492980957, -8.83847427368164, -7.242527008056641, -5.646579265594482, -4.050631523132324, -2.454683780670166, -0.8587360382080078, 0.7372117042541504, 2.3331594467163086, 3.929107666015625, 5.525054931640625, 7.121002674102783, 8.716950416564941, 10.312898635864258, 11.908845901489258, 13.504793167114258, 15.100741386413574, 16.69668960571289, 18.29263687133789, 19.88858413696289, 21.48453140258789, 23.080480575561523, 24.676427841186523, 26.272375106811523, 27.868324279785156, 29.464271545410156, 31.060218811035156, 32.656166076660156, 34.252113342285156, 35.848060607910156, 37.444007873535156, 39.03995895385742, 40.63590621948242, 42.23185348510742, 43.82780075073242, 45.42374801635742, 47.01969528198242, 48.61564254760742, 50.21159362792969, 51.80754089355469, 53.40348815917969, 54.99943542480469, 56.59538269042969]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 7.0, 8.0, 6.0, 6.0, 11.0, 17.0, 19.0, 17.0, 20.0, 23.0, 29.0, 32.0, 36.0, 34.0, 35.0, 46.0, 48.0, 42.0, 38.0, 52.0, 46.0, 43.0, 49.0, 30.0, 32.0, 40.0, 37.0, 30.0, 20.0, 23.0, 18.0, 14.0, 14.0, 12.0, 16.0, 12.0, 6.0, 11.0, 9.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.453125, -8.1912841796875, -7.929443359375, -7.6676025390625, -7.40576171875, -7.1439208984375, -6.882080078125, -6.6202392578125, -6.3583984375, -6.0965576171875, -5.834716796875, -5.5728759765625, -5.31103515625, -5.0491943359375, -4.787353515625, -4.5255126953125, -4.263671875, -4.0018310546875, -3.739990234375, -3.4781494140625, -3.21630859375, -2.9544677734375, -2.692626953125, -2.4307861328125, -2.1689453125, -1.9071044921875, -1.645263671875, -1.3834228515625, -1.12158203125, -0.8597412109375, -0.597900390625, -0.3360595703125, -0.07421875, 0.1876220703125, 0.449462890625, 0.7113037109375, 0.97314453125, 1.2349853515625, 1.496826171875, 1.7586669921875, 2.0205078125, 2.2823486328125, 2.544189453125, 2.8060302734375, 3.06787109375, 3.3297119140625, 3.591552734375, 3.8533935546875, 4.115234375, 4.3770751953125, 4.638916015625, 4.9007568359375, 5.16259765625, 5.4244384765625, 5.686279296875, 5.9481201171875, 6.2099609375, 6.4718017578125, 6.733642578125, 6.9954833984375, 7.25732421875, 7.5191650390625, 7.781005859375, 8.0428466796875, 8.3046875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 8.0, 3.0, 13.0, 6.0, 13.0, 22.0, 26.0, 25.0, 28.0, 31.0, 37.0, 67.0, 75.0, 89.0, 137.0, 207.0, 276.0, 474.0, 2628.0, 217296.0, 3959431.0, 11344.0, 784.0, 329.0, 242.0, 174.0, 98.0, 75.0, 79.0, 45.0, 40.0, 24.0, 26.0, 27.0, 25.0, 10.0, 18.0, 10.0, 3.0, 6.0, 7.0, 8.0, 2.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.5625, -83.4951171875, -80.427734375, -77.3603515625, -74.29296875, -71.2255859375, -68.158203125, -65.0908203125, -62.0234375, -58.9560546875, -55.888671875, -52.8212890625, -49.75390625, -46.6865234375, -43.619140625, -40.5517578125, -37.484375, -34.4169921875, -31.349609375, -28.2822265625, -25.21484375, -22.1474609375, -19.080078125, -16.0126953125, -12.9453125, -9.8779296875, -6.810546875, -3.7431640625, -0.67578125, 2.3916015625, 5.458984375, 8.5263671875, 11.59375, 14.6611328125, 17.728515625, 20.7958984375, 23.86328125, 26.9306640625, 29.998046875, 33.0654296875, 36.1328125, 39.2001953125, 42.267578125, 45.3349609375, 48.40234375, 51.4697265625, 54.537109375, 57.6044921875, 60.671875, 63.7392578125, 66.806640625, 69.8740234375, 72.94140625, 76.0087890625, 79.076171875, 82.1435546875, 85.2109375, 88.2783203125, 91.345703125, 94.4130859375, 97.48046875, 100.5478515625, 103.615234375, 106.6826171875, 109.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 9.0, 6.0, 13.0, 23.0, 34.0, 43.0, 82.0, 107.0, 161.0, 277.0, 631.0, 1131.0, 626.0, 340.0, 187.0, 122.0, 69.0, 61.0, 45.0, 22.0, 33.0, 24.0, 13.0, 3.0, 2.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9375, -13.34423828125, -12.7509765625, -12.15771484375, -11.564453125, -10.97119140625, -10.3779296875, -9.78466796875, -9.19140625, -8.59814453125, -8.0048828125, -7.41162109375, -6.818359375, -6.22509765625, -5.6318359375, -5.03857421875, -4.4453125, -3.85205078125, -3.2587890625, -2.66552734375, -2.072265625, -1.47900390625, -0.8857421875, -0.29248046875, 0.30078125, 0.89404296875, 1.4873046875, 2.08056640625, 2.673828125, 3.26708984375, 3.8603515625, 4.45361328125, 5.046875, 5.64013671875, 6.2333984375, 6.82666015625, 7.419921875, 8.01318359375, 8.6064453125, 9.19970703125, 9.79296875, 10.38623046875, 10.9794921875, 11.57275390625, 12.166015625, 12.75927734375, 13.3525390625, 13.94580078125, 14.5390625, 15.13232421875, 15.7255859375, 16.31884765625, 16.912109375, 17.50537109375, 18.0986328125, 18.69189453125, 19.28515625, 19.87841796875, 20.4716796875, 21.06494140625, 21.658203125, 22.25146484375, 22.8447265625, 23.43798828125, 24.03125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 12.0, 18.0, 20.0, 26.0, 44.0, 81.0, 120.0, 230.0, 491.0, 1931.0, 15550.0, 304799.0, 3738065.0, 122020.0, 8756.0, 1311.0, 401.0, 157.0, 74.0, 44.0, 35.0, 25.0, 20.0, 13.0, 11.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-63.96875, -62.34375, -60.71875, -59.09375, -57.46875, -55.84375, -54.21875, -52.59375, -50.96875, -49.34375, -47.71875, -46.09375, -44.46875, -42.84375, -41.21875, -39.59375, -37.96875, -36.34375, -34.71875, -33.09375, -31.46875, -29.84375, -28.21875, -26.59375, -24.96875, -23.34375, -21.71875, -20.09375, -18.46875, -16.84375, -15.21875, -13.59375, -11.96875, -10.34375, -8.71875, -7.09375, -5.46875, -3.84375, -2.21875, -0.59375, 1.03125, 2.65625, 4.28125, 5.90625, 7.53125, 9.15625, 10.78125, 12.40625, 14.03125, 15.65625, 17.28125, 18.90625, 20.53125, 22.15625, 23.78125, 25.40625, 27.03125, 28.65625, 30.28125, 31.90625, 33.53125, 35.15625, 36.78125, 38.40625, 40.03125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 63.0, 391.0, 428.0, 115.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.8079376220703, -224.05015563964844, -212.2923583984375, -200.53457641601562, -188.77679443359375, -177.01901245117188, -165.26123046875, -153.50343322753906, -141.7456512451172, -129.9878692626953, -118.2300796508789, -106.4722900390625, -94.71450805664062, -82.95672607421875, -71.19893646240234, -59.44114685058594, -47.68336486816406, -35.92557907104492, -24.16779327392578, -12.41000747680664, -0.6522216796875, 11.10556411743164, 22.86334991455078, 34.62113952636719, 46.37892150878906, 58.1367073059082, 69.89449310302734, 81.65228271484375, 93.41006469726562, 105.1678466796875, 116.9256362915039, 128.6834259033203, 140.44122314453125, 152.19900512695312, 163.956787109375, 175.71458435058594, 187.4723663330078, 199.2301483154297, 210.98794555664062, 222.7457275390625, 234.50350952148438, 246.26129150390625, 258.0190734863281, 269.77685546875, 281.53466796875, 293.2924499511719, 305.05023193359375, 316.8080139160156, 328.5657958984375, 340.3235778808594, 352.08135986328125, 363.8391418457031, 375.596923828125, 387.354736328125, 399.1125183105469, 410.87030029296875, 422.6280822753906, 434.3858642578125, 446.1436462402344, 457.90142822265625, 469.65924072265625, 481.4170227050781, 493.1748046875, 504.9325866699219, 516.6903686523438]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 4.0, 5.0, 8.0, 17.0, 16.0, 23.0, 15.0, 21.0, 20.0, 26.0, 23.0, 31.0, 34.0, 46.0, 40.0, 52.0, 45.0, 44.0, 50.0, 51.0, 52.0, 34.0, 42.0, 40.0, 28.0, 44.0, 29.0, 20.0, 24.0, 22.0, 16.0, 12.0, 23.0, 11.0, 10.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.05975341796875, -58.14244842529297, -56.22514343261719, -54.307838439941406, -52.390533447265625, -50.473228454589844, -48.5559196472168, -46.638614654541016, -44.721309661865234, -42.80400466918945, -40.88669967651367, -38.96939468383789, -37.052085876464844, -35.13478088378906, -33.21747589111328, -31.3001708984375, -29.38286590576172, -27.465560913085938, -25.548255920410156, -23.630949020385742, -21.71364402770996, -19.79633903503418, -17.879032135009766, -15.961727142333984, -14.044422149658203, -12.127117156982422, -10.209811210632324, -8.292505264282227, -6.375200271606445, -4.457895278930664, -2.5405893325805664, -0.6232833862304688, 1.2940254211425781, 3.2113308906555176, 5.128636360168457, 7.0459418296813965, 8.963247299194336, 10.880552291870117, 12.797858238220215, 14.715164184570312, 16.632469177246094, 18.549774169921875, 20.467079162597656, 22.38438606262207, 24.30169105529785, 26.218996047973633, 28.136302947998047, 30.053607940673828, 31.97091293334961, 33.88821792602539, 35.80552291870117, 37.72282791137695, 39.64013671875, 41.55744171142578, 43.47474670410156, 45.392051696777344, 47.309356689453125, 49.226661682128906, 51.14396667480469, 53.06127166748047, 54.97857666015625, 56.89588165283203, 58.81319046020508, 60.73049545288086, 62.64780044555664]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 10.0, 7.0, 4.0, 11.0, 23.0, 13.0, 16.0, 26.0, 18.0, 27.0, 35.0, 26.0, 36.0, 33.0, 28.0, 37.0, 45.0, 46.0, 40.0, 41.0, 44.0, 39.0, 38.0, 44.0, 34.0, 40.0, 37.0, 29.0, 19.0, 22.0, 15.0, 14.0, 19.0, 11.0, 12.0, 10.0, 9.0, 2.0, 6.0, 10.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-8.7265625, -8.47564697265625, -8.2247314453125, -7.97381591796875, -7.722900390625, -7.47198486328125, -7.2210693359375, -6.97015380859375, -6.71923828125, -6.46832275390625, -6.2174072265625, -5.96649169921875, -5.715576171875, -5.46466064453125, -5.2137451171875, -4.96282958984375, -4.7119140625, -4.46099853515625, -4.2100830078125, -3.95916748046875, -3.708251953125, -3.45733642578125, -3.2064208984375, -2.95550537109375, -2.70458984375, -2.45367431640625, -2.2027587890625, -1.95184326171875, -1.700927734375, -1.45001220703125, -1.1990966796875, -0.94818115234375, -0.697265625, -0.44635009765625, -0.1954345703125, 0.05548095703125, 0.306396484375, 0.55731201171875, 0.8082275390625, 1.05914306640625, 1.31005859375, 1.56097412109375, 1.8118896484375, 2.06280517578125, 2.313720703125, 2.56463623046875, 2.8155517578125, 3.06646728515625, 3.3173828125, 3.56829833984375, 3.8192138671875, 4.07012939453125, 4.321044921875, 4.57196044921875, 4.8228759765625, 5.07379150390625, 5.32470703125, 5.57562255859375, 5.8265380859375, 6.07745361328125, 6.328369140625, 6.57928466796875, 6.8302001953125, 7.08111572265625, 7.33203125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 8.0, 4.0, 18.0, 24.0, 43.0, 33.0, 60.0, 110.0, 117.0, 180.0, 244.0, 371.0, 487.0, 704.0, 953.0, 1406.0, 1966.0, 2841.0, 4048.0, 6003.0, 8869.0, 13263.0, 20760.0, 32380.0, 52109.0, 89495.0, 175147.0, 273393.0, 150118.0, 79626.0, 47219.0, 29158.0, 18684.0, 12243.0, 8169.0, 5659.0, 3836.0, 2648.0, 1783.0, 1263.0, 919.0, 643.0, 413.0, 327.0, 234.0, 172.0, 118.0, 78.0, 67.0, 37.0, 40.0, 23.0, 22.0, 9.0, 7.0, 3.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.2418212890625, -0.2335948944091797, -0.22536849975585938, -0.21714210510253906, -0.20891571044921875, -0.20068931579589844, -0.19246292114257812, -0.1842365264892578, -0.1760101318359375, -0.1677837371826172, -0.15955734252929688, -0.15133094787597656, -0.14310455322265625, -0.13487815856933594, -0.12665176391601562, -0.11842536926269531, -0.110198974609375, -0.10197257995605469, -0.09374618530273438, -0.08551979064941406, -0.07729339599609375, -0.06906700134277344, -0.060840606689453125, -0.05261421203613281, -0.0443878173828125, -0.03616142272949219, -0.027935028076171875, -0.019708633422851562, -0.01148223876953125, -0.0032558441162109375, 0.004970550537109375, 0.013196945190429688, 0.02142333984375, 0.029649734497070312, 0.037876129150390625, 0.04610252380371094, 0.05432891845703125, 0.06255531311035156, 0.07078170776367188, 0.07900810241699219, 0.0872344970703125, 0.09546089172363281, 0.10368728637695312, 0.11191368103027344, 0.12014007568359375, 0.12836647033691406, 0.13659286499023438, 0.1448192596435547, 0.153045654296875, 0.1612720489501953, 0.16949844360351562, 0.17772483825683594, 0.18595123291015625, 0.19417762756347656, 0.20240402221679688, 0.2106304168701172, 0.2188568115234375, 0.2270832061767578, 0.23530960083007812, 0.24353599548339844, 0.25176239013671875, 0.25998878479003906, 0.2682151794433594, 0.2764415740966797, 0.28466796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 5.0, 12.0, 11.0, 8.0, 10.0, 25.0, 19.0, 19.0, 24.0, 40.0, 37.0, 33.0, 39.0, 37.0, 34.0, 41.0, 38.0, 36.0, 1078.0, 26.0, 39.0, 42.0, 43.0, 33.0, 32.0, 31.0, 35.0, 25.0, 26.0, 19.0, 21.0, 17.0, 18.0, 12.0, 14.0, 8.0, 5.0, 6.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.34375, -6.14056396484375, -5.9373779296875, -5.73419189453125, -5.531005859375, -5.32781982421875, -5.1246337890625, -4.92144775390625, -4.71826171875, -4.51507568359375, -4.3118896484375, -4.10870361328125, -3.905517578125, -3.70233154296875, -3.4991455078125, -3.29595947265625, -3.0927734375, -2.88958740234375, -2.6864013671875, -2.48321533203125, -2.280029296875, -2.07684326171875, -1.8736572265625, -1.67047119140625, -1.46728515625, -1.26409912109375, -1.0609130859375, -0.85772705078125, -0.654541015625, -0.45135498046875, -0.2481689453125, -0.04498291015625, 0.158203125, 0.36138916015625, 0.5645751953125, 0.76776123046875, 0.970947265625, 1.17413330078125, 1.3773193359375, 1.58050537109375, 1.78369140625, 1.98687744140625, 2.1900634765625, 2.39324951171875, 2.596435546875, 2.79962158203125, 3.0028076171875, 3.20599365234375, 3.4091796875, 3.61236572265625, 3.8155517578125, 4.01873779296875, 4.221923828125, 4.42510986328125, 4.6282958984375, 4.83148193359375, 5.03466796875, 5.23785400390625, 5.4410400390625, 5.64422607421875, 5.847412109375, 6.05059814453125, 6.2537841796875, 6.45697021484375, 6.66015625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 11.0, 15.0, 32.0, 45.0, 50.0, 109.0, 142.0, 216.0, 337.0, 518.0, 819.0, 1241.0, 2074.0, 3126.0, 5058.0, 8264.0, 13488.0, 22867.0, 38750.0, 68336.0, 132265.0, 1332262.0, 225989.0, 103613.0, 55838.0, 32200.0, 19000.0, 11486.0, 7061.0, 4393.0, 2691.0, 1719.0, 1065.0, 701.0, 477.0, 293.0, 203.0, 130.0, 80.0, 67.0, 32.0, 23.0, 15.0, 9.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.234375, -0.2272357940673828, -0.22009658813476562, -0.21295738220214844, -0.20581817626953125, -0.19867897033691406, -0.19153976440429688, -0.1844005584716797, -0.1772613525390625, -0.1701221466064453, -0.16298294067382812, -0.15584373474121094, -0.14870452880859375, -0.14156532287597656, -0.13442611694335938, -0.1272869110107422, -0.120147705078125, -0.11300849914550781, -0.10586929321289062, -0.09873008728027344, -0.09159088134765625, -0.08445167541503906, -0.07731246948242188, -0.07017326354980469, -0.0630340576171875, -0.05589485168457031, -0.048755645751953125, -0.04161643981933594, -0.03447723388671875, -0.027338027954101562, -0.020198822021484375, -0.013059616088867188, -0.00592041015625, 0.0012187957763671875, 0.008358001708984375, 0.015497207641601562, 0.02263641357421875, 0.029775619506835938, 0.036914825439453125, 0.04405403137207031, 0.0511932373046875, 0.05833244323730469, 0.06547164916992188, 0.07261085510253906, 0.07975006103515625, 0.08688926696777344, 0.09402847290039062, 0.10116767883300781, 0.108306884765625, 0.11544609069824219, 0.12258529663085938, 0.12972450256347656, 0.13686370849609375, 0.14400291442871094, 0.15114212036132812, 0.1582813262939453, 0.1654205322265625, 0.1725597381591797, 0.17969894409179688, 0.18683815002441406, 0.19397735595703125, 0.20111656188964844, 0.20825576782226562, 0.2153949737548828, 0.2225341796875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 11.0, 11.0, 12.0, 28.0, 25.0, 25.0, 47.0, 40.0, 46.0, 65.0, 74.0, 52.0, 63.0, 75.0, 64.0, 54.0, 60.0, 39.0, 49.0, 27.0, 28.0, 12.0, 20.0, 19.0, 14.0, 8.0, 5.0, 3.0, 2.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011748075485229492, -0.00011343415826559067, -0.00010938756167888641, -0.00010534096509218216, -0.0001012943685054779, -9.724777191877365e-05, -9.32011753320694e-05, -8.915457874536514e-05, -8.510798215866089e-05, -8.106138557195663e-05, -7.701478898525238e-05, -7.296819239854813e-05, -6.892159581184387e-05, -6.487499922513962e-05, -6.0828402638435364e-05, -5.678180605173111e-05, -5.2735209465026855e-05, -4.86886128783226e-05, -4.464201629161835e-05, -4.059541970491409e-05, -3.654882311820984e-05, -3.2502226531505585e-05, -2.845562994480133e-05, -2.4409033358097076e-05, -2.0362436771392822e-05, -1.6315840184688568e-05, -1.2269243597984314e-05, -8.22264701128006e-06, -4.176050424575806e-06, -1.2945383787155151e-07, 3.917142748832703e-06, 7.963739335536957e-06, 1.2010335922241211e-05, 1.6056932508945465e-05, 2.010352909564972e-05, 2.4150125682353973e-05, 2.8196722269058228e-05, 3.224331885576248e-05, 3.6289915442466736e-05, 4.033651202917099e-05, 4.4383108615875244e-05, 4.84297052025795e-05, 5.247630178928375e-05, 5.6522898375988007e-05, 6.056949496269226e-05, 6.461609154939651e-05, 6.866268813610077e-05, 7.270928472280502e-05, 7.675588130950928e-05, 8.080247789621353e-05, 8.484907448291779e-05, 8.889567106962204e-05, 9.29422676563263e-05, 9.698886424303055e-05, 0.0001010354608297348, 0.00010508205741643906, 0.00010912865400314331, 0.00011317525058984756, 0.00011722184717655182, 0.00012126844376325607, 0.00012531504034996033, 0.00012936163693666458, 0.00013340823352336884, 0.0001374548301100731, 0.00014150142669677734]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 6.0, 5.0, 11.0, 20.0, 24.0, 25.0, 32.0, 42.0, 78.0, 130.0, 228.0, 843.0, 104607.0, 937995.0, 3553.0, 432.0, 191.0, 87.0, 63.0, 51.0, 37.0, 31.0, 16.0, 9.0, 12.0, 4.0, 5.0, 5.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00336456298828125, -0.003266274929046631, -0.0031679868698120117, -0.0030696988105773926, -0.0029714107513427734, -0.0028731226921081543, -0.002774834632873535, -0.002676546573638916, -0.002578258514404297, -0.0024799704551696777, -0.0023816823959350586, -0.0022833943367004395, -0.0021851062774658203, -0.002086818218231201, -0.001988530158996582, -0.0018902420997619629, -0.0017919540405273438, -0.0016936659812927246, -0.0015953779220581055, -0.0014970898628234863, -0.0013988018035888672, -0.001300513744354248, -0.001202225685119629, -0.0011039376258850098, -0.0010056495666503906, -0.0009073615074157715, -0.0008090734481811523, -0.0007107853889465332, -0.0006124973297119141, -0.0005142092704772949, -0.0004159212112426758, -0.00031763315200805664, -0.0002193450927734375, -0.00012105703353881836, -2.276897430419922e-05, 7.551908493041992e-05, 0.00017380714416503906, 0.0002720952033996582, 0.00037038326263427734, 0.0004686713218688965, 0.0005669593811035156, 0.0006652474403381348, 0.0007635354995727539, 0.000861823558807373, 0.0009601116180419922, 0.0010583996772766113, 0.0011566877365112305, 0.0012549757957458496, 0.0013532638549804688, 0.0014515519142150879, 0.001549839973449707, 0.0016481280326843262, 0.0017464160919189453, 0.0018447041511535645, 0.0019429922103881836, 0.0020412802696228027, 0.002139568328857422, 0.002237856388092041, 0.00233614444732666, 0.0024344325065612793, 0.0025327205657958984, 0.0026310086250305176, 0.0027292966842651367, 0.002827584743499756, 0.002925872802734375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 22.0, 442.0, 527.0, 25.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014449161244556308, -0.0001088781573344022, -7.326470222324133e-05, -3.7651247112080455e-05, -2.0377920009195805e-06, 3.3575663110241294e-05, 6.918911822140217e-05, 0.00010480257333256304, 0.00014041602844372392, 0.0001760294835548848, 0.00021164293866604567, 0.00024725639377720654, 0.0002828698488883674, 0.0003184833039995283, 0.00035409675911068916, 0.00038971021422185004, 0.0004253236693330109, 0.0004609371244441718, 0.0004965505795553327, 0.0005321640055626631, 0.0005677774897776544, 0.0006033909739926457, 0.0006390043999999762, 0.0006746178260073066, 0.0007102313102222979, 0.0007458447944372892, 0.0007814582204446197, 0.0008170716464519501, 0.0008526851306669414, 0.0008882986148819327, 0.0009239120408892632, 0.0009595254668965936, 0.000995138892903924, 0.0010307523189112544, 0.0010663657449185848, 0.001101979287341237, 0.0011375927133485675, 0.001173206139355898, 0.0012088196817785501, 0.0012444331077858806, 0.001280046533793211, 0.0013156599598005414, 0.0013512733858078718, 0.001386886928230524, 0.0014225003542378545, 0.001458113780245185, 0.0014937273226678371, 0.0015293407486751676, 0.001564954174682498, 0.0016005676006898284, 0.0016361810266971588, 0.001671794569119811, 0.0017074079951271415, 0.001743021421134472, 0.0017786349635571241, 0.0018142483895644546, 0.001849861815571785, 0.0018854752415791154, 0.0019210886675864458, 0.001956702210009098, 0.0019923155196011066, 0.002027929062023759, 0.002063542604446411, 0.0020991559140384197, 0.002134769456461072]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 3.0, 6.0, 1.0, 20.0, 10.0, 22.0, 21.0, 16.0, 20.0, 23.0, 35.0, 32.0, 32.0, 38.0, 46.0, 53.0, 46.0, 53.0, 64.0, 45.0, 45.0, 44.0, 53.0, 31.0, 30.0, 27.0, 29.0, 24.0, 24.0, 27.0, 17.0, 10.0, 15.0, 13.0, 6.0, 12.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.518861770629883e-05, -9.264517575502396e-05, -9.010173380374908e-05, -8.755829185247421e-05, -8.501484990119934e-05, -8.247140794992447e-05, -7.99279659986496e-05, -7.738452404737473e-05, -7.484108209609985e-05, -7.229764014482498e-05, -6.975419819355011e-05, -6.721075624227524e-05, -6.466731429100037e-05, -6.21238723397255e-05, -5.958043038845062e-05, -5.703698843717575e-05, -5.449354648590088e-05, -5.195010453462601e-05, -4.9406662583351135e-05, -4.6863220632076263e-05, -4.431977868080139e-05, -4.177633672952652e-05, -3.923289477825165e-05, -3.6689452826976776e-05, -3.4146010875701904e-05, -3.160256892442703e-05, -2.905912697315216e-05, -2.651568502187729e-05, -2.3972243070602417e-05, -2.1428801119327545e-05, -1.8885359168052673e-05, -1.63419172167778e-05, -1.379847526550293e-05, -1.1255033314228058e-05, -8.711591362953186e-06, -6.168149411678314e-06, -3.6247074604034424e-06, -1.0812655091285706e-06, 1.4621764421463013e-06, 4.005618393421173e-06, 6.549060344696045e-06, 9.092502295970917e-06, 1.1635944247245789e-05, 1.417938619852066e-05, 1.6722828149795532e-05, 1.9266270101070404e-05, 2.1809712052345276e-05, 2.4353154003620148e-05, 2.689659595489502e-05, 2.944003790616989e-05, 3.198347985744476e-05, 3.4526921808719635e-05, 3.707036375999451e-05, 3.961380571126938e-05, 4.215724766254425e-05, 4.470068961381912e-05, 4.7244131565093994e-05, 4.9787573516368866e-05, 5.233101546764374e-05, 5.487445741891861e-05, 5.741789937019348e-05, 5.996134132146835e-05, 6.250478327274323e-05, 6.50482252240181e-05, 6.759166717529297e-05]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 10.0, 7.0, 4.0, 11.0, 23.0, 13.0, 16.0, 26.0, 18.0, 27.0, 35.0, 26.0, 36.0, 33.0, 28.0, 37.0, 45.0, 46.0, 40.0, 41.0, 44.0, 39.0, 38.0, 44.0, 34.0, 40.0, 37.0, 29.0, 19.0, 22.0, 15.0, 14.0, 19.0, 11.0, 12.0, 10.0, 9.0, 2.0, 6.0, 10.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-8.7265625, -8.47564697265625, -8.2247314453125, -7.97381591796875, -7.722900390625, -7.47198486328125, -7.2210693359375, -6.97015380859375, -6.71923828125, -6.46832275390625, -6.2174072265625, -5.96649169921875, -5.715576171875, -5.46466064453125, -5.2137451171875, -4.96282958984375, -4.7119140625, -4.46099853515625, -4.2100830078125, -3.95916748046875, -3.708251953125, -3.45733642578125, -3.2064208984375, -2.95550537109375, -2.70458984375, -2.45367431640625, -2.2027587890625, -1.95184326171875, -1.700927734375, -1.45001220703125, -1.1990966796875, -0.94818115234375, -0.697265625, -0.44635009765625, -0.1954345703125, 0.05548095703125, 0.306396484375, 0.55731201171875, 0.8082275390625, 1.05914306640625, 1.31005859375, 1.56097412109375, 1.8118896484375, 2.06280517578125, 2.313720703125, 2.56463623046875, 2.8155517578125, 3.06646728515625, 3.3173828125, 3.56829833984375, 3.8192138671875, 4.07012939453125, 4.321044921875, 4.57196044921875, 4.8228759765625, 5.07379150390625, 5.32470703125, 5.57562255859375, 5.8265380859375, 6.07745361328125, 6.328369140625, 6.57928466796875, 6.8302001953125, 7.08111572265625, 7.33203125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 7.0, 8.0, 24.0, 28.0, 45.0, 65.0, 121.0, 224.0, 345.0, 617.0, 1046.0, 2066.0, 3737.0, 6968.0, 13882.0, 28570.0, 61396.0, 131333.0, 249701.0, 265547.0, 148388.0, 69733.0, 32518.0, 15415.0, 7650.0, 4067.0, 2235.0, 1179.0, 665.0, 403.0, 220.0, 142.0, 84.0, 49.0, 23.0, 17.0, 15.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.96875, -13.5333251953125, -13.097900390625, -12.6624755859375, -12.22705078125, -11.7916259765625, -11.356201171875, -10.9207763671875, -10.4853515625, -10.0499267578125, -9.614501953125, -9.1790771484375, -8.74365234375, -8.3082275390625, -7.872802734375, -7.4373779296875, -7.001953125, -6.5665283203125, -6.131103515625, -5.6956787109375, -5.26025390625, -4.8248291015625, -4.389404296875, -3.9539794921875, -3.5185546875, -3.0831298828125, -2.647705078125, -2.2122802734375, -1.77685546875, -1.3414306640625, -0.906005859375, -0.4705810546875, -0.03515625, 0.4002685546875, 0.835693359375, 1.2711181640625, 1.70654296875, 2.1419677734375, 2.577392578125, 3.0128173828125, 3.4482421875, 3.8836669921875, 4.319091796875, 4.7545166015625, 5.18994140625, 5.6253662109375, 6.060791015625, 6.4962158203125, 6.931640625, 7.3670654296875, 7.802490234375, 8.2379150390625, 8.67333984375, 9.1087646484375, 9.544189453125, 9.9796142578125, 10.4150390625, 10.8504638671875, 11.285888671875, 11.7213134765625, 12.15673828125, 12.5921630859375, 13.027587890625, 13.4630126953125, 13.8984375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 13.0, 10.0, 7.0, 22.0, 27.0, 48.0, 47.0, 50.0, 65.0, 86.0, 143.0, 245.0, 1414.0, 288.0, 189.0, 101.0, 66.0, 65.0, 46.0, 24.0, 16.0, 19.0, 15.0, 16.0, 4.0, 6.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.375, -36.29638671875, -35.2177734375, -34.13916015625, -33.060546875, -31.98193359375, -30.9033203125, -29.82470703125, -28.74609375, -27.66748046875, -26.5888671875, -25.51025390625, -24.431640625, -23.35302734375, -22.2744140625, -21.19580078125, -20.1171875, -19.03857421875, -17.9599609375, -16.88134765625, -15.802734375, -14.72412109375, -13.6455078125, -12.56689453125, -11.48828125, -10.40966796875, -9.3310546875, -8.25244140625, -7.173828125, -6.09521484375, -5.0166015625, -3.93798828125, -2.859375, -1.78076171875, -0.7021484375, 0.37646484375, 1.455078125, 2.53369140625, 3.6123046875, 4.69091796875, 5.76953125, 6.84814453125, 7.9267578125, 9.00537109375, 10.083984375, 11.16259765625, 12.2412109375, 13.31982421875, 14.3984375, 15.47705078125, 16.5556640625, 17.63427734375, 18.712890625, 19.79150390625, 20.8701171875, 21.94873046875, 23.02734375, 24.10595703125, 25.1845703125, 26.26318359375, 27.341796875, 28.42041015625, 29.4990234375, 30.57763671875, 31.65625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 12.0, 10.0, 6.0, 15.0, 23.0, 39.0, 50.0, 103.0, 159.0, 233.0, 530.0, 1565.0, 10420.0, 504101.0, 2594181.0, 30091.0, 2580.0, 694.0, 361.0, 174.0, 105.0, 72.0, 42.0, 40.0, 21.0, 19.0, 15.0, 10.0, 5.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-62.34375, -60.5712890625, -58.798828125, -57.0263671875, -55.25390625, -53.4814453125, -51.708984375, -49.9365234375, -48.1640625, -46.3916015625, -44.619140625, -42.8466796875, -41.07421875, -39.3017578125, -37.529296875, -35.7568359375, -33.984375, -32.2119140625, -30.439453125, -28.6669921875, -26.89453125, -25.1220703125, -23.349609375, -21.5771484375, -19.8046875, -18.0322265625, -16.259765625, -14.4873046875, -12.71484375, -10.9423828125, -9.169921875, -7.3974609375, -5.625, -3.8525390625, -2.080078125, -0.3076171875, 1.46484375, 3.2373046875, 5.009765625, 6.7822265625, 8.5546875, 10.3271484375, 12.099609375, 13.8720703125, 15.64453125, 17.4169921875, 19.189453125, 20.9619140625, 22.734375, 24.5068359375, 26.279296875, 28.0517578125, 29.82421875, 31.5966796875, 33.369140625, 35.1416015625, 36.9140625, 38.6865234375, 40.458984375, 42.2314453125, 44.00390625, 45.7763671875, 47.548828125, 49.3212890625, 51.09375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 12.0, 52.0, 212.0, 363.0, 274.0, 80.0, 13.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-466.3736267089844, -456.9913635253906, -447.6091003417969, -438.2268371582031, -428.8445739746094, -419.4623107910156, -410.0800476074219, -400.6977844238281, -391.3155212402344, -381.9332580566406, -372.5509948730469, -363.1687316894531, -353.7864685058594, -344.4042053222656, -335.0219421386719, -325.6396789550781, -316.25738525390625, -306.8751220703125, -297.49285888671875, -288.110595703125, -278.72833251953125, -269.3460693359375, -259.96380615234375, -250.58154296875, -241.19927978515625, -231.8170166015625, -222.43475341796875, -213.052490234375, -203.67022705078125, -194.2879638671875, -184.90570068359375, -175.5234375, -166.1411895751953, -156.75892639160156, -147.3766632080078, -137.99440002441406, -128.6121368408203, -119.22987365722656, -109.84760284423828, -100.46533966064453, -91.08307647705078, -81.70081329345703, -72.31855010986328, -62.936283111572266, -53.554019927978516, -44.171756744384766, -34.78948974609375, -25.4072265625, -16.02496337890625, -6.642699241638184, 2.739564895629883, 12.121829986572266, 21.504093170166016, 30.886356353759766, 40.26862335205078, 49.65088653564453, 59.03314971923828, 68.41541290283203, 77.79767608642578, 87.17994689941406, 96.56221008300781, 105.94447326660156, 115.32673645019531, 124.70899963378906, 134.0912628173828]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 6.0, 9.0, 11.0, 15.0, 18.0, 23.0, 25.0, 20.0, 36.0, 42.0, 35.0, 42.0, 52.0, 55.0, 65.0, 73.0, 60.0, 55.0, 51.0, 56.0, 56.0, 31.0, 35.0, 24.0, 24.0, 20.0, 15.0, 12.0, 8.0, 7.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.6611785888672, -129.1174774169922, -125.57376861572266, -122.03006744384766, -118.48636627197266, -114.94265747070312, -111.39895629882812, -107.85525512695312, -104.31155395507812, -100.76785278320312, -97.2241439819336, -93.6804428100586, -90.1367416381836, -86.59303283691406, -83.04933166503906, -79.50563049316406, -75.96192169189453, -72.41822052001953, -68.87451171875, -65.330810546875, -61.787109375, -58.243404388427734, -54.69969940185547, -51.15599822998047, -47.6122932434082, -44.06858825683594, -40.52488708496094, -36.98118209838867, -33.437477111816406, -29.893775939941406, -26.35007095336914, -22.806367874145508, -19.262657165527344, -15.718954086303711, -12.175250053405762, -8.631546020507812, -5.08784294128418, -1.5441398620605469, 1.9995651245117188, 5.543268203735352, 9.086971282958984, 12.630674362182617, 16.17437744140625, 19.718082427978516, 23.26178550720215, 26.80548858642578, 30.349193572998047, 33.89289855957031, 37.43659973144531, 40.98030471801758, 44.52400588989258, 48.067710876464844, 51.611412048339844, 55.15511703491211, 58.698822021484375, 62.242523193359375, 65.78622436523438, 69.32992553710938, 72.8736343383789, 76.4173355102539, 79.9610366821289, 83.50474548339844, 87.04844665527344, 90.59214782714844, 94.13585662841797]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 1.0, 5.0, 1.0, 3.0, 6.0, 5.0, 8.0, 9.0, 17.0, 9.0, 21.0, 17.0, 23.0, 29.0, 26.0, 37.0, 34.0, 32.0, 42.0, 44.0, 39.0, 44.0, 66.0, 53.0, 52.0, 50.0, 36.0, 41.0, 41.0, 35.0, 29.0, 25.0, 30.0, 14.0, 18.0, 15.0, 11.0, 5.0, 7.0, 3.0, 9.0, 3.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.2904052734375, -8.994873046875, -8.6993408203125, -8.40380859375, -8.1082763671875, -7.812744140625, -7.5172119140625, -7.2216796875, -6.9261474609375, -6.630615234375, -6.3350830078125, -6.03955078125, -5.7440185546875, -5.448486328125, -5.1529541015625, -4.857421875, -4.5618896484375, -4.266357421875, -3.9708251953125, -3.67529296875, -3.3797607421875, -3.084228515625, -2.7886962890625, -2.4931640625, -2.1976318359375, -1.902099609375, -1.6065673828125, -1.31103515625, -1.0155029296875, -0.719970703125, -0.4244384765625, -0.12890625, 0.1666259765625, 0.462158203125, 0.7576904296875, 1.05322265625, 1.3487548828125, 1.644287109375, 1.9398193359375, 2.2353515625, 2.5308837890625, 2.826416015625, 3.1219482421875, 3.41748046875, 3.7130126953125, 4.008544921875, 4.3040771484375, 4.599609375, 4.8951416015625, 5.190673828125, 5.4862060546875, 5.78173828125, 6.0772705078125, 6.372802734375, 6.6683349609375, 6.9638671875, 7.2593994140625, 7.554931640625, 7.8504638671875, 8.14599609375, 8.4415283203125, 8.737060546875, 9.0325927734375, 9.328125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 16.0, 33.0, 38.0, 77.0, 124.0, 250.0, 434.0, 920.0, 1910.0, 4420.0, 12461.0, 49181.0, 382984.0, 3144909.0, 515244.0, 58612.0, 14025.0, 4803.0, 2007.0, 898.0, 410.0, 219.0, 126.0, 60.0, 34.0, 28.0, 15.0, 6.0, 2.0, 8.0, 7.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-33.0, -32.044921875, -31.08984375, -30.134765625, -29.1796875, -28.224609375, -27.26953125, -26.314453125, -25.359375, -24.404296875, -23.44921875, -22.494140625, -21.5390625, -20.583984375, -19.62890625, -18.673828125, -17.71875, -16.763671875, -15.80859375, -14.853515625, -13.8984375, -12.943359375, -11.98828125, -11.033203125, -10.078125, -9.123046875, -8.16796875, -7.212890625, -6.2578125, -5.302734375, -4.34765625, -3.392578125, -2.4375, -1.482421875, -0.52734375, 0.427734375, 1.3828125, 2.337890625, 3.29296875, 4.248046875, 5.203125, 6.158203125, 7.11328125, 8.068359375, 9.0234375, 9.978515625, 10.93359375, 11.888671875, 12.84375, 13.798828125, 14.75390625, 15.708984375, 16.6640625, 17.619140625, 18.57421875, 19.529296875, 20.484375, 21.439453125, 22.39453125, 23.349609375, 24.3046875, 25.259765625, 26.21484375, 27.169921875, 28.125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 0.0, 13.0, 9.0, 26.0, 53.0, 88.0, 235.0, 464.0, 1065.0, 1085.0, 507.0, 244.0, 134.0, 75.0, 36.0, 21.0, 14.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.9375, -51.811279296875, -50.68505859375, -49.558837890625, -48.4326171875, -47.306396484375, -46.18017578125, -45.053955078125, -43.927734375, -42.801513671875, -41.67529296875, -40.549072265625, -39.4228515625, -38.296630859375, -37.17041015625, -36.044189453125, -34.91796875, -33.791748046875, -32.66552734375, -31.539306640625, -30.4130859375, -29.286865234375, -28.16064453125, -27.034423828125, -25.908203125, -24.781982421875, -23.65576171875, -22.529541015625, -21.4033203125, -20.277099609375, -19.15087890625, -18.024658203125, -16.8984375, -15.772216796875, -14.64599609375, -13.519775390625, -12.3935546875, -11.267333984375, -10.14111328125, -9.014892578125, -7.888671875, -6.762451171875, -5.63623046875, -4.510009765625, -3.3837890625, -2.257568359375, -1.13134765625, -0.005126953125, 1.12109375, 2.247314453125, 3.37353515625, 4.499755859375, 5.6259765625, 6.752197265625, 7.87841796875, 9.004638671875, 10.130859375, 11.257080078125, 12.38330078125, 13.509521484375, 14.6357421875, 15.761962890625, 16.88818359375, 18.014404296875, 19.140625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 12.0, 16.0, 15.0, 34.0, 68.0, 121.0, 256.0, 703.0, 2487.0, 18548.0, 527641.0, 3548602.0, 87777.0, 6023.0, 1148.0, 402.0, 203.0, 99.0, 50.0, 28.0, 22.0, 11.0, 12.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.46875, -57.62548828125, -55.7822265625, -53.93896484375, -52.095703125, -50.25244140625, -48.4091796875, -46.56591796875, -44.72265625, -42.87939453125, -41.0361328125, -39.19287109375, -37.349609375, -35.50634765625, -33.6630859375, -31.81982421875, -29.9765625, -28.13330078125, -26.2900390625, -24.44677734375, -22.603515625, -20.76025390625, -18.9169921875, -17.07373046875, -15.23046875, -13.38720703125, -11.5439453125, -9.70068359375, -7.857421875, -6.01416015625, -4.1708984375, -2.32763671875, -0.484375, 1.35888671875, 3.2021484375, 5.04541015625, 6.888671875, 8.73193359375, 10.5751953125, 12.41845703125, 14.26171875, 16.10498046875, 17.9482421875, 19.79150390625, 21.634765625, 23.47802734375, 25.3212890625, 27.16455078125, 29.0078125, 30.85107421875, 32.6943359375, 34.53759765625, 36.380859375, 38.22412109375, 40.0673828125, 41.91064453125, 43.75390625, 45.59716796875, 47.4404296875, 49.28369140625, 51.126953125, 52.97021484375, 54.8134765625, 56.65673828125, 58.5]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 133.0, 649.0, 212.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-435.26348876953125, -417.5155334472656, -399.7675476074219, -382.01959228515625, -364.2716064453125, -346.5236511230469, -328.77569580078125, -311.0277099609375, -293.27972412109375, -275.5317687988281, -257.7837829589844, -240.03582763671875, -222.287841796875, -204.53988647460938, -186.7919158935547, -169.0439453125, -151.29598999023438, -133.5480194091797, -115.800048828125, -98.05208587646484, -80.30411529541016, -62.55614471435547, -44.80818176269531, -27.060211181640625, -9.312240600585938, 8.435728073120117, 26.183696746826172, 43.931663513183594, 61.67963409423828, 79.42760467529297, 97.17556762695312, 114.92353820800781, 132.6715087890625, 150.4194793701172, 168.16744995117188, 185.9154052734375, 203.66339111328125, 221.41134643554688, 239.15931701660156, 256.90728759765625, 274.6552734375, 292.4032287597656, 310.1512145996094, 327.899169921875, 345.64715576171875, 363.3951110839844, 381.14306640625, 398.89105224609375, 416.6390075683594, 434.386962890625, 452.13494873046875, 469.8829040527344, 487.6308898925781, 505.37884521484375, 523.1268310546875, 540.874755859375, 558.6227416992188, 576.3707275390625, 594.11865234375, 611.8666381835938, 629.6146240234375, 647.3626098632812, 665.1105346679688, 682.8585205078125, 700.6065063476562]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 11.0, 13.0, 14.0, 23.0, 18.0, 31.0, 29.0, 30.0, 41.0, 46.0, 53.0, 57.0, 48.0, 58.0, 71.0, 56.0, 49.0, 45.0, 59.0, 48.0, 41.0, 29.0, 26.0, 22.0, 11.0, 22.0, 13.0, 9.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-107.16656494140625, -104.37073516845703, -101.57489776611328, -98.77906799316406, -95.98323059082031, -93.1874008178711, -90.39157104492188, -87.59573364257812, -84.7999038696289, -82.00407409667969, -79.20823669433594, -76.41240692138672, -73.6165771484375, -70.82073974609375, -68.02490997314453, -65.22908020019531, -62.43324279785156, -59.63740921020508, -56.841575622558594, -54.045745849609375, -51.24991226196289, -48.454078674316406, -45.65824890136719, -42.8624153137207, -40.06658172607422, -37.270748138427734, -34.47491455078125, -31.67908477783203, -28.883251190185547, -26.087417602539062, -23.29158592224121, -20.49575424194336, -17.699920654296875, -14.904088020324707, -12.108255386352539, -9.312422752380371, -6.516590118408203, -3.720757484436035, -0.9249248504638672, 1.8709068298339844, 4.666740417480469, 7.462573051452637, 10.258405685424805, 13.054238319396973, 15.85007095336914, 18.645904541015625, 21.441736221313477, 24.237567901611328, 27.033401489257812, 29.829235076904297, 32.62506866455078, 35.4208984375, 38.216732025146484, 41.01256561279297, 43.80839538574219, 46.60422897338867, 49.400062561035156, 52.19589614868164, 54.991729736328125, 57.787559509277344, 60.58339309692383, 63.37922668457031, 66.17505645751953, 68.97088623046875, 71.7667236328125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 10.0, 14.0, 15.0, 28.0, 15.0, 17.0, 35.0, 30.0, 44.0, 49.0, 48.0, 53.0, 50.0, 57.0, 69.0, 48.0, 55.0, 54.0, 49.0, 52.0, 43.0, 26.0, 24.0, 18.0, 22.0, 12.0, 10.0, 14.0, 9.0, 6.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.9281005859375, -8.598388671875, -8.2686767578125, -7.93896484375, -7.6092529296875, -7.279541015625, -6.9498291015625, -6.6201171875, -6.2904052734375, -5.960693359375, -5.6309814453125, -5.30126953125, -4.9715576171875, -4.641845703125, -4.3121337890625, -3.982421875, -3.6527099609375, -3.322998046875, -2.9932861328125, -2.66357421875, -2.3338623046875, -2.004150390625, -1.6744384765625, -1.3447265625, -1.0150146484375, -0.685302734375, -0.3555908203125, -0.02587890625, 0.3038330078125, 0.633544921875, 0.9632568359375, 1.29296875, 1.6226806640625, 1.952392578125, 2.2821044921875, 2.61181640625, 2.9415283203125, 3.271240234375, 3.6009521484375, 3.9306640625, 4.2603759765625, 4.590087890625, 4.9197998046875, 5.24951171875, 5.5792236328125, 5.908935546875, 6.2386474609375, 6.568359375, 6.8980712890625, 7.227783203125, 7.5574951171875, 7.88720703125, 8.2169189453125, 8.546630859375, 8.8763427734375, 9.2060546875, 9.5357666015625, 9.865478515625, 10.1951904296875, 10.52490234375, 10.8546142578125, 11.184326171875, 11.5140380859375, 11.84375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 10.0, 8.0, 12.0, 21.0, 42.0, 52.0, 74.0, 128.0, 199.0, 312.0, 577.0, 932.0, 1767.0, 3142.0, 5882.0, 10862.0, 20660.0, 42201.0, 96741.0, 301245.0, 357247.0, 110139.0, 47332.0, 22794.0, 11933.0, 6331.0, 3444.0, 1914.0, 1022.0, 608.0, 351.0, 210.0, 141.0, 60.0, 55.0, 38.0, 23.0, 17.0, 8.0, 6.0, 8.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.463623046875, -0.4496040344238281, -0.43558502197265625, -0.4215660095214844, -0.4075469970703125, -0.3935279846191406, -0.37950897216796875, -0.3654899597167969, -0.351470947265625, -0.3374519348144531, -0.32343292236328125, -0.3094139099121094, -0.2953948974609375, -0.2813758850097656, -0.26735687255859375, -0.2533378601074219, -0.23931884765625, -0.22529983520507812, -0.21128082275390625, -0.19726181030273438, -0.1832427978515625, -0.16922378540039062, -0.15520477294921875, -0.14118576049804688, -0.127166748046875, -0.11314773559570312, -0.09912872314453125, -0.08510971069335938, -0.0710906982421875, -0.057071685791015625, -0.04305267333984375, -0.029033660888671875, -0.0150146484375, -0.000995635986328125, 0.01302337646484375, 0.027042388916015625, 0.0410614013671875, 0.055080413818359375, 0.06909942626953125, 0.08311843872070312, 0.097137451171875, 0.11115646362304688, 0.12517547607421875, 0.13919448852539062, 0.1532135009765625, 0.16723251342773438, 0.18125152587890625, 0.19527053833007812, 0.20928955078125, 0.22330856323242188, 0.23732757568359375, 0.2513465881347656, 0.2653656005859375, 0.2793846130371094, 0.29340362548828125, 0.3074226379394531, 0.321441650390625, 0.3354606628417969, 0.34947967529296875, 0.3634986877441406, 0.3775177001953125, 0.3915367126464844, 0.40555572509765625, 0.4195747375488281, 0.43359375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 3.0, 8.0, 6.0, 10.0, 13.0, 11.0, 27.0, 14.0, 13.0, 17.0, 26.0, 16.0, 27.0, 29.0, 22.0, 29.0, 37.0, 39.0, 32.0, 38.0, 37.0, 25.0, 1052.0, 35.0, 28.0, 33.0, 32.0, 39.0, 35.0, 28.0, 36.0, 24.0, 22.0, 22.0, 22.0, 16.0, 11.0, 18.0, 13.0, 11.0, 19.0, 12.0, 13.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3203125, -5.137939453125, -4.95556640625, -4.773193359375, -4.5908203125, -4.408447265625, -4.22607421875, -4.043701171875, -3.861328125, -3.678955078125, -3.49658203125, -3.314208984375, -3.1318359375, -2.949462890625, -2.76708984375, -2.584716796875, -2.40234375, -2.219970703125, -2.03759765625, -1.855224609375, -1.6728515625, -1.490478515625, -1.30810546875, -1.125732421875, -0.943359375, -0.760986328125, -0.57861328125, -0.396240234375, -0.2138671875, -0.031494140625, 0.15087890625, 0.333251953125, 0.515625, 0.697998046875, 0.88037109375, 1.062744140625, 1.2451171875, 1.427490234375, 1.60986328125, 1.792236328125, 1.974609375, 2.156982421875, 2.33935546875, 2.521728515625, 2.7041015625, 2.886474609375, 3.06884765625, 3.251220703125, 3.43359375, 3.615966796875, 3.79833984375, 3.980712890625, 4.1630859375, 4.345458984375, 4.52783203125, 4.710205078125, 4.892578125, 5.074951171875, 5.25732421875, 5.439697265625, 5.6220703125, 5.804443359375, 5.98681640625, 6.169189453125, 6.3515625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 7.0, 10.0, 18.0, 23.0, 33.0, 48.0, 64.0, 119.0, 168.0, 231.0, 414.0, 652.0, 984.0, 1446.0, 2222.0, 3463.0, 5202.0, 7954.0, 12408.0, 19276.0, 29108.0, 46736.0, 79327.0, 150575.0, 1319005.0, 179441.0, 91903.0, 52767.0, 32761.0, 21268.0, 13705.0, 8932.0, 5820.0, 3817.0, 2475.0, 1723.0, 1055.0, 667.0, 472.0, 241.0, 211.0, 138.0, 89.0, 53.0, 37.0, 25.0, 16.0, 11.0, 8.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1893310546875, -0.1829395294189453, -0.17654800415039062, -0.17015647888183594, -0.16376495361328125, -0.15737342834472656, -0.15098190307617188, -0.1445903778076172, -0.1381988525390625, -0.1318073272705078, -0.12541580200195312, -0.11902427673339844, -0.11263275146484375, -0.10624122619628906, -0.09984970092773438, -0.09345817565917969, -0.087066650390625, -0.08067512512207031, -0.07428359985351562, -0.06789207458496094, -0.06150054931640625, -0.05510902404785156, -0.048717498779296875, -0.04232597351074219, -0.0359344482421875, -0.029542922973632812, -0.023151397705078125, -0.016759872436523438, -0.01036834716796875, -0.0039768218994140625, 0.002414703369140625, 0.008806228637695312, 0.01519775390625, 0.021589279174804688, 0.027980804443359375, 0.03437232971191406, 0.04076385498046875, 0.04715538024902344, 0.053546905517578125, 0.05993843078613281, 0.0663299560546875, 0.07272148132324219, 0.07911300659179688, 0.08550453186035156, 0.09189605712890625, 0.09828758239746094, 0.10467910766601562, 0.11107063293457031, 0.117462158203125, 0.12385368347167969, 0.13024520874023438, 0.13663673400878906, 0.14302825927734375, 0.14941978454589844, 0.15581130981445312, 0.1622028350830078, 0.1685943603515625, 0.1749858856201172, 0.18137741088867188, 0.18776893615722656, 0.19416046142578125, 0.20055198669433594, 0.20694351196289062, 0.2133350372314453, 0.2197265625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 9.0, 0.0, 3.0, 5.0, 8.0, 4.0, 7.0, 7.0, 10.0, 21.0, 16.0, 16.0, 15.0, 16.0, 31.0, 34.0, 33.0, 31.0, 32.0, 51.0, 38.0, 49.0, 53.0, 41.0, 47.0, 42.0, 41.0, 36.0, 48.0, 21.0, 33.0, 30.0, 32.0, 32.0, 20.0, 22.0, 14.0, 12.0, 10.0, 6.0, 6.0, 5.0, 9.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011259317398071289, -0.00010904483497142792, -0.00010549649596214294, -0.00010194815695285797, -9.8399817943573e-05, -9.485147893428802e-05, -9.130313992500305e-05, -8.775480091571808e-05, -8.42064619064331e-05, -8.065812289714813e-05, -7.710978388786316e-05, -7.356144487857819e-05, -7.001310586929321e-05, -6.646476686000824e-05, -6.291642785072327e-05, -5.9368088841438293e-05, -5.581974983215332e-05, -5.227141082286835e-05, -4.8723071813583374e-05, -4.51747328042984e-05, -4.162639379501343e-05, -3.8078054785728455e-05, -3.452971577644348e-05, -3.098137676715851e-05, -2.7433037757873535e-05, -2.3884698748588562e-05, -2.033635973930359e-05, -1.6788020730018616e-05, -1.3239681720733643e-05, -9.69134271144867e-06, -6.143003702163696e-06, -2.594664692878723e-06, 9.5367431640625e-07, 4.502013325691223e-06, 8.050352334976196e-06, 1.159869134426117e-05, 1.5147030353546143e-05, 1.8695369362831116e-05, 2.224370837211609e-05, 2.5792047381401062e-05, 2.9340386390686035e-05, 3.288872539997101e-05, 3.643706440925598e-05, 3.9985403418540955e-05, 4.353374242782593e-05, 4.70820814371109e-05, 5.0630420446395874e-05, 5.417875945568085e-05, 5.772709846496582e-05, 6.12754374742508e-05, 6.482377648353577e-05, 6.837211549282074e-05, 7.192045450210571e-05, 7.546879351139069e-05, 7.901713252067566e-05, 8.256547152996063e-05, 8.61138105392456e-05, 8.966214954853058e-05, 9.321048855781555e-05, 9.675882756710052e-05, 0.0001003071665763855, 0.00010385550558567047, 0.00010740384459495544, 0.00011095218360424042, 0.00011450052261352539]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 7.0, 5.0, 12.0, 3.0, 4.0, 9.0, 11.0, 14.0, 14.0, 26.0, 35.0, 41.0, 35.0, 46.0, 70.0, 87.0, 144.0, 194.0, 358.0, 1323.0, 28639.0, 860643.0, 152061.0, 3392.0, 524.0, 244.0, 143.0, 105.0, 71.0, 55.0, 49.0, 33.0, 22.0, 33.0, 17.0, 22.0, 15.0, 11.0, 10.0, 7.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020847320556640625, -0.002016812562942505, -0.0019488930702209473, -0.0018809735774993896, -0.001813054084777832, -0.0017451345920562744, -0.0016772150993347168, -0.0016092956066131592, -0.0015413761138916016, -0.001473456621170044, -0.0014055371284484863, -0.0013376176357269287, -0.001269698143005371, -0.0012017786502838135, -0.0011338591575622559, -0.0010659396648406982, -0.0009980201721191406, -0.000930100679397583, -0.0008621811866760254, -0.0007942616939544678, -0.0007263422012329102, -0.0006584227085113525, -0.0005905032157897949, -0.0005225837230682373, -0.0004546642303466797, -0.00038674473762512207, -0.00031882524490356445, -0.00025090575218200684, -0.00018298625946044922, -0.0001150667667388916, -4.7147274017333984e-05, 2.0772218704223633e-05, 8.869171142578125e-05, 0.00015661120414733887, 0.00022453069686889648, 0.0002924501895904541, 0.0003603696823120117, 0.00042828917503356934, 0.000496208667755127, 0.0005641281604766846, 0.0006320476531982422, 0.0006999671459197998, 0.0007678866386413574, 0.000835806131362915, 0.0009037256240844727, 0.0009716451168060303, 0.0010395646095275879, 0.0011074841022491455, 0.0011754035949707031, 0.0012433230876922607, 0.0013112425804138184, 0.001379162073135376, 0.0014470815658569336, 0.0015150010585784912, 0.0015829205513000488, 0.0016508400440216064, 0.001718759536743164, 0.0017866790294647217, 0.0018545985221862793, 0.001922518014907837, 0.0019904375076293945, 0.002058357000350952, 0.0021262764930725098, 0.0021941959857940674, 0.002262115478515625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 10.0, 14.0, 51.0, 137.0, 276.0, 284.0, 153.0, 66.0, 16.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010223874414805323, -8.94940021680668e-05, -7.674926018808037e-05, -6.400451093213633e-05, -5.12597689521499e-05, -3.851502697216347e-05, -2.5770277716219425e-05, -1.3025535736232996e-05, -2.8079375624656677e-07, 1.2463950042729266e-05, 2.52086938417051e-05, 3.7953439459670335e-05, 5.0698181439656764e-05, 6.34429234196432e-05, 7.618767267558724e-05, 8.893241465557367e-05, 0.0001016771566355601, 0.00011442189861554652, 0.00012716664059553295, 0.0001399113971274346, 0.00015265613910742104, 0.00016540088108740747, 0.0001781456230673939, 0.00019089036504738033, 0.00020363510702736676, 0.0002163798490073532, 0.00022912459098733962, 0.00024186933296732605, 0.0002546140749473125, 0.0002673588169272989, 0.0002801035880111158, 0.0002928483299911022, 0.00030559307197108865, 0.0003183378139510751, 0.0003310825559310615, 0.00034382729791104794, 0.00035657203989103436, 0.0003693167818710208, 0.0003820615238510072, 0.00039480626583099365, 0.0004075510078109801, 0.0004202957497909665, 0.00043304049177095294, 0.00044578523375093937, 0.0004585299757309258, 0.00047127471771091223, 0.00048401945969089866, 0.0004967642016708851, 0.0005095090018585324, 0.0005222537438385189, 0.0005349984858185053, 0.0005477432277984917, 0.0005604879697784781, 0.0005732327117584646, 0.000585977453738451, 0.0005987221957184374, 0.0006114669376984239, 0.0006242116796784103, 0.0006369564216583967, 0.0006497011636383832, 0.0006624459056183696, 0.000675190647598356, 0.0006879353895783424, 0.0007006801315583289, 0.0007134248735383153]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 5.0, 5.0, 5.0, 9.0, 11.0, 12.0, 13.0, 14.0, 12.0, 17.0, 14.0, 25.0, 26.0, 35.0, 27.0, 34.0, 47.0, 32.0, 44.0, 39.0, 41.0, 46.0, 44.0, 29.0, 37.0, 31.0, 36.0, 33.0, 28.0, 28.0, 33.0, 25.0, 31.0, 20.0, 19.0, 18.0, 12.0, 10.0, 11.0, 13.0, 8.0, 5.0, 5.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.434057235717773e-05, -8.173007518053055e-05, -7.911957800388336e-05, -7.650908082723618e-05, -7.389858365058899e-05, -7.12880864739418e-05, -6.867758929729462e-05, -6.606709212064743e-05, -6.345659494400024e-05, -6.084609776735306e-05, -5.823560059070587e-05, -5.5625103414058685e-05, -5.30146062374115e-05, -5.040410906076431e-05, -4.7793611884117126e-05, -4.518311470746994e-05, -4.2572617530822754e-05, -3.996212035417557e-05, -3.735162317752838e-05, -3.4741126000881195e-05, -3.213062882423401e-05, -2.9520131647586823e-05, -2.6909634470939636e-05, -2.429913729429245e-05, -2.1688640117645264e-05, -1.9078142940998077e-05, -1.646764576435089e-05, -1.3857148587703705e-05, -1.1246651411056519e-05, -8.636154234409332e-06, -6.025657057762146e-06, -3.4151598811149597e-06, -8.046627044677734e-07, 1.8058344721794128e-06, 4.416331648826599e-06, 7.026828825473785e-06, 9.637326002120972e-06, 1.2247823178768158e-05, 1.4858320355415344e-05, 1.746881753206253e-05, 2.0079314708709717e-05, 2.2689811885356903e-05, 2.530030906200409e-05, 2.7910806238651276e-05, 3.052130341529846e-05, 3.313180059194565e-05, 3.5742297768592834e-05, 3.835279494524002e-05, 4.096329212188721e-05, 4.357378929853439e-05, 4.618428647518158e-05, 4.8794783651828766e-05, 5.140528082847595e-05, 5.401577800512314e-05, 5.6626275181770325e-05, 5.923677235841751e-05, 6.18472695350647e-05, 6.445776671171188e-05, 6.706826388835907e-05, 6.967876106500626e-05, 7.228925824165344e-05, 7.489975541830063e-05, 7.751025259494781e-05, 8.0120749771595e-05, 8.273124694824219e-05]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 10.0, 14.0, 15.0, 28.0, 15.0, 17.0, 35.0, 30.0, 44.0, 49.0, 48.0, 53.0, 50.0, 57.0, 69.0, 48.0, 55.0, 54.0, 49.0, 52.0, 43.0, 26.0, 24.0, 18.0, 22.0, 12.0, 10.0, 14.0, 9.0, 6.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.9281005859375, -8.598388671875, -8.2686767578125, -7.93896484375, -7.6092529296875, -7.279541015625, -6.9498291015625, -6.6201171875, -6.2904052734375, -5.960693359375, -5.6309814453125, -5.30126953125, -4.9715576171875, -4.641845703125, -4.3121337890625, -3.982421875, -3.6527099609375, -3.322998046875, -2.9932861328125, -2.66357421875, -2.3338623046875, -2.004150390625, -1.6744384765625, -1.3447265625, -1.0150146484375, -0.685302734375, -0.3555908203125, -0.02587890625, 0.3038330078125, 0.633544921875, 0.9632568359375, 1.29296875, 1.6226806640625, 1.952392578125, 2.2821044921875, 2.61181640625, 2.9415283203125, 3.271240234375, 3.6009521484375, 3.9306640625, 4.2603759765625, 4.590087890625, 4.9197998046875, 5.24951171875, 5.5792236328125, 5.908935546875, 6.2386474609375, 6.568359375, 6.8980712890625, 7.227783203125, 7.5574951171875, 7.88720703125, 8.2169189453125, 8.546630859375, 8.8763427734375, 9.2060546875, 9.5357666015625, 9.865478515625, 10.1951904296875, 10.52490234375, 10.8546142578125, 11.184326171875, 11.5140380859375, 11.84375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 3.0, 8.0, 14.0, 16.0, 24.0, 26.0, 49.0, 55.0, 87.0, 137.0, 224.0, 381.0, 704.0, 1312.0, 2578.0, 5296.0, 12659.0, 33760.0, 102700.0, 337400.0, 371573.0, 116290.0, 37618.0, 13814.0, 5699.0, 2848.0, 1439.0, 735.0, 364.0, 258.0, 168.0, 104.0, 60.0, 45.0, 30.0, 21.0, 10.0, 9.0, 13.0, 5.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.28125, -17.744384765625, -17.20751953125, -16.670654296875, -16.1337890625, -15.596923828125, -15.06005859375, -14.523193359375, -13.986328125, -13.449462890625, -12.91259765625, -12.375732421875, -11.8388671875, -11.302001953125, -10.76513671875, -10.228271484375, -9.69140625, -9.154541015625, -8.61767578125, -8.080810546875, -7.5439453125, -7.007080078125, -6.47021484375, -5.933349609375, -5.396484375, -4.859619140625, -4.32275390625, -3.785888671875, -3.2490234375, -2.712158203125, -2.17529296875, -1.638427734375, -1.1015625, -0.564697265625, -0.02783203125, 0.509033203125, 1.0458984375, 1.582763671875, 2.11962890625, 2.656494140625, 3.193359375, 3.730224609375, 4.26708984375, 4.803955078125, 5.3408203125, 5.877685546875, 6.41455078125, 6.951416015625, 7.48828125, 8.025146484375, 8.56201171875, 9.098876953125, 9.6357421875, 10.172607421875, 10.70947265625, 11.246337890625, 11.783203125, 12.320068359375, 12.85693359375, 13.393798828125, 13.9306640625, 14.467529296875, 15.00439453125, 15.541259765625, 16.078125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 6.0, 7.0, 6.0, 5.0, 10.0, 14.0, 21.0, 15.0, 21.0, 42.0, 37.0, 48.0, 64.0, 90.0, 135.0, 177.0, 1356.0, 268.0, 193.0, 138.0, 80.0, 67.0, 58.0, 36.0, 42.0, 29.0, 22.0, 19.0, 8.0, 9.0, 10.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.4375, -23.58984375, -22.7421875, -21.89453125, -21.046875, -20.19921875, -19.3515625, -18.50390625, -17.65625, -16.80859375, -15.9609375, -15.11328125, -14.265625, -13.41796875, -12.5703125, -11.72265625, -10.875, -10.02734375, -9.1796875, -8.33203125, -7.484375, -6.63671875, -5.7890625, -4.94140625, -4.09375, -3.24609375, -2.3984375, -1.55078125, -0.703125, 0.14453125, 0.9921875, 1.83984375, 2.6875, 3.53515625, 4.3828125, 5.23046875, 6.078125, 6.92578125, 7.7734375, 8.62109375, 9.46875, 10.31640625, 11.1640625, 12.01171875, 12.859375, 13.70703125, 14.5546875, 15.40234375, 16.25, 17.09765625, 17.9453125, 18.79296875, 19.640625, 20.48828125, 21.3359375, 22.18359375, 23.03125, 23.87890625, 24.7265625, 25.57421875, 26.421875, 27.26953125, 28.1171875, 28.96484375, 29.8125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 5.0, 10.0, 16.0, 26.0, 69.0, 119.0, 291.0, 961.0, 11646.0, 3122732.0, 8496.0, 847.0, 260.0, 108.0, 49.0, 20.0, 14.0, 15.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.1875, -122.4169921875, -118.646484375, -114.8759765625, -111.10546875, -107.3349609375, -103.564453125, -99.7939453125, -96.0234375, -92.2529296875, -88.482421875, -84.7119140625, -80.94140625, -77.1708984375, -73.400390625, -69.6298828125, -65.859375, -62.0888671875, -58.318359375, -54.5478515625, -50.77734375, -47.0068359375, -43.236328125, -39.4658203125, -35.6953125, -31.9248046875, -28.154296875, -24.3837890625, -20.61328125, -16.8427734375, -13.072265625, -9.3017578125, -5.53125, -1.7607421875, 2.009765625, 5.7802734375, 9.55078125, 13.3212890625, 17.091796875, 20.8623046875, 24.6328125, 28.4033203125, 32.173828125, 35.9443359375, 39.71484375, 43.4853515625, 47.255859375, 51.0263671875, 54.796875, 58.5673828125, 62.337890625, 66.1083984375, 69.87890625, 73.6494140625, 77.419921875, 81.1904296875, 84.9609375, 88.7314453125, 92.501953125, 96.2724609375, 100.04296875, 103.8134765625, 107.583984375, 111.3544921875, 115.125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 13.0, 18.0, 29.0, 68.0, 133.0, 195.0, 215.0, 169.0, 89.0, 49.0, 19.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-191.60662841796875, -187.16661071777344, -182.72659301757812, -178.28659057617188, -173.84657287597656, -169.40655517578125, -164.96653747558594, -160.52651977539062, -156.08651733398438, -151.64649963378906, -147.20648193359375, -142.7664794921875, -138.3264617919922, -133.88644409179688, -129.44642639160156, -125.00640869140625, -120.56639099121094, -116.12637329101562, -111.68636322021484, -107.24634552001953, -102.80633544921875, -98.36631774902344, -93.92630004882812, -89.48628234863281, -85.04627227783203, -80.60625457763672, -76.16624450683594, -71.72622680664062, -67.28620910644531, -62.84619903564453, -58.40618133544922, -53.96616744995117, -49.52616882324219, -45.08615493774414, -40.646141052246094, -36.20612335205078, -31.766109466552734, -27.326095581054688, -22.886079788208008, -18.446063995361328, -14.006050109863281, -9.566035270690918, -5.126020431518555, -0.6860055923461914, 3.754009246826172, 8.194023132324219, 12.634038925170898, 17.074054718017578, 21.514068603515625, 25.954082489013672, 30.39409828186035, 34.83411407470703, 39.27412796020508, 43.714141845703125, 48.15415954589844, 52.594173431396484, 57.03418731689453, 61.47420120239258, 65.91421508789062, 70.35423278808594, 74.79425048828125, 79.23426055908203, 83.67427825927734, 88.11428833007812, 92.55430603027344]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 9.0, 10.0, 7.0, 6.0, 13.0, 10.0, 19.0, 12.0, 18.0, 16.0, 27.0, 23.0, 36.0, 24.0, 36.0, 35.0, 31.0, 38.0, 33.0, 44.0, 53.0, 39.0, 41.0, 30.0, 36.0, 36.0, 37.0, 29.0, 34.0, 30.0, 23.0, 16.0, 26.0, 17.0, 13.0, 14.0, 11.0, 14.0, 7.0, 10.0, 9.0, 3.0, 5.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.862159729003906, -51.848602294921875, -49.83504867553711, -47.82149124145508, -45.80793380737305, -43.79438018798828, -41.78082275390625, -39.76726531982422, -37.75370788574219, -35.740150451660156, -33.72659683227539, -31.71303939819336, -29.699481964111328, -27.68592643737793, -25.67237091064453, -23.6588134765625, -21.645259857177734, -19.631704330444336, -17.618146896362305, -15.604591369628906, -13.591034889221191, -11.577478408813477, -9.563922882080078, -7.550366401672363, -5.536809921264648, -3.5232536792755127, -1.509697437286377, 0.5038585662841797, 2.5174150466918945, 4.530971527099609, 6.544527053833008, 8.558083534240723, 10.571640014648438, 12.585196495056152, 14.598752975463867, 16.612308502197266, 18.625865936279297, 20.639421463012695, 22.652976989746094, 24.666534423828125, 26.680089950561523, 28.693645477294922, 30.707202911376953, 32.72075653076172, 34.73431396484375, 36.74787139892578, 38.76142883300781, 40.77498245239258, 42.78853988647461, 44.80209732055664, 46.815650939941406, 48.82920837402344, 50.84276580810547, 52.8563232421875, 54.869876861572266, 56.8834342956543, 58.89698791503906, 60.910545349121094, 62.92409896850586, 64.93765258789062, 66.95121002197266, 68.96476745605469, 70.97832489013672, 72.99188232421875, 75.00543975830078]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 10.0, 10.0, 16.0, 12.0, 24.0, 19.0, 26.0, 39.0, 39.0, 35.0, 37.0, 53.0, 46.0, 63.0, 50.0, 49.0, 59.0, 48.0, 59.0, 54.0, 39.0, 33.0, 36.0, 29.0, 25.0, 22.0, 19.0, 9.0, 11.0, 6.0, 5.0, 4.0, 5.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.7874755859375, -9.449951171875, -9.1124267578125, -8.77490234375, -8.4373779296875, -8.099853515625, -7.7623291015625, -7.4248046875, -7.0872802734375, -6.749755859375, -6.4122314453125, -6.07470703125, -5.7371826171875, -5.399658203125, -5.0621337890625, -4.724609375, -4.3870849609375, -4.049560546875, -3.7120361328125, -3.37451171875, -3.0369873046875, -2.699462890625, -2.3619384765625, -2.0244140625, -1.6868896484375, -1.349365234375, -1.0118408203125, -0.67431640625, -0.3367919921875, 0.000732421875, 0.3382568359375, 0.67578125, 1.0133056640625, 1.350830078125, 1.6883544921875, 2.02587890625, 2.3634033203125, 2.700927734375, 3.0384521484375, 3.3759765625, 3.7135009765625, 4.051025390625, 4.3885498046875, 4.72607421875, 5.0635986328125, 5.401123046875, 5.7386474609375, 6.076171875, 6.4136962890625, 6.751220703125, 7.0887451171875, 7.42626953125, 7.7637939453125, 8.101318359375, 8.4388427734375, 8.7763671875, 9.1138916015625, 9.451416015625, 9.7889404296875, 10.12646484375, 10.4639892578125, 10.801513671875, 11.1390380859375, 11.4765625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 6.0, 11.0, 16.0, 32.0, 50.0, 115.0, 191.0, 356.0, 651.0, 1194.0, 2366.0, 4758.0, 10994.0, 30702.0, 154525.0, 2722802.0, 1149008.0, 79987.0, 20971.0, 8094.0, 3585.0, 1864.0, 973.0, 459.0, 268.0, 127.0, 84.0, 36.0, 22.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.3125, -35.27001953125, -34.2275390625, -33.18505859375, -32.142578125, -31.10009765625, -30.0576171875, -29.01513671875, -27.97265625, -26.93017578125, -25.8876953125, -24.84521484375, -23.802734375, -22.76025390625, -21.7177734375, -20.67529296875, -19.6328125, -18.59033203125, -17.5478515625, -16.50537109375, -15.462890625, -14.42041015625, -13.3779296875, -12.33544921875, -11.29296875, -10.25048828125, -9.2080078125, -8.16552734375, -7.123046875, -6.08056640625, -5.0380859375, -3.99560546875, -2.953125, -1.91064453125, -0.8681640625, 0.17431640625, 1.216796875, 2.25927734375, 3.3017578125, 4.34423828125, 5.38671875, 6.42919921875, 7.4716796875, 8.51416015625, 9.556640625, 10.59912109375, 11.6416015625, 12.68408203125, 13.7265625, 14.76904296875, 15.8115234375, 16.85400390625, 17.896484375, 18.93896484375, 19.9814453125, 21.02392578125, 22.06640625, 23.10888671875, 24.1513671875, 25.19384765625, 26.236328125, 27.27880859375, 28.3212890625, 29.36376953125, 30.40625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 5.0, 12.0, 9.0, 18.0, 41.0, 73.0, 116.0, 243.0, 440.0, 864.0, 1032.0, 575.0, 278.0, 140.0, 103.0, 43.0, 24.0, 19.0, 10.0, 4.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0], "bins": [-48.21875, -47.197509765625, -46.17626953125, -45.155029296875, -44.1337890625, -43.112548828125, -42.09130859375, -41.070068359375, -40.048828125, -39.027587890625, -38.00634765625, -36.985107421875, -35.9638671875, -34.942626953125, -33.92138671875, -32.900146484375, -31.87890625, -30.857666015625, -29.83642578125, -28.815185546875, -27.7939453125, -26.772705078125, -25.75146484375, -24.730224609375, -23.708984375, -22.687744140625, -21.66650390625, -20.645263671875, -19.6240234375, -18.602783203125, -17.58154296875, -16.560302734375, -15.5390625, -14.517822265625, -13.49658203125, -12.475341796875, -11.4541015625, -10.432861328125, -9.41162109375, -8.390380859375, -7.369140625, -6.347900390625, -5.32666015625, -4.305419921875, -3.2841796875, -2.262939453125, -1.24169921875, -0.220458984375, 0.80078125, 1.822021484375, 2.84326171875, 3.864501953125, 4.8857421875, 5.906982421875, 6.92822265625, 7.949462890625, 8.970703125, 9.991943359375, 11.01318359375, 12.034423828125, 13.0556640625, 14.076904296875, 15.09814453125, 16.119384765625, 17.140625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 8.0, 4.0, 10.0, 17.0, 23.0, 29.0, 52.0, 78.0, 145.0, 259.0, 593.0, 1542.0, 5972.0, 43770.0, 1539352.0, 2535884.0, 56284.0, 7240.0, 1725.0, 610.0, 289.0, 149.0, 91.0, 50.0, 31.0, 10.0, 20.0, 11.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.625, -31.0751953125, -29.525390625, -27.9755859375, -26.42578125, -24.8759765625, -23.326171875, -21.7763671875, -20.2265625, -18.6767578125, -17.126953125, -15.5771484375, -14.02734375, -12.4775390625, -10.927734375, -9.3779296875, -7.828125, -6.2783203125, -4.728515625, -3.1787109375, -1.62890625, -0.0791015625, 1.470703125, 3.0205078125, 4.5703125, 6.1201171875, 7.669921875, 9.2197265625, 10.76953125, 12.3193359375, 13.869140625, 15.4189453125, 16.96875, 18.5185546875, 20.068359375, 21.6181640625, 23.16796875, 24.7177734375, 26.267578125, 27.8173828125, 29.3671875, 30.9169921875, 32.466796875, 34.0166015625, 35.56640625, 37.1162109375, 38.666015625, 40.2158203125, 41.765625, 43.3154296875, 44.865234375, 46.4150390625, 47.96484375, 49.5146484375, 51.064453125, 52.6142578125, 54.1640625, 55.7138671875, 57.263671875, 58.8134765625, 60.36328125, 61.9130859375, 63.462890625, 65.0126953125, 66.5625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 14.0, 90.0, 335.0, 405.0, 144.0, 24.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-406.2010498046875, -393.9336242675781, -381.66619873046875, -369.39874267578125, -357.1313171386719, -344.8638916015625, -332.5964660644531, -320.32904052734375, -308.06158447265625, -295.7941589355469, -283.5267333984375, -271.25927734375, -258.9918518066406, -246.72442626953125, -234.45700073242188, -222.1895751953125, -209.92214965820312, -197.65472412109375, -185.3872833251953, -173.11985778808594, -160.8524169921875, -148.58499145507812, -136.31756591796875, -124.05013275146484, -111.78269958496094, -99.51526641845703, -87.24783325195312, -74.98040771484375, -62.712974548339844, -50.44554138183594, -38.17811584472656, -25.910682678222656, -13.643280029296875, -1.3758487701416016, 10.891582489013672, 23.159011840820312, 35.42644500732422, 47.693878173828125, 59.9613037109375, 72.2287368774414, 84.49617004394531, 96.76360321044922, 109.03103637695312, 121.2984619140625, 133.56588745117188, 145.8333282470703, 158.1007537841797, 170.36819458007812, 182.6356201171875, 194.90304565429688, 207.1704864501953, 219.4379119873047, 231.70535278320312, 243.9727783203125, 256.2402038574219, 268.50762939453125, 280.77508544921875, 293.0425109863281, 305.3099365234375, 317.577392578125, 329.8448181152344, 342.11224365234375, 354.3796691894531, 366.6470947265625, 378.9145202636719]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 11.0, 18.0, 29.0, 46.0, 58.0, 46.0, 61.0, 89.0, 88.0, 94.0, 89.0, 78.0, 58.0, 63.0, 38.0, 42.0, 33.0, 16.0, 16.0, 14.0, 4.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.41453552246094, -121.85604858398438, -117.29756164550781, -112.73908233642578, -108.18059539794922, -103.62210845947266, -99.06362915039062, -94.50514221191406, -89.9466552734375, -85.38816833496094, -80.82968139648438, -76.27120208740234, -71.71271514892578, -67.15422821044922, -62.59574508666992, -58.037261962890625, -53.47877502441406, -48.9202880859375, -44.3618049621582, -39.803321838378906, -35.244834899902344, -30.686349868774414, -26.127864837646484, -21.569379806518555, -17.010894775390625, -12.452409744262695, -7.893924713134766, -3.335439682006836, 1.2230453491210938, 5.781530380249023, 10.340015411376953, 14.898500442504883, 19.457000732421875, 24.015485763549805, 28.573970794677734, 33.13245391845703, 37.690940856933594, 42.249427795410156, 46.80791091918945, 51.36639404296875, 55.92488098144531, 60.483367919921875, 65.04185485839844, 69.60033416748047, 74.15882110595703, 78.7173080444336, 83.27578735351562, 87.83427429199219, 92.39276123046875, 96.95124816894531, 101.50973510742188, 106.0682144165039, 110.62670135498047, 115.18518829345703, 119.74366760253906, 124.30215454101562, 128.8606414794922, 133.41912841796875, 137.9776153564453, 142.53610229492188, 147.09457397460938, 151.65306091308594, 156.2115478515625, 160.77003479003906, 165.32852172851562]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 5.0, 10.0, 12.0, 9.0, 22.0, 19.0, 19.0, 14.0, 25.0, 35.0, 34.0, 31.0, 27.0, 39.0, 33.0, 38.0, 45.0, 35.0, 39.0, 43.0, 43.0, 43.0, 43.0, 49.0, 42.0, 23.0, 28.0, 36.0, 24.0, 25.0, 22.0, 21.0, 8.0, 16.0, 3.0, 11.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1796875, -7.893798828125, -7.60791015625, -7.322021484375, -7.0361328125, -6.750244140625, -6.46435546875, -6.178466796875, -5.892578125, -5.606689453125, -5.32080078125, -5.034912109375, -4.7490234375, -4.463134765625, -4.17724609375, -3.891357421875, -3.60546875, -3.319580078125, -3.03369140625, -2.747802734375, -2.4619140625, -2.176025390625, -1.89013671875, -1.604248046875, -1.318359375, -1.032470703125, -0.74658203125, -0.460693359375, -0.1748046875, 0.111083984375, 0.39697265625, 0.682861328125, 0.96875, 1.254638671875, 1.54052734375, 1.826416015625, 2.1123046875, 2.398193359375, 2.68408203125, 2.969970703125, 3.255859375, 3.541748046875, 3.82763671875, 4.113525390625, 4.3994140625, 4.685302734375, 4.97119140625, 5.257080078125, 5.54296875, 5.828857421875, 6.11474609375, 6.400634765625, 6.6865234375, 6.972412109375, 7.25830078125, 7.544189453125, 7.830078125, 8.115966796875, 8.40185546875, 8.687744140625, 8.9736328125, 9.259521484375, 9.54541015625, 9.831298828125, 10.1171875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 0.0, 10.0, 10.0, 7.0, 25.0, 12.0, 35.0, 60.0, 73.0, 126.0, 183.0, 261.0, 377.0, 589.0, 885.0, 1371.0, 2053.0, 3209.0, 4982.0, 7579.0, 11537.0, 18047.0, 28867.0, 45953.0, 75391.0, 139586.0, 281258.0, 184898.0, 92349.0, 54632.0, 33760.0, 21442.0, 13662.0, 8709.0, 5684.0, 3783.0, 2424.0, 1590.0, 1040.0, 693.0, 475.0, 298.0, 212.0, 122.0, 111.0, 62.0, 38.0, 30.0, 17.0, 14.0, 12.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.376953125, -0.36576080322265625, -0.3545684814453125, -0.34337615966796875, -0.332183837890625, -0.32099151611328125, -0.3097991943359375, -0.29860687255859375, -0.28741455078125, -0.27622222900390625, -0.2650299072265625, -0.25383758544921875, -0.242645263671875, -0.23145294189453125, -0.2202606201171875, -0.20906829833984375, -0.1978759765625, -0.18668365478515625, -0.1754913330078125, -0.16429901123046875, -0.153106689453125, -0.14191436767578125, -0.1307220458984375, -0.11952972412109375, -0.10833740234375, -0.09714508056640625, -0.0859527587890625, -0.07476043701171875, -0.063568115234375, -0.05237579345703125, -0.0411834716796875, -0.02999114990234375, -0.018798828125, -0.00760650634765625, 0.0035858154296875, 0.01477813720703125, 0.025970458984375, 0.03716278076171875, 0.0483551025390625, 0.05954742431640625, 0.07073974609375, 0.08193206787109375, 0.0931243896484375, 0.10431671142578125, 0.115509033203125, 0.12670135498046875, 0.1378936767578125, 0.14908599853515625, 0.1602783203125, 0.17147064208984375, 0.1826629638671875, 0.19385528564453125, 0.205047607421875, 0.21623992919921875, 0.2274322509765625, 0.23862457275390625, 0.24981689453125, 0.26100921630859375, 0.2722015380859375, 0.28339385986328125, 0.294586181640625, 0.30577850341796875, 0.3169708251953125, 0.32816314697265625, 0.33935546875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 1.0, 8.0, 5.0, 6.0, 7.0, 13.0, 12.0, 8.0, 13.0, 21.0, 9.0, 22.0, 28.0, 31.0, 25.0, 27.0, 24.0, 32.0, 29.0, 43.0, 30.0, 43.0, 32.0, 1049.0, 39.0, 37.0, 44.0, 36.0, 30.0, 33.0, 30.0, 34.0, 30.0, 27.0, 15.0, 22.0, 20.0, 14.0, 14.0, 17.0, 11.0, 13.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-6.43359375, -6.24078369140625, -6.0479736328125, -5.85516357421875, -5.662353515625, -5.46954345703125, -5.2767333984375, -5.08392333984375, -4.89111328125, -4.69830322265625, -4.5054931640625, -4.31268310546875, -4.119873046875, -3.92706298828125, -3.7342529296875, -3.54144287109375, -3.3486328125, -3.15582275390625, -2.9630126953125, -2.77020263671875, -2.577392578125, -2.38458251953125, -2.1917724609375, -1.99896240234375, -1.80615234375, -1.61334228515625, -1.4205322265625, -1.22772216796875, -1.034912109375, -0.84210205078125, -0.6492919921875, -0.45648193359375, -0.263671875, -0.07086181640625, 0.1219482421875, 0.31475830078125, 0.507568359375, 0.70037841796875, 0.8931884765625, 1.08599853515625, 1.27880859375, 1.47161865234375, 1.6644287109375, 1.85723876953125, 2.050048828125, 2.24285888671875, 2.4356689453125, 2.62847900390625, 2.8212890625, 3.01409912109375, 3.2069091796875, 3.39971923828125, 3.592529296875, 3.78533935546875, 3.9781494140625, 4.17095947265625, 4.36376953125, 4.55657958984375, 4.7493896484375, 4.94219970703125, 5.135009765625, 5.32781982421875, 5.5206298828125, 5.71343994140625, 5.90625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 12.0, 9.0, 14.0, 33.0, 45.0, 69.0, 115.0, 185.0, 298.0, 404.0, 651.0, 1028.0, 1575.0, 2378.0, 3702.0, 5887.0, 9381.0, 15122.0, 24297.0, 40727.0, 71490.0, 140912.0, 1331946.0, 211261.0, 98835.0, 53627.0, 31712.0, 18952.0, 11906.0, 7448.0, 4704.0, 2962.0, 1919.0, 1258.0, 776.0, 520.0, 330.0, 257.0, 137.0, 91.0, 63.0, 30.0, 26.0, 10.0, 7.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.23486328125, -0.22746658325195312, -0.22006988525390625, -0.21267318725585938, -0.2052764892578125, -0.19787979125976562, -0.19048309326171875, -0.18308639526367188, -0.175689697265625, -0.16829299926757812, -0.16089630126953125, -0.15349960327148438, -0.1461029052734375, -0.13870620727539062, -0.13130950927734375, -0.12391281127929688, -0.11651611328125, -0.10911941528320312, -0.10172271728515625, -0.09432601928710938, -0.0869293212890625, -0.07953262329101562, -0.07213592529296875, -0.06473922729492188, -0.057342529296875, -0.049945831298828125, -0.04254913330078125, -0.035152435302734375, -0.0277557373046875, -0.020359039306640625, -0.01296234130859375, -0.005565643310546875, 0.0018310546875, 0.009227752685546875, 0.01662445068359375, 0.024021148681640625, 0.0314178466796875, 0.038814544677734375, 0.04621124267578125, 0.053607940673828125, 0.061004638671875, 0.06840133666992188, 0.07579803466796875, 0.08319473266601562, 0.0905914306640625, 0.09798812866210938, 0.10538482666015625, 0.11278152465820312, 0.12017822265625, 0.12757492065429688, 0.13497161865234375, 0.14236831665039062, 0.1497650146484375, 0.15716171264648438, 0.16455841064453125, 0.17195510864257812, 0.179351806640625, 0.18674850463867188, 0.19414520263671875, 0.20154190063476562, 0.2089385986328125, 0.21633529663085938, 0.22373199462890625, 0.23112869262695312, 0.238525390625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 10.0, 4.0, 6.0, 11.0, 12.0, 11.0, 14.0, 19.0, 22.0, 21.0, 30.0, 32.0, 46.0, 49.0, 45.0, 32.0, 49.0, 48.0, 51.0, 47.0, 44.0, 35.0, 44.0, 41.0, 38.0, 41.0, 30.0, 28.0, 23.0, 24.0, 18.0, 15.0, 12.0, 7.0, 7.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00017964839935302734, -0.00017410330474376678, -0.00016855821013450623, -0.00016301311552524567, -0.0001574680209159851, -0.00015192292630672455, -0.000146377831697464, -0.00014083273708820343, -0.00013528764247894287, -0.0001297425478696823, -0.00012419745326042175, -0.0001186523586511612, -0.00011310726404190063, -0.00010756216943264008, -0.00010201707482337952, -9.647198021411896e-05, -9.09268856048584e-05, -8.538179099559784e-05, -7.983669638633728e-05, -7.429160177707672e-05, -6.874650716781616e-05, -6.32014125585556e-05, -5.7656317949295044e-05, -5.2111223340034485e-05, -4.6566128730773926e-05, -4.102103412151337e-05, -3.547593951225281e-05, -2.993084490299225e-05, -2.438575029373169e-05, -1.884065568447113e-05, -1.3295561075210571e-05, -7.750466465950012e-06, -2.205371856689453e-06, 3.339722752571106e-06, 8.884817361831665e-06, 1.4429911971092224e-05, 1.9975006580352783e-05, 2.5520101189613342e-05, 3.10651957988739e-05, 3.661029040813446e-05, 4.215538501739502e-05, 4.770047962665558e-05, 5.324557423591614e-05, 5.87906688451767e-05, 6.433576345443726e-05, 6.988085806369781e-05, 7.542595267295837e-05, 8.097104728221893e-05, 8.651614189147949e-05, 9.206123650074005e-05, 9.760633111000061e-05, 0.00010315142571926117, 0.00010869652032852173, 0.00011424161493778229, 0.00011978670954704285, 0.0001253318041563034, 0.00013087689876556396, 0.00013642199337482452, 0.00014196708798408508, 0.00014751218259334564, 0.0001530572772026062, 0.00015860237181186676, 0.00016414746642112732, 0.00016969256103038788, 0.00017523765563964844]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 5.0, 3.0, 6.0, 9.0, 7.0, 5.0, 16.0, 15.0, 15.0, 25.0, 43.0, 44.0, 66.0, 63.0, 87.0, 120.0, 178.0, 204.0, 407.0, 779.0, 4518.0, 409969.0, 623287.0, 6450.0, 908.0, 383.0, 242.0, 183.0, 129.0, 87.0, 51.0, 50.0, 40.0, 33.0, 36.0, 17.0, 23.0, 12.0, 8.0, 4.0, 7.0, 3.0, 9.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0027618408203125, -0.0026668012142181396, -0.0025717616081237793, -0.002476722002029419, -0.0023816823959350586, -0.0022866427898406982, -0.002191603183746338, -0.0020965635776519775, -0.002001523971557617, -0.0019064843654632568, -0.0018114447593688965, -0.0017164051532745361, -0.0016213655471801758, -0.0015263259410858154, -0.001431286334991455, -0.0013362467288970947, -0.0012412071228027344, -0.001146167516708374, -0.0010511279106140137, -0.0009560883045196533, -0.000861048698425293, -0.0007660090923309326, -0.0006709694862365723, -0.0005759298801422119, -0.00048089027404785156, -0.0003858506679534912, -0.00029081106185913086, -0.0001957714557647705, -0.00010073184967041016, -5.692243576049805e-06, 8.934736251831055e-05, 0.0001843869686126709, 0.00027942657470703125, 0.0003744661808013916, 0.00046950578689575195, 0.0005645453929901123, 0.0006595849990844727, 0.000754624605178833, 0.0008496642112731934, 0.0009447038173675537, 0.001039743423461914, 0.0011347830295562744, 0.0012298226356506348, 0.0013248622417449951, 0.0014199018478393555, 0.0015149414539337158, 0.0016099810600280762, 0.0017050206661224365, 0.0018000602722167969, 0.0018950998783111572, 0.0019901394844055176, 0.002085179090499878, 0.0021802186965942383, 0.0022752583026885986, 0.002370297908782959, 0.0024653375148773193, 0.0025603771209716797, 0.00265541672706604, 0.0027504563331604004, 0.0028454959392547607, 0.002940535545349121, 0.0030355751514434814, 0.003130614757537842, 0.003225654363632202, 0.0033206939697265625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 33.0, 291.0, 538.0, 134.0, 13.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004836737643927336, -0.00044425265514291823, -0.0004048315458931029, -0.000365410465747118, -0.00032598935649730265, -0.0002865682472474873, -0.0002471471671015024, -0.00020772605785168707, -0.00016830494860187173, -0.00012888383935205638, -8.946274465415627e-05, -5.004164268029854e-05, -1.0620540706440806e-05, 2.880056854337454e-05, 6.822166324127465e-05, 0.00010764275793917477, 0.00014706386718899012, 0.00018648497643880546, 0.00022590607113670558, 0.0002653271658346057, 0.00030474827508442104, 0.0003441693843342364, 0.00038359046448022127, 0.0004230115737300366, 0.00046243268297985196, 0.0005018537631258368, 0.0005412749014794827, 0.0005806959816254675, 0.0006201170617714524, 0.0006595382001250982, 0.0006989592802710831, 0.000738380360417068, 0.0007778014987707138, 0.0008172225789166987, 0.0008566437172703445, 0.0008960647974163294, 0.0009354859357699752, 0.0009749070159159601, 0.001014328096061945, 0.0010537492344155908, 0.0010931703727692366, 0.0011325915111228824, 0.0011720125330612063, 0.0012114336714148521, 0.001250854809768498, 0.0012902759481221437, 0.0013296969700604677, 0.0013691181084141135, 0.0014085391303524375, 0.0014479602687060833, 0.0014873812906444073, 0.001526802428998053, 0.0015662235673516989, 0.0016056445892900229, 0.0016450657276436687, 0.0016844868659973145, 0.0017239078879356384, 0.0017633290262892842, 0.0018027500482276082, 0.001842171186581254, 0.0018815923249348998, 0.0019210134632885456, 0.0019604344852268696, 0.0019998555071651936, 0.002039276761934161]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 5.0, 3.0, 4.0, 9.0, 8.0, 10.0, 10.0, 18.0, 16.0, 13.0, 32.0, 38.0, 29.0, 45.0, 47.0, 56.0, 32.0, 52.0, 53.0, 50.0, 36.0, 47.0, 53.0, 52.0, 49.0, 45.0, 28.0, 40.0, 24.0, 16.0, 16.0, 20.0, 13.0, 13.0, 6.0, 5.0, 7.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013780593872070312, -0.0001315521076321602, -0.00012529827654361725, -0.00011904444545507431, -0.00011279061436653137, -0.00010653678327798843, -0.0001002829521894455, -9.402912110090256e-05, -8.777529001235962e-05, -8.152145892381668e-05, -7.526762783527374e-05, -6.90137967467308e-05, -6.275996565818787e-05, -5.650613456964493e-05, -5.025230348110199e-05, -4.399847239255905e-05, -3.774464130401611e-05, -3.1490810215473175e-05, -2.5236979126930237e-05, -1.89831480383873e-05, -1.272931694984436e-05, -6.475485861301422e-06, -2.2165477275848389e-07, 6.032176315784454e-06, 1.2286007404327393e-05, 1.853983849287033e-05, 2.479366958141327e-05, 3.104750066995621e-05, 3.7301331758499146e-05, 4.3555162847042084e-05, 4.980899393558502e-05, 5.606282502412796e-05, 6.23166561126709e-05, 6.857048720121384e-05, 7.482431828975677e-05, 8.107814937829971e-05, 8.733198046684265e-05, 9.358581155538559e-05, 9.983964264392853e-05, 0.00010609347373247147, 0.0001123473048210144, 0.00011860113590955734, 0.00012485496699810028, 0.00013110879808664322, 0.00013736262917518616, 0.0001436164602637291, 0.00014987029135227203, 0.00015612412244081497, 0.0001623779535293579, 0.00016863178461790085, 0.0001748856157064438, 0.00018113944679498672, 0.00018739327788352966, 0.0001936471089720726, 0.00019990094006061554, 0.00020615477114915848, 0.00021240860223770142, 0.00021866243332624435, 0.0002249162644147873, 0.00023117009550333023, 0.00023742392659187317, 0.0002436777576804161, 0.00024993158876895905, 0.000256185419857502, 0.0002624392509460449]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 5.0, 10.0, 12.0, 9.0, 22.0, 19.0, 19.0, 14.0, 25.0, 35.0, 34.0, 31.0, 27.0, 39.0, 33.0, 38.0, 45.0, 35.0, 39.0, 43.0, 43.0, 43.0, 43.0, 49.0, 42.0, 23.0, 28.0, 36.0, 24.0, 25.0, 22.0, 21.0, 8.0, 16.0, 3.0, 11.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1796875, -7.893798828125, -7.60791015625, -7.322021484375, -7.0361328125, -6.750244140625, -6.46435546875, -6.178466796875, -5.892578125, -5.606689453125, -5.32080078125, -5.034912109375, -4.7490234375, -4.463134765625, -4.17724609375, -3.891357421875, -3.60546875, -3.319580078125, -3.03369140625, -2.747802734375, -2.4619140625, -2.176025390625, -1.89013671875, -1.604248046875, -1.318359375, -1.032470703125, -0.74658203125, -0.460693359375, -0.1748046875, 0.111083984375, 0.39697265625, 0.682861328125, 0.96875, 1.254638671875, 1.54052734375, 1.826416015625, 2.1123046875, 2.398193359375, 2.68408203125, 2.969970703125, 3.255859375, 3.541748046875, 3.82763671875, 4.113525390625, 4.3994140625, 4.685302734375, 4.97119140625, 5.257080078125, 5.54296875, 5.828857421875, 6.11474609375, 6.400634765625, 6.6865234375, 6.972412109375, 7.25830078125, 7.544189453125, 7.830078125, 8.115966796875, 8.40185546875, 8.687744140625, 8.9736328125, 9.259521484375, 9.54541015625, 9.831298828125, 10.1171875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 12.0, 14.0, 32.0, 34.0, 61.0, 75.0, 133.0, 184.0, 291.0, 382.0, 609.0, 902.0, 1459.0, 2154.0, 3440.0, 5791.0, 9540.0, 17295.0, 34955.0, 75477.0, 169334.0, 312366.0, 218262.0, 99314.0, 44848.0, 21780.0, 11795.0, 6748.0, 4025.0, 2467.0, 1622.0, 1031.0, 698.0, 446.0, 324.0, 212.0, 162.0, 95.0, 57.0, 40.0, 28.0, 17.0, 12.0, 9.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1328125, -7.8388671875, -7.544921875, -7.2509765625, -6.95703125, -6.6630859375, -6.369140625, -6.0751953125, -5.78125, -5.4873046875, -5.193359375, -4.8994140625, -4.60546875, -4.3115234375, -4.017578125, -3.7236328125, -3.4296875, -3.1357421875, -2.841796875, -2.5478515625, -2.25390625, -1.9599609375, -1.666015625, -1.3720703125, -1.078125, -0.7841796875, -0.490234375, -0.1962890625, 0.09765625, 0.3916015625, 0.685546875, 0.9794921875, 1.2734375, 1.5673828125, 1.861328125, 2.1552734375, 2.44921875, 2.7431640625, 3.037109375, 3.3310546875, 3.625, 3.9189453125, 4.212890625, 4.5068359375, 4.80078125, 5.0947265625, 5.388671875, 5.6826171875, 5.9765625, 6.2705078125, 6.564453125, 6.8583984375, 7.15234375, 7.4462890625, 7.740234375, 8.0341796875, 8.328125, 8.6220703125, 8.916015625, 9.2099609375, 9.50390625, 9.7978515625, 10.091796875, 10.3857421875, 10.6796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 7.0, 5.0, 7.0, 10.0, 7.0, 9.0, 14.0, 18.0, 18.0, 24.0, 20.0, 30.0, 31.0, 39.0, 49.0, 63.0, 85.0, 113.0, 241.0, 1474.0, 225.0, 116.0, 78.0, 64.0, 51.0, 36.0, 32.0, 31.0, 35.0, 25.0, 13.0, 15.0, 4.0, 8.0, 6.0, 3.0, 11.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.453125, -25.556884765625, -24.66064453125, -23.764404296875, -22.8681640625, -21.971923828125, -21.07568359375, -20.179443359375, -19.283203125, -18.386962890625, -17.49072265625, -16.594482421875, -15.6982421875, -14.802001953125, -13.90576171875, -13.009521484375, -12.11328125, -11.217041015625, -10.32080078125, -9.424560546875, -8.5283203125, -7.632080078125, -6.73583984375, -5.839599609375, -4.943359375, -4.047119140625, -3.15087890625, -2.254638671875, -1.3583984375, -0.462158203125, 0.43408203125, 1.330322265625, 2.2265625, 3.122802734375, 4.01904296875, 4.915283203125, 5.8115234375, 6.707763671875, 7.60400390625, 8.500244140625, 9.396484375, 10.292724609375, 11.18896484375, 12.085205078125, 12.9814453125, 13.877685546875, 14.77392578125, 15.670166015625, 16.56640625, 17.462646484375, 18.35888671875, 19.255126953125, 20.1513671875, 21.047607421875, 21.94384765625, 22.840087890625, 23.736328125, 24.632568359375, 25.52880859375, 26.425048828125, 27.3212890625, 28.217529296875, 29.11376953125, 30.010009765625, 30.90625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 0.0, 4.0, 8.0, 6.0, 10.0, 6.0, 12.0, 17.0, 28.0, 37.0, 46.0, 61.0, 95.0, 136.0, 243.0, 396.0, 1001.0, 7591.0, 2800823.0, 329780.0, 3591.0, 747.0, 340.0, 222.0, 141.0, 84.0, 72.0, 41.0, 31.0, 24.0, 26.0, 14.0, 16.0, 10.0, 9.0, 11.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-64.8125, -62.84033203125, -60.8681640625, -58.89599609375, -56.923828125, -54.95166015625, -52.9794921875, -51.00732421875, -49.03515625, -47.06298828125, -45.0908203125, -43.11865234375, -41.146484375, -39.17431640625, -37.2021484375, -35.22998046875, -33.2578125, -31.28564453125, -29.3134765625, -27.34130859375, -25.369140625, -23.39697265625, -21.4248046875, -19.45263671875, -17.48046875, -15.50830078125, -13.5361328125, -11.56396484375, -9.591796875, -7.61962890625, -5.6474609375, -3.67529296875, -1.703125, 0.26904296875, 2.2412109375, 4.21337890625, 6.185546875, 8.15771484375, 10.1298828125, 12.10205078125, 14.07421875, 16.04638671875, 18.0185546875, 19.99072265625, 21.962890625, 23.93505859375, 25.9072265625, 27.87939453125, 29.8515625, 31.82373046875, 33.7958984375, 35.76806640625, 37.740234375, 39.71240234375, 41.6845703125, 43.65673828125, 45.62890625, 47.60107421875, 49.5732421875, 51.54541015625, 53.517578125, 55.48974609375, 57.4619140625, 59.43408203125, 61.40625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 22.0, 215.0, 513.0, 222.0, 33.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.35731506347656, -183.7769317626953, -175.19656372070312, -166.61618041992188, -158.03579711914062, -149.45541381835938, -140.8750457763672, -132.29466247558594, -123.71428680419922, -115.1339111328125, -106.55352783203125, -97.97315216064453, -89.39277648925781, -80.81239318847656, -72.23201751708984, -63.65163803100586, -55.071258544921875, -46.49087905883789, -37.910499572753906, -29.330123901367188, -20.749744415283203, -12.169364929199219, -3.5889892578125, 4.991390228271484, 13.571769714355469, 22.152149200439453, 30.732526779174805, 39.312904357910156, 47.89328384399414, 56.473663330078125, 65.05403900146484, 73.63441467285156, 82.21481323242188, 90.7951889038086, 99.37557220458984, 107.95594787597656, 116.53633117675781, 125.11670684814453, 133.69708251953125, 142.2774658203125, 150.85784912109375, 159.438232421875, 168.0186004638672, 176.59898376464844, 185.1793670654297, 193.75973510742188, 202.34011840820312, 210.92050170898438, 219.50086975097656, 228.0812530517578, 236.66162109375, 245.24200439453125, 253.8223876953125, 262.40277099609375, 270.983154296875, 279.5635070800781, 288.1438903808594, 296.7242736816406, 305.3046569824219, 313.885009765625, 322.46539306640625, 331.0457763671875, 339.62615966796875, 348.20654296875, 356.78692626953125]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 8.0, 12.0, 21.0, 23.0, 24.0, 29.0, 28.0, 34.0, 34.0, 30.0, 38.0, 42.0, 47.0, 42.0, 42.0, 44.0, 31.0, 46.0, 45.0, 45.0, 43.0, 50.0, 34.0, 33.0, 26.0, 24.0, 24.0, 13.0, 15.0, 11.0, 13.0, 9.0, 9.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.67426300048828, -97.41069030761719, -94.14712524414062, -90.88355255126953, -87.61997985839844, -84.35641479492188, -81.09284210205078, -77.82926940917969, -74.56570434570312, -71.30213165283203, -68.03856658935547, -64.77499389648438, -61.51142501831055, -58.24785614013672, -54.984283447265625, -51.7207145690918, -48.45714569091797, -45.19357681274414, -41.93000793457031, -38.66643524169922, -35.40286636352539, -32.13929748535156, -28.8757266998291, -25.61215591430664, -22.348587036132812, -19.085018157958984, -15.821447372436523, -12.557877540588379, -9.294307708740234, -6.030738830566406, -2.7671680450439453, 0.4964027404785156, 3.7599639892578125, 7.023533821105957, 10.287103652954102, 13.550673484802246, 16.81424331665039, 20.07781219482422, 23.34138298034668, 26.60495376586914, 29.86852264404297, 33.1320915222168, 36.395660400390625, 39.65923309326172, 42.92280197143555, 46.186370849609375, 49.44994354248047, 52.7135124206543, 55.977081298828125, 59.24065017700195, 62.50421905517578, 65.76779174804688, 69.03135681152344, 72.29492950439453, 75.55850219726562, 78.82206726074219, 82.08563995361328, 85.34921264648438, 88.61277770996094, 91.87635040283203, 95.13992309570312, 98.40348815917969, 101.66706085205078, 104.93063354492188, 108.19419860839844]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 8.0, 7.0, 11.0, 19.0, 16.0, 21.0, 21.0, 22.0, 24.0, 23.0, 22.0, 31.0, 29.0, 36.0, 40.0, 39.0, 46.0, 38.0, 37.0, 39.0, 51.0, 52.0, 28.0, 36.0, 36.0, 43.0, 32.0, 29.0, 29.0, 26.0, 16.0, 15.0, 17.0, 10.0, 10.0, 13.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.0859375, -8.7813720703125, -8.476806640625, -8.1722412109375, -7.86767578125, -7.5631103515625, -7.258544921875, -6.9539794921875, -6.6494140625, -6.3448486328125, -6.040283203125, -5.7357177734375, -5.43115234375, -5.1265869140625, -4.822021484375, -4.5174560546875, -4.212890625, -3.9083251953125, -3.603759765625, -3.2991943359375, -2.99462890625, -2.6900634765625, -2.385498046875, -2.0809326171875, -1.7763671875, -1.4718017578125, -1.167236328125, -0.8626708984375, -0.55810546875, -0.2535400390625, 0.051025390625, 0.3555908203125, 0.66015625, 0.9647216796875, 1.269287109375, 1.5738525390625, 1.87841796875, 2.1829833984375, 2.487548828125, 2.7921142578125, 3.0966796875, 3.4012451171875, 3.705810546875, 4.0103759765625, 4.31494140625, 4.6195068359375, 4.924072265625, 5.2286376953125, 5.533203125, 5.8377685546875, 6.142333984375, 6.4468994140625, 6.75146484375, 7.0560302734375, 7.360595703125, 7.6651611328125, 7.9697265625, 8.2742919921875, 8.578857421875, 8.8834228515625, 9.18798828125, 9.4925537109375, 9.797119140625, 10.1016845703125, 10.40625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 11.0, 9.0, 12.0, 12.0, 15.0, 22.0, 43.0, 42.0, 63.0, 90.0, 125.0, 171.0, 224.0, 285.0, 400.0, 617.0, 1011.0, 2037.0, 6059.0, 30640.0, 272736.0, 3397397.0, 429825.0, 39615.0, 7240.0, 2253.0, 1086.0, 627.0, 464.0, 324.0, 224.0, 159.0, 112.0, 90.0, 62.0, 53.0, 43.0, 22.0, 18.0, 10.0, 8.0, 5.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-53.375, -51.62939453125, -49.8837890625, -48.13818359375, -46.392578125, -44.64697265625, -42.9013671875, -41.15576171875, -39.41015625, -37.66455078125, -35.9189453125, -34.17333984375, -32.427734375, -30.68212890625, -28.9365234375, -27.19091796875, -25.4453125, -23.69970703125, -21.9541015625, -20.20849609375, -18.462890625, -16.71728515625, -14.9716796875, -13.22607421875, -11.48046875, -9.73486328125, -7.9892578125, -6.24365234375, -4.498046875, -2.75244140625, -1.0068359375, 0.73876953125, 2.484375, 4.22998046875, 5.9755859375, 7.72119140625, 9.466796875, 11.21240234375, 12.9580078125, 14.70361328125, 16.44921875, 18.19482421875, 19.9404296875, 21.68603515625, 23.431640625, 25.17724609375, 26.9228515625, 28.66845703125, 30.4140625, 32.15966796875, 33.9052734375, 35.65087890625, 37.396484375, 39.14208984375, 40.8876953125, 42.63330078125, 44.37890625, 46.12451171875, 47.8701171875, 49.61572265625, 51.361328125, 53.10693359375, 54.8525390625, 56.59814453125, 58.34375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 4.0, 7.0, 8.0, 10.0, 18.0, 25.0, 39.0, 44.0, 56.0, 74.0, 105.0, 171.0, 211.0, 276.0, 387.0, 518.0, 562.0, 456.0, 293.0, 225.0, 158.0, 103.0, 76.0, 70.0, 45.0, 29.0, 24.0, 16.0, 12.0, 9.0, 3.0, 4.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-28.078125, -27.36181640625, -26.6455078125, -25.92919921875, -25.212890625, -24.49658203125, -23.7802734375, -23.06396484375, -22.34765625, -21.63134765625, -20.9150390625, -20.19873046875, -19.482421875, -18.76611328125, -18.0498046875, -17.33349609375, -16.6171875, -15.90087890625, -15.1845703125, -14.46826171875, -13.751953125, -13.03564453125, -12.3193359375, -11.60302734375, -10.88671875, -10.17041015625, -9.4541015625, -8.73779296875, -8.021484375, -7.30517578125, -6.5888671875, -5.87255859375, -5.15625, -4.43994140625, -3.7236328125, -3.00732421875, -2.291015625, -1.57470703125, -0.8583984375, -0.14208984375, 0.57421875, 1.29052734375, 2.0068359375, 2.72314453125, 3.439453125, 4.15576171875, 4.8720703125, 5.58837890625, 6.3046875, 7.02099609375, 7.7373046875, 8.45361328125, 9.169921875, 9.88623046875, 10.6025390625, 11.31884765625, 12.03515625, 12.75146484375, 13.4677734375, 14.18408203125, 14.900390625, 15.61669921875, 16.3330078125, 17.04931640625, 17.765625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 12.0, 7.0, 10.0, 17.0, 17.0, 24.0, 41.0, 59.0, 83.0, 125.0, 194.0, 277.0, 476.0, 831.0, 1662.0, 3739.0, 10385.0, 35417.0, 155216.0, 965970.0, 2550630.0, 365915.0, 72655.0, 18931.0, 6195.0, 2539.0, 1155.0, 609.0, 367.0, 212.0, 183.0, 109.0, 56.0, 49.0, 32.0, 24.0, 14.0, 9.0, 12.0, 13.0, 6.0, 3.0, 3.0, 3.0, 2.0], "bins": [-37.03125, -36.087890625, -35.14453125, -34.201171875, -33.2578125, -32.314453125, -31.37109375, -30.427734375, -29.484375, -28.541015625, -27.59765625, -26.654296875, -25.7109375, -24.767578125, -23.82421875, -22.880859375, -21.9375, -20.994140625, -20.05078125, -19.107421875, -18.1640625, -17.220703125, -16.27734375, -15.333984375, -14.390625, -13.447265625, -12.50390625, -11.560546875, -10.6171875, -9.673828125, -8.73046875, -7.787109375, -6.84375, -5.900390625, -4.95703125, -4.013671875, -3.0703125, -2.126953125, -1.18359375, -0.240234375, 0.703125, 1.646484375, 2.58984375, 3.533203125, 4.4765625, 5.419921875, 6.36328125, 7.306640625, 8.25, 9.193359375, 10.13671875, 11.080078125, 12.0234375, 12.966796875, 13.91015625, 14.853515625, 15.796875, 16.740234375, 17.68359375, 18.626953125, 19.5703125, 20.513671875, 21.45703125, 22.400390625, 23.34375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 11.0, 10.0, 17.0, 19.0, 30.0, 33.0, 46.0, 53.0, 70.0, 60.0, 72.0, 97.0, 89.0, 80.0, 54.0, 55.0, 46.0, 33.0, 27.0, 23.0, 18.0, 12.0, 14.0, 6.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.49395751953125, -116.76133728027344, -111.0287094116211, -105.29608154296875, -99.56346130371094, -93.83084106445312, -88.09821319580078, -82.36558532714844, -76.63296508789062, -70.90034484863281, -65.16771697998047, -59.43509292602539, -53.70246887207031, -47.969844818115234, -42.237220764160156, -36.50459671020508, -30.77197265625, -25.039348602294922, -19.306724548339844, -13.574100494384766, -7.8414764404296875, -2.1088523864746094, 3.6237716674804688, 9.356395721435547, 15.089019775390625, 20.821643829345703, 26.55426788330078, 32.28689193725586, 38.01951599121094, 43.752140045166016, 49.484764099121094, 55.21738815307617, 60.95002746582031, 66.68264770507812, 72.41527557373047, 78.14790344238281, 83.88052368164062, 89.61314392089844, 95.34577178955078, 101.07839965820312, 106.81101989746094, 112.54364013671875, 118.2762680053711, 124.00889587402344, 129.74151611328125, 135.47413635253906, 141.20675659179688, 146.93939208984375, 152.67201232910156, 158.40463256835938, 164.13726806640625, 169.86988830566406, 175.60250854492188, 181.3351287841797, 187.0677490234375, 192.80038452148438, 198.5330047607422, 204.265625, 209.99826049804688, 215.7308807373047, 221.4635009765625, 227.1961212158203, 232.92874145507812, 238.661376953125, 244.3939971923828]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 5.0, 12.0, 9.0, 8.0, 22.0, 10.0, 27.0, 16.0, 18.0, 36.0, 27.0, 25.0, 46.0, 41.0, 41.0, 55.0, 51.0, 38.0, 45.0, 54.0, 42.0, 37.0, 47.0, 34.0, 29.0, 35.0, 17.0, 29.0, 26.0, 19.0, 28.0, 13.0, 15.0, 8.0, 5.0, 3.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.17784118652344, -100.6960220336914, -97.21420288085938, -93.73239135742188, -90.25057220458984, -86.76875305175781, -83.28693389892578, -79.80511474609375, -76.32330322265625, -72.84148406982422, -69.35966491699219, -65.87785339355469, -62.396034240722656, -58.914215087890625, -55.432395935058594, -51.95057678222656, -48.46875762939453, -44.9869384765625, -41.505123138427734, -38.0233039855957, -34.54148864746094, -31.059669494628906, -27.577850341796875, -24.096033096313477, -20.614215850830078, -17.13239860534668, -13.650580406188965, -10.16876220703125, -6.686944961547852, -3.205127716064453, 0.2766914367675781, 3.7585086822509766, 7.240325927734375, 10.722143173217773, 14.203961372375488, 17.685779571533203, 21.1675968170166, 24.6494140625, 28.13123321533203, 31.61305046081543, 35.09486770629883, 38.57668685913086, 42.058502197265625, 45.540321350097656, 49.02214050292969, 52.50395584106445, 55.985774993896484, 59.46759033203125, 62.94940948486328, 66.43122863769531, 69.91304779052734, 73.39486694335938, 76.87667846679688, 80.3584976196289, 83.84031677246094, 87.32213592529297, 90.803955078125, 94.28577423095703, 97.76759338378906, 101.24940490722656, 104.7312240600586, 108.21304321289062, 111.69486236572266, 115.17668151855469, 118.65849304199219]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 2.0, 9.0, 3.0, 17.0, 13.0, 18.0, 21.0, 17.0, 26.0, 32.0, 32.0, 37.0, 41.0, 57.0, 53.0, 61.0, 47.0, 59.0, 49.0, 42.0, 43.0, 47.0, 35.0, 30.0, 32.0, 32.0, 24.0, 27.0, 19.0, 12.0, 17.0, 10.0, 8.0, 6.0, 7.0, 8.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.75, -204.296875, -196.84375, -189.390625, -181.9375, -174.484375, -167.03125, -159.578125, -152.125, -144.671875, -137.21875, -129.765625, -122.3125, -114.859375, -107.40625, -99.953125, -92.5, -85.046875, -77.59375, -70.140625, -62.6875, -55.234375, -47.78125, -40.328125, -32.875, -25.421875, -17.96875, -10.515625, -3.0625, 4.390625, 11.84375, 19.296875, 26.75, 34.203125, 41.65625, 49.109375, 56.5625, 64.015625, 71.46875, 78.921875, 86.375, 93.828125, 101.28125, 108.734375, 116.1875, 123.640625, 131.09375, 138.546875, 146.0, 153.453125, 160.90625, 168.359375, 175.8125, 183.265625, 190.71875, 198.171875, 205.625, 213.078125, 220.53125, 227.984375, 235.4375, 242.890625, 250.34375, 257.796875, 265.25]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 8.0, 15.0, 26.0, 32.0, 45.0, 71.0, 119.0, 151.0, 266.0, 454.0, 779.0, 1299.0, 2286.0, 4155.0, 7429.0, 13640.0, 26047.0, 51268.0, 112586.0, 329305.0, 294046.0, 103305.0, 47945.0, 24339.0, 12815.0, 7012.0, 3914.0, 2162.0, 1199.0, 708.0, 400.0, 284.0, 147.0, 107.0, 68.0, 39.0, 28.0, 18.0, 13.0, 5.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.1640625, -13.7587890625, -13.353515625, -12.9482421875, -12.54296875, -12.1376953125, -11.732421875, -11.3271484375, -10.921875, -10.5166015625, -10.111328125, -9.7060546875, -9.30078125, -8.8955078125, -8.490234375, -8.0849609375, -7.6796875, -7.2744140625, -6.869140625, -6.4638671875, -6.05859375, -5.6533203125, -5.248046875, -4.8427734375, -4.4375, -4.0322265625, -3.626953125, -3.2216796875, -2.81640625, -2.4111328125, -2.005859375, -1.6005859375, -1.1953125, -0.7900390625, -0.384765625, 0.0205078125, 0.42578125, 0.8310546875, 1.236328125, 1.6416015625, 2.046875, 2.4521484375, 2.857421875, 3.2626953125, 3.66796875, 4.0732421875, 4.478515625, 4.8837890625, 5.2890625, 5.6943359375, 6.099609375, 6.5048828125, 6.91015625, 7.3154296875, 7.720703125, 8.1259765625, 8.53125, 8.9365234375, 9.341796875, 9.7470703125, 10.15234375, 10.5576171875, 10.962890625, 11.3681640625, 11.7734375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 10.0, 7.0, 13.0, 7.0, 15.0, 19.0, 27.0, 22.0, 27.0, 26.0, 29.0, 37.0, 27.0, 33.0, 32.0, 41.0, 30.0, 40.0, 1059.0, 42.0, 38.0, 42.0, 43.0, 38.0, 36.0, 33.0, 39.0, 28.0, 23.0, 30.0, 13.0, 12.0, 15.0, 10.0, 13.0, 16.0, 10.0, 6.0, 7.0, 4.0, 7.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-164.25, -159.10546875, -153.9609375, -148.81640625, -143.671875, -138.52734375, -133.3828125, -128.23828125, -123.09375, -117.94921875, -112.8046875, -107.66015625, -102.515625, -97.37109375, -92.2265625, -87.08203125, -81.9375, -76.79296875, -71.6484375, -66.50390625, -61.359375, -56.21484375, -51.0703125, -45.92578125, -40.78125, -35.63671875, -30.4921875, -25.34765625, -20.203125, -15.05859375, -9.9140625, -4.76953125, 0.375, 5.51953125, 10.6640625, 15.80859375, 20.953125, 26.09765625, 31.2421875, 36.38671875, 41.53125, 46.67578125, 51.8203125, 56.96484375, 62.109375, 67.25390625, 72.3984375, 77.54296875, 82.6875, 87.83203125, 92.9765625, 98.12109375, 103.265625, 108.41015625, 113.5546875, 118.69921875, 123.84375, 128.98828125, 134.1328125, 139.27734375, 144.421875, 149.56640625, 154.7109375, 159.85546875, 165.0]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 6.0, 12.0, 19.0, 30.0, 49.0, 62.0, 93.0, 156.0, 228.0, 349.0, 529.0, 870.0, 1288.0, 1995.0, 3080.0, 4808.0, 7543.0, 12568.0, 20088.0, 32865.0, 56048.0, 103534.0, 224629.0, 1326988.0, 130616.0, 67601.0, 38658.0, 23343.0, 14408.0, 8887.0, 5682.0, 3643.0, 2303.0, 1435.0, 950.0, 621.0, 406.0, 240.0, 159.0, 115.0, 81.0, 48.0, 43.0, 23.0, 7.0, 13.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.79296875, -5.61285400390625, -5.4327392578125, -5.25262451171875, -5.072509765625, -4.89239501953125, -4.7122802734375, -4.53216552734375, -4.35205078125, -4.17193603515625, -3.9918212890625, -3.81170654296875, -3.631591796875, -3.45147705078125, -3.2713623046875, -3.09124755859375, -2.9111328125, -2.73101806640625, -2.5509033203125, -2.37078857421875, -2.190673828125, -2.01055908203125, -1.8304443359375, -1.65032958984375, -1.47021484375, -1.29010009765625, -1.1099853515625, -0.92987060546875, -0.749755859375, -0.56964111328125, -0.3895263671875, -0.20941162109375, -0.029296875, 0.15081787109375, 0.3309326171875, 0.51104736328125, 0.691162109375, 0.87127685546875, 1.0513916015625, 1.23150634765625, 1.41162109375, 1.59173583984375, 1.7718505859375, 1.95196533203125, 2.132080078125, 2.31219482421875, 2.4923095703125, 2.67242431640625, 2.8525390625, 3.03265380859375, 3.2127685546875, 3.39288330078125, 3.572998046875, 3.75311279296875, 3.9332275390625, 4.11334228515625, 4.29345703125, 4.47357177734375, 4.6536865234375, 4.83380126953125, 5.013916015625, 5.19403076171875, 5.3741455078125, 5.55426025390625, 5.734375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 11.0, 12.0, 12.0, 23.0, 23.0, 20.0, 30.0, 41.0, 47.0, 63.0, 55.0, 65.0, 55.0, 66.0, 66.0, 73.0, 54.0, 44.0, 39.0, 34.0, 32.0, 37.0, 20.0, 20.0, 14.0, 8.0, 8.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004856109619140625, -0.004707217216491699, -0.0045583248138427734, -0.004409432411193848, -0.004260540008544922, -0.004111647605895996, -0.00396275520324707, -0.0038138628005981445, -0.0036649703979492188, -0.003516077995300293, -0.003367185592651367, -0.0032182931900024414, -0.0030694007873535156, -0.00292050838470459, -0.002771615982055664, -0.0026227235794067383, -0.0024738311767578125, -0.0023249387741088867, -0.002176046371459961, -0.002027153968811035, -0.0018782615661621094, -0.0017293691635131836, -0.0015804767608642578, -0.001431584358215332, -0.0012826919555664062, -0.0011337995529174805, -0.0009849071502685547, -0.0008360147476196289, -0.0006871223449707031, -0.0005382299423217773, -0.00038933753967285156, -0.00024044513702392578, -9.1552734375e-05, 5.733966827392578e-05, 0.00020623207092285156, 0.00035512447357177734, 0.0005040168762207031, 0.0006529092788696289, 0.0008018016815185547, 0.0009506940841674805, 0.0010995864868164062, 0.001248478889465332, 0.0013973712921142578, 0.0015462636947631836, 0.0016951560974121094, 0.0018440485000610352, 0.001992940902709961, 0.0021418333053588867, 0.0022907257080078125, 0.0024396181106567383, 0.002588510513305664, 0.00273740291595459, 0.0028862953186035156, 0.0030351877212524414, 0.003184080123901367, 0.003332972526550293, 0.0034818649291992188, 0.0036307573318481445, 0.0037796497344970703, 0.003928542137145996, 0.004077434539794922, 0.004226326942443848, 0.0043752193450927734, 0.004524111747741699, 0.004673004150390625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 10.0, 11.0, 8.0, 17.0, 27.0, 53.0, 72.0, 110.0, 195.0, 376.0, 677.0, 1268.0, 2341.0, 4920.0, 10375.0, 22791.0, 52529.0, 119855.0, 237491.0, 281996.0, 172110.0, 78535.0, 33852.0, 14987.0, 6864.0, 3353.0, 1701.0, 870.0, 464.0, 283.0, 160.0, 91.0, 63.0, 32.0, 24.0, 13.0, 15.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196380615234375, -0.019028902053833008, -0.018419742584228516, -0.017810583114624023, -0.01720142364501953, -0.01659226417541504, -0.015983104705810547, -0.015373945236206055, -0.014764785766601562, -0.01415562629699707, -0.013546466827392578, -0.012937307357788086, -0.012328147888183594, -0.011718988418579102, -0.01110982894897461, -0.010500669479370117, -0.009891510009765625, -0.009282350540161133, -0.00867319107055664, -0.008064031600952148, -0.007454872131347656, -0.006845712661743164, -0.006236553192138672, -0.00562739372253418, -0.0050182342529296875, -0.004409074783325195, -0.003799915313720703, -0.003190755844116211, -0.0025815963745117188, -0.0019724369049072266, -0.0013632774353027344, -0.0007541179656982422, -0.00014495849609375, 0.0004642009735107422, 0.0010733604431152344, 0.0016825199127197266, 0.0022916793823242188, 0.002900838851928711, 0.003509998321533203, 0.004119157791137695, 0.0047283172607421875, 0.00533747673034668, 0.005946636199951172, 0.006555795669555664, 0.007164955139160156, 0.0077741146087646484, 0.00838327407836914, 0.008992433547973633, 0.009601593017578125, 0.010210752487182617, 0.01081991195678711, 0.011429071426391602, 0.012038230895996094, 0.012647390365600586, 0.013256549835205078, 0.01386570930480957, 0.014474868774414062, 0.015084028244018555, 0.015693187713623047, 0.01630234718322754, 0.01691150665283203, 0.017520666122436523, 0.018129825592041016, 0.018738985061645508, 0.01934814453125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 2.0, 9.0, 7.0, 10.0, 9.0, 22.0, 37.0, 35.0, 53.0, 59.0, 86.0, 92.0, 74.0, 84.0, 95.0, 78.0, 57.0, 33.0, 43.0, 26.0, 26.0, 19.0, 5.0, 9.0, 6.0, 6.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.011856141500175, -0.011549847200512886, -0.011243552900850773, -0.010937259532511234, -0.010630965232849121, -0.010324670933187008, -0.010018376633524895, -0.009712083265185356, -0.009405788965523243, -0.00909949466586113, -0.008793200366199017, -0.008486906997859478, -0.008180612698197365, -0.007874318398535252, -0.007568024098873138, -0.0072617302648723125, -0.006955435965210199, -0.006649141665548086, -0.00634284783154726, -0.006036553531885147, -0.005730259697884321, -0.005423965398222208, -0.005117671564221382, -0.004811377264559269, -0.004505082964897156, -0.004198788665235043, -0.0038924948312342167, -0.0035862005315721035, -0.0032799066975712776, -0.0029736123979091644, -0.002667318331077695, -0.0023610242642462254, -0.0020547308959066868, -0.0017484368290752172, -0.0014421427622437477, -0.0011358485789969563, -0.0008295545121654868, -0.0005232604453340173, -0.00021696626208722591, 8.932780474424362e-05, 0.00039562187157571316, 0.0007019159384071827, 0.0010082100052386522, 0.0013145041884854436, 0.0016207982553169131, 0.0019270923221483827, 0.002233386505395174, 0.0025396805722266436, 0.002845974639058113, 0.0031522687058895826, 0.003458562772721052, 0.0037648570723831654, 0.004071150906383991, 0.004377445206046104, 0.004683739505708218, 0.0049900333397090435, 0.005296327173709869, 0.005602621473371983, 0.0059089153073728085, 0.006215209607034922, 0.0065215034410357475, 0.006827797740697861, 0.007134092040359974, 0.0074403858743608, 0.007746680174022913]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 6.0, 5.0, 5.0, 4.0, 4.0, 13.0, 7.0, 9.0, 15.0, 16.0, 22.0, 24.0, 14.0, 29.0, 28.0, 43.0, 34.0, 31.0, 32.0, 40.0, 37.0, 45.0, 36.0, 32.0, 38.0, 42.0, 37.0, 28.0, 32.0, 30.0, 35.0, 28.0, 17.0, 29.0, 27.0, 22.0, 15.0, 14.0, 16.0, 5.0, 17.0, 5.0, 9.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.003509044647216797, -0.0034059500321745872, -0.0033028554171323776, -0.003199760802090168, -0.0030966661870479584, -0.0029935715720057487, -0.002890476956963539, -0.0027873823419213295, -0.00268428772687912, -0.0025811931118369102, -0.0024780984967947006, -0.002375003881752491, -0.0022719092667102814, -0.0021688146516680717, -0.002065720036625862, -0.0019626254215836525, -0.0018595308065414429, -0.0017564361914992332, -0.0016533415764570236, -0.001550246961414814, -0.0014471523463726044, -0.0013440577313303947, -0.0012409631162881851, -0.0011378685012459755, -0.0010347738862037659, -0.0009316792711615562, -0.0008285846561193466, -0.000725490041077137, -0.0006223954260349274, -0.0005193008109927177, -0.0004162061959505081, -0.0003131115809082985, -0.00021001696586608887, -0.00010692235082387924, -3.827735781669617e-06, 9.926687926054001e-05, 0.00020236149430274963, 0.00030545610934495926, 0.0004085507243871689, 0.0005116453394293785, 0.0006147399544715881, 0.0007178345695137978, 0.0008209291845560074, 0.000924023799598217, 0.0010271184146404266, 0.0011302130296826363, 0.0012333076447248459, 0.0013364022597670555, 0.0014394968748092651, 0.0015425914898514748, 0.0016456861048936844, 0.001748780719935894, 0.0018518753349781036, 0.0019549699500203133, 0.002058064565062523, 0.0021611591801047325, 0.002264253795146942, 0.0023673484101891518, 0.0024704430252313614, 0.002573537640273571, 0.0026766322553157806, 0.0027797268703579903, 0.0028828214854002, 0.0029859161004424095, 0.003089010715484619]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 2.0, 9.0, 3.0, 17.0, 13.0, 18.0, 21.0, 17.0, 26.0, 32.0, 32.0, 37.0, 41.0, 57.0, 53.0, 61.0, 47.0, 59.0, 49.0, 42.0, 43.0, 47.0, 35.0, 30.0, 32.0, 32.0, 24.0, 27.0, 19.0, 12.0, 17.0, 10.0, 8.0, 6.0, 7.0, 7.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.75, -204.296875, -196.84375, -189.390625, -181.9375, -174.484375, -167.03125, -159.578125, -152.125, -144.671875, -137.21875, -129.765625, -122.3125, -114.859375, -107.40625, -99.953125, -92.5, -85.046875, -77.59375, -70.140625, -62.6875, -55.234375, -47.78125, -40.328125, -32.875, -25.421875, -17.96875, -10.515625, -3.0625, 4.390625, 11.84375, 19.296875, 26.75, 34.203125, 41.65625, 49.109375, 56.5625, 64.015625, 71.46875, 78.921875, 86.375, 93.828125, 101.28125, 108.734375, 116.1875, 123.640625, 131.09375, 138.546875, 146.0, 153.453125, 160.90625, 168.359375, 175.8125, 183.265625, 190.71875, 198.171875, 205.625, 213.078125, 220.53125, 227.984375, 235.4375, 242.890625, 250.34375, 257.796875, 265.25]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 11.0, 8.0, 8.0, 15.0, 25.0, 24.0, 27.0, 38.0, 35.0, 78.0, 98.0, 163.0, 364.0, 1003.0, 3312.0, 12105.0, 52519.0, 266124.0, 518612.0, 152183.0, 30660.0, 7539.0, 2191.0, 668.0, 267.0, 142.0, 89.0, 55.0, 51.0, 41.0, 18.0, 27.0, 14.0, 8.0, 11.0, 10.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.0625, -37.73046875, -36.3984375, -35.06640625, -33.734375, -32.40234375, -31.0703125, -29.73828125, -28.40625, -27.07421875, -25.7421875, -24.41015625, -23.078125, -21.74609375, -20.4140625, -19.08203125, -17.75, -16.41796875, -15.0859375, -13.75390625, -12.421875, -11.08984375, -9.7578125, -8.42578125, -7.09375, -5.76171875, -4.4296875, -3.09765625, -1.765625, -0.43359375, 0.8984375, 2.23046875, 3.5625, 4.89453125, 6.2265625, 7.55859375, 8.890625, 10.22265625, 11.5546875, 12.88671875, 14.21875, 15.55078125, 16.8828125, 18.21484375, 19.546875, 20.87890625, 22.2109375, 23.54296875, 24.875, 26.20703125, 27.5390625, 28.87109375, 30.203125, 31.53515625, 32.8671875, 34.19921875, 35.53125, 36.86328125, 38.1953125, 39.52734375, 40.859375, 42.19140625, 43.5234375, 44.85546875, 46.1875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 6.0, 6.0, 14.0, 16.0, 16.0, 25.0, 26.0, 39.0, 53.0, 62.0, 70.0, 59.0, 80.0, 2119.0, 68.0, 50.0, 62.0, 45.0, 53.0, 37.0, 27.0, 28.0, 23.0, 23.0, 16.0, 15.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-393.0, -380.04296875, -367.0859375, -354.12890625, -341.171875, -328.21484375, -315.2578125, -302.30078125, -289.34375, -276.38671875, -263.4296875, -250.47265625, -237.515625, -224.55859375, -211.6015625, -198.64453125, -185.6875, -172.73046875, -159.7734375, -146.81640625, -133.859375, -120.90234375, -107.9453125, -94.98828125, -82.03125, -69.07421875, -56.1171875, -43.16015625, -30.203125, -17.24609375, -4.2890625, 8.66796875, 21.625, 34.58203125, 47.5390625, 60.49609375, 73.453125, 86.41015625, 99.3671875, 112.32421875, 125.28125, 138.23828125, 151.1953125, 164.15234375, 177.109375, 190.06640625, 203.0234375, 215.98046875, 228.9375, 241.89453125, 254.8515625, 267.80859375, 280.765625, 293.72265625, 306.6796875, 319.63671875, 332.59375, 345.55078125, 358.5078125, 371.46484375, 384.421875, 397.37890625, 410.3359375, 423.29296875, 436.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 11.0, 8.0, 22.0, 35.0, 45.0, 98.0, 128.0, 264.0, 516.0, 1178.0, 3679.0, 20693.0, 249332.0, 2779169.0, 78138.0, 8670.0, 2084.0, 805.0, 375.0, 178.0, 129.0, 47.0, 38.0, 24.0, 15.0, 13.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.28125, -35.91455078125, -34.5478515625, -33.18115234375, -31.814453125, -30.44775390625, -29.0810546875, -27.71435546875, -26.34765625, -24.98095703125, -23.6142578125, -22.24755859375, -20.880859375, -19.51416015625, -18.1474609375, -16.78076171875, -15.4140625, -14.04736328125, -12.6806640625, -11.31396484375, -9.947265625, -8.58056640625, -7.2138671875, -5.84716796875, -4.48046875, -3.11376953125, -1.7470703125, -0.38037109375, 0.986328125, 2.35302734375, 3.7197265625, 5.08642578125, 6.453125, 7.81982421875, 9.1865234375, 10.55322265625, 11.919921875, 13.28662109375, 14.6533203125, 16.02001953125, 17.38671875, 18.75341796875, 20.1201171875, 21.48681640625, 22.853515625, 24.22021484375, 25.5869140625, 26.95361328125, 28.3203125, 29.68701171875, 31.0537109375, 32.42041015625, 33.787109375, 35.15380859375, 36.5205078125, 37.88720703125, 39.25390625, 40.62060546875, 41.9873046875, 43.35400390625, 44.720703125, 46.08740234375, 47.4541015625, 48.82080078125, 50.1875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 7.0, 10.0, 18.0, 38.0, 115.0, 178.0, 194.0, 173.0, 108.0, 59.0, 29.0, 17.0, 12.0, 7.0, 8.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1047.2930908203125, -1024.2669677734375, -1001.2409057617188, -978.21484375, -955.1887817382812, -932.1627197265625, -909.1365966796875, -886.1105346679688, -863.08447265625, -840.0584106445312, -817.0322875976562, -794.0062255859375, -770.9801635742188, -747.9541015625, -724.927978515625, -701.9019165039062, -678.8758544921875, -655.8497924804688, -632.8236694335938, -609.797607421875, -586.7715454101562, -563.7454833984375, -540.7193603515625, -517.6932983398438, -494.66717529296875, -471.6410827636719, -448.6150207519531, -425.58892822265625, -402.5628662109375, -379.5367736816406, -356.51068115234375, -333.484619140625, -310.45855712890625, -287.4324645996094, -264.4064025878906, -241.38031005859375, -218.354248046875, -195.32815551757812, -172.3020782470703, -149.2760009765625, -126.24992370605469, -103.22384643554688, -80.19776916503906, -57.17168426513672, -34.145606994628906, -11.119529724121094, 11.90655517578125, 34.93263244628906, 57.958709716796875, 80.98478698730469, 104.0108642578125, 127.03694915771484, 150.06301879882812, 173.089111328125, 196.1151885986328, 219.14126586914062, 242.16734313964844, 265.19342041015625, 288.2195129394531, 311.2455749511719, 334.27166748046875, 357.2977294921875, 380.3238220214844, 403.34991455078125, 426.3759765625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 5.0, 6.0, 6.0, 9.0, 5.0, 14.0, 9.0, 10.0, 15.0, 16.0, 18.0, 24.0, 24.0, 31.0, 32.0, 33.0, 29.0, 52.0, 35.0, 38.0, 36.0, 46.0, 38.0, 44.0, 37.0, 31.0, 37.0, 29.0, 44.0, 29.0, 33.0, 28.0, 19.0, 24.0, 21.0, 15.0, 21.0, 8.0, 7.0, 10.0, 6.0, 7.0, 6.0, 7.0, 7.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-446.8499450683594, -432.5949401855469, -418.33990478515625, -404.08489990234375, -389.8298645019531, -375.5748596191406, -361.31982421875, -347.0648193359375, -332.809814453125, -318.5548095703125, -304.2997741699219, -290.0447692871094, -275.78973388671875, -261.53472900390625, -247.2797088623047, -233.02468872070312, -218.7696533203125, -204.51463317871094, -190.25961303710938, -176.00460815429688, -161.74957275390625, -147.49456787109375, -133.2395477294922, -118.98452758789062, -104.72950744628906, -90.4744873046875, -76.21946716308594, -61.964454650878906, -47.709434509277344, -33.45441436767578, -19.19940185546875, -4.9443817138671875, 9.31060791015625, 23.56562614440918, 37.82064437866211, 52.075660705566406, 66.33068084716797, 80.58570098876953, 94.84071350097656, 109.09573364257812, 123.35075378417969, 137.60577392578125, 151.8607940673828, 166.11581420898438, 180.37081909179688, 194.6258544921875, 208.880859375, 223.13587951660156, 237.39089965820312, 251.6459197998047, 265.90093994140625, 280.15594482421875, 294.4109802246094, 308.6659851074219, 322.9210205078125, 337.176025390625, 351.4310302734375, 365.68603515625, 379.9410705566406, 394.1960754394531, 408.45111083984375, 422.70611572265625, 436.96112060546875, 451.2161560058594, 465.47119140625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 12.0, 12.0, 14.0, 27.0, 29.0, 38.0, 65.0, 88.0, 100.0, 154.0, 247.0, 273.0, 381.0, 557.0, 731.0, 1130.0, 1041128.0, 995.0, 700.0, 514.0, 373.0, 257.0, 186.0, 158.0, 99.0, 74.0, 65.0, 39.0, 30.0, 15.0, 16.0, 2.0, 9.0, 6.0, 10.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.6254425048828, -158.5720977783203, -153.5187530517578, -148.4654083251953, -143.4120635986328, -138.3587188720703, -133.3053741455078, -128.25204467773438, -123.19869232177734, -118.14534759521484, -113.09200286865234, -108.03865814208984, -102.98532104492188, -97.93197631835938, -92.87863159179688, -87.82528686523438, -82.77194213867188, -77.71859741210938, -72.66525268554688, -67.61190795898438, -62.55856704711914, -57.50522232055664, -52.451881408691406, -47.398536682128906, -42.345191955566406, -37.291847229003906, -32.238502502441406, -27.185161590576172, -22.131816864013672, -17.078472137451172, -12.025129318237305, -6.9717864990234375, -1.9184417724609375, 3.134902000427246, 8.18824577331543, 13.241589546203613, 18.294933319091797, 23.348278045654297, 28.401620864868164, 33.45496368408203, 38.50830841064453, 43.56165313720703, 48.61499786376953, 53.668338775634766, 58.721683502197266, 63.775028228759766, 68.828369140625, 73.8817138671875, 78.93505859375, 83.9884033203125, 89.041748046875, 94.0950927734375, 99.1484375, 104.2017822265625, 109.25511932373047, 114.30846405029297, 119.36180877685547, 124.41515350341797, 129.46849060058594, 134.52183532714844, 139.57518005371094, 144.62852478027344, 149.68186950683594, 154.73521423339844, 159.78855895996094]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 10.0, 7.0, 14.0, 15.0, 24.0, 31.0, 130.0, 1065.0, 51457080.0, 4463.0, 156.0, 57.0, 22.0, 15.0, 18.0, 8.0, 5.0, 7.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1546.0, -1463.11474609375, -1380.2293701171875, -1297.3441162109375, -1214.458740234375, -1131.573486328125, -1048.688232421875, -965.8029174804688, -882.9176025390625, -800.0322875976562, -717.14697265625, -634.26171875, -551.3764038085938, -468.4910888671875, -385.6058044433594, -302.72052001953125, -219.835205078125, -136.9499053955078, -54.064605712890625, 28.820693969726562, 111.70599365234375, 194.59130859375, 277.4765930175781, 360.36187744140625, 443.2471923828125, 526.1325073242188, 609.017822265625, 691.903076171875, 774.7883911132812, 857.6737060546875, 940.5589599609375, 1023.4442749023438, 1106.329345703125, 1189.214599609375, 1272.0999755859375, 1354.9852294921875, 1437.87060546875, 1520.755859375, 1603.64111328125, 1686.5263671875, 1769.4117431640625, 1852.2969970703125, 1935.182373046875, 2018.067626953125, 2100.952880859375, 2183.83837890625, 2266.7236328125, 2349.60888671875, 2432.494140625, 2515.37939453125, 2598.2646484375, 2681.150146484375, 2764.035400390625, 2846.920654296875, 2929.805908203125, 3012.691162109375, 3095.57666015625, 3178.4619140625, 3261.34716796875, 3344.232666015625, 3427.117919921875, 3510.003173828125, 3592.888427734375, 3675.773681640625, 3758.658935546875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 14.0, 27.0, 34.0, 54.0, 87.0, 137.0, 195.0, 317.0, 457.0, 853.0, 1297.0, 1931.0, 2894.0, 4833.0, 7239.0, 11144.0, 17371.0, 26815.0, 41376.0, 64451.0, 100876.0, 162293.0, 278835.0, 570150.0, 3964363.0, 430538.0, 227760.0, 135713.0, 85181.0, 54167.0, 35340.0, 22956.0, 14850.0, 9479.0, 6263.0, 4014.0, 2579.0, 1674.0, 1042.0, 647.0, 427.0, 288.0, 181.0, 106.0, 65.0, 43.0, 34.0, 15.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.07379150390625, -2.0030517578125, -1.93231201171875, -1.861572265625, -1.79083251953125, -1.7200927734375, -1.64935302734375, -1.57861328125, -1.50787353515625, -1.4371337890625, -1.36639404296875, -1.295654296875, -1.22491455078125, -1.1541748046875, -1.08343505859375, -1.0126953125, -0.94195556640625, -0.8712158203125, -0.80047607421875, -0.729736328125, -0.65899658203125, -0.5882568359375, -0.51751708984375, -0.44677734375, -0.37603759765625, -0.3052978515625, -0.23455810546875, -0.163818359375, -0.09307861328125, -0.0223388671875, 0.04840087890625, 0.119140625, 0.18988037109375, 0.2606201171875, 0.33135986328125, 0.402099609375, 0.47283935546875, 0.5435791015625, 0.61431884765625, 0.68505859375, 0.75579833984375, 0.8265380859375, 0.89727783203125, 0.968017578125, 1.03875732421875, 1.1094970703125, 1.18023681640625, 1.2509765625, 1.32171630859375, 1.3924560546875, 1.46319580078125, 1.533935546875, 1.60467529296875, 1.6754150390625, 1.74615478515625, 1.81689453125, 1.88763427734375, 1.9583740234375, 2.02911376953125, 2.099853515625, 2.17059326171875, 2.2413330078125, 2.31207275390625, 2.3828125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 7.0, 12.0, 12.0, 17.0, 26.0, 23.0, 28.0, 28.0, 29.0, 31.0, 43.0, 25.0, 31.0, 38.0, 29.0, 45.0, 34.0, 1050.0, 61.0, 41.0, 33.0, 38.0, 31.0, 22.0, 32.0, 20.0, 33.0, 25.0, 17.0, 25.0, 17.0, 19.0, 14.0, 16.0, 16.0, 9.0, 6.0, 3.0, 6.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-101.3125, -98.220703125, -95.12890625, -92.037109375, -88.9453125, -85.853515625, -82.76171875, -79.669921875, -76.578125, -73.486328125, -70.39453125, -67.302734375, -64.2109375, -61.119140625, -58.02734375, -54.935546875, -51.84375, -48.751953125, -45.66015625, -42.568359375, -39.4765625, -36.384765625, -33.29296875, -30.201171875, -27.109375, -24.017578125, -20.92578125, -17.833984375, -14.7421875, -11.650390625, -8.55859375, -5.466796875, -2.375, 0.716796875, 3.80859375, 6.900390625, 9.9921875, 13.083984375, 16.17578125, 19.267578125, 22.359375, 25.451171875, 28.54296875, 31.634765625, 34.7265625, 37.818359375, 40.91015625, 44.001953125, 47.09375, 50.185546875, 53.27734375, 56.369140625, 59.4609375, 62.552734375, 65.64453125, 68.736328125, 71.828125, 74.919921875, 78.01171875, 81.103515625, 84.1953125, 87.287109375, 90.37890625, 93.470703125, 96.5625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 3.0, 9.0, 11.0, 11.0, 19.0, 24.0, 44.0, 74.0, 139.0, 178.0, 257.0, 383.0, 520.0, 779.0, 1084.0, 1568.0, 2342.0, 3324.0, 4751.0, 7094.0, 9699.0, 14167.0, 21022.0, 30238.0, 44303.0, 66780.0, 105286.0, 171900.0, 307493.0, 555192.0, 3828524.0, 453302.0, 247063.0, 143698.0, 88866.0, 57552.0, 38200.0, 26226.0, 18260.0, 12424.0, 8763.0, 6003.0, 4215.0, 3033.0, 2040.0, 1423.0, 979.0, 644.0, 489.0, 331.0, 217.0, 139.0, 104.0, 84.0, 48.0, 38.0, 29.0, 17.0, 20.0, 14.0, 8.0, 1.0, 4.0], "bins": [-1.796875, -1.739501953125, -1.68212890625, -1.624755859375, -1.5673828125, -1.510009765625, -1.45263671875, -1.395263671875, -1.337890625, -1.280517578125, -1.22314453125, -1.165771484375, -1.1083984375, -1.051025390625, -0.99365234375, -0.936279296875, -0.87890625, -0.821533203125, -0.76416015625, -0.706787109375, -0.6494140625, -0.592041015625, -0.53466796875, -0.477294921875, -0.419921875, -0.362548828125, -0.30517578125, -0.247802734375, -0.1904296875, -0.133056640625, -0.07568359375, -0.018310546875, 0.0390625, 0.096435546875, 0.15380859375, 0.211181640625, 0.2685546875, 0.325927734375, 0.38330078125, 0.440673828125, 0.498046875, 0.555419921875, 0.61279296875, 0.670166015625, 0.7275390625, 0.784912109375, 0.84228515625, 0.899658203125, 0.95703125, 1.014404296875, 1.07177734375, 1.129150390625, 1.1865234375, 1.243896484375, 1.30126953125, 1.358642578125, 1.416015625, 1.473388671875, 1.53076171875, 1.588134765625, 1.6455078125, 1.702880859375, 1.76025390625, 1.817626953125, 1.875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 11.0, 11.0, 6.0, 4.0, 10.0, 9.0, 11.0, 9.0, 13.0, 14.0, 19.0, 18.0, 18.0, 23.0, 30.0, 27.0, 35.0, 25.0, 39.0, 29.0, 30.0, 42.0, 1004.0, 104.0, 36.0, 36.0, 36.0, 43.0, 37.0, 41.0, 25.0, 20.0, 22.0, 22.0, 26.0, 18.0, 18.0, 10.0, 14.0, 8.0, 11.0, 12.0, 14.0, 10.0, 4.0, 3.0, 6.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0], "bins": [-94.6875, -91.7177734375, -88.748046875, -85.7783203125, -82.80859375, -79.8388671875, -76.869140625, -73.8994140625, -70.9296875, -67.9599609375, -64.990234375, -62.0205078125, -59.05078125, -56.0810546875, -53.111328125, -50.1416015625, -47.171875, -44.2021484375, -41.232421875, -38.2626953125, -35.29296875, -32.3232421875, -29.353515625, -26.3837890625, -23.4140625, -20.4443359375, -17.474609375, -14.5048828125, -11.53515625, -8.5654296875, -5.595703125, -2.6259765625, 0.34375, 3.3134765625, 6.283203125, 9.2529296875, 12.22265625, 15.1923828125, 18.162109375, 21.1318359375, 24.1015625, 27.0712890625, 30.041015625, 33.0107421875, 35.98046875, 38.9501953125, 41.919921875, 44.8896484375, 47.859375, 50.8291015625, 53.798828125, 56.7685546875, 59.73828125, 62.7080078125, 65.677734375, 68.6474609375, 71.6171875, 74.5869140625, 77.556640625, 80.5263671875, 83.49609375, 86.4658203125, 89.435546875, 92.4052734375, 95.375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 16.0, 20.0, 18.0, 21.0, 29.0, 35.0, 74.0, 84.0, 108.0, 143.0, 208.0, 260.0, 427.0, 573.0, 820.0, 1159.0, 1758.0, 2765.0, 4329.0, 6977.0, 11145.0, 19208.0, 36271.0, 84451.0, 914643.0, 5017124.0, 96060.0, 38967.0, 20871.0, 12191.0, 7367.0, 4455.0, 2880.0, 1774.0, 1239.0, 858.0, 589.0, 416.0, 298.0, 214.0, 170.0, 101.0, 100.0, 71.0, 30.0, 29.0, 18.0, 31.0, 12.0, 9.0, 10.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.37890625, -4.2423095703125, -4.105712890625, -3.9691162109375, -3.83251953125, -3.6959228515625, -3.559326171875, -3.4227294921875, -3.2861328125, -3.1495361328125, -3.012939453125, -2.8763427734375, -2.73974609375, -2.6031494140625, -2.466552734375, -2.3299560546875, -2.193359375, -2.0567626953125, -1.920166015625, -1.7835693359375, -1.64697265625, -1.5103759765625, -1.373779296875, -1.2371826171875, -1.1005859375, -0.9639892578125, -0.827392578125, -0.6907958984375, -0.55419921875, -0.4176025390625, -0.281005859375, -0.1444091796875, -0.0078125, 0.1287841796875, 0.265380859375, 0.4019775390625, 0.53857421875, 0.6751708984375, 0.811767578125, 0.9483642578125, 1.0849609375, 1.2215576171875, 1.358154296875, 1.4947509765625, 1.63134765625, 1.7679443359375, 1.904541015625, 2.0411376953125, 2.177734375, 2.3143310546875, 2.450927734375, 2.5875244140625, 2.72412109375, 2.8607177734375, 2.997314453125, 3.1339111328125, 3.2705078125, 3.4071044921875, 3.543701171875, 3.6802978515625, 3.81689453125, 3.9534912109375, 4.090087890625, 4.2266845703125, 4.36328125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 15.0, 7.0, 6.0, 17.0, 15.0, 15.0, 26.0, 24.0, 19.0, 35.0, 52.0, 30.0, 40.0, 43.0, 33.0, 51.0, 41.0, 1062.0, 44.0, 47.0, 36.0, 39.0, 37.0, 30.0, 35.0, 16.0, 35.0, 22.0, 17.0, 20.0, 23.0, 10.0, 12.0, 11.0, 10.0, 6.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-82.5625, -79.75, -76.9375, -74.125, -71.3125, -68.5, -65.6875, -62.875, -60.0625, -57.25, -54.4375, -51.625, -48.8125, -46.0, -43.1875, -40.375, -37.5625, -34.75, -31.9375, -29.125, -26.3125, -23.5, -20.6875, -17.875, -15.0625, -12.25, -9.4375, -6.625, -3.8125, -1.0, 1.8125, 4.625, 7.4375, 10.25, 13.0625, 15.875, 18.6875, 21.5, 24.3125, 27.125, 29.9375, 32.75, 35.5625, 38.375, 41.1875, 44.0, 46.8125, 49.625, 52.4375, 55.25, 58.0625, 60.875, 63.6875, 66.5, 69.3125, 72.125, 74.9375, 77.75, 80.5625, 83.375, 86.1875, 89.0, 91.8125, 94.625, 97.4375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 932.0, 66.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2995.4453125, -2939.714599609375, -2883.98388671875, -2828.2529296875, -2772.522216796875, -2716.79150390625, -2661.060791015625, -2605.329833984375, -2549.59912109375, -2493.868408203125, -2438.1376953125, -2382.40673828125, -2326.676025390625, -2270.9453125, -2215.214599609375, -2159.483642578125, -2103.7529296875, -2048.022216796875, -1992.2913818359375, -1936.5606689453125, -1880.829833984375, -1825.09912109375, -1769.3682861328125, -1713.6375732421875, -1657.9068603515625, -1602.1761474609375, -1546.4453125, -1490.714599609375, -1434.9837646484375, -1379.2530517578125, -1323.522216796875, -1267.79150390625, -1212.060791015625, -1156.330078125, -1100.5992431640625, -1044.8685302734375, -989.1376953125, -933.406982421875, -877.6761474609375, -821.9454345703125, -766.214599609375, -710.4838256835938, -654.7530517578125, -599.0222778320312, -543.29150390625, -487.5607604980469, -431.8299865722656, -376.0992126464844, -320.368408203125, -264.63763427734375, -208.9068603515625, -153.1761016845703, -97.44532775878906, -41.714569091796875, 14.016204833984375, 69.74697875976562, 125.47775268554688, 181.20852661132812, 236.93930053710938, 292.6700439453125, 348.40081787109375, 404.131591796875, 459.86236572265625, 515.5931396484375, 571.3239135742188]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 9.0, 8.0, 6.0, 7.0, 10.0, 8.0, 9.0, 18.0, 16.0, 18.0, 23.0, 24.0, 22.0, 26.0, 37.0, 35.0, 40.0, 50.0, 47.0, 32.0, 37.0, 47.0, 40.0, 37.0, 46.0, 25.0, 40.0, 35.0, 35.0, 24.0, 24.0, 28.0, 19.0, 20.0, 11.0, 12.0, 14.0, 12.0, 4.0, 9.0, 7.0, 10.0, 5.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-203.13497924804688, -196.5615997314453, -189.98822021484375, -183.4148406982422, -176.84146118164062, -170.26808166503906, -163.6947021484375, -157.121337890625, -150.54794311523438, -143.9745635986328, -137.40118408203125, -130.8278045654297, -124.25442504882812, -117.68104553222656, -111.10767364501953, -104.53429412841797, -97.96092224121094, -91.38754272460938, -84.81416320800781, -78.24078369140625, -71.66740417480469, -65.09402465820312, -58.520652770996094, -51.94727325439453, -45.37389373779297, -38.800514221191406, -32.227134704589844, -25.653759002685547, -19.080379486083984, -12.506999969482422, -5.933624267578125, 0.6397552490234375, 7.213134765625, 13.786513328552246, 20.359891891479492, 26.933269500732422, 33.506649017333984, 40.08002853393555, 46.653404235839844, 53.226783752441406, 59.80016326904297, 66.37354278564453, 72.9469223022461, 79.52029418945312, 86.09367370605469, 92.66705322265625, 99.24043273925781, 105.81381225585938, 112.38719177246094, 118.9605712890625, 125.53395080566406, 132.10733032226562, 138.6807098388672, 145.25408935546875, 151.82745361328125, 158.40084838867188, 164.97421264648438, 171.54759216308594, 178.1209716796875, 184.69435119628906, 191.26773071289062, 197.8411102294922, 204.41448974609375, 210.98785400390625, 217.56124877929688]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 3.0, 2.0, 0.0, 4.0, 9.0, 4.0, 4.0, 12.0, 9.0, 5.0, 6.0, 7.0, 11.0, 6.0, 18.0, 21.0, 25.0, 17.0, 53.0, 72.0, 132.0, 276.0, 1414.0, 24070.0, 4136401.0, 27445.0, 3335.0, 535.0, 110.0, 74.0, 54.0, 22.0, 22.0, 16.0, 17.0, 11.0, 17.0, 13.0, 0.0, 8.0, 6.0, 5.0, 3.0, 3.0, 9.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.5009765625, -0.4868659973144531, -0.47275543212890625, -0.4586448669433594, -0.4445343017578125, -0.4304237365722656, -0.41631317138671875, -0.4022026062011719, -0.388092041015625, -0.3739814758300781, -0.35987091064453125, -0.3457603454589844, -0.3316497802734375, -0.3175392150878906, -0.30342864990234375, -0.2893180847167969, -0.27520751953125, -0.2610969543457031, -0.24698638916015625, -0.23287582397460938, -0.2187652587890625, -0.20465469360351562, -0.19054412841796875, -0.17643356323242188, -0.162322998046875, -0.14821243286132812, -0.13410186767578125, -0.11999130249023438, -0.1058807373046875, -0.09177017211914062, -0.07765960693359375, -0.06354904174804688, -0.0494384765625, -0.035327911376953125, -0.02121734619140625, -0.007106781005859375, 0.0070037841796875, 0.021114349365234375, 0.03522491455078125, 0.049335479736328125, 0.063446044921875, 0.07755661010742188, 0.09166717529296875, 0.10577774047851562, 0.1198883056640625, 0.13399887084960938, 0.14810943603515625, 0.16222000122070312, 0.17633056640625, 0.19044113159179688, 0.20455169677734375, 0.21866226196289062, 0.2327728271484375, 0.24688339233398438, 0.26099395751953125, 0.2751045227050781, 0.289215087890625, 0.3033256530761719, 0.31743621826171875, 0.3315467834472656, 0.3456573486328125, 0.3597679138183594, 0.37387847900390625, 0.3879890441894531, 0.402099609375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 1.0, 6.0, 7.0, 15.0, 14.0, 19.0, 23.0, 781.0, 22.0, 14.0, 15.0, 13.0, 12.0, 9.0, 4.0, 2.0, 6.0, 5.0, 5.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.3019981384277344, -0.29320526123046875, -0.2844123840332031, -0.2756195068359375, -0.2668266296386719, -0.25803375244140625, -0.24924087524414062, -0.240447998046875, -0.23165512084960938, -0.22286224365234375, -0.21406936645507812, -0.2052764892578125, -0.19648361206054688, -0.18769073486328125, -0.17889785766601562, -0.17010498046875, -0.16131210327148438, -0.15251922607421875, -0.14372634887695312, -0.1349334716796875, -0.12614059448242188, -0.11734771728515625, -0.10855484008789062, -0.099761962890625, -0.09096908569335938, -0.08217620849609375, -0.07338333129882812, -0.0645904541015625, -0.055797576904296875, -0.04700469970703125, -0.038211822509765625, -0.0294189453125, -0.020626068115234375, -0.01183319091796875, -0.003040313720703125, 0.0057525634765625, 0.014545440673828125, 0.02333831787109375, 0.032131195068359375, 0.040924072265625, 0.049716949462890625, 0.05850982666015625, 0.06730270385742188, 0.0760955810546875, 0.08488845825195312, 0.09368133544921875, 0.10247421264648438, 0.11126708984375, 0.12005996704101562, 0.12885284423828125, 0.13764572143554688, 0.1464385986328125, 0.15523147583007812, 0.16402435302734375, 0.17281723022460938, 0.181610107421875, 0.19040298461914062, 0.19919586181640625, 0.20798873901367188, 0.2167816162109375, 0.22557449340820312, 0.23436737060546875, 0.24316024780273438, 0.251953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 10.0, 24.0, 22.0, 29.0, 52.0, 116.0, 270.0, 572.0, 1960.0, 10904.0, 4145896.0, 31254.0, 2314.0, 500.0, 165.0, 66.0, 44.0, 28.0, 15.0, 19.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.732421875, -0.7118911743164062, -0.6913604736328125, -0.6708297729492188, -0.650299072265625, -0.6297683715820312, -0.6092376708984375, -0.5887069702148438, -0.56817626953125, -0.5476455688476562, -0.5271148681640625, -0.5065841674804688, -0.486053466796875, -0.46552276611328125, -0.4449920654296875, -0.42446136474609375, -0.4039306640625, -0.38339996337890625, -0.3628692626953125, -0.34233856201171875, -0.321807861328125, -0.30127716064453125, -0.2807464599609375, -0.26021575927734375, -0.23968505859375, -0.21915435791015625, -0.1986236572265625, -0.17809295654296875, -0.157562255859375, -0.13703155517578125, -0.1165008544921875, -0.09597015380859375, -0.075439453125, -0.05490875244140625, -0.0343780517578125, -0.01384735107421875, 0.006683349609375, 0.02721405029296875, 0.0477447509765625, 0.06827545166015625, 0.08880615234375, 0.10933685302734375, 0.1298675537109375, 0.15039825439453125, 0.170928955078125, 0.19145965576171875, 0.2119903564453125, 0.23252105712890625, 0.2530517578125, 0.27358245849609375, 0.2941131591796875, 0.31464385986328125, 0.335174560546875, 0.35570526123046875, 0.3762359619140625, 0.39676666259765625, 0.41729736328125, 0.43782806396484375, 0.4583587646484375, 0.47888946533203125, 0.499420166015625, 0.5199508666992188, 0.5404815673828125, 0.5610122680664062, 0.58154296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 2.0, 7.0, 5.0, 14.0, 15.0, 41.0, 160.0, 801.0, 2599.0, 288.0, 69.0, 18.0, 19.0, 5.0, 4.0, 4.0, 1.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.332763671875, -0.3238239288330078, -0.3148841857910156, -0.30594444274902344, -0.29700469970703125, -0.28806495666503906, -0.2791252136230469, -0.2701854705810547, -0.2612457275390625, -0.2523059844970703, -0.24336624145507812, -0.23442649841308594, -0.22548675537109375, -0.21654701232910156, -0.20760726928710938, -0.1986675262451172, -0.189727783203125, -0.1807880401611328, -0.17184829711914062, -0.16290855407714844, -0.15396881103515625, -0.14502906799316406, -0.13608932495117188, -0.1271495819091797, -0.1182098388671875, -0.10927009582519531, -0.10033035278320312, -0.09139060974121094, -0.08245086669921875, -0.07351112365722656, -0.06457138061523438, -0.05563163757324219, -0.04669189453125, -0.03775215148925781, -0.028812408447265625, -0.019872665405273438, -0.01093292236328125, -0.0019931793212890625, 0.006946563720703125, 0.015886306762695312, 0.0248260498046875, 0.03376579284667969, 0.042705535888671875, 0.05164527893066406, 0.06058502197265625, 0.06952476501464844, 0.07846450805664062, 0.08740425109863281, 0.096343994140625, 0.10528373718261719, 0.11422348022460938, 0.12316322326660156, 0.13210296630859375, 0.14104270935058594, 0.14998245239257812, 0.1589221954345703, 0.1678619384765625, 0.1768016815185547, 0.18574142456054688, 0.19468116760253906, 0.20362091064453125, 0.21256065368652344, 0.22150039672851562, 0.2304401397705078, 0.2393798828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 11.0, 28.0, 104.0, 557.0, 198.0, 49.0, 27.0, 11.0, 7.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5676230192184448, -0.5529505014419556, -0.5382780432701111, -0.5236055254936218, -0.5089330673217773, -0.4942605495452881, -0.4795880615711212, -0.46491557359695435, -0.4502430558204651, -0.4355705678462982, -0.42089807987213135, -0.4062255620956421, -0.3915530741214752, -0.37688058614730835, -0.3622080981731415, -0.3475356101989746, -0.33286312222480774, -0.31819063425064087, -0.303518146276474, -0.28884565830230713, -0.27417314052581787, -0.259500652551651, -0.24482816457748413, -0.23015567660331726, -0.2154831737279892, -0.20081068575382233, -0.18613818287849426, -0.1714656949043274, -0.15679320693016052, -0.14212070405483246, -0.1274482160806656, -0.11277572065591812, -0.09810322523117065, -0.08343072980642319, -0.06875823438167572, -0.05408574640750885, -0.03941325098276138, -0.024740755558013916, -0.010068267583847046, 0.004604227840900421, 0.019276723265647888, 0.033949218690395355, 0.048621710389852524, 0.06329420208930969, 0.07796669751405716, 0.09263919293880463, 0.1073116809129715, 0.12198417633771896, 0.13665667176246643, 0.1513291597366333, 0.16600166261196136, 0.18067415058612823, 0.1953466534614563, 0.21001914143562317, 0.22469162940979004, 0.2393641173839569, 0.2540366053581238, 0.26870909333229065, 0.2833815813064575, 0.2980540990829468, 0.31272658705711365, 0.3273990750312805, 0.3420715630054474, 0.35674405097961426, 0.3714165687561035]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 9.0, 4.0, 8.0, 14.0, 26.0, 48.0, 83.0, 100.0, 115.0, 143.0, 117.0, 95.0, 61.0, 46.0, 27.0, 16.0, 17.0, 6.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1085833311080933, -1.0783967971801758, -1.0482103824615479, -1.01802396774292, -0.9878374338150024, -0.9576509594917297, -0.927464485168457, -0.8972780108451843, -0.8670915365219116, -0.8369050621986389, -0.8067185878753662, -0.7765321135520935, -0.7463456392288208, -0.7161591649055481, -0.6859726905822754, -0.6557862162590027, -0.62559974193573, -0.5954132676124573, -0.5652267932891846, -0.5350403189659119, -0.5048538446426392, -0.47466737031936646, -0.44448089599609375, -0.41429442167282104, -0.38410794734954834, -0.35392147302627563, -0.32373499870300293, -0.2935485243797302, -0.2633620500564575, -0.23317557573318481, -0.2029891014099121, -0.1728026270866394, -0.1426161527633667, -0.112429678440094, -0.08224320411682129, -0.052056729793548584, -0.02187025547027588, 0.008316218852996826, 0.03850269317626953, 0.06868916749954224, 0.09887564182281494, 0.12906211614608765, 0.15924859046936035, 0.18943506479263306, 0.21962153911590576, 0.24980801343917847, 0.27999448776245117, 0.3101809620857239, 0.3403674364089966, 0.3705539107322693, 0.400740385055542, 0.4309268593788147, 0.4611133337020874, 0.4912998080253601, 0.5214862823486328, 0.5516727566719055, 0.5818592309951782, 0.6120457053184509, 0.6422321796417236, 0.6724186539649963, 0.702605128288269, 0.7327916026115417, 0.7629780769348145, 0.7931645512580872, 0.8233510255813599]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 11.0, 9.0, 13.0, 26.0, 23.0, 42.0, 59.0, 75.0, 87.0, 138.0, 192.0, 301.0, 394.0, 583.0, 838.0, 1261.0, 1947.0, 3203.0, 5594.0, 11846.0, 33046.0, 921792.0, 38321.0, 13032.0, 6133.0, 3414.0, 2112.0, 1305.0, 838.0, 578.0, 362.0, 281.0, 177.0, 128.0, 107.0, 63.0, 56.0, 33.0, 40.0, 24.0, 15.0, 13.0, 5.0, 10.0, 8.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.9990234375, -0.9640350341796875, -0.929046630859375, -0.8940582275390625, -0.85906982421875, -0.8240814208984375, -0.789093017578125, -0.7541046142578125, -0.7191162109375, -0.6841278076171875, -0.649139404296875, -0.6141510009765625, -0.57916259765625, -0.5441741943359375, -0.509185791015625, -0.4741973876953125, -0.439208984375, -0.4042205810546875, -0.369232177734375, -0.3342437744140625, -0.29925537109375, -0.2642669677734375, -0.229278564453125, -0.1942901611328125, -0.1593017578125, -0.1243133544921875, -0.089324951171875, -0.0543365478515625, -0.01934814453125, 0.0156402587890625, 0.050628662109375, 0.0856170654296875, 0.12060546875, 0.1555938720703125, 0.190582275390625, 0.2255706787109375, 0.26055908203125, 0.2955474853515625, 0.330535888671875, 0.3655242919921875, 0.4005126953125, 0.4355010986328125, 0.470489501953125, 0.5054779052734375, 0.54046630859375, 0.5754547119140625, 0.610443115234375, 0.6454315185546875, 0.680419921875, 0.7154083251953125, 0.750396728515625, 0.7853851318359375, 0.82037353515625, 0.8553619384765625, 0.890350341796875, 0.9253387451171875, 0.9603271484375, 0.9953155517578125, 1.030303955078125, 1.0652923583984375, 1.10028076171875, 1.1352691650390625, 1.170257568359375, 1.2052459716796875, 1.240234375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 6.0, 3.0, 18.0, 11.0, 17.0, 20.0, 739.0, 65.0, 15.0, 14.0, 17.0, 8.0, 15.0, 5.0, 2.0, 4.0, 7.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30859375, -0.2999687194824219, -0.29134368896484375, -0.2827186584472656, -0.2740936279296875, -0.2654685974121094, -0.25684356689453125, -0.24821853637695312, -0.239593505859375, -0.23096847534179688, -0.22234344482421875, -0.21371841430664062, -0.2050933837890625, -0.19646835327148438, -0.18784332275390625, -0.17921829223632812, -0.17059326171875, -0.16196823120117188, -0.15334320068359375, -0.14471817016601562, -0.1360931396484375, -0.12746810913085938, -0.11884307861328125, -0.11021804809570312, -0.101593017578125, -0.09296798706054688, -0.08434295654296875, -0.07571792602539062, -0.0670928955078125, -0.058467864990234375, -0.04984283447265625, -0.041217803955078125, -0.0325927734375, -0.023967742919921875, -0.01534271240234375, -0.006717681884765625, 0.0019073486328125, 0.010532379150390625, 0.01915740966796875, 0.027782440185546875, 0.036407470703125, 0.045032501220703125, 0.05365753173828125, 0.062282562255859375, 0.0709075927734375, 0.07953262329101562, 0.08815765380859375, 0.09678268432617188, 0.10540771484375, 0.11403274536132812, 0.12265777587890625, 0.13128280639648438, 0.1399078369140625, 0.14853286743164062, 0.15715789794921875, 0.16578292846679688, 0.174407958984375, 0.18303298950195312, 0.19165802001953125, 0.20028305053710938, 0.2089080810546875, 0.21753311157226562, 0.22615814208984375, 0.23478317260742188, 0.243408203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 7.0, 5.0, 18.0, 20.0, 22.0, 21.0, 32.0, 42.0, 51.0, 60.0, 74.0, 107.0, 160.0, 265.0, 550.0, 1140.0, 2855.0, 8891.0, 36238.0, 324032.0, 607683.0, 48886.0, 11054.0, 3414.0, 1381.0, 591.0, 279.0, 155.0, 101.0, 80.0, 68.0, 57.0, 45.0, 47.0, 31.0, 18.0, 13.0, 12.0, 9.0, 10.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.83251953125, -0.8087921142578125, -0.785064697265625, -0.7613372802734375, -0.73760986328125, -0.7138824462890625, -0.690155029296875, -0.6664276123046875, -0.6427001953125, -0.6189727783203125, -0.595245361328125, -0.5715179443359375, -0.54779052734375, -0.5240631103515625, -0.500335693359375, -0.4766082763671875, -0.452880859375, -0.4291534423828125, -0.405426025390625, -0.3816986083984375, -0.35797119140625, -0.3342437744140625, -0.310516357421875, -0.2867889404296875, -0.2630615234375, -0.2393341064453125, -0.215606689453125, -0.1918792724609375, -0.16815185546875, -0.1444244384765625, -0.120697021484375, -0.0969696044921875, -0.0732421875, -0.0495147705078125, -0.025787353515625, -0.0020599365234375, 0.02166748046875, 0.0453948974609375, 0.069122314453125, 0.0928497314453125, 0.1165771484375, 0.1403045654296875, 0.164031982421875, 0.1877593994140625, 0.21148681640625, 0.2352142333984375, 0.258941650390625, 0.2826690673828125, 0.306396484375, 0.3301239013671875, 0.353851318359375, 0.3775787353515625, 0.40130615234375, 0.4250335693359375, 0.448760986328125, 0.4724884033203125, 0.4962158203125, 0.5199432373046875, 0.543670654296875, 0.5673980712890625, 0.59112548828125, 0.6148529052734375, 0.638580322265625, 0.6623077392578125, 0.68603515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 11.0, 9.0, 2.0, 7.0, 20.0, 11.0, 9.0, 14.0, 18.0, 20.0, 16.0, 19.0, 32.0, 29.0, 29.0, 27.0, 38.0, 40.0, 30.0, 37.0, 35.0, 32.0, 48.0, 34.0, 26.0, 39.0, 25.0, 23.0, 39.0, 25.0, 29.0, 29.0, 28.0, 29.0, 19.0, 20.0, 24.0, 15.0, 12.0, 4.0, 10.0, 8.0, 6.0, 3.0, 5.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.9501953125, -0.92230224609375, -0.8944091796875, -0.86651611328125, -0.838623046875, -0.81072998046875, -0.7828369140625, -0.75494384765625, -0.72705078125, -0.69915771484375, -0.6712646484375, -0.64337158203125, -0.615478515625, -0.58758544921875, -0.5596923828125, -0.53179931640625, -0.50390625, -0.47601318359375, -0.4481201171875, -0.42022705078125, -0.392333984375, -0.36444091796875, -0.3365478515625, -0.30865478515625, -0.28076171875, -0.25286865234375, -0.2249755859375, -0.19708251953125, -0.169189453125, -0.14129638671875, -0.1134033203125, -0.08551025390625, -0.0576171875, -0.02972412109375, -0.0018310546875, 0.02606201171875, 0.053955078125, 0.08184814453125, 0.1097412109375, 0.13763427734375, 0.16552734375, 0.19342041015625, 0.2213134765625, 0.24920654296875, 0.277099609375, 0.30499267578125, 0.3328857421875, 0.36077880859375, 0.388671875, 0.41656494140625, 0.4444580078125, 0.47235107421875, 0.500244140625, 0.52813720703125, 0.5560302734375, 0.58392333984375, 0.61181640625, 0.63970947265625, 0.6676025390625, 0.69549560546875, 0.723388671875, 0.75128173828125, 0.7791748046875, 0.80706787109375, 0.8349609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 15.0, 22.0, 32.0, 56.0, 102.0, 260.0, 595.0, 1904.0, 16153.0, 1012378.0, 14131.0, 1725.0, 593.0, 274.0, 114.0, 64.0, 40.0, 14.0, 16.0, 14.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.230804443359375, -0.22137451171875, -0.211944580078125, -0.2025146484375, -0.193084716796875, -0.18365478515625, -0.174224853515625, -0.164794921875, -0.155364990234375, -0.14593505859375, -0.136505126953125, -0.1270751953125, -0.117645263671875, -0.10821533203125, -0.098785400390625, -0.08935546875, -0.079925537109375, -0.07049560546875, -0.061065673828125, -0.0516357421875, -0.042205810546875, -0.03277587890625, -0.023345947265625, -0.013916015625, -0.004486083984375, 0.00494384765625, 0.014373779296875, 0.0238037109375, 0.033233642578125, 0.04266357421875, 0.052093505859375, 0.0615234375, 0.070953369140625, 0.08038330078125, 0.089813232421875, 0.0992431640625, 0.108673095703125, 0.11810302734375, 0.127532958984375, 0.136962890625, 0.146392822265625, 0.15582275390625, 0.165252685546875, 0.1746826171875, 0.184112548828125, 0.19354248046875, 0.202972412109375, 0.21240234375, 0.221832275390625, 0.23126220703125, 0.240692138671875, 0.2501220703125, 0.259552001953125, 0.26898193359375, 0.278411865234375, 0.287841796875, 0.297271728515625, 0.30670166015625, 0.316131591796875, 0.3255615234375, 0.334991455078125, 0.34442138671875, 0.353851318359375, 0.36328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 7.0, 6.0, 13.0, 16.0, 41.0, 91.0, 234.0, 309.0, 161.0, 52.0, 34.0, 17.0, 9.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2292137145996094e-05, -2.1676532924175262e-05, -2.106092870235443e-05, -2.04453244805336e-05, -1.982972025871277e-05, -1.9214116036891937e-05, -1.8598511815071106e-05, -1.7982907593250275e-05, -1.7367303371429443e-05, -1.6751699149608612e-05, -1.613609492778778e-05, -1.552049070596695e-05, -1.4904886484146118e-05, -1.4289282262325287e-05, -1.3673678040504456e-05, -1.3058073818683624e-05, -1.2442469596862793e-05, -1.1826865375041962e-05, -1.121126115322113e-05, -1.0595656931400299e-05, -9.980052709579468e-06, -9.364448487758636e-06, -8.748844265937805e-06, -8.133240044116974e-06, -7.517635822296143e-06, -6.902031600475311e-06, -6.28642737865448e-06, -5.670823156833649e-06, -5.055218935012817e-06, -4.439614713191986e-06, -3.824010491371155e-06, -3.2084062695503235e-06, -2.592802047729492e-06, -1.977197825908661e-06, -1.3615936040878296e-06, -7.459893822669983e-07, -1.30385160446167e-07, 4.852190613746643e-07, 1.1008232831954956e-06, 1.716427505016327e-06, 2.332031726837158e-06, 2.9476359486579895e-06, 3.563240170478821e-06, 4.178844392299652e-06, 4.794448614120483e-06, 5.410052835941315e-06, 6.025657057762146e-06, 6.641261279582977e-06, 7.256865501403809e-06, 7.87246972322464e-06, 8.488073945045471e-06, 9.103678166866302e-06, 9.719282388687134e-06, 1.0334886610507965e-05, 1.0950490832328796e-05, 1.1566095054149628e-05, 1.2181699275970459e-05, 1.279730349779129e-05, 1.3412907719612122e-05, 1.4028511941432953e-05, 1.4644116163253784e-05, 1.5259720385074615e-05, 1.5875324606895447e-05, 1.6490928828716278e-05, 1.710653305053711e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 9.0, 16.0, 38.0, 57.0, 96.0, 197.0, 748.0, 5253.0, 1008671.0, 31110.0, 1621.0, 435.0, 138.0, 69.0, 28.0, 24.0, 14.0, 11.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4365234375, -0.417327880859375, -0.39813232421875, -0.378936767578125, -0.3597412109375, -0.340545654296875, -0.32135009765625, -0.302154541015625, -0.282958984375, -0.263763427734375, -0.24456787109375, -0.225372314453125, -0.2061767578125, -0.186981201171875, -0.16778564453125, -0.148590087890625, -0.12939453125, -0.110198974609375, -0.09100341796875, -0.071807861328125, -0.0526123046875, -0.033416748046875, -0.01422119140625, 0.004974365234375, 0.024169921875, 0.043365478515625, 0.06256103515625, 0.081756591796875, 0.1009521484375, 0.120147705078125, 0.13934326171875, 0.158538818359375, 0.177734375, 0.196929931640625, 0.21612548828125, 0.235321044921875, 0.2545166015625, 0.273712158203125, 0.29290771484375, 0.312103271484375, 0.331298828125, 0.350494384765625, 0.36968994140625, 0.388885498046875, 0.4080810546875, 0.427276611328125, 0.44647216796875, 0.465667724609375, 0.48486328125, 0.504058837890625, 0.52325439453125, 0.542449951171875, 0.5616455078125, 0.580841064453125, 0.60003662109375, 0.619232177734375, 0.638427734375, 0.657623291015625, 0.67681884765625, 0.696014404296875, 0.7152099609375, 0.734405517578125, 0.75360107421875, 0.772796630859375, 0.7919921875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 16.0, 16.0, 29.0, 35.0, 84.0, 228.0, 307.0, 141.0, 48.0, 34.0, 14.0, 15.0, 5.0, 4.0, 4.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36572265625, -0.3456573486328125, -0.325592041015625, -0.3055267333984375, -0.28546142578125, -0.2653961181640625, -0.245330810546875, -0.2252655029296875, -0.2052001953125, -0.1851348876953125, -0.165069580078125, -0.1450042724609375, -0.12493896484375, -0.1048736572265625, -0.084808349609375, -0.0647430419921875, -0.044677734375, -0.0246124267578125, -0.004547119140625, 0.0155181884765625, 0.03558349609375, 0.0556488037109375, 0.075714111328125, 0.0957794189453125, 0.1158447265625, 0.1359100341796875, 0.155975341796875, 0.1760406494140625, 0.19610595703125, 0.2161712646484375, 0.236236572265625, 0.2563018798828125, 0.2763671875, 0.2964324951171875, 0.316497802734375, 0.3365631103515625, 0.35662841796875, 0.3766937255859375, 0.396759033203125, 0.4168243408203125, 0.4368896484375, 0.4569549560546875, 0.477020263671875, 0.4970855712890625, 0.51715087890625, 0.5372161865234375, 0.557281494140625, 0.5773468017578125, 0.597412109375, 0.6174774169921875, 0.637542724609375, 0.6576080322265625, 0.67767333984375, 0.6977386474609375, 0.717803955078125, 0.7378692626953125, 0.7579345703125, 0.7779998779296875, 0.798065185546875, 0.8181304931640625, 0.83819580078125, 0.8582611083984375, 0.878326416015625, 0.8983917236328125, 0.91845703125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 33.0, 71.0, 666.0, 164.0, 49.0, 9.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.288055896759033, -2.9463248252868652, -2.6045937538146973, -2.2628629207611084, -1.9211318492889404, -1.5794007778167725, -1.2376699447631836, -0.8959388732910156, -0.5542078018188477, -0.21247678995132446, 0.12925422191619873, 0.47098517417907715, 0.8127162456512451, 1.154447317123413, 1.496178150177002, 1.83790922164917, 2.179640293121338, 2.521371364593506, 2.863102436065674, 3.2048332691192627, 3.5465643405914307, 3.8882954120635986, 4.2300262451171875, 4.5717573165893555, 4.913488388061523, 5.255219459533691, 5.596950531005859, 5.938681602478027, 6.280412673950195, 6.622143745422363, 6.963874340057373, 7.305605411529541, 7.647336959838867, 7.989068031311035, 8.330799102783203, 8.672530174255371, 9.014261245727539, 9.355992317199707, 9.697723388671875, 10.039453506469727, 10.381185531616211, 10.722916603088379, 11.064647674560547, 11.406378746032715, 11.748109817504883, 12.08984088897705, 12.431571960449219, 12.77330207824707, 13.115033149719238, 13.456764221191406, 13.798495292663574, 14.140226364135742, 14.48195743560791, 14.823688507080078, 15.16541862487793, 15.507150650024414, 15.848880767822266, 16.190610885620117, 16.5323429107666, 16.874073028564453, 17.215805053710938, 17.55753517150879, 17.899267196655273, 18.240997314453125, 18.58272933959961]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 7.0, 11.0, 15.0, 15.0, 32.0, 47.0, 85.0, 150.0, 202.0, 173.0, 97.0, 55.0, 24.0, 15.0, 14.0, 10.0, 7.0, 7.0, 2.0, 2.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.72482681274414, -22.995487213134766, -22.26614761352539, -21.536808013916016, -20.80746841430664, -20.078128814697266, -19.34878921508789, -18.619449615478516, -17.89011001586914, -17.160770416259766, -16.43143081665039, -15.702091217041016, -14.97275161743164, -14.243412017822266, -13.514073371887207, -12.784733772277832, -12.055395126342773, -11.326055526733398, -10.596715927124023, -9.867376327514648, -9.138036727905273, -8.408697128295898, -7.67935848236084, -6.950018882751465, -6.22067928314209, -5.491339683532715, -4.76200008392334, -4.032660961151123, -3.303321361541748, -2.573981761932373, -1.8446426391601562, -1.1153030395507812, -0.38596153259277344, 0.343377947807312, 1.0727174282073975, 1.8020567893981934, 2.5313963890075684, 3.2607359886169434, 3.99007511138916, 4.719414710998535, 5.44875431060791, 6.178093910217285, 6.90743350982666, 7.636772632598877, 8.366111755371094, 9.095451354980469, 9.824790954589844, 10.554130554199219, 11.283470153808594, 12.012809753417969, 12.742149353027344, 13.471488952636719, 14.200828552246094, 14.930168151855469, 15.659506797790527, 16.38884735107422, 17.118186950683594, 17.84752655029297, 18.576866149902344, 19.30620574951172, 20.035545349121094, 20.76488494873047, 21.494224548339844, 22.22356414794922, 22.95290184020996]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 6.0, 10.0, 14.0, 20.0, 18.0, 36.0, 37.0, 49.0, 78.0, 138.0, 219.0, 349.0, 545.0, 803.0, 1421.0, 2305.0, 4608.0, 10417.0, 34878.0, 4080996.0, 37522.0, 10805.0, 4389.0, 2115.0, 1097.0, 571.0, 344.0, 191.0, 117.0, 60.0, 45.0, 19.0, 13.0, 11.0, 10.0, 4.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.228515625, -2.1690826416015625, -2.109649658203125, -2.0502166748046875, -1.99078369140625, -1.9313507080078125, -1.871917724609375, -1.8124847412109375, -1.7530517578125, -1.6936187744140625, -1.634185791015625, -1.5747528076171875, -1.51531982421875, -1.4558868408203125, -1.396453857421875, -1.3370208740234375, -1.277587890625, -1.2181549072265625, -1.158721923828125, -1.0992889404296875, -1.03985595703125, -0.9804229736328125, -0.920989990234375, -0.8615570068359375, -0.8021240234375, -0.7426910400390625, -0.683258056640625, -0.6238250732421875, -0.56439208984375, -0.5049591064453125, -0.445526123046875, -0.3860931396484375, -0.32666015625, -0.2672271728515625, -0.207794189453125, -0.1483612060546875, -0.08892822265625, -0.0294952392578125, 0.029937744140625, 0.0893707275390625, 0.1488037109375, 0.2082366943359375, 0.267669677734375, 0.3271026611328125, 0.38653564453125, 0.4459686279296875, 0.505401611328125, 0.5648345947265625, 0.624267578125, 0.6837005615234375, 0.743133544921875, 0.8025665283203125, 0.86199951171875, 0.9214324951171875, 0.980865478515625, 1.0402984619140625, 1.0997314453125, 1.1591644287109375, 1.218597412109375, 1.2780303955078125, 1.33746337890625, 1.3968963623046875, 1.456329345703125, 1.5157623291015625, 1.5751953125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 6.0, 6.0, 15.0, 11.0, 8.0, 11.0, 20.0, 223.0, 553.0, 34.0, 13.0, 7.0, 13.0, 14.0, 15.0, 4.0, 10.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2432861328125, -0.23690032958984375, -0.2305145263671875, -0.22412872314453125, -0.217742919921875, -0.21135711669921875, -0.2049713134765625, -0.19858551025390625, -0.19219970703125, -0.18581390380859375, -0.1794281005859375, -0.17304229736328125, -0.166656494140625, -0.16027069091796875, -0.1538848876953125, -0.14749908447265625, -0.14111328125, -0.13472747802734375, -0.1283416748046875, -0.12195587158203125, -0.115570068359375, -0.10918426513671875, -0.1027984619140625, -0.09641265869140625, -0.09002685546875, -0.08364105224609375, -0.0772552490234375, -0.07086944580078125, -0.064483642578125, -0.05809783935546875, -0.0517120361328125, -0.04532623291015625, -0.0389404296875, -0.03255462646484375, -0.0261688232421875, -0.01978302001953125, -0.013397216796875, -0.00701141357421875, -0.0006256103515625, 0.00576019287109375, 0.01214599609375, 0.01853179931640625, 0.0249176025390625, 0.03130340576171875, 0.037689208984375, 0.04407501220703125, 0.0504608154296875, 0.05684661865234375, 0.063232421875, 0.06961822509765625, 0.0760040283203125, 0.08238983154296875, 0.088775634765625, 0.09516143798828125, 0.1015472412109375, 0.10793304443359375, 0.11431884765625, 0.12070465087890625, 0.1270904541015625, 0.13347625732421875, 0.139862060546875, 0.14624786376953125, 0.1526336669921875, 0.15901947021484375, 0.1654052734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 11.0, 9.0, 15.0, 11.0, 20.0, 26.0, 41.0, 73.0, 104.0, 228.0, 502.0, 1640.0, 6391.0, 48980.0, 4051227.0, 73738.0, 8093.0, 1889.0, 644.0, 256.0, 117.0, 65.0, 41.0, 22.0, 23.0, 23.0, 13.0, 16.0, 7.0, 10.0, 4.0, 6.0, 0.0, 5.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4189453125, -1.3753814697265625, -1.331817626953125, -1.2882537841796875, -1.24468994140625, -1.2011260986328125, -1.157562255859375, -1.1139984130859375, -1.0704345703125, -1.0268707275390625, -0.983306884765625, -0.9397430419921875, -0.89617919921875, -0.8526153564453125, -0.809051513671875, -0.7654876708984375, -0.721923828125, -0.6783599853515625, -0.634796142578125, -0.5912322998046875, -0.54766845703125, -0.5041046142578125, -0.460540771484375, -0.4169769287109375, -0.3734130859375, -0.3298492431640625, -0.286285400390625, -0.2427215576171875, -0.19915771484375, -0.1555938720703125, -0.112030029296875, -0.0684661865234375, -0.02490234375, 0.0186614990234375, 0.062225341796875, 0.1057891845703125, 0.14935302734375, 0.1929168701171875, 0.236480712890625, 0.2800445556640625, 0.3236083984375, 0.3671722412109375, 0.410736083984375, 0.4542999267578125, 0.49786376953125, 0.5414276123046875, 0.584991455078125, 0.6285552978515625, 0.672119140625, 0.7156829833984375, 0.759246826171875, 0.8028106689453125, 0.84637451171875, 0.8899383544921875, 0.933502197265625, 0.9770660400390625, 1.0206298828125, 1.0641937255859375, 1.107757568359375, 1.1513214111328125, 1.19488525390625, 1.2384490966796875, 1.282012939453125, 1.3255767822265625, 1.369140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 8.0, 8.0, 4.0, 7.0, 9.0, 7.0, 14.0, 14.0, 26.0, 31.0, 35.0, 68.0, 100.0, 196.0, 2470.0, 672.0, 126.0, 78.0, 42.0, 22.0, 22.0, 18.0, 12.0, 11.0, 7.0, 9.0, 7.0, 6.0, 6.0, 3.0, 5.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2734375, -0.2651214599609375, -0.256805419921875, -0.2484893798828125, -0.24017333984375, -0.2318572998046875, -0.223541259765625, -0.2152252197265625, -0.2069091796875, -0.1985931396484375, -0.190277099609375, -0.1819610595703125, -0.17364501953125, -0.1653289794921875, -0.157012939453125, -0.1486968994140625, -0.140380859375, -0.1320648193359375, -0.123748779296875, -0.1154327392578125, -0.10711669921875, -0.0988006591796875, -0.090484619140625, -0.0821685791015625, -0.0738525390625, -0.0655364990234375, -0.057220458984375, -0.0489044189453125, -0.04058837890625, -0.0322723388671875, -0.023956298828125, -0.0156402587890625, -0.00732421875, 0.0009918212890625, 0.009307861328125, 0.0176239013671875, 0.02593994140625, 0.0342559814453125, 0.042572021484375, 0.0508880615234375, 0.0592041015625, 0.0675201416015625, 0.075836181640625, 0.0841522216796875, 0.09246826171875, 0.1007843017578125, 0.109100341796875, 0.1174163818359375, 0.125732421875, 0.1340484619140625, 0.142364501953125, 0.1506805419921875, 0.15899658203125, 0.1673126220703125, 0.175628662109375, 0.1839447021484375, 0.1922607421875, 0.2005767822265625, 0.208892822265625, 0.2172088623046875, 0.22552490234375, 0.2338409423828125, 0.242156982421875, 0.2504730224609375, 0.2587890625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 31.0, 970.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5032474994659424, -1.225464105606079, -0.9476807713508606, -0.6698974370956421, -0.3921140432357788, -0.11433064937591553, 0.1634526252746582, 0.4412360191345215, 0.7190194129943848, 0.996802806854248, 1.2745862007141113, 1.552369475364685, 1.8301528692245483, 2.107936382293701, 2.3857195377349854, 2.6635029315948486, 2.941286325454712, 3.219069719314575, 3.4968531131744385, 3.7746362686157227, 4.052419662475586, 4.330203056335449, 4.6079864501953125, 4.885769844055176, 5.163553237915039, 5.441336631774902, 5.719120025634766, 5.996903419494629, 6.274686813354492, 6.5524702072143555, 6.830253601074219, 7.108036994934082, 7.385819435119629, 7.663602828979492, 7.9413862228393555, 8.219169616699219, 8.496953010559082, 8.774736404418945, 9.052519798278809, 9.330303192138672, 9.608086585998535, 9.885869979858398, 10.163653373718262, 10.441436767578125, 10.719220161437988, 10.997003555297852, 11.274786949157715, 11.552570343017578, 11.830352783203125, 12.108136177062988, 12.385919570922852, 12.663702964782715, 12.941486358642578, 13.219269752502441, 13.497053146362305, 13.774836540222168, 14.052619934082031, 14.330403327941895, 14.608186721801758, 14.885970115661621, 15.163753509521484, 15.441536903381348, 15.719320297241211, 15.997103691101074, 16.274887084960938]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 6.0, 4.0, 5.0, 6.0, 9.0, 14.0, 24.0, 42.0, 40.0, 59.0, 79.0, 103.0, 102.0, 113.0, 96.0, 73.0, 73.0, 47.0, 22.0, 18.0, 6.0, 6.0, 5.0, 4.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2213718891143799, -1.1778141260147095, -1.134256362915039, -1.0906985998153687, -1.0471408367156982, -1.0035831928253174, -0.960025429725647, -0.9164676666259766, -0.8729099035263062, -0.8293521404266357, -0.7857943773269653, -0.7422366738319397, -0.6986789107322693, -0.6551211476325989, -0.6115634441375732, -0.5680056810379028, -0.5244479179382324, -0.480890154838562, -0.437332421541214, -0.39377468824386597, -0.35021692514419556, -0.30665916204452515, -0.2631014287471771, -0.2195436954498291, -0.1759859323501587, -0.13242818415164948, -0.08887043595314026, -0.04531268775463104, -0.0017549395561218262, 0.04180280864238739, 0.0853605568408966, 0.12891829013824463, 0.17247605323791504, 0.21603380143642426, 0.25959154963493347, 0.3031492829322815, 0.3467070460319519, 0.3902648091316223, 0.43382254242897034, 0.47738027572631836, 0.5209380388259888, 0.5644958019256592, 0.6080535650253296, 0.6516112685203552, 0.6951690316200256, 0.738726794719696, 0.7822844982147217, 0.8258422613143921, 0.8694000244140625, 0.9129577875137329, 0.9565155506134033, 1.0000733137130737, 1.0436310768127441, 1.087188720703125, 1.1307464838027954, 1.1743042469024658, 1.2178620100021362, 1.2614197731018066, 1.304977536201477, 1.3485352993011475, 1.3920929431915283, 1.4356507062911987, 1.4792084693908691, 1.5227662324905396, 1.56632399559021]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 14.0, 11.0, 16.0, 37.0, 39.0, 62.0, 108.0, 129.0, 237.0, 453.0, 760.0, 1480.0, 2873.0, 5932.0, 14959.0, 55013.0, 912031.0, 33117.0, 11224.0, 4853.0, 2309.0, 1226.0, 631.0, 406.0, 230.0, 137.0, 82.0, 64.0, 36.0, 23.0, 18.0, 10.0, 13.0, 6.0, 3.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0439453125, -1.009552001953125, -0.97515869140625, -0.940765380859375, -0.9063720703125, -0.871978759765625, -0.83758544921875, -0.803192138671875, -0.768798828125, -0.734405517578125, -0.70001220703125, -0.665618896484375, -0.6312255859375, -0.596832275390625, -0.56243896484375, -0.528045654296875, -0.49365234375, -0.459259033203125, -0.42486572265625, -0.390472412109375, -0.3560791015625, -0.321685791015625, -0.28729248046875, -0.252899169921875, -0.218505859375, -0.184112548828125, -0.14971923828125, -0.115325927734375, -0.0809326171875, -0.046539306640625, -0.01214599609375, 0.022247314453125, 0.056640625, 0.091033935546875, 0.12542724609375, 0.159820556640625, 0.1942138671875, 0.228607177734375, 0.26300048828125, 0.297393798828125, 0.331787109375, 0.366180419921875, 0.40057373046875, 0.434967041015625, 0.4693603515625, 0.503753662109375, 0.53814697265625, 0.572540283203125, 0.60693359375, 0.641326904296875, 0.67572021484375, 0.710113525390625, 0.7445068359375, 0.778900146484375, 0.81329345703125, 0.847686767578125, 0.882080078125, 0.916473388671875, 0.95086669921875, 0.985260009765625, 1.0196533203125, 1.054046630859375, 1.08843994140625, 1.122833251953125, 1.1572265625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 4.0, 10.0, 12.0, 7.0, 11.0, 18.0, 25.0, 303.0, 441.0, 50.0, 12.0, 16.0, 11.0, 13.0, 7.0, 11.0, 6.0, 2.0, 9.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2109375, -0.20508766174316406, -0.19923782348632812, -0.1933879852294922, -0.18753814697265625, -0.1816883087158203, -0.17583847045898438, -0.16998863220214844, -0.1641387939453125, -0.15828895568847656, -0.15243911743164062, -0.1465892791748047, -0.14073944091796875, -0.1348896026611328, -0.12903976440429688, -0.12318992614746094, -0.117340087890625, -0.11149024963378906, -0.10564041137695312, -0.09979057312011719, -0.09394073486328125, -0.08809089660644531, -0.08224105834960938, -0.07639122009277344, -0.0705413818359375, -0.06469154357910156, -0.058841705322265625, -0.05299186706542969, -0.04714202880859375, -0.04129219055175781, -0.035442352294921875, -0.029592514038085938, -0.02374267578125, -0.017892837524414062, -0.012042999267578125, -0.0061931610107421875, -0.00034332275390625, 0.0055065155029296875, 0.011356353759765625, 0.017206192016601562, 0.0230560302734375, 0.028905868530273438, 0.034755706787109375, 0.04060554504394531, 0.04645538330078125, 0.05230522155761719, 0.058155059814453125, 0.06400489807128906, 0.069854736328125, 0.07570457458496094, 0.08155441284179688, 0.08740425109863281, 0.09325408935546875, 0.09910392761230469, 0.10495376586914062, 0.11080360412597656, 0.1166534423828125, 0.12250328063964844, 0.12835311889648438, 0.1342029571533203, 0.14005279541015625, 0.1459026336669922, 0.15175247192382812, 0.15760231018066406, 0.1634521484375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 7.0, 7.0, 6.0, 12.0, 17.0, 15.0, 19.0, 20.0, 20.0, 37.0, 48.0, 40.0, 83.0, 116.0, 205.0, 539.0, 2788.0, 58402.0, 941473.0, 40812.0, 2665.0, 549.0, 210.0, 126.0, 68.0, 50.0, 26.0, 41.0, 24.0, 27.0, 18.0, 22.0, 10.0, 13.0, 15.0, 5.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9482421875, -0.9136810302734375, -0.879119873046875, -0.8445587158203125, -0.80999755859375, -0.7754364013671875, -0.740875244140625, -0.7063140869140625, -0.6717529296875, -0.6371917724609375, -0.602630615234375, -0.5680694580078125, -0.53350830078125, -0.4989471435546875, -0.464385986328125, -0.4298248291015625, -0.395263671875, -0.3607025146484375, -0.326141357421875, -0.2915802001953125, -0.25701904296875, -0.2224578857421875, -0.187896728515625, -0.1533355712890625, -0.1187744140625, -0.0842132568359375, -0.049652099609375, -0.0150909423828125, 0.01947021484375, 0.0540313720703125, 0.088592529296875, 0.1231536865234375, 0.15771484375, 0.1922760009765625, 0.226837158203125, 0.2613983154296875, 0.29595947265625, 0.3305206298828125, 0.365081787109375, 0.3996429443359375, 0.4342041015625, 0.4687652587890625, 0.503326416015625, 0.5378875732421875, 0.57244873046875, 0.6070098876953125, 0.641571044921875, 0.6761322021484375, 0.710693359375, 0.7452545166015625, 0.779815673828125, 0.8143768310546875, 0.84893798828125, 0.8834991455078125, 0.918060302734375, 0.9526214599609375, 0.9871826171875, 1.0217437744140625, 1.056304931640625, 1.0908660888671875, 1.12542724609375, 1.1599884033203125, 1.194549560546875, 1.2291107177734375, 1.263671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 6.0, 18.0, 11.0, 15.0, 15.0, 19.0, 30.0, 27.0, 34.0, 35.0, 33.0, 36.0, 45.0, 45.0, 43.0, 49.0, 44.0, 42.0, 56.0, 41.0, 50.0, 37.0, 30.0, 34.0, 23.0, 31.0, 15.0, 19.0, 23.0, 16.0, 17.0, 15.0, 6.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.48046875, -0.46387481689453125, -0.4472808837890625, -0.43068695068359375, -0.414093017578125, -0.39749908447265625, -0.3809051513671875, -0.36431121826171875, -0.34771728515625, -0.33112335205078125, -0.3145294189453125, -0.29793548583984375, -0.281341552734375, -0.26474761962890625, -0.2481536865234375, -0.23155975341796875, -0.2149658203125, -0.19837188720703125, -0.1817779541015625, -0.16518402099609375, -0.148590087890625, -0.13199615478515625, -0.1154022216796875, -0.09880828857421875, -0.08221435546875, -0.06562042236328125, -0.0490264892578125, -0.03243255615234375, -0.015838623046875, 0.00075531005859375, 0.0173492431640625, 0.03394317626953125, 0.050537109375, 0.06713104248046875, 0.0837249755859375, 0.10031890869140625, 0.116912841796875, 0.13350677490234375, 0.1501007080078125, 0.16669464111328125, 0.18328857421875, 0.19988250732421875, 0.2164764404296875, 0.23307037353515625, 0.249664306640625, 0.26625823974609375, 0.2828521728515625, 0.29944610595703125, 0.3160400390625, 0.33263397216796875, 0.3492279052734375, 0.36582183837890625, 0.382415771484375, 0.39900970458984375, 0.4156036376953125, 0.43219757080078125, 0.44879150390625, 0.46538543701171875, 0.4819793701171875, 0.49857330322265625, 0.515167236328125, 0.5317611694335938, 0.5483551025390625, 0.5649490356445312, 0.58154296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 7.0, 10.0, 16.0, 32.0, 47.0, 115.0, 239.0, 879.0, 8536.0, 1034057.0, 3641.0, 605.0, 185.0, 73.0, 38.0, 23.0, 11.0, 10.0, 5.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.6086349487304688, -0.5898284912109375, -0.5710220336914062, -0.552215576171875, -0.5334091186523438, -0.5146026611328125, -0.49579620361328125, -0.47698974609375, -0.45818328857421875, -0.4393768310546875, -0.42057037353515625, -0.401763916015625, -0.38295745849609375, -0.3641510009765625, -0.34534454345703125, -0.3265380859375, -0.30773162841796875, -0.2889251708984375, -0.27011871337890625, -0.251312255859375, -0.23250579833984375, -0.2136993408203125, -0.19489288330078125, -0.17608642578125, -0.15727996826171875, -0.1384735107421875, -0.11966705322265625, -0.100860595703125, -0.08205413818359375, -0.0632476806640625, -0.04444122314453125, -0.025634765625, -0.00682830810546875, 0.0119781494140625, 0.03078460693359375, 0.049591064453125, 0.06839752197265625, 0.0872039794921875, 0.10601043701171875, 0.12481689453125, 0.14362335205078125, 0.1624298095703125, 0.18123626708984375, 0.200042724609375, 0.21884918212890625, 0.2376556396484375, 0.25646209716796875, 0.2752685546875, 0.29407501220703125, 0.3128814697265625, 0.33168792724609375, 0.350494384765625, 0.36930084228515625, 0.3881072998046875, 0.40691375732421875, 0.42572021484375, 0.44452667236328125, 0.4633331298828125, 0.48213958740234375, 0.500946044921875, 0.5197525024414062, 0.5385589599609375, 0.5573654174804688, 0.576171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 6.0, 5.0, 19.0, 31.0, 83.0, 118.0, 204.0, 197.0, 149.0, 79.0, 43.0, 23.0, 9.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5020370483398438e-05, -1.4564022421836853e-05, -1.4107674360275269e-05, -1.3651326298713684e-05, -1.31949782371521e-05, -1.2738630175590515e-05, -1.228228211402893e-05, -1.1825934052467346e-05, -1.1369585990905762e-05, -1.0913237929344177e-05, -1.0456889867782593e-05, -1.0000541806221008e-05, -9.544193744659424e-06, -9.08784568309784e-06, -8.631497621536255e-06, -8.17514955997467e-06, -7.718801498413086e-06, -7.2624534368515015e-06, -6.806105375289917e-06, -6.3497573137283325e-06, -5.893409252166748e-06, -5.4370611906051636e-06, -4.980713129043579e-06, -4.524365067481995e-06, -4.06801700592041e-06, -3.6116689443588257e-06, -3.155320882797241e-06, -2.6989728212356567e-06, -2.2426247596740723e-06, -1.7862766981124878e-06, -1.3299286365509033e-06, -8.735805749893188e-07, -4.172325134277344e-07, 3.91155481338501e-08, 4.954636096954346e-07, 9.51811671257019e-07, 1.4081597328186035e-06, 1.864507794380188e-06, 2.3208558559417725e-06, 2.777203917503357e-06, 3.2335519790649414e-06, 3.689900040626526e-06, 4.14624810218811e-06, 4.602596163749695e-06, 5.058944225311279e-06, 5.515292286872864e-06, 5.971640348434448e-06, 6.427988409996033e-06, 6.884336471557617e-06, 7.340684533119202e-06, 7.797032594680786e-06, 8.25338065624237e-06, 8.709728717803955e-06, 9.16607677936554e-06, 9.622424840927124e-06, 1.0078772902488708e-05, 1.0535120964050293e-05, 1.0991469025611877e-05, 1.1447817087173462e-05, 1.1904165148735046e-05, 1.2360513210296631e-05, 1.2816861271858215e-05, 1.32732093334198e-05, 1.3729557394981384e-05, 1.4185905456542969e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 0.0, 5.0, 1.0, 9.0, 18.0, 17.0, 28.0, 51.0, 142.0, 400.0, 2134.0, 123357.0, 918986.0, 2867.0, 307.0, 108.0, 37.0, 18.0, 19.0, 13.0, 7.0, 7.0, 9.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53076171875, -0.5175247192382812, -0.5042877197265625, -0.49105072021484375, -0.477813720703125, -0.46457672119140625, -0.4513397216796875, -0.43810272216796875, -0.42486572265625, -0.41162872314453125, -0.3983917236328125, -0.38515472412109375, -0.371917724609375, -0.35868072509765625, -0.3454437255859375, -0.33220672607421875, -0.3189697265625, -0.30573272705078125, -0.2924957275390625, -0.27925872802734375, -0.266021728515625, -0.25278472900390625, -0.2395477294921875, -0.22631072998046875, -0.21307373046875, -0.19983673095703125, -0.1865997314453125, -0.17336273193359375, -0.160125732421875, -0.14688873291015625, -0.1336517333984375, -0.12041473388671875, -0.107177734375, -0.09394073486328125, -0.0807037353515625, -0.06746673583984375, -0.054229736328125, -0.04099273681640625, -0.0277557373046875, -0.01451873779296875, -0.00128173828125, 0.01195526123046875, 0.0251922607421875, 0.03842926025390625, 0.051666259765625, 0.06490325927734375, 0.0781402587890625, 0.09137725830078125, 0.1046142578125, 0.11785125732421875, 0.1310882568359375, 0.14432525634765625, 0.157562255859375, 0.17079925537109375, 0.1840362548828125, 0.19727325439453125, 0.21051025390625, 0.22374725341796875, 0.2369842529296875, 0.25022125244140625, 0.263458251953125, 0.27669525146484375, 0.2899322509765625, 0.30316925048828125, 0.31640625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 11.0, 6.0, 10.0, 11.0, 20.0, 39.0, 49.0, 94.0, 203.0, 260.0, 122.0, 52.0, 36.0, 21.0, 8.0, 13.0, 7.0, 7.0, 4.0, 10.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26171875, -0.25536155700683594, -0.24900436401367188, -0.2426471710205078, -0.23628997802734375, -0.2299327850341797, -0.22357559204101562, -0.21721839904785156, -0.2108612060546875, -0.20450401306152344, -0.19814682006835938, -0.1917896270751953, -0.18543243408203125, -0.1790752410888672, -0.17271804809570312, -0.16636085510253906, -0.160003662109375, -0.15364646911621094, -0.14728927612304688, -0.1409320831298828, -0.13457489013671875, -0.1282176971435547, -0.12186050415039062, -0.11550331115722656, -0.1091461181640625, -0.10278892517089844, -0.09643173217773438, -0.09007453918457031, -0.08371734619140625, -0.07736015319824219, -0.07100296020507812, -0.06464576721191406, -0.05828857421875, -0.05193138122558594, -0.045574188232421875, -0.03921699523925781, -0.03285980224609375, -0.026502609252929688, -0.020145416259765625, -0.013788223266601562, -0.0074310302734375, -0.0010738372802734375, 0.005283355712890625, 0.011640548706054688, 0.01799774169921875, 0.024354934692382812, 0.030712127685546875, 0.03706932067871094, 0.043426513671875, 0.04978370666503906, 0.056140899658203125, 0.06249809265136719, 0.06885528564453125, 0.07521247863769531, 0.08156967163085938, 0.08792686462402344, 0.0942840576171875, 0.10064125061035156, 0.10699844360351562, 0.11335563659667969, 0.11971282958984375, 0.1260700225830078, 0.13242721557617188, 0.13878440856933594, 0.1451416015625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 13.0, 83.0, 803.0, 96.0, 11.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0751290321350098, -1.829355239868164, -1.5835813283920288, -1.3378074169158936, -1.0920336246490479, -0.8462598323822021, -0.6004859209060669, -0.35471200942993164, -0.10893821716308594, 0.13683563470840454, 0.382609486579895, 0.6283833384513855, 0.874157190322876, 1.1199309825897217, 1.365704894065857, 1.6114788055419922, 1.857252597808838, 2.1030263900756836, 2.3488001823425293, 2.594574213027954, 2.8403480052948, 3.0861217975616455, 3.3318958282470703, 3.577669620513916, 3.8234434127807617, 4.069217205047607, 4.314990997314453, 4.560764789581299, 4.8065385818481445, 5.052312850952148, 5.298086643218994, 5.54386043548584, 5.789633750915527, 6.035407543182373, 6.281181335449219, 6.5269551277160645, 6.77272891998291, 7.018503189086914, 7.26427698135376, 7.5100507736206055, 7.755824565887451, 8.001598358154297, 8.2473726272583, 8.493145942687988, 8.738920211791992, 8.98469352722168, 9.230467796325684, 9.476242065429688, 9.722015380859375, 9.967789649963379, 10.213562965393066, 10.45933723449707, 10.705110549926758, 10.950884819030762, 11.19665813446045, 11.442432403564453, 11.68820571899414, 11.933979988098145, 12.179753303527832, 12.425527572631836, 12.671300888061523, 12.917075157165527, 13.162848472595215, 13.408622741699219, 13.654397010803223]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 11.0, 8.0, 10.0, 16.0, 30.0, 35.0, 58.0, 78.0, 95.0, 99.0, 110.0, 95.0, 87.0, 86.0, 57.0, 34.0, 28.0, 19.0, 7.0, 6.0, 4.0, 1.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.831767559051514, -7.628604412078857, -7.425441265106201, -7.222278118133545, -7.019115447998047, -6.815952301025391, -6.612789154052734, -6.409626007080078, -6.206462860107422, -6.003299713134766, -5.800136566162109, -5.596973419189453, -5.393810272216797, -5.190647125244141, -4.987484455108643, -4.784321308135986, -4.58115816116333, -4.377995014190674, -4.174831867218018, -3.9716689586639404, -3.768505811691284, -3.565342664718628, -3.362179756164551, -3.1590166091918945, -2.9558534622192383, -2.752690315246582, -2.549527168273926, -2.3463642597198486, -2.1432011127471924, -1.9400379657745361, -1.7368749380111694, -1.5337119102478027, -1.3305482864379883, -1.127385139465332, -0.9242221117019653, -0.7210590243339539, -0.5178959369659424, -0.31473278999328613, -0.11156976222991943, 0.09159326553344727, 0.2947564125061035, 0.497919499874115, 0.7010825872421265, 0.9042456746101379, 1.1074087619781494, 1.3105719089508057, 1.5137349367141724, 1.716897964477539, 1.9200611114501953, 2.1232242584228516, 2.326387405395508, 2.529550313949585, 2.732713460922241, 2.9358766078948975, 3.1390395164489746, 3.342202663421631, 3.545365810394287, 3.7485289573669434, 3.9516921043395996, 4.154855251312256, 4.358017921447754, 4.56118106842041, 4.764344215393066, 4.967507362365723, 5.170670509338379]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 12.0, 10.0, 10.0, 13.0, 30.0, 36.0, 58.0, 90.0, 111.0, 187.0, 348.0, 495.0, 807.0, 1454.0, 2758.0, 6191.0, 27094.0, 4114385.0, 28525.0, 6119.0, 2589.0, 1335.0, 698.0, 366.0, 218.0, 122.0, 59.0, 50.0, 27.0, 22.0, 19.0, 8.0, 7.0, 12.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.927734375, -1.868408203125, -1.80908203125, -1.749755859375, -1.6904296875, -1.631103515625, -1.57177734375, -1.512451171875, -1.453125, -1.393798828125, -1.33447265625, -1.275146484375, -1.2158203125, -1.156494140625, -1.09716796875, -1.037841796875, -0.978515625, -0.919189453125, -0.85986328125, -0.800537109375, -0.7412109375, -0.681884765625, -0.62255859375, -0.563232421875, -0.50390625, -0.444580078125, -0.38525390625, -0.325927734375, -0.2666015625, -0.207275390625, -0.14794921875, -0.088623046875, -0.029296875, 0.030029296875, 0.08935546875, 0.148681640625, 0.2080078125, 0.267333984375, 0.32666015625, 0.385986328125, 0.4453125, 0.504638671875, 0.56396484375, 0.623291015625, 0.6826171875, 0.741943359375, 0.80126953125, 0.860595703125, 0.919921875, 0.979248046875, 1.03857421875, 1.097900390625, 1.1572265625, 1.216552734375, 1.27587890625, 1.335205078125, 1.39453125, 1.453857421875, 1.51318359375, 1.572509765625, 1.6318359375, 1.691162109375, 1.75048828125, 1.809814453125, 1.869140625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 4.0, 7.0, 4.0, 3.0, 8.0, 8.0, 18.0, 9.0, 14.0, 27.0, 159.0, 498.0, 138.0, 17.0, 15.0, 11.0, 12.0, 10.0, 10.0, 5.0, 9.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18212890625, -0.17650413513183594, -0.17087936401367188, -0.1652545928955078, -0.15962982177734375, -0.1540050506591797, -0.14838027954101562, -0.14275550842285156, -0.1371307373046875, -0.13150596618652344, -0.12588119506835938, -0.12025642395019531, -0.11463165283203125, -0.10900688171386719, -0.10338211059570312, -0.09775733947753906, -0.092132568359375, -0.08650779724121094, -0.08088302612304688, -0.07525825500488281, -0.06963348388671875, -0.06400871276855469, -0.058383941650390625, -0.05275917053222656, -0.0471343994140625, -0.04150962829589844, -0.035884857177734375, -0.030260086059570312, -0.02463531494140625, -0.019010543823242188, -0.013385772705078125, -0.0077610015869140625, -0.00213623046875, 0.0034885406494140625, 0.009113311767578125, 0.014738082885742188, 0.02036285400390625, 0.025987625122070312, 0.031612396240234375, 0.03723716735839844, 0.0428619384765625, 0.04848670959472656, 0.054111480712890625, 0.05973625183105469, 0.06536102294921875, 0.07098579406738281, 0.07661056518554688, 0.08223533630371094, 0.087860107421875, 0.09348487854003906, 0.09910964965820312, 0.10473442077636719, 0.11035919189453125, 0.11598396301269531, 0.12160873413085938, 0.12723350524902344, 0.1328582763671875, 0.13848304748535156, 0.14410781860351562, 0.1497325897216797, 0.15535736083984375, 0.1609821319580078, 0.16660690307617188, 0.17223167419433594, 0.1778564453125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 11.0, 12.0, 6.0, 25.0, 23.0, 35.0, 36.0, 81.0, 104.0, 214.0, 777.0, 5948.0, 4059704.0, 123447.0, 2844.0, 535.0, 171.0, 90.0, 71.0, 30.0, 29.0, 16.0, 11.0, 10.0, 10.0, 10.0, 6.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.33984375, -2.26861572265625, -2.1973876953125, -2.12615966796875, -2.054931640625, -1.98370361328125, -1.9124755859375, -1.84124755859375, -1.77001953125, -1.69879150390625, -1.6275634765625, -1.55633544921875, -1.485107421875, -1.41387939453125, -1.3426513671875, -1.27142333984375, -1.2001953125, -1.12896728515625, -1.0577392578125, -0.98651123046875, -0.915283203125, -0.84405517578125, -0.7728271484375, -0.70159912109375, -0.63037109375, -0.55914306640625, -0.4879150390625, -0.41668701171875, -0.345458984375, -0.27423095703125, -0.2030029296875, -0.13177490234375, -0.060546875, 0.01068115234375, 0.0819091796875, 0.15313720703125, 0.224365234375, 0.29559326171875, 0.3668212890625, 0.43804931640625, 0.50927734375, 0.58050537109375, 0.6517333984375, 0.72296142578125, 0.794189453125, 0.86541748046875, 0.9366455078125, 1.00787353515625, 1.0791015625, 1.15032958984375, 1.2215576171875, 1.29278564453125, 1.364013671875, 1.43524169921875, 1.5064697265625, 1.57769775390625, 1.64892578125, 1.72015380859375, 1.7913818359375, 1.86260986328125, 1.933837890625, 2.00506591796875, 2.0762939453125, 2.14752197265625, 2.21875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 6.0, 11.0, 4.0, 7.0, 18.0, 21.0, 19.0, 31.0, 53.0, 92.0, 564.0, 2863.0, 136.0, 66.0, 51.0, 23.0, 17.0, 26.0, 14.0, 5.0, 10.0, 8.0, 4.0, 0.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3173828125, -0.30651092529296875, -0.2956390380859375, -0.28476715087890625, -0.273895263671875, -0.26302337646484375, -0.2521514892578125, -0.24127960205078125, -0.23040771484375, -0.21953582763671875, -0.2086639404296875, -0.19779205322265625, -0.186920166015625, -0.17604827880859375, -0.1651763916015625, -0.15430450439453125, -0.1434326171875, -0.13256072998046875, -0.1216888427734375, -0.11081695556640625, -0.099945068359375, -0.08907318115234375, -0.0782012939453125, -0.06732940673828125, -0.05645751953125, -0.04558563232421875, -0.0347137451171875, -0.02384185791015625, -0.012969970703125, -0.00209808349609375, 0.0087738037109375, 0.01964569091796875, 0.030517578125, 0.04138946533203125, 0.0522613525390625, 0.06313323974609375, 0.074005126953125, 0.08487701416015625, 0.0957489013671875, 0.10662078857421875, 0.11749267578125, 0.12836456298828125, 0.1392364501953125, 0.15010833740234375, 0.160980224609375, 0.17185211181640625, 0.1827239990234375, 0.19359588623046875, 0.2044677734375, 0.21533966064453125, 0.2262115478515625, 0.23708343505859375, 0.247955322265625, 0.25882720947265625, 0.2696990966796875, 0.28057098388671875, 0.29144287109375, 0.30231475830078125, 0.3131866455078125, 0.32405853271484375, 0.334930419921875, 0.34580230712890625, 0.3566741943359375, 0.36754608154296875, 0.37841796875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 25.0, 962.0, 25.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5877652168273926, -1.418749213218689, -1.2497332096099854, -1.0807172060012817, -0.9117012023925781, -0.7426851987838745, -0.5736691951751709, -0.4046531915664673, -0.23563718795776367, -0.06662118434906006, 0.10239481925964355, 0.27141082286834717, 0.4404268264770508, 0.6094428300857544, 0.778458833694458, 0.9474748373031616, 1.1164908409118652, 1.2855068445205688, 1.4545228481292725, 1.623538851737976, 1.7925548553466797, 1.9615708589553833, 2.130586862564087, 2.29960298538208, 2.468618869781494, 2.637634754180908, 2.8066508769989014, 2.9756669998168945, 3.1446828842163086, 3.3136987686157227, 3.482714891433716, 3.651731014251709, 3.8207473754882812, 3.9897632598876953, 4.158779144287109, 4.327795505523682, 4.496811389923096, 4.66582727432251, 4.834843635559082, 5.003859519958496, 5.17287540435791, 5.341891288757324, 5.510907173156738, 5.6799235343933105, 5.848939418792725, 6.017955303192139, 6.186971664428711, 6.355987548828125, 6.525003433227539, 6.694019317626953, 6.863035202026367, 7.0320515632629395, 7.2010674476623535, 7.370083332061768, 7.53909969329834, 7.708115577697754, 7.877131462097168, 8.046147346496582, 8.215163230895996, 8.38417911529541, 8.55319595336914, 8.722211837768555, 8.891227722167969, 9.060243606567383, 9.229259490966797]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 5.0, 4.0, 5.0, 9.0, 20.0, 18.0, 37.0, 61.0, 56.0, 67.0, 111.0, 105.0, 107.0, 105.0, 84.0, 68.0, 41.0, 22.0, 17.0, 9.0, 11.0, 4.0, 2.0, 2.0, 4.0, 7.0, 3.0, 1.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1792802810668945, -1.1334666013717651, -1.0876529216766357, -1.041839361190796, -0.9960256218910217, -0.9502120018005371, -0.9043983221054077, -0.8585846424102783, -0.8127709627151489, -0.7669572830200195, -0.7211436629295349, -0.6753299832344055, -0.6295163035392761, -0.5837026834487915, -0.5378890037536621, -0.4920753240585327, -0.4462617039680481, -0.4004480540752411, -0.3546343743801117, -0.3088207244873047, -0.2630070447921753, -0.2171933948993683, -0.17137974500656128, -0.12556606531143188, -0.07975241541862488, -0.033938754349946976, 0.011874906718730927, 0.05768856406211853, 0.10350222885608673, 0.14931589365005493, 0.19512954354286194, 0.24094322323799133, 0.28675687313079834, 0.33257052302360535, 0.37838420271873474, 0.42419785261154175, 0.47001153230667114, 0.5158251523971558, 0.5616388320922852, 0.6074525117874146, 0.653266191482544, 0.6990798711776733, 0.744893491268158, 0.7907071709632874, 0.8365208506584167, 0.8823344707489014, 0.9281481504440308, 0.9739618301391602, 1.019775390625, 1.0655890703201294, 1.1114027500152588, 1.1572163105010986, 1.203029990196228, 1.2488436698913574, 1.2946573495864868, 1.3404710292816162, 1.3862847089767456, 1.432098388671875, 1.4779120683670044, 1.5237257480621338, 1.5695393085479736, 1.615352988243103, 1.6611666679382324, 1.7069803476333618, 1.7527940273284912]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 8.0, 10.0, 17.0, 26.0, 34.0, 56.0, 62.0, 118.0, 160.0, 260.0, 469.0, 835.0, 1582.0, 3547.0, 9843.0, 56111.0, 926437.0, 35009.0, 7851.0, 2933.0, 1348.0, 738.0, 391.0, 219.0, 151.0, 90.0, 63.0, 43.0, 41.0, 21.0, 14.0, 15.0, 12.0, 12.0, 5.0, 4.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9372711181640625, -0.909210205078125, -0.8811492919921875, -0.85308837890625, -0.8250274658203125, -0.796966552734375, -0.7689056396484375, -0.7408447265625, -0.7127838134765625, -0.684722900390625, -0.6566619873046875, -0.62860107421875, -0.6005401611328125, -0.572479248046875, -0.5444183349609375, -0.516357421875, -0.4882965087890625, -0.460235595703125, -0.4321746826171875, -0.40411376953125, -0.3760528564453125, -0.347991943359375, -0.3199310302734375, -0.2918701171875, -0.2638092041015625, -0.235748291015625, -0.2076873779296875, -0.17962646484375, -0.1515655517578125, -0.123504638671875, -0.0954437255859375, -0.0673828125, -0.0393218994140625, -0.011260986328125, 0.0167999267578125, 0.04486083984375, 0.0729217529296875, 0.100982666015625, 0.1290435791015625, 0.1571044921875, 0.1851654052734375, 0.213226318359375, 0.2412872314453125, 0.26934814453125, 0.2974090576171875, 0.325469970703125, 0.3535308837890625, 0.381591796875, 0.4096527099609375, 0.437713623046875, 0.4657745361328125, 0.49383544921875, 0.5218963623046875, 0.549957275390625, 0.5780181884765625, 0.6060791015625, 0.6341400146484375, 0.662200927734375, 0.6902618408203125, 0.71832275390625, 0.7463836669921875, 0.774444580078125, 0.8025054931640625, 0.83056640625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 11.0, 7.0, 13.0, 10.0, 24.0, 59.0, 295.0, 374.0, 86.0, 20.0, 13.0, 21.0, 7.0, 10.0, 8.0, 9.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1527099609375, -0.1476287841796875, -0.142547607421875, -0.1374664306640625, -0.13238525390625, -0.1273040771484375, -0.122222900390625, -0.1171417236328125, -0.112060546875, -0.1069793701171875, -0.101898193359375, -0.0968170166015625, -0.09173583984375, -0.0866546630859375, -0.081573486328125, -0.0764923095703125, -0.0714111328125, -0.0663299560546875, -0.061248779296875, -0.0561676025390625, -0.05108642578125, -0.0460052490234375, -0.040924072265625, -0.0358428955078125, -0.03076171875, -0.0256805419921875, -0.020599365234375, -0.0155181884765625, -0.01043701171875, -0.0053558349609375, -0.000274658203125, 0.0048065185546875, 0.0098876953125, 0.0149688720703125, 0.020050048828125, 0.0251312255859375, 0.03021240234375, 0.0352935791015625, 0.040374755859375, 0.0454559326171875, 0.050537109375, 0.0556182861328125, 0.060699462890625, 0.0657806396484375, 0.07086181640625, 0.0759429931640625, 0.081024169921875, 0.0861053466796875, 0.0911865234375, 0.0962677001953125, 0.101348876953125, 0.1064300537109375, 0.11151123046875, 0.1165924072265625, 0.121673583984375, 0.1267547607421875, 0.1318359375, 0.1369171142578125, 0.141998291015625, 0.1470794677734375, 0.15216064453125, 0.1572418212890625, 0.162322998046875, 0.1674041748046875, 0.1724853515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 1.0, 15.0, 7.0, 15.0, 9.0, 16.0, 23.0, 27.0, 16.0, 21.0, 44.0, 60.0, 98.0, 125.0, 159.0, 258.0, 477.0, 1342.0, 7074.0, 362978.0, 663080.0, 9678.0, 1544.0, 520.0, 272.0, 168.0, 114.0, 101.0, 63.0, 45.0, 39.0, 31.0, 25.0, 12.0, 14.0, 21.0, 17.0, 8.0, 6.0, 8.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.890625, -0.860992431640625, -0.83135986328125, -0.801727294921875, -0.7720947265625, -0.742462158203125, -0.71282958984375, -0.683197021484375, -0.653564453125, -0.623931884765625, -0.59429931640625, -0.564666748046875, -0.5350341796875, -0.505401611328125, -0.47576904296875, -0.446136474609375, -0.41650390625, -0.386871337890625, -0.35723876953125, -0.327606201171875, -0.2979736328125, -0.268341064453125, -0.23870849609375, -0.209075927734375, -0.179443359375, -0.149810791015625, -0.12017822265625, -0.090545654296875, -0.0609130859375, -0.031280517578125, -0.00164794921875, 0.027984619140625, 0.0576171875, 0.087249755859375, 0.11688232421875, 0.146514892578125, 0.1761474609375, 0.205780029296875, 0.23541259765625, 0.265045166015625, 0.294677734375, 0.324310302734375, 0.35394287109375, 0.383575439453125, 0.4132080078125, 0.442840576171875, 0.47247314453125, 0.502105712890625, 0.53173828125, 0.561370849609375, 0.59100341796875, 0.620635986328125, 0.6502685546875, 0.679901123046875, 0.70953369140625, 0.739166259765625, 0.768798828125, 0.798431396484375, 0.82806396484375, 0.857696533203125, 0.8873291015625, 0.916961669921875, 0.94659423828125, 0.976226806640625, 1.005859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 2.0, 2.0, 3.0, 5.0, 11.0, 12.0, 15.0, 10.0, 11.0, 19.0, 21.0, 9.0, 20.0, 26.0, 31.0, 31.0, 33.0, 37.0, 34.0, 41.0, 45.0, 42.0, 35.0, 41.0, 29.0, 45.0, 40.0, 40.0, 31.0, 17.0, 32.0, 30.0, 27.0, 28.0, 25.0, 21.0, 9.0, 9.0, 20.0, 15.0, 8.0, 5.0, 12.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.297119140625, -0.2871971130371094, -0.27727508544921875, -0.2673530578613281, -0.2574310302734375, -0.24750900268554688, -0.23758697509765625, -0.22766494750976562, -0.217742919921875, -0.20782089233398438, -0.19789886474609375, -0.18797683715820312, -0.1780548095703125, -0.16813278198242188, -0.15821075439453125, -0.14828872680664062, -0.13836669921875, -0.12844467163085938, -0.11852264404296875, -0.10860061645507812, -0.0986785888671875, -0.08875656127929688, -0.07883453369140625, -0.06891250610351562, -0.058990478515625, -0.049068450927734375, -0.03914642333984375, -0.029224395751953125, -0.0193023681640625, -0.009380340576171875, 0.00054168701171875, 0.010463714599609375, 0.0203857421875, 0.030307769775390625, 0.04022979736328125, 0.050151824951171875, 0.0600738525390625, 0.06999588012695312, 0.07991790771484375, 0.08983993530273438, 0.099761962890625, 0.10968399047851562, 0.11960601806640625, 0.12952804565429688, 0.1394500732421875, 0.14937210083007812, 0.15929412841796875, 0.16921615600585938, 0.17913818359375, 0.18906021118164062, 0.19898223876953125, 0.20890426635742188, 0.2188262939453125, 0.22874832153320312, 0.23867034912109375, 0.24859237670898438, 0.258514404296875, 0.2684364318847656, 0.27835845947265625, 0.2882804870605469, 0.2982025146484375, 0.3081245422363281, 0.31804656982421875, 0.3279685974121094, 0.337890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 7.0, 14.0, 12.0, 13.0, 24.0, 39.0, 46.0, 98.0, 136.0, 280.0, 622.0, 1628.0, 5457.0, 30748.0, 703028.0, 281209.0, 18688.0, 4071.0, 1253.0, 532.0, 248.0, 125.0, 83.0, 56.0, 28.0, 22.0, 19.0, 18.0, 9.0, 11.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.193359375, -0.18811607360839844, -0.18287277221679688, -0.1776294708251953, -0.17238616943359375, -0.1671428680419922, -0.16189956665039062, -0.15665626525878906, -0.1514129638671875, -0.14616966247558594, -0.14092636108398438, -0.1356830596923828, -0.13043975830078125, -0.1251964569091797, -0.11995315551757812, -0.11470985412597656, -0.109466552734375, -0.10422325134277344, -0.09897994995117188, -0.09373664855957031, -0.08849334716796875, -0.08325004577636719, -0.07800674438476562, -0.07276344299316406, -0.0675201416015625, -0.06227684020996094, -0.057033538818359375, -0.05179023742675781, -0.04654693603515625, -0.04130363464355469, -0.036060333251953125, -0.030817031860351562, -0.02557373046875, -0.020330429077148438, -0.015087127685546875, -0.009843826293945312, -0.00460052490234375, 0.0006427764892578125, 0.005886077880859375, 0.011129379272460938, 0.0163726806640625, 0.021615982055664062, 0.026859283447265625, 0.03210258483886719, 0.03734588623046875, 0.04258918762207031, 0.047832489013671875, 0.05307579040527344, 0.058319091796875, 0.06356239318847656, 0.06880569458007812, 0.07404899597167969, 0.07929229736328125, 0.08453559875488281, 0.08977890014648438, 0.09502220153808594, 0.1002655029296875, 0.10550880432128906, 0.11075210571289062, 0.11599540710449219, 0.12123870849609375, 0.1264820098876953, 0.13172531127929688, 0.13696861267089844, 0.1422119140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 7.0, 11.0, 7.0, 15.0, 10.0, 15.0, 27.0, 49.0, 71.0, 140.0, 217.0, 159.0, 85.0, 48.0, 43.0, 25.0, 18.0, 15.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.568960189819336e-05, -2.497062087059021e-05, -2.425163984298706e-05, -2.353265881538391e-05, -2.2813677787780762e-05, -2.2094696760177612e-05, -2.1375715732574463e-05, -2.0656734704971313e-05, -1.9937753677368164e-05, -1.9218772649765015e-05, -1.8499791622161865e-05, -1.7780810594558716e-05, -1.7061829566955566e-05, -1.6342848539352417e-05, -1.5623867511749268e-05, -1.4904886484146118e-05, -1.4185905456542969e-05, -1.346692442893982e-05, -1.274794340133667e-05, -1.202896237373352e-05, -1.1309981346130371e-05, -1.0591000318527222e-05, -9.872019290924072e-06, -9.153038263320923e-06, -8.434057235717773e-06, -7.715076208114624e-06, -6.996095180511475e-06, -6.277114152908325e-06, -5.558133125305176e-06, -4.839152097702026e-06, -4.120171070098877e-06, -3.4011900424957275e-06, -2.682209014892578e-06, -1.9632279872894287e-06, -1.2442469596862793e-06, -5.252659320831299e-07, 1.9371509552001953e-07, 9.126961231231689e-07, 1.6316771507263184e-06, 2.3506581783294678e-06, 3.069639205932617e-06, 3.7886202335357666e-06, 4.507601261138916e-06, 5.2265822887420654e-06, 5.945563316345215e-06, 6.664544343948364e-06, 7.383525371551514e-06, 8.102506399154663e-06, 8.821487426757812e-06, 9.540468454360962e-06, 1.0259449481964111e-05, 1.097843050956726e-05, 1.169741153717041e-05, 1.241639256477356e-05, 1.3135373592376709e-05, 1.3854354619979858e-05, 1.4573335647583008e-05, 1.5292316675186157e-05, 1.6011297702789307e-05, 1.6730278730392456e-05, 1.7449259757995605e-05, 1.8168240785598755e-05, 1.8887221813201904e-05, 1.9606202840805054e-05, 2.0325183868408203e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 5.0, 4.0, 12.0, 10.0, 14.0, 23.0, 41.0, 74.0, 171.0, 506.0, 2802.0, 151250.0, 887201.0, 5301.0, 690.0, 208.0, 98.0, 45.0, 35.0, 21.0, 6.0, 5.0, 9.0, 5.0, 5.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.611328125, -0.595703125, -0.580078125, -0.564453125, -0.548828125, -0.533203125, -0.517578125, -0.501953125, -0.486328125, -0.470703125, -0.455078125, -0.439453125, -0.423828125, -0.408203125, -0.392578125, -0.376953125, -0.361328125, -0.345703125, -0.330078125, -0.314453125, -0.298828125, -0.283203125, -0.267578125, -0.251953125, -0.236328125, -0.220703125, -0.205078125, -0.189453125, -0.173828125, -0.158203125, -0.142578125, -0.126953125, -0.111328125, -0.095703125, -0.080078125, -0.064453125, -0.048828125, -0.033203125, -0.017578125, -0.001953125, 0.013671875, 0.029296875, 0.044921875, 0.060546875, 0.076171875, 0.091796875, 0.107421875, 0.123046875, 0.138671875, 0.154296875, 0.169921875, 0.185546875, 0.201171875, 0.216796875, 0.232421875, 0.248046875, 0.263671875, 0.279296875, 0.294921875, 0.310546875, 0.326171875, 0.341796875, 0.357421875, 0.373046875, 0.388671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 2.0, 6.0, 6.0, 14.0, 12.0, 18.0, 27.0, 45.0, 69.0, 85.0, 126.0, 165.0, 128.0, 84.0, 49.0, 52.0, 37.0, 19.0, 18.0, 11.0, 5.0, 1.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.191162109375, -0.18642425537109375, -0.1816864013671875, -0.17694854736328125, -0.172210693359375, -0.16747283935546875, -0.1627349853515625, -0.15799713134765625, -0.15325927734375, -0.14852142333984375, -0.1437835693359375, -0.13904571533203125, -0.134307861328125, -0.12957000732421875, -0.1248321533203125, -0.12009429931640625, -0.1153564453125, -0.11061859130859375, -0.1058807373046875, -0.10114288330078125, -0.096405029296875, -0.09166717529296875, -0.0869293212890625, -0.08219146728515625, -0.07745361328125, -0.07271575927734375, -0.0679779052734375, -0.06324005126953125, -0.058502197265625, -0.05376434326171875, -0.0490264892578125, -0.04428863525390625, -0.03955078125, -0.03481292724609375, -0.0300750732421875, -0.02533721923828125, -0.020599365234375, -0.01586151123046875, -0.0111236572265625, -0.00638580322265625, -0.00164794921875, 0.00308990478515625, 0.0078277587890625, 0.01256561279296875, 0.017303466796875, 0.02204132080078125, 0.0267791748046875, 0.03151702880859375, 0.0362548828125, 0.04099273681640625, 0.0457305908203125, 0.05046844482421875, 0.055206298828125, 0.05994415283203125, 0.0646820068359375, 0.06941986083984375, 0.07415771484375, 0.07889556884765625, 0.0836334228515625, 0.08837127685546875, 0.093109130859375, 0.09784698486328125, 0.1025848388671875, 0.10732269287109375, 0.112060546875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 11.0, 84.0, 712.0, 173.0, 24.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.296865463256836, -12.075573921203613, -11.85428237915039, -11.632990837097168, -11.411699295043945, -11.190407752990723, -10.9691162109375, -10.747824668884277, -10.526533126831055, -10.305241584777832, -10.08395004272461, -9.862658500671387, -9.641366958618164, -9.420075416564941, -9.198783874511719, -8.977492332458496, -8.756200790405273, -8.53490924835205, -8.313617706298828, -8.092326164245605, -7.871034622192383, -7.64974308013916, -7.4284515380859375, -7.207159996032715, -6.98586893081665, -6.764577388763428, -6.543285846710205, -6.321994304656982, -6.10070276260376, -5.879411220550537, -5.6581196784973145, -5.436828136444092, -5.215536594390869, -4.9942450523376465, -4.772953510284424, -4.551661968231201, -4.3303704261779785, -4.109078884124756, -3.887787342071533, -3.6664958000183105, -3.445204257965088, -3.2239127159118652, -3.0026211738586426, -2.78132963180542, -2.5600380897521973, -2.3387465476989746, -2.117455005645752, -1.8961635828018188, -1.6748721599578857, -1.453580617904663, -1.2322890758514404, -1.0109975337982178, -0.7897060513496399, -0.568414568901062, -0.34712302684783936, -0.1258314847946167, 0.09546005725860596, 0.3167515993118286, 0.5380431413650513, 0.7593346238136292, 0.9806261658668518, 1.2019176483154297, 1.4232091903686523, 1.644500732421875, 1.8657922744750977]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 3.0, 11.0, 12.0, 15.0, 18.0, 18.0, 22.0, 28.0, 20.0, 37.0, 50.0, 61.0, 63.0, 58.0, 72.0, 48.0, 69.0, 58.0, 54.0, 42.0, 50.0, 36.0, 29.0, 24.0, 23.0, 22.0, 12.0, 11.0, 10.0, 8.0, 2.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.9163193702697754, -3.8081178665161133, -3.6999166011810303, -3.591715097427368, -3.483513832092285, -3.375312328338623, -3.267110824584961, -3.158909320831299, -3.050708055496216, -2.9425065517425537, -2.8343052864074707, -2.7261037826538086, -2.6179022789001465, -2.5097010135650635, -2.4014995098114014, -2.2932982444763184, -2.1850967407226562, -2.076895236968994, -1.9686939716339111, -1.860492467880249, -1.7522910833358765, -1.644089698791504, -1.5358881950378418, -1.4276868104934692, -1.3194854259490967, -1.2112840414047241, -1.1030826568603516, -0.9948811531066895, -0.8866797685623169, -0.7784783840179443, -0.670276939868927, -0.5620754957199097, -0.4538741111755371, -0.34567269682884216, -0.23747128248214722, -0.12926986813545227, -0.021068453788757324, 0.08713293075561523, 0.19533437490463257, 0.3035358190536499, 0.41173720359802246, 0.519938588142395, 0.6281400322914124, 0.7363414764404297, 0.8445428609848022, 0.9527442455291748, 1.060945749282837, 1.1691471338272095, 1.277348518371582, 1.3855499029159546, 1.4937512874603271, 1.6019527912139893, 1.7101541757583618, 1.8183555603027344, 1.9265570640563965, 2.0347585678100586, 2.1429598331451416, 2.2511613368988037, 2.3593626022338867, 2.467564105987549, 2.575765609741211, 2.683966875076294, 2.792168378829956, 2.900369644165039, 3.008571147918701]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 4.0, 6.0, 6.0, 16.0, 21.0, 39.0, 102.0, 515.0, 5791.0, 4183666.0, 3544.0, 387.0, 84.0, 23.0, 18.0, 19.0, 12.0, 12.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.490234375, -3.352996826171875, -3.21575927734375, -3.078521728515625, -2.9412841796875, -2.804046630859375, -2.66680908203125, -2.529571533203125, -2.392333984375, -2.255096435546875, -2.11785888671875, -1.980621337890625, -1.8433837890625, -1.706146240234375, -1.56890869140625, -1.431671142578125, -1.29443359375, -1.157196044921875, -1.01995849609375, -0.882720947265625, -0.7454833984375, -0.608245849609375, -0.47100830078125, -0.333770751953125, -0.196533203125, -0.059295654296875, 0.07794189453125, 0.215179443359375, 0.3524169921875, 0.489654541015625, 0.62689208984375, 0.764129638671875, 0.9013671875, 1.038604736328125, 1.17584228515625, 1.313079833984375, 1.4503173828125, 1.587554931640625, 1.72479248046875, 1.862030029296875, 1.999267578125, 2.136505126953125, 2.27374267578125, 2.410980224609375, 2.5482177734375, 2.685455322265625, 2.82269287109375, 2.959930419921875, 3.09716796875, 3.234405517578125, 3.37164306640625, 3.508880615234375, 3.6461181640625, 3.783355712890625, 3.92059326171875, 4.057830810546875, 4.195068359375, 4.332305908203125, 4.46954345703125, 4.606781005859375, 4.7440185546875, 4.881256103515625, 5.01849365234375, 5.155731201171875, 5.29296875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 6.0, 6.0, 8.0, 15.0, 14.0, 19.0, 36.0, 118.0, 345.0, 248.0, 82.0, 32.0, 9.0, 11.0, 6.0, 8.0, 12.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1424560546875, -0.13712501525878906, -0.13179397583007812, -0.1264629364013672, -0.12113189697265625, -0.11580085754394531, -0.11046981811523438, -0.10513877868652344, -0.0998077392578125, -0.09447669982910156, -0.08914566040039062, -0.08381462097167969, -0.07848358154296875, -0.07315254211425781, -0.06782150268554688, -0.06249046325683594, -0.057159423828125, -0.05182838439941406, -0.046497344970703125, -0.04116630554199219, -0.03583526611328125, -0.030504226684570312, -0.025173187255859375, -0.019842147827148438, -0.0145111083984375, -0.009180068969726562, -0.003849029541015625, 0.0014820098876953125, 0.00681304931640625, 0.012144088745117188, 0.017475128173828125, 0.022806167602539062, 0.02813720703125, 0.03346824645996094, 0.038799285888671875, 0.04413032531738281, 0.04946136474609375, 0.05479240417480469, 0.060123443603515625, 0.06545448303222656, 0.0707855224609375, 0.07611656188964844, 0.08144760131835938, 0.08677864074707031, 0.09210968017578125, 0.09744071960449219, 0.10277175903320312, 0.10810279846191406, 0.113433837890625, 0.11876487731933594, 0.12409591674804688, 0.1294269561767578, 0.13475799560546875, 0.1400890350341797, 0.14542007446289062, 0.15075111389160156, 0.1560821533203125, 0.16141319274902344, 0.16674423217773438, 0.1720752716064453, 0.17740631103515625, 0.1827373504638672, 0.18806838989257812, 0.19339942932128906, 0.19873046875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 10.0, 8.0, 18.0, 12.0, 26.0, 20.0, 68.0, 108.0, 255.0, 1000.0, 11580.0, 4123726.0, 54199.0, 2421.0, 415.0, 153.0, 95.0, 48.0, 26.0, 22.0, 11.0, 7.0, 6.0, 8.0, 2.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1337890625, -1.0942535400390625, -1.054718017578125, -1.0151824951171875, -0.97564697265625, -0.9361114501953125, -0.896575927734375, -0.8570404052734375, -0.8175048828125, -0.7779693603515625, -0.738433837890625, -0.6988983154296875, -0.65936279296875, -0.6198272705078125, -0.580291748046875, -0.5407562255859375, -0.501220703125, -0.4616851806640625, -0.422149658203125, -0.3826141357421875, -0.34307861328125, -0.3035430908203125, -0.264007568359375, -0.2244720458984375, -0.1849365234375, -0.1454010009765625, -0.105865478515625, -0.0663299560546875, -0.02679443359375, 0.0127410888671875, 0.052276611328125, 0.0918121337890625, 0.13134765625, 0.1708831787109375, 0.210418701171875, 0.2499542236328125, 0.28948974609375, 0.3290252685546875, 0.368560791015625, 0.4080963134765625, 0.4476318359375, 0.4871673583984375, 0.526702880859375, 0.5662384033203125, 0.60577392578125, 0.6453094482421875, 0.684844970703125, 0.7243804931640625, 0.763916015625, 0.8034515380859375, 0.842987060546875, 0.8825225830078125, 0.92205810546875, 0.9615936279296875, 1.001129150390625, 1.0406646728515625, 1.0802001953125, 1.1197357177734375, 1.159271240234375, 1.1988067626953125, 1.23834228515625, 1.2778778076171875, 1.317413330078125, 1.3569488525390625, 1.396484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 10.0, 6.0, 6.0, 11.0, 12.0, 20.0, 30.0, 37.0, 107.0, 543.0, 2766.0, 308.0, 66.0, 33.0, 24.0, 14.0, 14.0, 6.0, 12.0, 6.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1854248046875, -0.17910385131835938, -0.17278289794921875, -0.16646194458007812, -0.1601409912109375, -0.15382003784179688, -0.14749908447265625, -0.14117813110351562, -0.134857177734375, -0.12853622436523438, -0.12221527099609375, -0.11589431762695312, -0.1095733642578125, -0.10325241088867188, -0.09693145751953125, -0.09061050415039062, -0.08428955078125, -0.07796859741210938, -0.07164764404296875, -0.06532669067382812, -0.0590057373046875, -0.052684783935546875, -0.04636383056640625, -0.040042877197265625, -0.033721923828125, -0.027400970458984375, -0.02108001708984375, -0.014759063720703125, -0.0084381103515625, -0.002117156982421875, 0.00420379638671875, 0.010524749755859375, 0.016845703125, 0.023166656494140625, 0.02948760986328125, 0.035808563232421875, 0.0421295166015625, 0.048450469970703125, 0.05477142333984375, 0.061092376708984375, 0.067413330078125, 0.07373428344726562, 0.08005523681640625, 0.08637619018554688, 0.0926971435546875, 0.09901809692382812, 0.10533905029296875, 0.11166000366210938, 0.11798095703125, 0.12430191040039062, 0.13062286376953125, 0.13694381713867188, 0.1432647705078125, 0.14958572387695312, 0.15590667724609375, 0.16222763061523438, 0.168548583984375, 0.17486953735351562, 0.18119049072265625, 0.18751144409179688, 0.1938323974609375, 0.20015335083007812, 0.20647430419921875, 0.21279525756835938, 0.2191162109375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 9.0, 804.0, 199.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5977959632873535, -0.4951344430446625, -0.39247292280197144, -0.2898114323616028, -0.18714991211891174, -0.0844883918762207, 0.01817309856414795, 0.12083464860916138, 0.22349613904953003, 0.32615765929222107, 0.4288191795349121, 0.5314806699752808, 0.6341421604156494, 0.7368037104606628, 0.8394652009010315, 0.9421267509460449, 1.0447882413864136, 1.1474497318267822, 1.2501112222671509, 1.3527727127075195, 1.4554343223571777, 1.5580958127975464, 1.660757303237915, 1.7634189128875732, 1.8660802841186523, 1.968741774559021, 2.0714032649993896, 2.174064874649048, 2.276726245880127, 2.379387855529785, 2.4820494651794434, 2.5847108364105225, 2.6873724460601807, 2.790034055709839, 2.892695426940918, 2.995357036590576, 3.0980184078216553, 3.2006800174713135, 3.3033413887023926, 3.406002998352051, 3.508664608001709, 3.611326217651367, 3.7139875888824463, 3.8166491985321045, 3.9193105697631836, 4.021972179412842, 4.1246337890625, 4.227295398712158, 4.329956531524658, 4.432618141174316, 4.535279750823975, 4.637940883636475, 4.740602493286133, 4.843264102935791, 4.945925712585449, 5.048587322235107, 5.151248931884766, 5.253910541534424, 5.356572151184082, 5.459233283996582, 5.56189489364624, 5.664556503295898, 5.767218112945557, 5.869879722595215, 5.972540855407715]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 13.0, 9.0, 13.0, 14.0, 23.0, 21.0, 26.0, 48.0, 50.0, 52.0, 60.0, 58.0, 51.0, 73.0, 69.0, 62.0, 60.0, 54.0, 45.0, 35.0, 43.0, 22.0, 17.0, 10.0, 18.0, 7.0, 13.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6082558631896973, -0.5892598628997803, -0.5702638626098633, -0.5512679219245911, -0.5322719216346741, -0.5132759213447571, -0.4942799210548401, -0.4752839207649231, -0.4562879502773285, -0.4372919499874115, -0.4182959794998169, -0.3992999792098999, -0.3803039789199829, -0.3613080084323883, -0.3423120081424713, -0.3233160376548767, -0.3043200373649597, -0.2853240370750427, -0.2663280665874481, -0.24733206629753113, -0.22833608090877533, -0.20934009552001953, -0.19034409523010254, -0.17134810984134674, -0.15235212445259094, -0.13335613906383514, -0.11436014622449875, -0.09536415338516235, -0.07636816799640656, -0.05737218260765076, -0.03837618976831436, -0.019380196928977966, -0.00038421154022216797, 0.01861177757382393, 0.037607766687870026, 0.05660375580191612, 0.07559974491596222, 0.09459573030471802, 0.11359172314405441, 0.1325877159833908, 0.1515837013721466, 0.1705796867609024, 0.1895756721496582, 0.2085716724395752, 0.227567657828331, 0.2465636432170868, 0.2655596435070038, 0.2845556139945984, 0.3035516142845154, 0.3225476145744324, 0.341543585062027, 0.36053958535194397, 0.3795355558395386, 0.39853155612945557, 0.41752755641937256, 0.43652355670928955, 0.45551952719688416, 0.47451552748680115, 0.49351149797439575, 0.5125074982643127, 0.5315034985542297, 0.550499439239502, 0.569495439529419, 0.5884914398193359, 0.6074874401092529]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 2.0, 2.0, 9.0, 9.0, 18.0, 20.0, 42.0, 51.0, 111.0, 145.0, 293.0, 557.0, 1340.0, 3348.0, 10563.0, 53998.0, 896361.0, 64005.0, 11364.0, 3657.0, 1354.0, 584.0, 294.0, 142.0, 108.0, 47.0, 34.0, 26.0, 26.0, 14.0, 7.0, 8.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400390625, -0.3852996826171875, -0.370208740234375, -0.3551177978515625, -0.34002685546875, -0.3249359130859375, -0.309844970703125, -0.2947540283203125, -0.2796630859375, -0.2645721435546875, -0.249481201171875, -0.2343902587890625, -0.21929931640625, -0.2042083740234375, -0.189117431640625, -0.1740264892578125, -0.158935546875, -0.1438446044921875, -0.128753662109375, -0.1136627197265625, -0.09857177734375, -0.0834808349609375, -0.068389892578125, -0.0532989501953125, -0.0382080078125, -0.0231170654296875, -0.008026123046875, 0.0070648193359375, 0.02215576171875, 0.0372467041015625, 0.052337646484375, 0.0674285888671875, 0.08251953125, 0.0976104736328125, 0.112701416015625, 0.1277923583984375, 0.14288330078125, 0.1579742431640625, 0.173065185546875, 0.1881561279296875, 0.2032470703125, 0.2183380126953125, 0.233428955078125, 0.2485198974609375, 0.26361083984375, 0.2787017822265625, 0.293792724609375, 0.3088836669921875, 0.323974609375, 0.3390655517578125, 0.354156494140625, 0.3692474365234375, 0.38433837890625, 0.3994293212890625, 0.414520263671875, 0.4296112060546875, 0.4447021484375, 0.4597930908203125, 0.474884033203125, 0.4899749755859375, 0.50506591796875, 0.5201568603515625, 0.535247802734375, 0.5503387451171875, 0.5654296875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 8.0, 6.0, 8.0, 12.0, 18.0, 14.0, 40.0, 122.0, 310.0, 261.0, 104.0, 28.0, 11.0, 12.0, 8.0, 8.0, 13.0, 7.0, 1.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1365966796875, -0.1314983367919922, -0.12639999389648438, -0.12130165100097656, -0.11620330810546875, -0.11110496520996094, -0.10600662231445312, -0.10090827941894531, -0.0958099365234375, -0.09071159362792969, -0.08561325073242188, -0.08051490783691406, -0.07541656494140625, -0.07031822204589844, -0.06521987915039062, -0.06012153625488281, -0.055023193359375, -0.04992485046386719, -0.044826507568359375, -0.03972816467285156, -0.03462982177734375, -0.029531478881835938, -0.024433135986328125, -0.019334793090820312, -0.0142364501953125, -0.009138107299804688, -0.004039764404296875, 0.0010585784912109375, 0.00615692138671875, 0.011255264282226562, 0.016353607177734375, 0.021451950073242188, 0.02655029296875, 0.03164863586425781, 0.036746978759765625, 0.04184532165527344, 0.04694366455078125, 0.05204200744628906, 0.057140350341796875, 0.06223869323730469, 0.0673370361328125, 0.07243537902832031, 0.07753372192382812, 0.08263206481933594, 0.08773040771484375, 0.09282875061035156, 0.09792709350585938, 0.10302543640136719, 0.108123779296875, 0.11322212219238281, 0.11832046508789062, 0.12341880798339844, 0.12851715087890625, 0.13361549377441406, 0.13871383666992188, 0.1438121795654297, 0.1489105224609375, 0.1540088653564453, 0.15910720825195312, 0.16420555114746094, 0.16930389404296875, 0.17440223693847656, 0.17950057983398438, 0.1845989227294922, 0.189697265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 10.0, 12.0, 14.0, 23.0, 37.0, 23.0, 46.0, 56.0, 57.0, 89.0, 86.0, 85.0, 116.0, 199.0, 240.0, 486.0, 1365.0, 7035.0, 269764.0, 750022.0, 14965.0, 1907.0, 651.0, 309.0, 205.0, 150.0, 78.0, 105.0, 71.0, 76.0, 52.0, 44.0, 26.0, 40.0, 36.0, 17.0, 11.0, 8.0, 5.0, 7.0, 9.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.56494140625, -0.54736328125, -0.52978515625, -0.51220703125, -0.49462890625, -0.47705078125, -0.45947265625, -0.44189453125, -0.42431640625, -0.40673828125, -0.38916015625, -0.37158203125, -0.35400390625, -0.33642578125, -0.31884765625, -0.30126953125, -0.28369140625, -0.26611328125, -0.24853515625, -0.23095703125, -0.21337890625, -0.19580078125, -0.17822265625, -0.16064453125, -0.14306640625, -0.12548828125, -0.10791015625, -0.09033203125, -0.07275390625, -0.05517578125, -0.03759765625, -0.02001953125, -0.00244140625, 0.01513671875, 0.03271484375, 0.05029296875, 0.06787109375, 0.08544921875, 0.10302734375, 0.12060546875, 0.13818359375, 0.15576171875, 0.17333984375, 0.19091796875, 0.20849609375, 0.22607421875, 0.24365234375, 0.26123046875, 0.27880859375, 0.29638671875, 0.31396484375, 0.33154296875, 0.34912109375, 0.36669921875, 0.38427734375, 0.40185546875, 0.41943359375, 0.43701171875, 0.45458984375, 0.47216796875, 0.48974609375, 0.50732421875, 0.52490234375, 0.54248046875, 0.56005859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 7.0, 6.0, 9.0, 7.0, 15.0, 21.0, 26.0, 29.0, 28.0, 25.0, 18.0, 24.0, 36.0, 42.0, 42.0, 60.0, 48.0, 43.0, 43.0, 59.0, 38.0, 36.0, 58.0, 35.0, 36.0, 26.0, 21.0, 32.0, 23.0, 20.0, 21.0, 16.0, 11.0, 11.0, 12.0, 2.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.337158203125, -0.3266334533691406, -0.31610870361328125, -0.3055839538574219, -0.2950592041015625, -0.2845344543457031, -0.27400970458984375, -0.2634849548339844, -0.252960205078125, -0.24243545532226562, -0.23191070556640625, -0.22138595581054688, -0.2108612060546875, -0.20033645629882812, -0.18981170654296875, -0.17928695678710938, -0.16876220703125, -0.15823745727539062, -0.14771270751953125, -0.13718795776367188, -0.1266632080078125, -0.11613845825195312, -0.10561370849609375, -0.09508895874023438, -0.084564208984375, -0.07403945922851562, -0.06351470947265625, -0.052989959716796875, -0.0424652099609375, -0.031940460205078125, -0.02141571044921875, -0.010890960693359375, -0.0003662109375, 0.010158538818359375, 0.02068328857421875, 0.031208038330078125, 0.0417327880859375, 0.052257537841796875, 0.06278228759765625, 0.07330703735351562, 0.083831787109375, 0.09435653686523438, 0.10488128662109375, 0.11540603637695312, 0.1259307861328125, 0.13645553588867188, 0.14698028564453125, 0.15750503540039062, 0.16802978515625, 0.17855453491210938, 0.18907928466796875, 0.19960403442382812, 0.2101287841796875, 0.22065353393554688, 0.23117828369140625, 0.24170303344726562, 0.252227783203125, 0.2627525329589844, 0.27327728271484375, 0.2838020324707031, 0.2943267822265625, 0.3048515319824219, 0.31537628173828125, 0.3259010314941406, 0.33642578125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 1.0, 4.0, 3.0, 6.0, 13.0, 10.0, 10.0, 16.0, 18.0, 28.0, 49.0, 88.0, 156.0, 286.0, 702.0, 1808.0, 6031.0, 37368.0, 781837.0, 199807.0, 14823.0, 3410.0, 1092.0, 460.0, 217.0, 102.0, 61.0, 41.0, 24.0, 21.0, 22.0, 10.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.174072265625, -0.16958332061767578, -0.16509437561035156, -0.16060543060302734, -0.15611648559570312, -0.1516275405883789, -0.1471385955810547, -0.14264965057373047, -0.13816070556640625, -0.13367176055908203, -0.1291828155517578, -0.1246938705444336, -0.12020492553710938, -0.11571598052978516, -0.11122703552246094, -0.10673809051513672, -0.1022491455078125, -0.09776020050048828, -0.09327125549316406, -0.08878231048583984, -0.08429336547851562, -0.0798044204711914, -0.07531547546386719, -0.07082653045654297, -0.06633758544921875, -0.06184864044189453, -0.05735969543457031, -0.052870750427246094, -0.048381805419921875, -0.043892860412597656, -0.03940391540527344, -0.03491497039794922, -0.030426025390625, -0.02593708038330078, -0.021448135375976562, -0.016959190368652344, -0.012470245361328125, -0.007981300354003906, -0.0034923553466796875, 0.0009965896606445312, 0.00548553466796875, 0.009974479675292969, 0.014463424682617188, 0.018952369689941406, 0.023441314697265625, 0.027930259704589844, 0.03241920471191406, 0.03690814971923828, 0.0413970947265625, 0.04588603973388672, 0.05037498474121094, 0.054863929748535156, 0.059352874755859375, 0.0638418197631836, 0.06833076477050781, 0.07281970977783203, 0.07730865478515625, 0.08179759979248047, 0.08628654479980469, 0.0907754898071289, 0.09526443481445312, 0.09975337982177734, 0.10424232482910156, 0.10873126983642578, 0.11322021484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 11.0, 18.0, 18.0, 27.0, 26.0, 55.0, 76.0, 170.0, 185.0, 145.0, 85.0, 41.0, 32.0, 16.0, 19.0, 15.0, 13.0, 9.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0265579223632812e-05, -1.9599683582782745e-05, -1.8933787941932678e-05, -1.826789230108261e-05, -1.7601996660232544e-05, -1.6936101019382477e-05, -1.627020537853241e-05, -1.5604309737682343e-05, -1.4938414096832275e-05, -1.4272518455982208e-05, -1.3606622815132141e-05, -1.2940727174282074e-05, -1.2274831533432007e-05, -1.160893589258194e-05, -1.0943040251731873e-05, -1.0277144610881805e-05, -9.611248970031738e-06, -8.945353329181671e-06, -8.279457688331604e-06, -7.613562047481537e-06, -6.94766640663147e-06, -6.281770765781403e-06, -5.6158751249313354e-06, -4.949979484081268e-06, -4.284083843231201e-06, -3.618188202381134e-06, -2.952292561531067e-06, -2.2863969206809998e-06, -1.6205012798309326e-06, -9.546056389808655e-07, -2.8870999813079834e-07, 3.771856427192688e-07, 1.043081283569336e-06, 1.708976924419403e-06, 2.3748725652694702e-06, 3.0407682061195374e-06, 3.7066638469696045e-06, 4.372559487819672e-06, 5.038455128669739e-06, 5.704350769519806e-06, 6.370246410369873e-06, 7.03614205121994e-06, 7.702037692070007e-06, 8.367933332920074e-06, 9.033828973770142e-06, 9.699724614620209e-06, 1.0365620255470276e-05, 1.1031515896320343e-05, 1.169741153717041e-05, 1.2363307178020477e-05, 1.3029202818870544e-05, 1.3695098459720612e-05, 1.4360994100570679e-05, 1.5026889741420746e-05, 1.5692785382270813e-05, 1.635868102312088e-05, 1.7024576663970947e-05, 1.7690472304821014e-05, 1.835636794567108e-05, 1.902226358652115e-05, 1.9688159227371216e-05, 2.0354054868221283e-05, 2.101995050907135e-05, 2.1685846149921417e-05, 2.2351741790771484e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 14.0, 20.0, 34.0, 51.0, 138.0, 390.0, 2260.0, 78859.0, 958303.0, 7222.0, 869.0, 207.0, 86.0, 38.0, 22.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.390380859375, -0.3782691955566406, -0.36615753173828125, -0.3540458679199219, -0.3419342041015625, -0.3298225402832031, -0.31771087646484375, -0.3055992126464844, -0.293487548828125, -0.2813758850097656, -0.26926422119140625, -0.2571525573730469, -0.2450408935546875, -0.23292922973632812, -0.22081756591796875, -0.20870590209960938, -0.19659423828125, -0.18448257446289062, -0.17237091064453125, -0.16025924682617188, -0.1481475830078125, -0.13603591918945312, -0.12392425537109375, -0.11181259155273438, -0.099700927734375, -0.08758926391601562, -0.07547760009765625, -0.06336593627929688, -0.0512542724609375, -0.039142608642578125, -0.02703094482421875, -0.014919281005859375, -0.0028076171875, 0.009304046630859375, 0.02141571044921875, 0.033527374267578125, 0.0456390380859375, 0.057750701904296875, 0.06986236572265625, 0.08197402954101562, 0.094085693359375, 0.10619735717773438, 0.11830902099609375, 0.13042068481445312, 0.1425323486328125, 0.15464401245117188, 0.16675567626953125, 0.17886734008789062, 0.19097900390625, 0.20309066772460938, 0.21520233154296875, 0.22731399536132812, 0.2394256591796875, 0.2515373229980469, 0.26364898681640625, 0.2757606506347656, 0.287872314453125, 0.2999839782714844, 0.31209564208984375, 0.3242073059082031, 0.3363189697265625, 0.3484306335449219, 0.36054229736328125, 0.3726539611816406, 0.384765625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 15.0, 31.0, 50.0, 73.0, 180.0, 244.0, 197.0, 97.0, 46.0, 26.0, 12.0, 10.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2196044921875, -0.213043212890625, -0.20648193359375, -0.199920654296875, -0.193359375, -0.186798095703125, -0.18023681640625, -0.173675537109375, -0.1671142578125, -0.160552978515625, -0.15399169921875, -0.147430419921875, -0.140869140625, -0.134307861328125, -0.12774658203125, -0.121185302734375, -0.1146240234375, -0.108062744140625, -0.10150146484375, -0.094940185546875, -0.08837890625, -0.081817626953125, -0.07525634765625, -0.068695068359375, -0.0621337890625, -0.055572509765625, -0.04901123046875, -0.042449951171875, -0.035888671875, -0.029327392578125, -0.02276611328125, -0.016204833984375, -0.0096435546875, -0.003082275390625, 0.00347900390625, 0.010040283203125, 0.0166015625, 0.023162841796875, 0.02972412109375, 0.036285400390625, 0.0428466796875, 0.049407958984375, 0.05596923828125, 0.062530517578125, 0.069091796875, 0.075653076171875, 0.08221435546875, 0.088775634765625, 0.0953369140625, 0.101898193359375, 0.10845947265625, 0.115020751953125, 0.12158203125, 0.128143310546875, 0.13470458984375, 0.141265869140625, 0.1478271484375, 0.154388427734375, 0.16094970703125, 0.167510986328125, 0.174072265625, 0.180633544921875, 0.18719482421875, 0.193756103515625, 0.2003173828125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 11.0, 257.0, 718.0, 24.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2328357696533203, -2.0331013202667236, -1.833366870880127, -1.6336325407028198, -1.4338980913162231, -1.2341636419296265, -1.0344293117523193, -0.8346948623657227, -0.634960412979126, -0.4352259933948517, -0.2354915738105774, -0.03575718402862549, 0.1639772653579712, 0.36371171474456787, 0.563446044921875, 0.7631804943084717, 0.9629149436950684, 1.162649393081665, 1.3623838424682617, 1.5621181726455688, 1.7618526220321655, 1.9615870714187622, 2.1613214015960693, 2.361055850982666, 2.5607903003692627, 2.7605247497558594, 2.960259199142456, 3.1599936485290527, 3.3597278594970703, 3.559462547302246, 3.7591967582702637, 3.9589312076568604, 4.158665657043457, 4.358399868011475, 4.55813455581665, 4.757868766784668, 4.957603454589844, 5.157337665557861, 5.357071876525879, 5.556806564331055, 5.7565412521362305, 5.956275463104248, 6.156010150909424, 6.355744361877441, 6.555479049682617, 6.755213260650635, 6.954947471618652, 7.154682159423828, 7.354416370391846, 7.554150581359863, 7.753885269165039, 7.953619480133057, 8.153353691101074, 8.35308837890625, 8.552823066711426, 8.752557754516602, 8.952291488647461, 9.152026176452637, 9.351759910583496, 9.551494598388672, 9.751229286193848, 9.950963973999023, 10.150697708129883, 10.350432395935059, 10.550167083740234]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 0.0, 12.0, 11.0, 16.0, 15.0, 16.0, 28.0, 25.0, 32.0, 41.0, 28.0, 50.0, 47.0, 43.0, 44.0, 53.0, 52.0, 59.0, 53.0, 55.0, 49.0, 58.0, 35.0, 34.0, 29.0, 25.0, 20.0, 15.0, 13.0, 7.0, 12.0, 8.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0935630798339844, -2.021535873413086, -1.949508547782898, -1.8774813413619995, -1.8054540157318115, -1.733426809310913, -1.6613996028900146, -1.5893723964691162, -1.5173450708389282, -1.4453178644180298, -1.3732905387878418, -1.3012633323669434, -1.229236125946045, -1.157208800315857, -1.0851815938949585, -1.0131542682647705, -0.9411270618438721, -0.8690997958183289, -0.7970725297927856, -0.7250453233718872, -0.653018057346344, -0.5809907913208008, -0.5089635848999023, -0.43693631887435913, -0.3649090528488159, -0.2928817868232727, -0.22085455060005188, -0.14882729947566986, -0.07680004835128784, -0.004772782325744629, 0.0672544538974762, 0.13928169012069702, 0.21130895614624023, 0.28333622217178345, 0.3553634583950043, 0.4273906946182251, 0.4994179606437683, 0.5714452266693115, 0.64347243309021, 0.7154996991157532, 0.7875269651412964, 0.8595542311668396, 0.9315814971923828, 1.0036087036132812, 1.0756359100341797, 1.1476632356643677, 1.2196904420852661, 1.291717767715454, 1.3637449741363525, 1.435772180557251, 1.507799506187439, 1.5798267126083374, 1.6518540382385254, 1.7238812446594238, 1.7959084510803223, 1.8679356575012207, 1.9399629831314087, 2.0119903087615967, 2.084017515182495, 2.1560447216033936, 2.228071928024292, 2.3000993728637695, 2.372126579284668, 2.4441537857055664, 2.516180992126465]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 7.0, 9.0, 11.0, 24.0, 30.0, 61.0, 89.0, 169.0, 341.0, 895.0, 3733.0, 359098.0, 3823270.0, 4652.0, 1026.0, 410.0, 187.0, 110.0, 60.0, 35.0, 23.0, 13.0, 3.0, 4.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5791015625, -0.553985595703125, -0.52886962890625, -0.503753662109375, -0.4786376953125, -0.453521728515625, -0.42840576171875, -0.403289794921875, -0.378173828125, -0.353057861328125, -0.32794189453125, -0.302825927734375, -0.2777099609375, -0.252593994140625, -0.22747802734375, -0.202362060546875, -0.17724609375, -0.152130126953125, -0.12701416015625, -0.101898193359375, -0.0767822265625, -0.051666259765625, -0.02655029296875, -0.001434326171875, 0.023681640625, 0.048797607421875, 0.07391357421875, 0.099029541015625, 0.1241455078125, 0.149261474609375, 0.17437744140625, 0.199493408203125, 0.224609375, 0.249725341796875, 0.27484130859375, 0.299957275390625, 0.3250732421875, 0.350189208984375, 0.37530517578125, 0.400421142578125, 0.425537109375, 0.450653076171875, 0.47576904296875, 0.500885009765625, 0.5260009765625, 0.551116943359375, 0.57623291015625, 0.601348876953125, 0.62646484375, 0.651580810546875, 0.67669677734375, 0.701812744140625, 0.7269287109375, 0.752044677734375, 0.77716064453125, 0.802276611328125, 0.827392578125, 0.852508544921875, 0.87762451171875, 0.902740478515625, 0.9278564453125, 0.952972412109375, 0.97808837890625, 1.003204345703125, 1.0283203125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 2.0, 5.0, 11.0, 8.0, 17.0, 10.0, 25.0, 67.0, 172.0, 298.0, 227.0, 68.0, 27.0, 15.0, 6.0, 10.0, 10.0, 7.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.12815475463867188, -0.12313079833984375, -0.11810684204101562, -0.1130828857421875, -0.10805892944335938, -0.10303497314453125, -0.09801101684570312, -0.092987060546875, -0.08796310424804688, -0.08293914794921875, -0.07791519165039062, -0.0728912353515625, -0.06786727905273438, -0.06284332275390625, -0.057819366455078125, -0.05279541015625, -0.047771453857421875, -0.04274749755859375, -0.037723541259765625, -0.0326995849609375, -0.027675628662109375, -0.02265167236328125, -0.017627716064453125, -0.012603759765625, -0.007579803466796875, -0.00255584716796875, 0.002468109130859375, 0.0074920654296875, 0.012516021728515625, 0.01753997802734375, 0.022563934326171875, 0.027587890625, 0.032611846923828125, 0.03763580322265625, 0.042659759521484375, 0.0476837158203125, 0.052707672119140625, 0.05773162841796875, 0.06275558471679688, 0.067779541015625, 0.07280349731445312, 0.07782745361328125, 0.08285140991210938, 0.0878753662109375, 0.09289932250976562, 0.09792327880859375, 0.10294723510742188, 0.10797119140625, 0.11299514770507812, 0.11801910400390625, 0.12304306030273438, 0.1280670166015625, 0.13309097290039062, 0.13811492919921875, 0.14313888549804688, 0.148162841796875, 0.15318679809570312, 0.15821075439453125, 0.16323471069335938, 0.1682586669921875, 0.17328262329101562, 0.17830657958984375, 0.18333053588867188, 0.1883544921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 12.0, 3.0, 5.0, 7.0, 5.0, 14.0, 24.0, 27.0, 27.0, 62.0, 156.0, 417.0, 1742.0, 17594.0, 4104652.0, 66106.0, 2582.0, 422.0, 189.0, 73.0, 41.0, 32.0, 21.0, 16.0, 10.0, 15.0, 8.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7158203125, -0.6968154907226562, -0.6778106689453125, -0.6588058471679688, -0.639801025390625, -0.6207962036132812, -0.6017913818359375, -0.5827865600585938, -0.56378173828125, -0.5447769165039062, -0.5257720947265625, -0.5067672729492188, -0.487762451171875, -0.46875762939453125, -0.4497528076171875, -0.43074798583984375, -0.4117431640625, -0.39273834228515625, -0.3737335205078125, -0.35472869873046875, -0.335723876953125, -0.31671905517578125, -0.2977142333984375, -0.27870941162109375, -0.25970458984375, -0.24069976806640625, -0.2216949462890625, -0.20269012451171875, -0.183685302734375, -0.16468048095703125, -0.1456756591796875, -0.12667083740234375, -0.107666015625, -0.08866119384765625, -0.0696563720703125, -0.05065155029296875, -0.031646728515625, -0.01264190673828125, 0.0063629150390625, 0.02536773681640625, 0.04437255859375, 0.06337738037109375, 0.0823822021484375, 0.10138702392578125, 0.120391845703125, 0.13939666748046875, 0.1584014892578125, 0.17740631103515625, 0.1964111328125, 0.21541595458984375, 0.2344207763671875, 0.25342559814453125, 0.272430419921875, 0.29143524169921875, 0.3104400634765625, 0.32944488525390625, 0.34844970703125, 0.36745452880859375, 0.3864593505859375, 0.40546417236328125, 0.424468994140625, 0.44347381591796875, 0.4624786376953125, 0.48148345947265625, 0.50048828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 2.0, 8.0, 13.0, 10.0, 21.0, 42.0, 85.0, 482.0, 2703.0, 493.0, 112.0, 24.0, 14.0, 12.0, 11.0, 4.0, 6.0, 2.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1695556640625, -0.16526126861572266, -0.1609668731689453, -0.15667247772216797, -0.15237808227539062, -0.14808368682861328, -0.14378929138183594, -0.1394948959350586, -0.13520050048828125, -0.1309061050415039, -0.12661170959472656, -0.12231731414794922, -0.11802291870117188, -0.11372852325439453, -0.10943412780761719, -0.10513973236083984, -0.1008453369140625, -0.09655094146728516, -0.09225654602050781, -0.08796215057373047, -0.08366775512695312, -0.07937335968017578, -0.07507896423339844, -0.0707845687866211, -0.06649017333984375, -0.062195777893066406, -0.05790138244628906, -0.05360698699951172, -0.049312591552734375, -0.04501819610595703, -0.04072380065917969, -0.036429405212402344, -0.032135009765625, -0.027840614318847656, -0.023546218872070312, -0.01925182342529297, -0.014957427978515625, -0.010663032531738281, -0.0063686370849609375, -0.0020742416381835938, 0.00222015380859375, 0.006514549255371094, 0.010808944702148438, 0.015103340148925781, 0.019397735595703125, 0.02369213104248047, 0.027986526489257812, 0.032280921936035156, 0.0365753173828125, 0.040869712829589844, 0.04516410827636719, 0.04945850372314453, 0.053752899169921875, 0.05804729461669922, 0.06234169006347656, 0.0666360855102539, 0.07093048095703125, 0.0752248764038086, 0.07951927185058594, 0.08381366729736328, 0.08810806274414062, 0.09240245819091797, 0.09669685363769531, 0.10099124908447266, 0.10528564453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 14.0, 723.0, 273.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5706811547279358, -0.4876716136932373, -0.4046620726585388, -0.32165253162384033, -0.23864299058914185, -0.15563344955444336, -0.07262390851974487, 0.010385632514953613, 0.0933951735496521, 0.17640471458435059, 0.2594142556190491, 0.34242379665374756, 0.42543333768844604, 0.5084428787231445, 0.591452419757843, 0.6744619607925415, 0.75747150182724, 0.8404810428619385, 0.923490583896637, 1.0065001249313354, 1.0895097255706787, 1.1725192070007324, 1.2555286884307861, 1.3385382890701294, 1.4215478897094727, 1.5045573711395264, 1.5875669717788696, 1.670576572418213, 1.7535860538482666, 1.8365955352783203, 1.9196051359176636, 2.002614736557007, 2.0856242179870605, 2.1686336994171143, 2.251643180847168, 2.334652900695801, 2.4176623821258545, 2.500671863555908, 2.583681583404541, 2.6666910648345947, 2.7497005462646484, 2.832710027694702, 2.915719509124756, 2.9987292289733887, 3.0817387104034424, 3.164748191833496, 3.247757911682129, 3.3307673931121826, 3.4137768745422363, 3.49678635597229, 3.5797958374023438, 3.6628055572509766, 3.7458150386810303, 3.828824520111084, 3.911834239959717, 3.9948437213897705, 4.077853202819824, 4.160862922668457, 4.243872165679932, 4.3268818855285645, 4.409891128540039, 4.492900848388672, 4.575910568237305, 4.658919811248779, 4.741929531097412]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 3.0, 5.0, 6.0, 14.0, 12.0, 16.0, 26.0, 20.0, 34.0, 37.0, 41.0, 53.0, 58.0, 56.0, 56.0, 63.0, 54.0, 68.0, 60.0, 40.0, 55.0, 39.0, 42.0, 28.0, 28.0, 17.0, 22.0, 13.0, 10.0, 9.0, 5.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4249011278152466, -0.4135485589504242, -0.4021959602832794, -0.39084339141845703, -0.37949079275131226, -0.36813822388648987, -0.3567856550216675, -0.3454330563545227, -0.3340804874897003, -0.32272791862487793, -0.31137531995773315, -0.30002275109291077, -0.2886701822280884, -0.2773175835609436, -0.2659650146961212, -0.25461244583129883, -0.24325984716415405, -0.23190726339817047, -0.2205546796321869, -0.2092021107673645, -0.19784952700138092, -0.18649694323539734, -0.17514437437057495, -0.16379179060459137, -0.1524392068386078, -0.1410866230726242, -0.12973403930664062, -0.11838147044181824, -0.10702888667583466, -0.09567630290985107, -0.08432372659444809, -0.0729711502790451, -0.06161856651306152, -0.05026598647236824, -0.03891340643167496, -0.027560826390981674, -0.01620824635028839, -0.004855666309595108, 0.006496913731098175, 0.01784949004650116, 0.02920207381248474, 0.040554653853178024, 0.05190723389387131, 0.06325981020927429, 0.07461239397525787, 0.08596497774124146, 0.09731755405664444, 0.10867013037204742, 0.120022714138031, 0.1313752979040146, 0.14272788166999817, 0.15408045053482056, 0.16543303430080414, 0.17678561806678772, 0.1881381869316101, 0.1994907706975937, 0.21084335446357727, 0.22219593822956085, 0.23354852199554443, 0.24490109086036682, 0.2562536597251892, 0.267606258392334, 0.27895882725715637, 0.29031139612197876, 0.30166399478912354]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 8.0, 17.0, 18.0, 28.0, 38.0, 58.0, 96.0, 140.0, 210.0, 387.0, 714.0, 1433.0, 3057.0, 7167.0, 23034.0, 238978.0, 706289.0, 47269.0, 11282.0, 4136.0, 1962.0, 904.0, 512.0, 301.0, 177.0, 99.0, 77.0, 47.0, 26.0, 27.0, 13.0, 14.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25244140625, -0.24460411071777344, -0.23676681518554688, -0.2289295196533203, -0.22109222412109375, -0.2132549285888672, -0.20541763305664062, -0.19758033752441406, -0.1897430419921875, -0.18190574645996094, -0.17406845092773438, -0.1662311553955078, -0.15839385986328125, -0.1505565643310547, -0.14271926879882812, -0.13488197326660156, -0.127044677734375, -0.11920738220214844, -0.11137008666992188, -0.10353279113769531, -0.09569549560546875, -0.08785820007324219, -0.08002090454101562, -0.07218360900878906, -0.0643463134765625, -0.05650901794433594, -0.048671722412109375, -0.04083442687988281, -0.03299713134765625, -0.025159835815429688, -0.017322540283203125, -0.009485244750976562, -0.00164794921875, 0.0061893463134765625, 0.014026641845703125, 0.021863937377929688, 0.02970123291015625, 0.03753852844238281, 0.045375823974609375, 0.05321311950683594, 0.0610504150390625, 0.06888771057128906, 0.07672500610351562, 0.08456230163574219, 0.09239959716796875, 0.10023689270019531, 0.10807418823242188, 0.11591148376464844, 0.123748779296875, 0.13158607482910156, 0.13942337036132812, 0.1472606658935547, 0.15509796142578125, 0.1629352569580078, 0.17077255249023438, 0.17860984802246094, 0.1864471435546875, 0.19428443908691406, 0.20212173461914062, 0.2099590301513672, 0.21779632568359375, 0.2256336212158203, 0.23347091674804688, 0.24130821228027344, 0.2491455078125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 1.0, 5.0, 10.0, 7.0, 21.0, 6.0, 22.0, 56.0, 160.0, 295.0, 245.0, 77.0, 31.0, 12.0, 7.0, 12.0, 10.0, 5.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128662109375, -0.12383079528808594, -0.11899948120117188, -0.11416816711425781, -0.10933685302734375, -0.10450553894042969, -0.09967422485351562, -0.09484291076660156, -0.0900115966796875, -0.08518028259277344, -0.08034896850585938, -0.07551765441894531, -0.07068634033203125, -0.06585502624511719, -0.061023712158203125, -0.05619239807128906, -0.051361083984375, -0.04652976989746094, -0.041698455810546875, -0.03686714172363281, -0.03203582763671875, -0.027204513549804688, -0.022373199462890625, -0.017541885375976562, -0.0127105712890625, -0.007879257202148438, -0.003047943115234375, 0.0017833709716796875, 0.00661468505859375, 0.011445999145507812, 0.016277313232421875, 0.021108627319335938, 0.02593994140625, 0.030771255493164062, 0.035602569580078125, 0.04043388366699219, 0.04526519775390625, 0.05009651184082031, 0.054927825927734375, 0.05975914001464844, 0.0645904541015625, 0.06942176818847656, 0.07425308227539062, 0.07908439636230469, 0.08391571044921875, 0.08874702453613281, 0.09357833862304688, 0.09840965270996094, 0.103240966796875, 0.10807228088378906, 0.11290359497070312, 0.11773490905761719, 0.12256622314453125, 0.1273975372314453, 0.13222885131835938, 0.13706016540527344, 0.1418914794921875, 0.14672279357910156, 0.15155410766601562, 0.1563854217529297, 0.16121673583984375, 0.1660480499267578, 0.17087936401367188, 0.17571067810058594, 0.1805419921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 14.0, 32.0, 25.0, 32.0, 28.0, 65.0, 71.0, 89.0, 103.0, 127.0, 199.0, 225.0, 424.0, 890.0, 3219.0, 37967.0, 890569.0, 106641.0, 4976.0, 1249.0, 492.0, 267.0, 184.0, 145.0, 110.0, 103.0, 78.0, 47.0, 45.0, 45.0, 29.0, 21.0, 9.0, 11.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38232421875, -0.369842529296875, -0.35736083984375, -0.344879150390625, -0.3323974609375, -0.319915771484375, -0.30743408203125, -0.294952392578125, -0.282470703125, -0.269989013671875, -0.25750732421875, -0.245025634765625, -0.2325439453125, -0.220062255859375, -0.20758056640625, -0.195098876953125, -0.1826171875, -0.170135498046875, -0.15765380859375, -0.145172119140625, -0.1326904296875, -0.120208740234375, -0.10772705078125, -0.095245361328125, -0.082763671875, -0.070281982421875, -0.05780029296875, -0.045318603515625, -0.0328369140625, -0.020355224609375, -0.00787353515625, 0.004608154296875, 0.01708984375, 0.029571533203125, 0.04205322265625, 0.054534912109375, 0.0670166015625, 0.079498291015625, 0.09197998046875, 0.104461669921875, 0.116943359375, 0.129425048828125, 0.14190673828125, 0.154388427734375, 0.1668701171875, 0.179351806640625, 0.19183349609375, 0.204315185546875, 0.216796875, 0.229278564453125, 0.24176025390625, 0.254241943359375, 0.2667236328125, 0.279205322265625, 0.29168701171875, 0.304168701171875, 0.316650390625, 0.329132080078125, 0.34161376953125, 0.354095458984375, 0.3665771484375, 0.379058837890625, 0.39154052734375, 0.404022216796875, 0.41650390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 9.0, 9.0, 4.0, 9.0, 9.0, 12.0, 11.0, 18.0, 10.0, 18.0, 16.0, 22.0, 27.0, 29.0, 32.0, 30.0, 24.0, 36.0, 46.0, 38.0, 36.0, 23.0, 37.0, 20.0, 42.0, 50.0, 28.0, 37.0, 27.0, 29.0, 35.0, 27.0, 18.0, 22.0, 23.0, 18.0, 14.0, 24.0, 9.0, 10.0, 9.0, 10.0, 8.0, 10.0, 9.0, 5.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2235107421875, -0.21585655212402344, -0.20820236206054688, -0.2005481719970703, -0.19289398193359375, -0.1852397918701172, -0.17758560180664062, -0.16993141174316406, -0.1622772216796875, -0.15462303161621094, -0.14696884155273438, -0.1393146514892578, -0.13166046142578125, -0.12400627136230469, -0.11635208129882812, -0.10869789123535156, -0.101043701171875, -0.09338951110839844, -0.08573532104492188, -0.07808113098144531, -0.07042694091796875, -0.06277275085449219, -0.055118560791015625, -0.04746437072753906, -0.0398101806640625, -0.03215599060058594, -0.024501800537109375, -0.016847610473632812, -0.00919342041015625, -0.0015392303466796875, 0.006114959716796875, 0.013769149780273438, 0.02142333984375, 0.029077529907226562, 0.036731719970703125, 0.04438591003417969, 0.05204010009765625, 0.05969429016113281, 0.06734848022460938, 0.07500267028808594, 0.0826568603515625, 0.09031105041503906, 0.09796524047851562, 0.10561943054199219, 0.11327362060546875, 0.12092781066894531, 0.12858200073242188, 0.13623619079589844, 0.143890380859375, 0.15154457092285156, 0.15919876098632812, 0.1668529510498047, 0.17450714111328125, 0.1821613311767578, 0.18981552124023438, 0.19746971130371094, 0.2051239013671875, 0.21277809143066406, 0.22043228149414062, 0.2280864715576172, 0.23574066162109375, 0.2433948516845703, 0.2510490417480469, 0.25870323181152344, 0.266357421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 8.0, 11.0, 14.0, 22.0, 46.0, 54.0, 82.0, 152.0, 298.0, 629.0, 1537.0, 4294.0, 16043.0, 152088.0, 792943.0, 64713.0, 10294.0, 3104.0, 1097.0, 497.0, 247.0, 153.0, 85.0, 45.0, 34.0, 14.0, 18.0, 8.0, 6.0, 5.0, 4.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0777587890625, -0.07510948181152344, -0.07246017456054688, -0.06981086730957031, -0.06716156005859375, -0.06451225280761719, -0.061862945556640625, -0.05921363830566406, -0.0565643310546875, -0.05391502380371094, -0.051265716552734375, -0.04861640930175781, -0.04596710205078125, -0.04331779479980469, -0.040668487548828125, -0.03801918029785156, -0.035369873046875, -0.03272056579589844, -0.030071258544921875, -0.027421951293945312, -0.02477264404296875, -0.022123336791992188, -0.019474029541015625, -0.016824722290039062, -0.0141754150390625, -0.011526107788085938, -0.008876800537109375, -0.0062274932861328125, -0.00357818603515625, -0.0009288787841796875, 0.001720428466796875, 0.0043697357177734375, 0.00701904296875, 0.009668350219726562, 0.012317657470703125, 0.014966964721679688, 0.01761627197265625, 0.020265579223632812, 0.022914886474609375, 0.025564193725585938, 0.0282135009765625, 0.030862808227539062, 0.033512115478515625, 0.03616142272949219, 0.03881072998046875, 0.04146003723144531, 0.044109344482421875, 0.04675865173339844, 0.049407958984375, 0.05205726623535156, 0.054706573486328125, 0.05735588073730469, 0.06000518798828125, 0.06265449523925781, 0.06530380249023438, 0.06795310974121094, 0.0706024169921875, 0.07325172424316406, 0.07590103149414062, 0.07855033874511719, 0.08119964599609375, 0.08384895324707031, 0.08649826049804688, 0.08914756774902344, 0.091796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 11.0, 9.0, 15.0, 26.0, 23.0, 50.0, 72.0, 80.0, 116.0, 107.0, 122.0, 88.0, 81.0, 48.0, 25.0, 30.0, 23.0, 13.0, 5.0, 11.0, 4.0, 9.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.953975677490234e-06, -9.547919034957886e-06, -9.141862392425537e-06, -8.735805749893188e-06, -8.32974910736084e-06, -7.923692464828491e-06, -7.517635822296143e-06, -7.111579179763794e-06, -6.705522537231445e-06, -6.299465894699097e-06, -5.893409252166748e-06, -5.487352609634399e-06, -5.081295967102051e-06, -4.675239324569702e-06, -4.2691826820373535e-06, -3.863126039505005e-06, -3.4570693969726562e-06, -3.0510127544403076e-06, -2.644956111907959e-06, -2.2388994693756104e-06, -1.8328428268432617e-06, -1.426786184310913e-06, -1.0207295417785645e-06, -6.146728992462158e-07, -2.086162567138672e-07, 1.9744038581848145e-07, 6.034970283508301e-07, 1.0095536708831787e-06, 1.4156103134155273e-06, 1.821666955947876e-06, 2.2277235984802246e-06, 2.6337802410125732e-06, 3.039836883544922e-06, 3.4458935260772705e-06, 3.851950168609619e-06, 4.258006811141968e-06, 4.664063453674316e-06, 5.070120096206665e-06, 5.476176738739014e-06, 5.882233381271362e-06, 6.288290023803711e-06, 6.6943466663360596e-06, 7.100403308868408e-06, 7.506459951400757e-06, 7.912516593933105e-06, 8.318573236465454e-06, 8.724629878997803e-06, 9.130686521530151e-06, 9.5367431640625e-06, 9.942799806594849e-06, 1.0348856449127197e-05, 1.0754913091659546e-05, 1.1160969734191895e-05, 1.1567026376724243e-05, 1.1973083019256592e-05, 1.237913966178894e-05, 1.2785196304321289e-05, 1.3191252946853638e-05, 1.3597309589385986e-05, 1.4003366231918335e-05, 1.4409422874450684e-05, 1.4815479516983032e-05, 1.5221536159515381e-05, 1.562759280204773e-05, 1.6033649444580078e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 8.0, 11.0, 11.0, 21.0, 22.0, 22.0, 54.0, 79.0, 129.0, 206.0, 348.0, 699.0, 1510.0, 4514.0, 18324.0, 172801.0, 764736.0, 68580.0, 10916.0, 3134.0, 1101.0, 534.0, 290.0, 166.0, 119.0, 64.0, 50.0, 33.0, 15.0, 12.0, 12.0, 11.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08599853515625, -0.08316326141357422, -0.08032798767089844, -0.07749271392822266, -0.07465744018554688, -0.0718221664428711, -0.06898689270019531, -0.06615161895751953, -0.06331634521484375, -0.06048107147216797, -0.05764579772949219, -0.054810523986816406, -0.051975250244140625, -0.049139976501464844, -0.04630470275878906, -0.04346942901611328, -0.0406341552734375, -0.03779888153076172, -0.03496360778808594, -0.032128334045410156, -0.029293060302734375, -0.026457786560058594, -0.023622512817382812, -0.02078723907470703, -0.01795196533203125, -0.015116691589355469, -0.012281417846679688, -0.009446144104003906, -0.006610870361328125, -0.0037755966186523438, -0.0009403228759765625, 0.0018949508666992188, 0.004730224609375, 0.007565498352050781, 0.010400772094726562, 0.013236045837402344, 0.016071319580078125, 0.018906593322753906, 0.021741867065429688, 0.02457714080810547, 0.02741241455078125, 0.03024768829345703, 0.03308296203613281, 0.035918235778808594, 0.038753509521484375, 0.041588783264160156, 0.04442405700683594, 0.04725933074951172, 0.0500946044921875, 0.05292987823486328, 0.05576515197753906, 0.058600425720214844, 0.061435699462890625, 0.0642709732055664, 0.06710624694824219, 0.06994152069091797, 0.07277679443359375, 0.07561206817626953, 0.07844734191894531, 0.0812826156616211, 0.08411788940429688, 0.08695316314697266, 0.08978843688964844, 0.09262371063232422, 0.095458984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 11.0, 16.0, 19.0, 23.0, 27.0, 37.0, 57.0, 74.0, 107.0, 113.0, 131.0, 103.0, 79.0, 61.0, 39.0, 20.0, 16.0, 10.0, 11.0, 11.0, 5.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09417724609375, -0.09139823913574219, -0.08861923217773438, -0.08584022521972656, -0.08306121826171875, -0.08028221130371094, -0.07750320434570312, -0.07472419738769531, -0.0719451904296875, -0.06916618347167969, -0.06638717651367188, -0.06360816955566406, -0.06082916259765625, -0.05805015563964844, -0.055271148681640625, -0.05249214172363281, -0.049713134765625, -0.04693412780761719, -0.044155120849609375, -0.04137611389160156, -0.03859710693359375, -0.03581809997558594, -0.033039093017578125, -0.030260086059570312, -0.0274810791015625, -0.024702072143554688, -0.021923065185546875, -0.019144058227539062, -0.01636505126953125, -0.013586044311523438, -0.010807037353515625, -0.008028030395507812, -0.0052490234375, -0.0024700164794921875, 0.000308990478515625, 0.0030879974365234375, 0.00586700439453125, 0.008646011352539062, 0.011425018310546875, 0.014204025268554688, 0.0169830322265625, 0.019762039184570312, 0.022541046142578125, 0.025320053100585938, 0.02809906005859375, 0.030878067016601562, 0.033657073974609375, 0.03643608093261719, 0.039215087890625, 0.04199409484863281, 0.044773101806640625, 0.04755210876464844, 0.05033111572265625, 0.05311012268066406, 0.055889129638671875, 0.05866813659667969, 0.0614471435546875, 0.06422615051269531, 0.06700515747070312, 0.06978416442871094, 0.07256317138671875, 0.07534217834472656, 0.07812118530273438, 0.08090019226074219, 0.08367919921875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 17.0, 865.0, 124.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.909315586090088, -2.6805007457733154, -2.451686143875122, -2.2228713035583496, -1.9940565824508667, -1.7652418613433838, -1.5364270210266113, -1.3076122999191284, -1.0787975788116455, -0.8499828577041626, -0.6211680769920349, -0.3923532962799072, -0.16353857517242432, 0.0652761459350586, 0.29409098625183105, 0.522905707359314, 0.7517204284667969, 0.9805351495742798, 1.2093498706817627, 1.4381647109985352, 1.666979432106018, 1.895794153213501, 2.1246089935302734, 2.353423595428467, 2.5822384357452393, 2.8110532760620117, 3.039867877960205, 3.2686827182769775, 3.49749755859375, 3.7263121604919434, 3.955127000808716, 4.183941841125488, 4.41275691986084, 4.641571521759033, 4.870386600494385, 5.099201202392578, 5.3280158042907715, 5.556830406188965, 5.785645484924316, 6.01446008682251, 6.243274688720703, 6.4720892906188965, 6.700904369354248, 6.929718971252441, 7.158533573150635, 7.387348175048828, 7.61616325378418, 7.844977855682373, 8.073793411254883, 8.302608489990234, 8.53142261505127, 8.760237693786621, 8.989052772521973, 9.217866897583008, 9.44668197631836, 9.675497055053711, 9.904311180114746, 10.133126258850098, 10.361940383911133, 10.590755462646484, 10.819570541381836, 11.048384666442871, 11.277199745178223, 11.506014823913574, 11.73482894897461]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 7.0, 6.0, 5.0, 9.0, 17.0, 13.0, 12.0, 14.0, 22.0, 23.0, 31.0, 31.0, 22.0, 27.0, 40.0, 44.0, 37.0, 46.0, 42.0, 37.0, 47.0, 55.0, 38.0, 40.0, 40.0, 39.0, 34.0, 27.0, 37.0, 22.0, 28.0, 10.0, 13.0, 15.0, 11.0, 13.0, 7.0, 11.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.6813184022903442, -1.628021240234375, -1.5747239589691162, -1.521426796913147, -1.4681295156478882, -1.414832353591919, -1.3615350723266602, -1.308237910270691, -1.2549407482147217, -1.2016435861587524, -1.1483463048934937, -1.0950491428375244, -1.0417518615722656, -0.9884546995162964, -0.9351574778556824, -0.8818602561950684, -0.8285629749298096, -0.7752657532691956, -0.7219685316085815, -0.6686713695526123, -0.6153740882873535, -0.5620769262313843, -0.5087797045707703, -0.45548248291015625, -0.40218526124954224, -0.3488880395889282, -0.2955908179283142, -0.24229362607002258, -0.18899640440940857, -0.13569918274879456, -0.08240199089050293, -0.029104769229888916, 0.02419257164001465, 0.07748978585004807, 0.13078700006008148, 0.1840842068195343, 0.23738142848014832, 0.29067865014076233, 0.34397584199905396, 0.39727306365966797, 0.450570285320282, 0.503867506980896, 0.55716472864151, 0.610461950302124, 0.6637591123580933, 0.717056393623352, 0.7703535556793213, 0.8236507773399353, 0.8769479990005493, 0.9302452206611633, 0.9835424423217773, 1.0368396043777466, 1.0901368856430054, 1.1434340476989746, 1.1967313289642334, 1.2500284910202026, 1.3033256530761719, 1.3566228151321411, 1.4099200963974, 1.4632172584533691, 1.516514539718628, 1.5698117017745972, 1.6231088638305664, 1.6764061450958252, 1.729703426361084]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 6.0, 10.0, 12.0, 23.0, 24.0, 45.0, 65.0, 126.0, 196.0, 607.0, 6010.0, 4161903.0, 23406.0, 1089.0, 363.0, 146.0, 98.0, 44.0, 34.0, 20.0, 12.0, 10.0, 4.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53662109375, -0.5185165405273438, -0.5004119873046875, -0.48230743408203125, -0.464202880859375, -0.44609832763671875, -0.4279937744140625, -0.40988922119140625, -0.39178466796875, -0.37368011474609375, -0.3555755615234375, -0.33747100830078125, -0.319366455078125, -0.30126190185546875, -0.2831573486328125, -0.26505279541015625, -0.2469482421875, -0.22884368896484375, -0.2107391357421875, -0.19263458251953125, -0.174530029296875, -0.15642547607421875, -0.1383209228515625, -0.12021636962890625, -0.10211181640625, -0.08400726318359375, -0.0659027099609375, -0.04779815673828125, -0.029693603515625, -0.01158905029296875, 0.0065155029296875, 0.02462005615234375, 0.042724609375, 0.06082916259765625, 0.0789337158203125, 0.09703826904296875, 0.115142822265625, 0.13324737548828125, 0.1513519287109375, 0.16945648193359375, 0.18756103515625, 0.20566558837890625, 0.2237701416015625, 0.24187469482421875, 0.259979248046875, 0.27808380126953125, 0.2961883544921875, 0.31429290771484375, 0.3323974609375, 0.35050201416015625, 0.3686065673828125, 0.38671112060546875, 0.404815673828125, 0.42292022705078125, 0.4410247802734375, 0.45912933349609375, 0.47723388671875, 0.49533843994140625, 0.5134429931640625, 0.5315475463867188, 0.549652099609375, 0.5677566528320312, 0.5858612060546875, 0.6039657592773438, 0.6220703125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 3.0, 5.0, 5.0, 4.0, 15.0, 18.0, 22.0, 47.0, 166.0, 277.0, 236.0, 104.0, 31.0, 16.0, 10.0, 7.0, 13.0, 6.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1314697265625, -0.1267242431640625, -0.121978759765625, -0.1172332763671875, -0.11248779296875, -0.1077423095703125, -0.102996826171875, -0.0982513427734375, -0.093505859375, -0.0887603759765625, -0.084014892578125, -0.0792694091796875, -0.07452392578125, -0.0697784423828125, -0.065032958984375, -0.0602874755859375, -0.0555419921875, -0.0507965087890625, -0.046051025390625, -0.0413055419921875, -0.03656005859375, -0.0318145751953125, -0.027069091796875, -0.0223236083984375, -0.017578125, -0.0128326416015625, -0.008087158203125, -0.0033416748046875, 0.00140380859375, 0.0061492919921875, 0.010894775390625, 0.0156402587890625, 0.0203857421875, 0.0251312255859375, 0.029876708984375, 0.0346221923828125, 0.03936767578125, 0.0441131591796875, 0.048858642578125, 0.0536041259765625, 0.058349609375, 0.0630950927734375, 0.067840576171875, 0.0725860595703125, 0.07733154296875, 0.0820770263671875, 0.086822509765625, 0.0915679931640625, 0.0963134765625, 0.1010589599609375, 0.105804443359375, 0.1105499267578125, 0.11529541015625, 0.1200408935546875, 0.124786376953125, 0.1295318603515625, 0.13427734375, 0.1390228271484375, 0.143768310546875, 0.1485137939453125, 0.15325927734375, 0.1580047607421875, 0.162750244140625, 0.1674957275390625, 0.1722412109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 9.0, 25.0, 38.0, 88.0, 200.0, 692.0, 4064.0, 76753.0, 4062328.0, 46317.0, 2920.0, 496.0, 173.0, 79.0, 28.0, 17.0, 6.0, 10.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22607421875, -0.21718978881835938, -0.20830535888671875, -0.19942092895507812, -0.1905364990234375, -0.18165206909179688, -0.17276763916015625, -0.16388320922851562, -0.154998779296875, -0.14611434936523438, -0.13722991943359375, -0.12834548950195312, -0.1194610595703125, -0.11057662963867188, -0.10169219970703125, -0.09280776977539062, -0.08392333984375, -0.07503890991210938, -0.06615447998046875, -0.057270050048828125, -0.0483856201171875, -0.039501190185546875, -0.03061676025390625, -0.021732330322265625, -0.012847900390625, -0.003963470458984375, 0.00492095947265625, 0.013805389404296875, 0.0226898193359375, 0.031574249267578125, 0.04045867919921875, 0.049343109130859375, 0.0582275390625, 0.06711196899414062, 0.07599639892578125, 0.08488082885742188, 0.0937652587890625, 0.10264968872070312, 0.11153411865234375, 0.12041854858398438, 0.129302978515625, 0.13818740844726562, 0.14707183837890625, 0.15595626831054688, 0.1648406982421875, 0.17372512817382812, 0.18260955810546875, 0.19149398803710938, 0.20037841796875, 0.20926284790039062, 0.21814727783203125, 0.22703170776367188, 0.2359161376953125, 0.24480056762695312, 0.25368499755859375, 0.2625694274902344, 0.271453857421875, 0.2803382873535156, 0.28922271728515625, 0.2981071472167969, 0.3069915771484375, 0.3158760070800781, 0.32476043701171875, 0.3336448669433594, 0.342529296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 9.0, 14.0, 19.0, 40.0, 56.0, 158.0, 368.0, 2099.0, 872.0, 242.0, 100.0, 44.0, 19.0, 9.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07873249053955078, -0.07659339904785156, -0.07445430755615234, -0.07231521606445312, -0.0701761245727539, -0.06803703308105469, -0.06589794158935547, -0.06375885009765625, -0.06161975860595703, -0.05948066711425781, -0.057341575622558594, -0.055202484130859375, -0.053063392639160156, -0.05092430114746094, -0.04878520965576172, -0.0466461181640625, -0.04450702667236328, -0.04236793518066406, -0.040228843688964844, -0.038089752197265625, -0.035950660705566406, -0.03381156921386719, -0.03167247772216797, -0.02953338623046875, -0.02739429473876953, -0.025255203247070312, -0.023116111755371094, -0.020977020263671875, -0.018837928771972656, -0.016698837280273438, -0.014559745788574219, -0.012420654296875, -0.010281562805175781, -0.008142471313476562, -0.006003379821777344, -0.003864288330078125, -0.0017251968383789062, 0.0004138946533203125, 0.0025529861450195312, 0.00469207763671875, 0.006831169128417969, 0.008970260620117188, 0.011109352111816406, 0.013248443603515625, 0.015387535095214844, 0.017526626586914062, 0.01966571807861328, 0.0218048095703125, 0.02394390106201172, 0.026082992553710938, 0.028222084045410156, 0.030361175537109375, 0.032500267028808594, 0.03463935852050781, 0.03677845001220703, 0.03891754150390625, 0.04105663299560547, 0.04319572448730469, 0.045334815979003906, 0.047473907470703125, 0.049612998962402344, 0.05175209045410156, 0.05389118194580078, 0.0560302734375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 10.0, 29.0, 200.0, 512.0, 223.0, 25.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48881155252456665, -0.47044065594673157, -0.4520697593688965, -0.433698832988739, -0.41532793641090393, -0.39695703983306885, -0.3785861134529114, -0.3602152168750763, -0.3418443202972412, -0.32347342371940613, -0.30510252714157104, -0.2867316007614136, -0.2683607041835785, -0.2499898076057434, -0.23161889612674713, -0.21324798464775085, -0.19487708806991577, -0.1765061914920807, -0.1581352800130844, -0.13976436853408813, -0.12139347195625305, -0.10302256792783737, -0.08465166389942169, -0.06628075242042542, -0.04790985584259033, -0.029538951814174652, -0.011168047785758972, 0.007202856242656708, 0.025573760271072388, 0.04394466429948807, 0.06231556832790375, 0.08068647980690002, 0.09905737638473511, 0.11742828041315079, 0.13579918444156647, 0.15417009592056274, 0.17254099249839783, 0.1909118890762329, 0.2092828005552292, 0.22765371203422546, 0.24602460861206055, 0.26439550518989563, 0.2827664017677307, 0.3011373281478882, 0.31950822472572327, 0.33787912130355835, 0.3562500476837158, 0.3746209442615509, 0.392991840839386, 0.41136273741722107, 0.42973363399505615, 0.4481045603752136, 0.4664754569530487, 0.4848463535308838, 0.5032172799110413, 0.5215882062911987, 0.5399590730667114, 0.5583299994468689, 0.5767008662223816, 0.5950717926025391, 0.6134426593780518, 0.6318135857582092, 0.6501845121383667, 0.6685553789138794, 0.6869263052940369]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 10.0, 18.0, 14.0, 19.0, 16.0, 27.0, 28.0, 37.0, 32.0, 32.0, 42.0, 41.0, 32.0, 49.0, 54.0, 46.0, 52.0, 49.0, 35.0, 42.0, 32.0, 35.0, 32.0, 40.0, 16.0, 29.0, 24.0, 13.0, 13.0, 20.0, 9.0, 13.0, 14.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.13406014442443848, -0.12983031570911407, -0.12560047209262848, -0.12137063592672348, -0.11714079976081848, -0.11291097104549408, -0.10868113487958908, -0.10445129871368408, -0.10022146254777908, -0.09599162638187408, -0.09176179021596909, -0.08753195405006409, -0.08330212533473969, -0.07907228171825409, -0.07484245300292969, -0.07061261683702469, -0.06638278067111969, -0.06215294450521469, -0.05792310833930969, -0.05369327589869499, -0.04946343973278999, -0.045233603566884995, -0.041003771126270294, -0.036773934960365295, -0.0325440987944603, -0.028314262628555298, -0.02408442832529545, -0.0198545940220356, -0.0156247578561306, -0.011394921690225601, -0.007165087386965752, -0.002935253083705902, 0.0012945830821990967, 0.005524418316781521, 0.009754253551363945, 0.01398408878594637, 0.018213924020528793, 0.022443760186433792, 0.02667359448969364, 0.03090342879295349, 0.03513326495885849, 0.03936310112476349, 0.04359293729066849, 0.04782276973128319, 0.05205260589718819, 0.056282442063093185, 0.060512274503707886, 0.06474211066961288, 0.06897194683551788, 0.07320178300142288, 0.07743161916732788, 0.08166145533323288, 0.08589129149913788, 0.09012112021446228, 0.09435095638036728, 0.09858079254627228, 0.10281062871217728, 0.10704046487808228, 0.11127030104398727, 0.11550013720989227, 0.11972996592521667, 0.12395980954170227, 0.12818963825702667, 0.13241946697235107, 0.13664931058883667]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 13.0, 15.0, 21.0, 41.0, 39.0, 68.0, 130.0, 206.0, 456.0, 996.0, 2410.0, 7187.0, 33949.0, 661382.0, 311137.0, 21532.0, 5384.0, 1955.0, 797.0, 359.0, 175.0, 93.0, 69.0, 50.0, 27.0, 19.0, 11.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.253662109375, -0.24570465087890625, -0.2377471923828125, -0.22978973388671875, -0.221832275390625, -0.21387481689453125, -0.2059173583984375, -0.19795989990234375, -0.19000244140625, -0.18204498291015625, -0.1740875244140625, -0.16613006591796875, -0.158172607421875, -0.15021514892578125, -0.1422576904296875, -0.13430023193359375, -0.1263427734375, -0.11838531494140625, -0.1104278564453125, -0.10247039794921875, -0.094512939453125, -0.08655548095703125, -0.0785980224609375, -0.07064056396484375, -0.06268310546875, -0.05472564697265625, -0.0467681884765625, -0.03881072998046875, -0.030853271484375, -0.02289581298828125, -0.0149383544921875, -0.00698089599609375, 0.0009765625, 0.00893402099609375, 0.0168914794921875, 0.02484893798828125, 0.032806396484375, 0.04076385498046875, 0.0487213134765625, 0.05667877197265625, 0.06463623046875, 0.07259368896484375, 0.0805511474609375, 0.08850860595703125, 0.096466064453125, 0.10442352294921875, 0.1123809814453125, 0.12033843994140625, 0.1282958984375, 0.13625335693359375, 0.1442108154296875, 0.15216827392578125, 0.160125732421875, 0.16808319091796875, 0.1760406494140625, 0.18399810791015625, 0.19195556640625, 0.19991302490234375, 0.2078704833984375, 0.21582794189453125, 0.223785400390625, 0.23174285888671875, 0.2397003173828125, 0.24765777587890625, 0.255615234375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 3.0, 5.0, 6.0, 8.0, 13.0, 18.0, 22.0, 65.0, 189.0, 273.0, 223.0, 85.0, 23.0, 17.0, 12.0, 9.0, 10.0, 4.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12939453125, -0.12469482421875, -0.1199951171875, -0.11529541015625, -0.110595703125, -0.10589599609375, -0.1011962890625, -0.09649658203125, -0.091796875, -0.08709716796875, -0.0823974609375, -0.07769775390625, -0.072998046875, -0.06829833984375, -0.0635986328125, -0.05889892578125, -0.05419921875, -0.04949951171875, -0.0447998046875, -0.04010009765625, -0.035400390625, -0.03070068359375, -0.0260009765625, -0.02130126953125, -0.0166015625, -0.01190185546875, -0.0072021484375, -0.00250244140625, 0.002197265625, 0.00689697265625, 0.0115966796875, 0.01629638671875, 0.02099609375, 0.02569580078125, 0.0303955078125, 0.03509521484375, 0.039794921875, 0.04449462890625, 0.0491943359375, 0.05389404296875, 0.05859375, 0.06329345703125, 0.0679931640625, 0.07269287109375, 0.077392578125, 0.08209228515625, 0.0867919921875, 0.09149169921875, 0.09619140625, 0.10089111328125, 0.1055908203125, 0.11029052734375, 0.114990234375, 0.11968994140625, 0.1243896484375, 0.12908935546875, 0.1337890625, 0.13848876953125, 0.1431884765625, 0.14788818359375, 0.152587890625, 0.15728759765625, 0.1619873046875, 0.16668701171875, 0.17138671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 14.0, 6.0, 11.0, 14.0, 22.0, 20.0, 20.0, 28.0, 32.0, 55.0, 48.0, 64.0, 81.0, 88.0, 166.0, 179.0, 339.0, 517.0, 1112.0, 3158.0, 20822.0, 591249.0, 409450.0, 15675.0, 2702.0, 997.0, 506.0, 318.0, 193.0, 112.0, 100.0, 86.0, 57.0, 63.0, 53.0, 37.0, 29.0, 25.0, 25.0, 25.0, 11.0, 10.0, 9.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.283203125, -0.27460479736328125, -0.2660064697265625, -0.25740814208984375, -0.248809814453125, -0.24021148681640625, -0.2316131591796875, -0.22301483154296875, -0.21441650390625, -0.20581817626953125, -0.1972198486328125, -0.18862152099609375, -0.180023193359375, -0.17142486572265625, -0.1628265380859375, -0.15422821044921875, -0.1456298828125, -0.13703155517578125, -0.1284332275390625, -0.11983489990234375, -0.111236572265625, -0.10263824462890625, -0.0940399169921875, -0.08544158935546875, -0.07684326171875, -0.06824493408203125, -0.0596466064453125, -0.05104827880859375, -0.042449951171875, -0.03385162353515625, -0.0252532958984375, -0.01665496826171875, -0.008056640625, 0.00054168701171875, 0.0091400146484375, 0.01773834228515625, 0.026336669921875, 0.03493499755859375, 0.0435333251953125, 0.05213165283203125, 0.06072998046875, 0.06932830810546875, 0.0779266357421875, 0.08652496337890625, 0.095123291015625, 0.10372161865234375, 0.1123199462890625, 0.12091827392578125, 0.1295166015625, 0.13811492919921875, 0.1467132568359375, 0.15531158447265625, 0.163909912109375, 0.17250823974609375, 0.1811065673828125, 0.18970489501953125, 0.19830322265625, 0.20690155029296875, 0.2154998779296875, 0.22409820556640625, 0.232696533203125, 0.24129486083984375, 0.2498931884765625, 0.25849151611328125, 0.26708984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 15.0, 17.0, 14.0, 13.0, 13.0, 21.0, 18.0, 25.0, 25.0, 33.0, 42.0, 40.0, 42.0, 40.0, 48.0, 42.0, 34.0, 51.0, 49.0, 47.0, 49.0, 39.0, 32.0, 23.0, 32.0, 30.0, 24.0, 27.0, 24.0, 14.0, 14.0, 12.0, 9.0, 10.0, 6.0, 2.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.326416015625, -0.31809425354003906, -0.3097724914550781, -0.3014507293701172, -0.29312896728515625, -0.2848072052001953, -0.2764854431152344, -0.26816368103027344, -0.2598419189453125, -0.25152015686035156, -0.24319839477539062, -0.2348766326904297, -0.22655487060546875, -0.2182331085205078, -0.20991134643554688, -0.20158958435058594, -0.193267822265625, -0.18494606018066406, -0.17662429809570312, -0.1683025360107422, -0.15998077392578125, -0.1516590118408203, -0.14333724975585938, -0.13501548767089844, -0.1266937255859375, -0.11837196350097656, -0.11005020141601562, -0.10172843933105469, -0.09340667724609375, -0.08508491516113281, -0.07676315307617188, -0.06844139099121094, -0.06011962890625, -0.05179786682128906, -0.043476104736328125, -0.03515434265136719, -0.02683258056640625, -0.018510818481445312, -0.010189056396484375, -0.0018672943115234375, 0.0064544677734375, 0.014776229858398438, 0.023097991943359375, 0.03141975402832031, 0.03974151611328125, 0.04806327819824219, 0.056385040283203125, 0.06470680236816406, 0.073028564453125, 0.08135032653808594, 0.08967208862304688, 0.09799385070800781, 0.10631561279296875, 0.11463737487792969, 0.12295913696289062, 0.13128089904785156, 0.1396026611328125, 0.14792442321777344, 0.15624618530273438, 0.1645679473876953, 0.17288970947265625, 0.1812114715576172, 0.18953323364257812, 0.19785499572753906, 0.2061767578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 4.0, 11.0, 10.0, 12.0, 17.0, 23.0, 30.0, 37.0, 67.0, 106.0, 122.0, 243.0, 551.0, 1307.0, 3582.0, 14247.0, 169160.0, 811649.0, 36368.0, 7079.0, 2132.0, 859.0, 410.0, 201.0, 121.0, 67.0, 43.0, 23.0, 18.0, 18.0, 13.0, 6.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08673095703125, -0.08386421203613281, -0.08099746704101562, -0.07813072204589844, -0.07526397705078125, -0.07239723205566406, -0.06953048706054688, -0.06666374206542969, -0.0637969970703125, -0.06093025207519531, -0.058063507080078125, -0.05519676208496094, -0.05233001708984375, -0.04946327209472656, -0.046596527099609375, -0.04372978210449219, -0.040863037109375, -0.03799629211425781, -0.035129547119140625, -0.03226280212402344, -0.02939605712890625, -0.026529312133789062, -0.023662567138671875, -0.020795822143554688, -0.0179290771484375, -0.015062332153320312, -0.012195587158203125, -0.009328842163085938, -0.00646209716796875, -0.0035953521728515625, -0.000728607177734375, 0.0021381378173828125, 0.0050048828125, 0.007871627807617188, 0.010738372802734375, 0.013605117797851562, 0.01647186279296875, 0.019338607788085938, 0.022205352783203125, 0.025072097778320312, 0.0279388427734375, 0.030805587768554688, 0.033672332763671875, 0.03653907775878906, 0.03940582275390625, 0.04227256774902344, 0.045139312744140625, 0.04800605773925781, 0.050872802734375, 0.05373954772949219, 0.056606292724609375, 0.05947303771972656, 0.06233978271484375, 0.06520652770996094, 0.06807327270507812, 0.07094001770019531, 0.0738067626953125, 0.07667350769042969, 0.07954025268554688, 0.08240699768066406, 0.08527374267578125, 0.08814048767089844, 0.09100723266601562, 0.09387397766113281, 0.09674072265625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 9.0, 5.0, 8.0, 15.0, 38.0, 76.0, 129.0, 257.0, 190.0, 136.0, 56.0, 30.0, 11.0, 9.0, 14.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6808509826660156e-05, -1.6130506992340088e-05, -1.545250415802002e-05, -1.4774501323699951e-05, -1.4096498489379883e-05, -1.3418495655059814e-05, -1.2740492820739746e-05, -1.2062489986419678e-05, -1.138448715209961e-05, -1.0706484317779541e-05, -1.0028481483459473e-05, -9.350478649139404e-06, -8.672475814819336e-06, -7.994472980499268e-06, -7.316470146179199e-06, -6.638467311859131e-06, -5.9604644775390625e-06, -5.282461643218994e-06, -4.604458808898926e-06, -3.926455974578857e-06, -3.248453140258789e-06, -2.5704503059387207e-06, -1.8924474716186523e-06, -1.214444637298584e-06, -5.364418029785156e-07, 1.4156103134155273e-07, 8.195638656616211e-07, 1.4975666999816895e-06, 2.175569534301758e-06, 2.853572368621826e-06, 3.5315752029418945e-06, 4.209578037261963e-06, 4.887580871582031e-06, 5.5655837059021e-06, 6.243586540222168e-06, 6.921589374542236e-06, 7.599592208862305e-06, 8.277595043182373e-06, 8.955597877502441e-06, 9.63360071182251e-06, 1.0311603546142578e-05, 1.0989606380462646e-05, 1.1667609214782715e-05, 1.2345612049102783e-05, 1.3023614883422852e-05, 1.370161771774292e-05, 1.4379620552062988e-05, 1.5057623386383057e-05, 1.5735626220703125e-05, 1.6413629055023193e-05, 1.7091631889343262e-05, 1.776963472366333e-05, 1.84476375579834e-05, 1.9125640392303467e-05, 1.9803643226623535e-05, 2.0481646060943604e-05, 2.1159648895263672e-05, 2.183765172958374e-05, 2.251565456390381e-05, 2.3193657398223877e-05, 2.3871660232543945e-05, 2.4549663066864014e-05, 2.5227665901184082e-05, 2.590566873550415e-05, 2.658367156982422e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 5.0, 4.0, 7.0, 11.0, 7.0, 14.0, 14.0, 13.0, 18.0, 29.0, 48.0, 64.0, 123.0, 204.0, 324.0, 632.0, 1488.0, 4218.0, 16477.0, 310267.0, 682828.0, 23062.0, 5095.0, 1861.0, 765.0, 360.0, 214.0, 125.0, 83.0, 49.0, 38.0, 22.0, 12.0, 15.0, 12.0, 14.0, 2.0, 6.0, 3.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.123291015625, -0.1196746826171875, -0.116058349609375, -0.1124420166015625, -0.10882568359375, -0.1052093505859375, -0.101593017578125, -0.0979766845703125, -0.0943603515625, -0.0907440185546875, -0.087127685546875, -0.0835113525390625, -0.07989501953125, -0.0762786865234375, -0.072662353515625, -0.0690460205078125, -0.0654296875, -0.0618133544921875, -0.058197021484375, -0.0545806884765625, -0.05096435546875, -0.0473480224609375, -0.043731689453125, -0.0401153564453125, -0.0364990234375, -0.0328826904296875, -0.029266357421875, -0.0256500244140625, -0.02203369140625, -0.0184173583984375, -0.014801025390625, -0.0111846923828125, -0.007568359375, -0.0039520263671875, -0.000335693359375, 0.0032806396484375, 0.00689697265625, 0.0105133056640625, 0.014129638671875, 0.0177459716796875, 0.0213623046875, 0.0249786376953125, 0.028594970703125, 0.0322113037109375, 0.03582763671875, 0.0394439697265625, 0.043060302734375, 0.0466766357421875, 0.05029296875, 0.0539093017578125, 0.057525634765625, 0.0611419677734375, 0.06475830078125, 0.0683746337890625, 0.071990966796875, 0.0756072998046875, 0.0792236328125, 0.0828399658203125, 0.086456298828125, 0.0900726318359375, 0.09368896484375, 0.0973052978515625, 0.100921630859375, 0.1045379638671875, 0.108154296875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 2.0, 4.0, 7.0, 9.0, 15.0, 24.0, 33.0, 52.0, 100.0, 146.0, 170.0, 138.0, 100.0, 66.0, 44.0, 24.0, 17.0, 13.0, 7.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11541748046875, -0.11208629608154297, -0.10875511169433594, -0.1054239273071289, -0.10209274291992188, -0.09876155853271484, -0.09543037414550781, -0.09209918975830078, -0.08876800537109375, -0.08543682098388672, -0.08210563659667969, -0.07877445220947266, -0.07544326782226562, -0.0721120834350586, -0.06878089904785156, -0.06544971466064453, -0.0621185302734375, -0.05878734588623047, -0.05545616149902344, -0.052124977111816406, -0.048793792724609375, -0.045462608337402344, -0.04213142395019531, -0.03880023956298828, -0.03546905517578125, -0.03213787078857422, -0.028806686401367188, -0.025475502014160156, -0.022144317626953125, -0.018813133239746094, -0.015481948852539062, -0.012150764465332031, -0.008819580078125, -0.005488395690917969, -0.0021572113037109375, 0.0011739730834960938, 0.004505157470703125, 0.007836341857910156, 0.011167526245117188, 0.014498710632324219, 0.01782989501953125, 0.02116107940673828, 0.024492263793945312, 0.027823448181152344, 0.031154632568359375, 0.034485816955566406, 0.03781700134277344, 0.04114818572998047, 0.0444793701171875, 0.04781055450439453, 0.05114173889160156, 0.054472923278808594, 0.057804107666015625, 0.061135292053222656, 0.06446647644042969, 0.06779766082763672, 0.07112884521484375, 0.07446002960205078, 0.07779121398925781, 0.08112239837646484, 0.08445358276367188, 0.0877847671508789, 0.09111595153808594, 0.09444713592529297, 0.0977783203125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 5.0, 24.0, 674.0, 285.0, 17.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9732828736305237, -0.8057948350906372, -0.6383068561553955, -0.47081881761550903, -0.30333077907562256, -0.13584274053573608, 0.031645238399505615, 0.19913333654403687, 0.36662131547927856, 0.534109354019165, 0.7015973329544067, 0.8690853714942932, 1.0365734100341797, 1.204061508178711, 1.371549367904663, 1.5390374660491943, 1.7065255641937256, 1.8740135431289673, 2.041501522064209, 2.2089896202087402, 2.3764777183532715, 2.5439658164978027, 2.711453676223755, 2.878941774368286, 3.0464296340942383, 3.2139177322387695, 3.3814055919647217, 3.548893690109253, 3.716381788253784, 3.8838696479797363, 4.051357746124268, 4.218845844268799, 4.38633394241333, 4.553822040557861, 4.721310138702393, 4.888797760009766, 5.056285858154297, 5.223773956298828, 5.391262054443359, 5.558750152587891, 5.726238250732422, 5.893726348876953, 6.061214447021484, 6.228702545166016, 6.396190166473389, 6.56367826461792, 6.731166362762451, 6.898654460906982, 7.0661420822143555, 7.233630180358887, 7.401118278503418, 7.568606376647949, 7.736093997955322, 7.9035820960998535, 8.071069717407227, 8.238557815551758, 8.406046867370605, 8.573534965515137, 8.741023063659668, 8.9085111618042, 9.07599925994873, 9.243487358093262, 9.410974502563477, 9.578462600708008, 9.745950698852539]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 8.0, 7.0, 8.0, 11.0, 14.0, 15.0, 20.0, 22.0, 18.0, 15.0, 37.0, 34.0, 29.0, 42.0, 33.0, 50.0, 45.0, 45.0, 49.0, 35.0, 45.0, 43.0, 42.0, 43.0, 33.0, 35.0, 34.0, 26.0, 23.0, 20.0, 19.0, 19.0, 19.0, 12.0, 8.0, 9.0, 6.0, 3.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.5177534818649292, -1.4698368310928345, -1.4219202995300293, -1.3740036487579346, -1.3260871171951294, -1.2781704664230347, -1.2302539348602295, -1.1823372840881348, -1.1344207525253296, -1.0865041017532349, -1.0385875701904297, -0.9906709790229797, -0.9427543878555298, -0.8948377966880798, -0.8469212055206299, -0.7990045547485352, -0.7510879635810852, -0.7031713724136353, -0.6552547812461853, -0.6073381900787354, -0.5594215989112854, -0.5115050077438354, -0.4635883867740631, -0.41567179560661316, -0.3677552044391632, -0.31983861327171326, -0.2719220221042633, -0.22400541603565216, -0.1760888248682022, -0.12817223370075226, -0.08025562763214111, -0.03233903646469116, 0.015577554702758789, 0.06349414587020874, 0.11141074448823929, 0.15932734310626984, 0.2072439342737198, 0.25516051054000854, 0.3030771315097809, 0.35099372267723083, 0.3989103138446808, 0.44682690501213074, 0.4947434961795807, 0.542660117149353, 0.590576708316803, 0.6384932994842529, 0.6864098906517029, 0.7343264818191528, 0.7822430729866028, 0.8301596641540527, 0.8780762553215027, 0.9259928464889526, 0.9739094376564026, 1.0218260288238525, 1.0697426795959473, 1.1176592111587524, 1.1655758619308472, 1.213492512702942, 1.261409044265747, 1.3093256950378418, 1.357242226600647, 1.4051588773727417, 1.4530754089355469, 1.5009920597076416, 1.5489085912704468]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 4.0, 2.0, 10.0, 11.0, 6.0, 27.0, 34.0, 41.0, 76.0, 136.0, 299.0, 753.0, 3385.0, 122140.0, 4049103.0, 15699.0, 1534.0, 522.0, 242.0, 114.0, 54.0, 29.0, 18.0, 13.0, 10.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.320068359375, -0.30913543701171875, -0.2982025146484375, -0.28726959228515625, -0.276336669921875, -0.26540374755859375, -0.2544708251953125, -0.24353790283203125, -0.23260498046875, -0.22167205810546875, -0.2107391357421875, -0.19980621337890625, -0.188873291015625, -0.17794036865234375, -0.1670074462890625, -0.15607452392578125, -0.1451416015625, -0.13420867919921875, -0.1232757568359375, -0.11234283447265625, -0.101409912109375, -0.09047698974609375, -0.0795440673828125, -0.06861114501953125, -0.05767822265625, -0.04674530029296875, -0.0358123779296875, -0.02487945556640625, -0.013946533203125, -0.00301361083984375, 0.0079193115234375, 0.01885223388671875, 0.02978515625, 0.04071807861328125, 0.0516510009765625, 0.06258392333984375, 0.073516845703125, 0.08444976806640625, 0.0953826904296875, 0.10631561279296875, 0.11724853515625, 0.12818145751953125, 0.1391143798828125, 0.15004730224609375, 0.160980224609375, 0.17191314697265625, 0.1828460693359375, 0.19377899169921875, 0.2047119140625, 0.21564483642578125, 0.2265777587890625, 0.23751068115234375, 0.248443603515625, 0.25937652587890625, 0.2703094482421875, 0.28124237060546875, 0.29217529296875, 0.30310821533203125, 0.3140411376953125, 0.32497406005859375, 0.335906982421875, 0.34683990478515625, 0.3577728271484375, 0.36870574951171875, 0.379638671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 6.0, 20.0, 20.0, 49.0, 153.0, 248.0, 249.0, 118.0, 45.0, 22.0, 12.0, 11.0, 7.0, 9.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.1258087158203125, -0.121124267578125, -0.1164398193359375, -0.11175537109375, -0.1070709228515625, -0.102386474609375, -0.0977020263671875, -0.093017578125, -0.0883331298828125, -0.083648681640625, -0.0789642333984375, -0.07427978515625, -0.0695953369140625, -0.064910888671875, -0.0602264404296875, -0.0555419921875, -0.0508575439453125, -0.046173095703125, -0.0414886474609375, -0.03680419921875, -0.0321197509765625, -0.027435302734375, -0.0227508544921875, -0.01806640625, -0.0133819580078125, -0.008697509765625, -0.0040130615234375, 0.00067138671875, 0.0053558349609375, 0.010040283203125, 0.0147247314453125, 0.0194091796875, 0.0240936279296875, 0.028778076171875, 0.0334625244140625, 0.03814697265625, 0.0428314208984375, 0.047515869140625, 0.0522003173828125, 0.056884765625, 0.0615692138671875, 0.066253662109375, 0.0709381103515625, 0.07562255859375, 0.0803070068359375, 0.084991455078125, 0.0896759033203125, 0.0943603515625, 0.0990447998046875, 0.103729248046875, 0.1084136962890625, 0.11309814453125, 0.1177825927734375, 0.122467041015625, 0.1271514892578125, 0.1318359375, 0.1365203857421875, 0.141204833984375, 0.1458892822265625, 0.15057373046875, 0.1552581787109375, 0.159942626953125, 0.1646270751953125, 0.1693115234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 10.0, 11.0, 21.0, 69.0, 158.0, 838.0, 12915.0, 4163371.0, 15687.0, 904.0, 163.0, 69.0, 29.0, 12.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50341796875, -0.4857635498046875, -0.468109130859375, -0.4504547119140625, -0.43280029296875, -0.4151458740234375, -0.397491455078125, -0.3798370361328125, -0.3621826171875, -0.3445281982421875, -0.326873779296875, -0.3092193603515625, -0.29156494140625, -0.2739105224609375, -0.256256103515625, -0.2386016845703125, -0.220947265625, -0.2032928466796875, -0.185638427734375, -0.1679840087890625, -0.15032958984375, -0.1326751708984375, -0.115020751953125, -0.0973663330078125, -0.0797119140625, -0.0620574951171875, -0.044403076171875, -0.0267486572265625, -0.00909423828125, 0.0085601806640625, 0.026214599609375, 0.0438690185546875, 0.0615234375, 0.0791778564453125, 0.096832275390625, 0.1144866943359375, 0.13214111328125, 0.1497955322265625, 0.167449951171875, 0.1851043701171875, 0.2027587890625, 0.2204132080078125, 0.238067626953125, 0.2557220458984375, 0.27337646484375, 0.2910308837890625, 0.308685302734375, 0.3263397216796875, 0.343994140625, 0.3616485595703125, 0.379302978515625, 0.3969573974609375, 0.41461181640625, 0.4322662353515625, 0.449920654296875, 0.4675750732421875, 0.4852294921875, 0.5028839111328125, 0.520538330078125, 0.5381927490234375, 0.55584716796875, 0.5735015869140625, 0.591156005859375, 0.6088104248046875, 0.62646484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 11.0, 23.0, 55.0, 314.0, 1911.0, 1375.0, 271.0, 66.0, 21.0, 14.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2156982421875, -0.2101573944091797, -0.20461654663085938, -0.19907569885253906, -0.19353485107421875, -0.18799400329589844, -0.18245315551757812, -0.1769123077392578, -0.1713714599609375, -0.1658306121826172, -0.16028976440429688, -0.15474891662597656, -0.14920806884765625, -0.14366722106933594, -0.13812637329101562, -0.1325855255126953, -0.127044677734375, -0.12150382995605469, -0.11596298217773438, -0.11042213439941406, -0.10488128662109375, -0.09934043884277344, -0.09379959106445312, -0.08825874328613281, -0.0827178955078125, -0.07717704772949219, -0.07163619995117188, -0.06609535217285156, -0.06055450439453125, -0.05501365661621094, -0.049472808837890625, -0.04393196105957031, -0.03839111328125, -0.03285026550292969, -0.027309417724609375, -0.021768569946289062, -0.01622772216796875, -0.010686874389648438, -0.005146026611328125, 0.0003948211669921875, 0.0059356689453125, 0.011476516723632812, 0.017017364501953125, 0.022558212280273438, 0.02809906005859375, 0.03363990783691406, 0.039180755615234375, 0.04472160339355469, 0.050262451171875, 0.05580329895019531, 0.061344146728515625, 0.06688499450683594, 0.07242584228515625, 0.07796669006347656, 0.08350753784179688, 0.08904838562011719, 0.0945892333984375, 0.10013008117675781, 0.10567092895507812, 0.11121177673339844, 0.11675262451171875, 0.12229347229003906, 0.12783432006835938, 0.1333751678466797, 0.138916015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 87.0, 535.0, 344.0, 30.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.327150583267212, -1.2938041687011719, -1.2604578733444214, -1.2271114587783813, -1.1937651634216309, -1.1604187488555908, -1.1270723342895508, -1.0937260389328003, -1.0603796243667603, -1.0270332098007202, -0.9936869144439697, -0.9603404998779297, -0.9269941449165344, -0.8936477899551392, -0.8603013753890991, -0.8269550204277039, -0.7936086654663086, -0.7602623105049133, -0.7269159555435181, -0.693569540977478, -0.6602231860160828, -0.6268768310546875, -0.5935304164886475, -0.5601840615272522, -0.5268377065658569, -0.49349135160446167, -0.460144966840744, -0.42679858207702637, -0.3934522271156311, -0.36010587215423584, -0.3267594873905182, -0.29341310262680054, -0.2600668668746948, -0.22672049701213837, -0.1933741271495819, -0.16002775728702545, -0.126681387424469, -0.09333501756191254, -0.05998864769935608, -0.02664227783679962, 0.006704092025756836, 0.04005046188831329, 0.07339683175086975, 0.10674320161342621, 0.14008957147598267, 0.17343594133853912, 0.20678231120109558, 0.24012868106365204, 0.2734750509262085, 0.30682140588760376, 0.3401677906513214, 0.37351417541503906, 0.4068605303764343, 0.4402068853378296, 0.47355327010154724, 0.5068996548652649, 0.5402460098266602, 0.5735923647880554, 0.6069387197494507, 0.6402851343154907, 0.673631489276886, 0.7069778442382812, 0.7403242588043213, 0.7736706137657166, 0.8070169687271118]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 16.0, 19.0, 23.0, 27.0, 40.0, 44.0, 57.0, 65.0, 85.0, 86.0, 87.0, 81.0, 70.0, 70.0, 54.0, 50.0, 37.0, 35.0, 16.0, 23.0, 9.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3746042847633362, -0.3614467680454254, -0.34828925132751465, -0.3351317346096039, -0.3219742178916931, -0.30881667137145996, -0.2956591844558716, -0.2825016379356384, -0.26934412121772766, -0.2561866044998169, -0.24302908778190613, -0.22987157106399536, -0.2167140394449234, -0.20355652272701263, -0.19039900600910187, -0.1772414743900299, -0.16408397257328033, -0.15092645585536957, -0.1377689391374588, -0.12461141496896744, -0.11145389080047607, -0.09829637408256531, -0.08513885736465454, -0.07198133319616318, -0.05882381647825241, -0.045666296035051346, -0.03250877559185028, -0.019351258873939514, -0.006193738430738449, 0.006963782012462616, 0.020121298730373383, 0.033278822898864746, 0.04643633961677551, 0.05959386005997658, 0.07275138050317764, 0.08590889722108841, 0.09906642138957977, 0.11222393810749054, 0.1253814548254013, 0.13853898644447327, 0.15169650316238403, 0.1648540198802948, 0.17801153659820557, 0.19116905331611633, 0.2043265849351883, 0.21748410165309906, 0.23064161837100983, 0.2437991499900818, 0.25695663690567017, 0.27011415362358093, 0.2832716703414917, 0.29642918705940247, 0.30958670377731323, 0.3227442502975464, 0.33590173721313477, 0.3490592837333679, 0.3622168004512787, 0.37537431716918945, 0.3885318338871002, 0.401689350605011, 0.41484686732292175, 0.4280043840408325, 0.4411619305610657, 0.45431944727897644, 0.4674769639968872]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 14.0, 16.0, 12.0, 20.0, 28.0, 33.0, 49.0, 50.0, 95.0, 124.0, 203.0, 346.0, 533.0, 963.0, 1852.0, 3677.0, 8785.0, 29467.0, 200742.0, 675228.0, 95510.0, 17939.0, 6506.0, 2758.0, 1416.0, 786.0, 476.0, 282.0, 183.0, 129.0, 90.0, 64.0, 43.0, 37.0, 22.0, 13.0, 9.0, 11.0, 7.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.16259765625, -0.15771865844726562, -0.15283966064453125, -0.14796066284179688, -0.1430816650390625, -0.13820266723632812, -0.13332366943359375, -0.12844467163085938, -0.123565673828125, -0.11868667602539062, -0.11380767822265625, -0.10892868041992188, -0.1040496826171875, -0.09917068481445312, -0.09429168701171875, -0.08941268920898438, -0.08453369140625, -0.07965469360351562, -0.07477569580078125, -0.06989669799804688, -0.0650177001953125, -0.060138702392578125, -0.05525970458984375, -0.050380706787109375, -0.045501708984375, -0.040622711181640625, -0.03574371337890625, -0.030864715576171875, -0.0259857177734375, -0.021106719970703125, -0.01622772216796875, -0.011348724365234375, -0.0064697265625, -0.001590728759765625, 0.00328826904296875, 0.008167266845703125, 0.0130462646484375, 0.017925262451171875, 0.02280426025390625, 0.027683258056640625, 0.032562255859375, 0.037441253662109375, 0.04232025146484375, 0.047199249267578125, 0.0520782470703125, 0.056957244873046875, 0.06183624267578125, 0.06671524047851562, 0.07159423828125, 0.07647323608398438, 0.08135223388671875, 0.08623123168945312, 0.0911102294921875, 0.09598922729492188, 0.10086822509765625, 0.10574722290039062, 0.110626220703125, 0.11550521850585938, 0.12038421630859375, 0.12526321411132812, 0.1301422119140625, 0.13502120971679688, 0.13990020751953125, 0.14477920532226562, 0.149658203125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 3.0, 9.0, 9.0, 6.0, 18.0, 21.0, 63.0, 160.0, 252.0, 236.0, 114.0, 38.0, 20.0, 14.0, 7.0, 6.0, 10.0, 8.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12143516540527344, -0.11689376831054688, -0.11235237121582031, -0.10781097412109375, -0.10326957702636719, -0.09872817993164062, -0.09418678283691406, -0.0896453857421875, -0.08510398864746094, -0.08056259155273438, -0.07602119445800781, -0.07147979736328125, -0.06693840026855469, -0.062397003173828125, -0.05785560607910156, -0.053314208984375, -0.04877281188964844, -0.044231414794921875, -0.03969001770019531, -0.03514862060546875, -0.030607223510742188, -0.026065826416015625, -0.021524429321289062, -0.0169830322265625, -0.012441635131835938, -0.007900238037109375, -0.0033588409423828125, 0.00118255615234375, 0.0057239532470703125, 0.010265350341796875, 0.014806747436523438, 0.01934814453125, 0.023889541625976562, 0.028430938720703125, 0.03297233581542969, 0.03751373291015625, 0.04205513000488281, 0.046596527099609375, 0.05113792419433594, 0.0556793212890625, 0.06022071838378906, 0.06476211547851562, 0.06930351257324219, 0.07384490966796875, 0.07838630676269531, 0.08292770385742188, 0.08746910095214844, 0.092010498046875, 0.09655189514160156, 0.10109329223632812, 0.10563468933105469, 0.11017608642578125, 0.11471748352050781, 0.11925888061523438, 0.12380027770996094, 0.1283416748046875, 0.13288307189941406, 0.13742446899414062, 0.1419658660888672, 0.14650726318359375, 0.1510486602783203, 0.15559005737304688, 0.16013145446777344, 0.1646728515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 4.0, 7.0, 5.0, 8.0, 10.0, 16.0, 14.0, 18.0, 37.0, 25.0, 35.0, 47.0, 54.0, 76.0, 90.0, 114.0, 173.0, 236.0, 384.0, 802.0, 2247.0, 17118.0, 546279.0, 462386.0, 14203.0, 2022.0, 792.0, 397.0, 235.0, 170.0, 122.0, 87.0, 62.0, 57.0, 44.0, 42.0, 24.0, 18.0, 31.0, 15.0, 11.0, 15.0, 10.0, 5.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.25927734375, -0.25141334533691406, -0.24354934692382812, -0.2356853485107422, -0.22782135009765625, -0.2199573516845703, -0.21209335327148438, -0.20422935485839844, -0.1963653564453125, -0.18850135803222656, -0.18063735961914062, -0.1727733612060547, -0.16490936279296875, -0.1570453643798828, -0.14918136596679688, -0.14131736755371094, -0.133453369140625, -0.12558937072753906, -0.11772537231445312, -0.10986137390136719, -0.10199737548828125, -0.09413337707519531, -0.08626937866210938, -0.07840538024902344, -0.0705413818359375, -0.06267738342285156, -0.054813385009765625, -0.04694938659667969, -0.03908538818359375, -0.031221389770507812, -0.023357391357421875, -0.015493392944335938, -0.00762939453125, 0.0002346038818359375, 0.008098602294921875, 0.015962600708007812, 0.02382659912109375, 0.03169059753417969, 0.039554595947265625, 0.04741859436035156, 0.0552825927734375, 0.06314659118652344, 0.07101058959960938, 0.07887458801269531, 0.08673858642578125, 0.09460258483886719, 0.10246658325195312, 0.11033058166503906, 0.118194580078125, 0.12605857849121094, 0.13392257690429688, 0.1417865753173828, 0.14965057373046875, 0.1575145721435547, 0.16537857055664062, 0.17324256896972656, 0.1811065673828125, 0.18897056579589844, 0.19683456420898438, 0.2046985626220703, 0.21256256103515625, 0.2204265594482422, 0.22829055786132812, 0.23615455627441406, 0.2440185546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 4.0, 9.0, 8.0, 4.0, 9.0, 13.0, 12.0, 20.0, 29.0, 25.0, 15.0, 43.0, 33.0, 32.0, 28.0, 40.0, 40.0, 35.0, 54.0, 46.0, 40.0, 36.0, 29.0, 36.0, 37.0, 30.0, 37.0, 25.0, 35.0, 21.0, 23.0, 19.0, 23.0, 18.0, 10.0, 10.0, 10.0, 11.0, 9.0, 12.0, 3.0, 6.0, 2.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.232421875, -0.22567176818847656, -0.21892166137695312, -0.2121715545654297, -0.20542144775390625, -0.1986713409423828, -0.19192123413085938, -0.18517112731933594, -0.1784210205078125, -0.17167091369628906, -0.16492080688476562, -0.1581707000732422, -0.15142059326171875, -0.1446704864501953, -0.13792037963867188, -0.13117027282714844, -0.124420166015625, -0.11767005920410156, -0.11091995239257812, -0.10416984558105469, -0.09741973876953125, -0.09066963195800781, -0.08391952514648438, -0.07716941833496094, -0.0704193115234375, -0.06366920471191406, -0.056919097900390625, -0.05016899108886719, -0.04341888427734375, -0.03666877746582031, -0.029918670654296875, -0.023168563842773438, -0.01641845703125, -0.009668350219726562, -0.002918243408203125, 0.0038318634033203125, 0.01058197021484375, 0.017332077026367188, 0.024082183837890625, 0.030832290649414062, 0.0375823974609375, 0.04433250427246094, 0.051082611083984375, 0.05783271789550781, 0.06458282470703125, 0.07133293151855469, 0.07808303833007812, 0.08483314514160156, 0.091583251953125, 0.09833335876464844, 0.10508346557617188, 0.11183357238769531, 0.11858367919921875, 0.1253337860107422, 0.13208389282226562, 0.13883399963378906, 0.1455841064453125, 0.15233421325683594, 0.15908432006835938, 0.1658344268798828, 0.17258453369140625, 0.1793346405029297, 0.18608474731445312, 0.19283485412597656, 0.1995849609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 5.0, 3.0, 9.0, 14.0, 16.0, 36.0, 42.0, 72.0, 158.0, 273.0, 570.0, 1483.0, 5102.0, 26812.0, 298745.0, 661540.0, 43229.0, 7081.0, 1912.0, 712.0, 312.0, 181.0, 96.0, 46.0, 33.0, 24.0, 21.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0753173828125, -0.0730428695678711, -0.07076835632324219, -0.06849384307861328, -0.06621932983398438, -0.06394481658935547, -0.06167030334472656, -0.059395790100097656, -0.05712127685546875, -0.054846763610839844, -0.05257225036621094, -0.05029773712158203, -0.048023223876953125, -0.04574871063232422, -0.04347419738769531, -0.041199684143066406, -0.0389251708984375, -0.036650657653808594, -0.03437614440917969, -0.03210163116455078, -0.029827117919921875, -0.02755260467529297, -0.025278091430664062, -0.023003578186035156, -0.02072906494140625, -0.018454551696777344, -0.016180038452148438, -0.013905525207519531, -0.011631011962890625, -0.009356498718261719, -0.0070819854736328125, -0.004807472229003906, -0.002532958984375, -0.00025844573974609375, 0.0020160675048828125, 0.004290580749511719, 0.006565093994140625, 0.008839607238769531, 0.011114120483398438, 0.013388633728027344, 0.01566314697265625, 0.017937660217285156, 0.020212173461914062, 0.02248668670654297, 0.024761199951171875, 0.02703571319580078, 0.029310226440429688, 0.031584739685058594, 0.0338592529296875, 0.036133766174316406, 0.03840827941894531, 0.04068279266357422, 0.042957305908203125, 0.04523181915283203, 0.04750633239746094, 0.049780845642089844, 0.05205535888671875, 0.054329872131347656, 0.05660438537597656, 0.05887889862060547, 0.061153411865234375, 0.06342792510986328, 0.06570243835449219, 0.0679769515991211, 0.07025146484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 7.0, 18.0, 12.0, 24.0, 23.0, 33.0, 50.0, 59.0, 91.0, 127.0, 121.0, 110.0, 96.0, 47.0, 51.0, 20.0, 18.0, 18.0, 9.0, 13.0, 7.0, 12.0, 5.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.52346420288086e-06, -8.184462785720825e-06, -7.845461368560791e-06, -7.506459951400757e-06, -7.167458534240723e-06, -6.8284571170806885e-06, -6.489455699920654e-06, -6.15045428276062e-06, -5.811452865600586e-06, -5.472451448440552e-06, -5.133450031280518e-06, -4.794448614120483e-06, -4.455447196960449e-06, -4.116445779800415e-06, -3.777444362640381e-06, -3.4384429454803467e-06, -3.0994415283203125e-06, -2.7604401111602783e-06, -2.421438694000244e-06, -2.08243727684021e-06, -1.7434358596801758e-06, -1.4044344425201416e-06, -1.0654330253601074e-06, -7.264316082000732e-07, -3.8743019104003906e-07, -4.842877388000488e-08, 2.905726432800293e-07, 6.295740604400635e-07, 9.685754776000977e-07, 1.3075768947601318e-06, 1.646578311920166e-06, 1.9855797290802e-06, 2.3245811462402344e-06, 2.6635825634002686e-06, 3.0025839805603027e-06, 3.341585397720337e-06, 3.680586814880371e-06, 4.019588232040405e-06, 4.3585896492004395e-06, 4.697591066360474e-06, 5.036592483520508e-06, 5.375593900680542e-06, 5.714595317840576e-06, 6.05359673500061e-06, 6.3925981521606445e-06, 6.731599569320679e-06, 7.070600986480713e-06, 7.409602403640747e-06, 7.748603820800781e-06, 8.087605237960815e-06, 8.42660665512085e-06, 8.765608072280884e-06, 9.104609489440918e-06, 9.443610906600952e-06, 9.782612323760986e-06, 1.012161374092102e-05, 1.0460615158081055e-05, 1.0799616575241089e-05, 1.1138617992401123e-05, 1.1477619409561157e-05, 1.1816620826721191e-05, 1.2155622243881226e-05, 1.249462366104126e-05, 1.2833625078201294e-05, 1.3172626495361328e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 5.0, 6.0, 4.0, 10.0, 14.0, 24.0, 25.0, 31.0, 42.0, 85.0, 130.0, 201.0, 378.0, 741.0, 1581.0, 4577.0, 18520.0, 137943.0, 783431.0, 81452.0, 12993.0, 3561.0, 1303.0, 635.0, 305.0, 192.0, 111.0, 77.0, 44.0, 26.0, 24.0, 19.0, 15.0, 9.0, 5.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.0765380859375, -0.07431221008300781, -0.07208633422851562, -0.06986045837402344, -0.06763458251953125, -0.06540870666503906, -0.06318283081054688, -0.06095695495605469, -0.0587310791015625, -0.05650520324707031, -0.054279327392578125, -0.05205345153808594, -0.04982757568359375, -0.04760169982910156, -0.045375823974609375, -0.04314994812011719, -0.040924072265625, -0.03869819641113281, -0.036472320556640625, -0.03424644470214844, -0.03202056884765625, -0.029794692993164062, -0.027568817138671875, -0.025342941284179688, -0.0231170654296875, -0.020891189575195312, -0.018665313720703125, -0.016439437866210938, -0.01421356201171875, -0.011987686157226562, -0.009761810302734375, -0.0075359344482421875, -0.00531005859375, -0.0030841827392578125, -0.000858306884765625, 0.0013675689697265625, 0.00359344482421875, 0.0058193206787109375, 0.008045196533203125, 0.010271072387695312, 0.0124969482421875, 0.014722824096679688, 0.016948699951171875, 0.019174575805664062, 0.02140045166015625, 0.023626327514648438, 0.025852203369140625, 0.028078079223632812, 0.030303955078125, 0.03252983093261719, 0.034755706787109375, 0.03698158264160156, 0.03920745849609375, 0.04143333435058594, 0.043659210205078125, 0.04588508605957031, 0.0481109619140625, 0.05033683776855469, 0.052562713623046875, 0.05478858947753906, 0.05701446533203125, 0.05924034118652344, 0.061466217041015625, 0.06369209289550781, 0.06591796875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 7.0, 8.0, 16.0, 26.0, 31.0, 27.0, 53.0, 84.0, 126.0, 180.0, 144.0, 85.0, 63.0, 49.0, 22.0, 22.0, 9.0, 9.0, 6.0, 7.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.09649658203125, -0.09412670135498047, -0.09175682067871094, -0.0893869400024414, -0.08701705932617188, -0.08464717864990234, -0.08227729797363281, -0.07990741729736328, -0.07753753662109375, -0.07516765594482422, -0.07279777526855469, -0.07042789459228516, -0.06805801391601562, -0.0656881332397461, -0.06331825256347656, -0.06094837188720703, -0.0585784912109375, -0.05620861053466797, -0.05383872985839844, -0.051468849182128906, -0.049098968505859375, -0.046729087829589844, -0.04435920715332031, -0.04198932647705078, -0.03961944580078125, -0.03724956512451172, -0.03487968444824219, -0.032509803771972656, -0.030139923095703125, -0.027770042419433594, -0.025400161743164062, -0.02303028106689453, -0.020660400390625, -0.01829051971435547, -0.015920639038085938, -0.013550758361816406, -0.011180877685546875, -0.008810997009277344, -0.0064411163330078125, -0.004071235656738281, -0.00170135498046875, 0.0006685256958007812, 0.0030384063720703125, 0.005408287048339844, 0.007778167724609375, 0.010148048400878906, 0.012517929077148438, 0.014887809753417969, 0.0172576904296875, 0.01962757110595703, 0.021997451782226562, 0.024367332458496094, 0.026737213134765625, 0.029107093811035156, 0.03147697448730469, 0.03384685516357422, 0.03621673583984375, 0.03858661651611328, 0.04095649719238281, 0.043326377868652344, 0.045696258544921875, 0.048066139221191406, 0.05043601989746094, 0.05280590057373047, 0.05517578125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 15.0, 53.0, 199.0, 403.0, 229.0, 67.0, 20.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1133036613464355, -1.0641229152679443, -1.0149421691894531, -0.9657613635063171, -0.9165806174278259, -0.8673998117446899, -0.8182190656661987, -0.7690383195877075, -0.7198575735092163, -0.6706768274307251, -0.6214960217475891, -0.5723152756690979, -0.5231345295906067, -0.4739537537097931, -0.4247729778289795, -0.3755922317504883, -0.3264114260673523, -0.2772306501865387, -0.22804990410804749, -0.1788691282272339, -0.12968836724758148, -0.08050760626792908, -0.03132683038711548, 0.017853915691375732, 0.06703469157218933, 0.11621545255184174, 0.16539621353149414, 0.21457698941230774, 0.26375776529312134, 0.31293851137161255, 0.36211928725242615, 0.41130003333091736, 0.46048080921173096, 0.5096615552902222, 0.5588423609733582, 0.6080231070518494, 0.6572038531303406, 0.7063846588134766, 0.7555654048919678, 0.804746150970459, 0.8539268970489502, 0.9031076431274414, 0.9522884488105774, 1.0014691352844238, 1.0506500005722046, 1.0998307466506958, 1.149011492729187, 1.1981922388076782, 1.247373104095459, 1.2965538501739502, 1.3457345962524414, 1.3949153423309326, 1.4440962076187134, 1.4932769536972046, 1.5424576997756958, 1.591638445854187, 1.6408191919326782, 1.6899999380111694, 1.7391806840896606, 1.7883615493774414, 1.8375422954559326, 1.8867230415344238, 1.935903787612915, 1.9850845336914062, 2.0342652797698975]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 2.0, 6.0, 4.0, 7.0, 7.0, 20.0, 21.0, 20.0, 26.0, 20.0, 29.0, 34.0, 45.0, 45.0, 48.0, 42.0, 50.0, 49.0, 63.0, 61.0, 51.0, 45.0, 49.0, 35.0, 36.0, 30.0, 27.0, 23.0, 15.0, 13.0, 17.0, 12.0, 4.0, 9.0, 9.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0], "bins": [-1.693314552307129, -1.6472734212875366, -1.6012322902679443, -1.5551912784576416, -1.5091501474380493, -1.463109016418457, -1.4170678853988647, -1.3710267543792725, -1.3249857425689697, -1.2789446115493774, -1.2329034805297852, -1.1868624687194824, -1.1408213376998901, -1.0947802066802979, -1.0487390756607056, -1.0026979446411133, -0.9566568732261658, -0.9106157422065735, -0.864574670791626, -0.8185335397720337, -0.7724924683570862, -0.7264513373374939, -0.6804102659225464, -0.6343691349029541, -0.5883280038833618, -0.5422868728637695, -0.496245801448822, -0.45020467042922974, -0.4041635990142822, -0.35812246799468994, -0.31208136677742004, -0.26604026556015015, -0.21999919414520264, -0.17395809292793274, -0.12791699171066284, -0.08187587559223175, -0.03583477437496185, 0.010206326842308044, 0.056247442960739136, 0.10228854417800903, 0.14832964539527893, 0.19437074661254883, 0.24041184782981873, 0.2864529490470886, 0.3324940800666809, 0.3785351514816284, 0.4245762825012207, 0.4706173837184906, 0.5166584849357605, 0.5626996159553528, 0.6087406873703003, 0.6547818183898926, 0.7008228898048401, 0.7468640208244324, 0.7929050922393799, 0.8389462232589722, 0.8849873542785645, 0.9310284852981567, 0.9770695567131042, 1.0231106281280518, 1.069151759147644, 1.1151928901672363, 1.1612340211868286, 1.207275152206421, 1.2533161640167236]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 8.0, 4.0, 12.0, 3.0, 7.0, 13.0, 26.0, 43.0, 34.0, 99.0, 175.0, 405.0, 1386.0, 9916.0, 3658255.0, 514460.0, 7524.0, 1116.0, 353.0, 177.0, 102.0, 63.0, 24.0, 29.0, 15.0, 15.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2286376953125, -0.22124671936035156, -0.21385574340820312, -0.2064647674560547, -0.19907379150390625, -0.1916828155517578, -0.18429183959960938, -0.17690086364746094, -0.1695098876953125, -0.16211891174316406, -0.15472793579101562, -0.1473369598388672, -0.13994598388671875, -0.1325550079345703, -0.12516403198242188, -0.11777305603027344, -0.110382080078125, -0.10299110412597656, -0.09560012817382812, -0.08820915222167969, -0.08081817626953125, -0.07342720031738281, -0.06603622436523438, -0.05864524841308594, -0.0512542724609375, -0.04386329650878906, -0.036472320556640625, -0.029081344604492188, -0.02169036865234375, -0.014299392700195312, -0.006908416748046875, 0.0004825592041015625, 0.00787353515625, 0.015264511108398438, 0.022655487060546875, 0.030046463012695312, 0.03743743896484375, 0.04482841491699219, 0.052219390869140625, 0.05961036682128906, 0.0670013427734375, 0.07439231872558594, 0.08178329467773438, 0.08917427062988281, 0.09656524658203125, 0.10395622253417969, 0.11134719848632812, 0.11873817443847656, 0.126129150390625, 0.13352012634277344, 0.14091110229492188, 0.1483020782470703, 0.15569305419921875, 0.1630840301513672, 0.17047500610351562, 0.17786598205566406, 0.1852569580078125, 0.19264793395996094, 0.20003890991210938, 0.2074298858642578, 0.21482086181640625, 0.2222118377685547, 0.22960281372070312, 0.23699378967285156, 0.244384765625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 8.0, 7.0, 9.0, 11.0, 16.0, 36.0, 107.0, 190.0, 273.0, 189.0, 61.0, 36.0, 15.0, 12.0, 6.0, 10.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128662109375, -0.12412071228027344, -0.11957931518554688, -0.11503791809082031, -0.11049652099609375, -0.10595512390136719, -0.10141372680664062, -0.09687232971191406, -0.0923309326171875, -0.08778953552246094, -0.08324813842773438, -0.07870674133300781, -0.07416534423828125, -0.06962394714355469, -0.06508255004882812, -0.06054115295410156, -0.055999755859375, -0.05145835876464844, -0.046916961669921875, -0.04237556457519531, -0.03783416748046875, -0.03329277038574219, -0.028751373291015625, -0.024209976196289062, -0.0196685791015625, -0.015127182006835938, -0.010585784912109375, -0.0060443878173828125, -0.00150299072265625, 0.0030384063720703125, 0.007579803466796875, 0.012121200561523438, 0.01666259765625, 0.021203994750976562, 0.025745391845703125, 0.030286788940429688, 0.03482818603515625, 0.03936958312988281, 0.043910980224609375, 0.04845237731933594, 0.0529937744140625, 0.05753517150878906, 0.062076568603515625, 0.06661796569824219, 0.07115936279296875, 0.07570075988769531, 0.08024215698242188, 0.08478355407714844, 0.089324951171875, 0.09386634826660156, 0.09840774536132812, 0.10294914245605469, 0.10749053955078125, 0.11203193664550781, 0.11657333374023438, 0.12111473083496094, 0.1256561279296875, 0.13019752502441406, 0.13473892211914062, 0.1392803192138672, 0.14382171630859375, 0.1483631134033203, 0.15290451049804688, 0.15744590759277344, 0.1619873046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 44.0, 70.0, 264.0, 1790.0, 32927.0, 4076474.0, 79475.0, 2649.0, 389.0, 105.0, 41.0, 14.0, 10.0, 6.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.2882881164550781, -0.28018951416015625, -0.2720909118652344, -0.2639923095703125, -0.2558937072753906, -0.24779510498046875, -0.23969650268554688, -0.231597900390625, -0.22349929809570312, -0.21540069580078125, -0.20730209350585938, -0.1992034912109375, -0.19110488891601562, -0.18300628662109375, -0.17490768432617188, -0.16680908203125, -0.15871047973632812, -0.15061187744140625, -0.14251327514648438, -0.1344146728515625, -0.12631607055664062, -0.11821746826171875, -0.11011886596679688, -0.102020263671875, -0.09392166137695312, -0.08582305908203125, -0.07772445678710938, -0.0696258544921875, -0.061527252197265625, -0.05342864990234375, -0.045330047607421875, -0.0372314453125, -0.029132843017578125, -0.02103424072265625, -0.012935638427734375, -0.0048370361328125, 0.003261566162109375, 0.01136016845703125, 0.019458770751953125, 0.027557373046875, 0.035655975341796875, 0.04375457763671875, 0.051853179931640625, 0.0599517822265625, 0.06805038452148438, 0.07614898681640625, 0.08424758911132812, 0.09234619140625, 0.10044479370117188, 0.10854339599609375, 0.11664199829101562, 0.1247406005859375, 0.13283920288085938, 0.14093780517578125, 0.14903640747070312, 0.157135009765625, 0.16523361206054688, 0.17333221435546875, 0.18143081665039062, 0.1895294189453125, 0.19762802124023438, 0.20572662353515625, 0.21382522583007812, 0.221923828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 17.0, 25.0, 44.0, 113.0, 335.0, 2317.0, 807.0, 254.0, 89.0, 37.0, 23.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0645751953125, -0.062073707580566406, -0.05957221984863281, -0.05707073211669922, -0.054569244384765625, -0.05206775665283203, -0.04956626892089844, -0.047064781188964844, -0.04456329345703125, -0.042061805725097656, -0.03956031799316406, -0.03705883026123047, -0.034557342529296875, -0.03205585479736328, -0.029554367065429688, -0.027052879333496094, -0.0245513916015625, -0.022049903869628906, -0.019548416137695312, -0.01704692840576172, -0.014545440673828125, -0.012043952941894531, -0.009542465209960938, -0.007040977478027344, -0.00453948974609375, -0.0020380020141601562, 0.0004634857177734375, 0.0029649734497070312, 0.005466461181640625, 0.007967948913574219, 0.010469436645507812, 0.012970924377441406, 0.015472412109375, 0.017973899841308594, 0.020475387573242188, 0.02297687530517578, 0.025478363037109375, 0.02797985076904297, 0.030481338500976562, 0.032982826232910156, 0.03548431396484375, 0.037985801696777344, 0.04048728942871094, 0.04298877716064453, 0.045490264892578125, 0.04799175262451172, 0.05049324035644531, 0.052994728088378906, 0.0554962158203125, 0.057997703552246094, 0.06049919128417969, 0.06300067901611328, 0.06550216674804688, 0.06800365447998047, 0.07050514221191406, 0.07300662994384766, 0.07550811767578125, 0.07800960540771484, 0.08051109313964844, 0.08301258087158203, 0.08551406860351562, 0.08801555633544922, 0.09051704406738281, 0.0930185317993164, 0.09552001953125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 27.0, 85.0, 246.0, 412.0, 172.0, 43.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3954436182975769, -0.38095805048942566, -0.3664724826812744, -0.35198691487312317, -0.3375013470649719, -0.3230157792568207, -0.30853021144866943, -0.2940446734428406, -0.27955907583236694, -0.2650735080242157, -0.25058794021606445, -0.2361023724079132, -0.22161680459976196, -0.20713123679161072, -0.19264568388462067, -0.17816011607646942, -0.16367456316947937, -0.14918899536132812, -0.13470342755317688, -0.12021786719560623, -0.10573229938745499, -0.09124673157930374, -0.0767611712217331, -0.06227560341358185, -0.0477900356054306, -0.03330446779727936, -0.01881890371441841, -0.004333339631557465, 0.01015222817659378, 0.024637795984745026, 0.039123356342315674, 0.05360892415046692, 0.06809449195861816, 0.08258005976676941, 0.09706562757492065, 0.1115511879324913, 0.12603676319122314, 0.1405223309993744, 0.15500788390636444, 0.16949345171451569, 0.18397901952266693, 0.19846458733081818, 0.21295015513896942, 0.22743570804595947, 0.24192127585411072, 0.25640684366226196, 0.2708924114704132, 0.28537797927856445, 0.2998635470867157, 0.31434911489486694, 0.3288346827030182, 0.34332025051116943, 0.3578058183193207, 0.3722913861274719, 0.3867769241333008, 0.4012625217437744, 0.41574805974960327, 0.4302336275577545, 0.44471919536590576, 0.459204763174057, 0.47369033098220825, 0.4881758987903595, 0.5026614665985107, 0.5171470046043396, 0.5316326022148132]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 9.0, 11.0, 15.0, 18.0, 27.0, 30.0, 42.0, 49.0, 52.0, 52.0, 68.0, 58.0, 65.0, 73.0, 65.0, 65.0, 56.0, 39.0, 37.0, 33.0, 34.0, 21.0, 22.0, 17.0, 14.0, 7.0, 9.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1941661238670349, -0.18874065577983856, -0.1833151876926422, -0.17788971960544586, -0.1724642515182495, -0.16703878343105316, -0.1616133153438568, -0.15618786215782166, -0.1507623791694641, -0.14533691108226776, -0.1399114429950714, -0.13448597490787506, -0.1290605068206787, -0.12363503873348236, -0.11820957809686661, -0.11278411000967026, -0.1073586493730545, -0.10193318128585815, -0.0965077131986618, -0.09108224511146545, -0.0856567770242691, -0.08023130893707275, -0.074805848300457, -0.06938038021326065, -0.0639549121260643, -0.05852944403886795, -0.0531039759516716, -0.04767851158976555, -0.0422530435025692, -0.03682757541537285, -0.0314021110534668, -0.025976642966270447, -0.020551174879074097, -0.015125707723200321, -0.009700240567326546, -0.004274774342775345, 0.0011506937444210052, 0.006576161831617355, 0.012001626193523407, 0.017427094280719757, 0.022852562367916107, 0.028278030455112457, 0.03370349854230881, 0.03912896290421486, 0.04455443099141121, 0.04997989907860756, 0.05540536344051361, 0.06083083152770996, 0.06625629961490631, 0.07168176770210266, 0.07710723578929901, 0.08253270387649536, 0.08795817196369171, 0.09338364005088806, 0.09880910068750381, 0.10423456877470016, 0.10966003686189651, 0.11508550494909286, 0.12051097303628922, 0.12593643367290497, 0.13136190176010132, 0.13678736984729767, 0.14221283793449402, 0.14763830602169037, 0.15306377410888672]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 8.0, 18.0, 18.0, 26.0, 39.0, 51.0, 58.0, 102.0, 124.0, 222.0, 319.0, 492.0, 866.0, 1784.0, 3880.0, 10240.0, 36888.0, 224650.0, 637680.0, 98311.0, 19938.0, 6523.0, 2866.0, 1402.0, 751.0, 404.0, 244.0, 201.0, 130.0, 90.0, 50.0, 45.0, 34.0, 27.0, 8.0, 15.0, 12.0, 10.0, 3.0, 2.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.1422119140625, -0.13829326629638672, -0.13437461853027344, -0.13045597076416016, -0.12653732299804688, -0.1226186752319336, -0.11870002746582031, -0.11478137969970703, -0.11086273193359375, -0.10694408416748047, -0.10302543640136719, -0.0991067886352539, -0.09518814086914062, -0.09126949310302734, -0.08735084533691406, -0.08343219757080078, -0.0795135498046875, -0.07559490203857422, -0.07167625427246094, -0.06775760650634766, -0.06383895874023438, -0.059920310974121094, -0.05600166320800781, -0.05208301544189453, -0.04816436767578125, -0.04424571990966797, -0.04032707214355469, -0.036408424377441406, -0.032489776611328125, -0.028571128845214844, -0.024652481079101562, -0.02073383331298828, -0.016815185546875, -0.012896537780761719, -0.008977890014648438, -0.005059242248535156, -0.001140594482421875, 0.0027780532836914062, 0.0066967010498046875, 0.010615348815917969, 0.01453399658203125, 0.01845264434814453, 0.022371292114257812, 0.026289939880371094, 0.030208587646484375, 0.034127235412597656, 0.03804588317871094, 0.04196453094482422, 0.0458831787109375, 0.04980182647705078, 0.05372047424316406, 0.057639122009277344, 0.061557769775390625, 0.0654764175415039, 0.06939506530761719, 0.07331371307373047, 0.07723236083984375, 0.08115100860595703, 0.08506965637207031, 0.0889883041381836, 0.09290695190429688, 0.09682559967041016, 0.10074424743652344, 0.10466289520263672, 0.10858154296875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 7.0, 10.0, 6.0, 11.0, 17.0, 27.0, 109.0, 182.0, 269.0, 189.0, 82.0, 33.0, 15.0, 11.0, 5.0, 12.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1287841796875, -0.12425041198730469, -0.11971664428710938, -0.11518287658691406, -0.11064910888671875, -0.10611534118652344, -0.10158157348632812, -0.09704780578613281, -0.0925140380859375, -0.08798027038574219, -0.08344650268554688, -0.07891273498535156, -0.07437896728515625, -0.06984519958496094, -0.06531143188476562, -0.06077766418457031, -0.056243896484375, -0.05171012878417969, -0.047176361083984375, -0.04264259338378906, -0.03810882568359375, -0.03357505798339844, -0.029041290283203125, -0.024507522583007812, -0.0199737548828125, -0.015439987182617188, -0.010906219482421875, -0.0063724517822265625, -0.00183868408203125, 0.0026950836181640625, 0.007228851318359375, 0.011762619018554688, 0.01629638671875, 0.020830154418945312, 0.025363922119140625, 0.029897689819335938, 0.03443145751953125, 0.03896522521972656, 0.043498992919921875, 0.04803276062011719, 0.0525665283203125, 0.05710029602050781, 0.061634063720703125, 0.06616783142089844, 0.07070159912109375, 0.07523536682128906, 0.07976913452148438, 0.08430290222167969, 0.088836669921875, 0.09337043762207031, 0.09790420532226562, 0.10243797302246094, 0.10697174072265625, 0.11150550842285156, 0.11603927612304688, 0.12057304382324219, 0.1251068115234375, 0.1296405792236328, 0.13417434692382812, 0.13870811462402344, 0.14324188232421875, 0.14777565002441406, 0.15230941772460938, 0.1568431854248047, 0.161376953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 5.0, 14.0, 10.0, 23.0, 20.0, 18.0, 32.0, 36.0, 44.0, 53.0, 71.0, 79.0, 89.0, 140.0, 192.0, 322.0, 566.0, 1243.0, 4248.0, 71258.0, 908901.0, 54485.0, 3846.0, 1163.0, 530.0, 298.0, 189.0, 122.0, 95.0, 95.0, 71.0, 53.0, 54.0, 30.0, 27.0, 31.0, 18.0, 16.0, 12.0, 12.0, 9.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.2607421875, -0.25295066833496094, -0.24515914916992188, -0.2373676300048828, -0.22957611083984375, -0.2217845916748047, -0.21399307250976562, -0.20620155334472656, -0.1984100341796875, -0.19061851501464844, -0.18282699584960938, -0.1750354766845703, -0.16724395751953125, -0.1594524383544922, -0.15166091918945312, -0.14386940002441406, -0.136077880859375, -0.12828636169433594, -0.12049484252929688, -0.11270332336425781, -0.10491180419921875, -0.09712028503417969, -0.08932876586914062, -0.08153724670410156, -0.0737457275390625, -0.06595420837402344, -0.058162689208984375, -0.05037117004394531, -0.04257965087890625, -0.03478813171386719, -0.026996612548828125, -0.019205093383789062, -0.01141357421875, -0.0036220550537109375, 0.004169464111328125, 0.011960983276367188, 0.01975250244140625, 0.027544021606445312, 0.035335540771484375, 0.04312705993652344, 0.0509185791015625, 0.05871009826660156, 0.06650161743164062, 0.07429313659667969, 0.08208465576171875, 0.08987617492675781, 0.09766769409179688, 0.10545921325683594, 0.113250732421875, 0.12104225158691406, 0.12883377075195312, 0.1366252899169922, 0.14441680908203125, 0.1522083282470703, 0.15999984741210938, 0.16779136657714844, 0.1755828857421875, 0.18337440490722656, 0.19116592407226562, 0.1989574432373047, 0.20674896240234375, 0.2145404815673828, 0.22233200073242188, 0.23012351989746094, 0.2379150390625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 7.0, 7.0, 8.0, 8.0, 18.0, 15.0, 18.0, 11.0, 30.0, 22.0, 24.0, 28.0, 31.0, 37.0, 44.0, 35.0, 42.0, 39.0, 34.0, 44.0, 35.0, 45.0, 32.0, 36.0, 39.0, 38.0, 42.0, 24.0, 19.0, 24.0, 22.0, 29.0, 18.0, 15.0, 12.0, 11.0, 10.0, 9.0, 13.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.217529296875, -0.2109394073486328, -0.20434951782226562, -0.19775962829589844, -0.19116973876953125, -0.18457984924316406, -0.17798995971679688, -0.1714000701904297, -0.1648101806640625, -0.1582202911376953, -0.15163040161132812, -0.14504051208496094, -0.13845062255859375, -0.13186073303222656, -0.12527084350585938, -0.11868095397949219, -0.112091064453125, -0.10550117492675781, -0.09891128540039062, -0.09232139587402344, -0.08573150634765625, -0.07914161682128906, -0.07255172729492188, -0.06596183776855469, -0.0593719482421875, -0.05278205871582031, -0.046192169189453125, -0.03960227966308594, -0.03301239013671875, -0.026422500610351562, -0.019832611083984375, -0.013242721557617188, -0.00665283203125, -6.29425048828125e-05, 0.006526947021484375, 0.013116836547851562, 0.01970672607421875, 0.026296615600585938, 0.032886505126953125, 0.03947639465332031, 0.0460662841796875, 0.05265617370605469, 0.059246063232421875, 0.06583595275878906, 0.07242584228515625, 0.07901573181152344, 0.08560562133789062, 0.09219551086425781, 0.098785400390625, 0.10537528991699219, 0.11196517944335938, 0.11855506896972656, 0.12514495849609375, 0.13173484802246094, 0.13832473754882812, 0.1449146270751953, 0.1515045166015625, 0.1580944061279297, 0.16468429565429688, 0.17127418518066406, 0.17786407470703125, 0.18445396423339844, 0.19104385375976562, 0.1976337432861328, 0.2042236328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 18.0, 14.0, 17.0, 27.0, 59.0, 81.0, 115.0, 177.0, 327.0, 626.0, 1409.0, 3867.0, 12870.0, 64822.0, 675488.0, 246966.0, 29757.0, 7298.0, 2461.0, 998.0, 468.0, 257.0, 141.0, 91.0, 55.0, 31.0, 34.0, 19.0, 9.0, 7.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.05230712890625, -0.050711631774902344, -0.04911613464355469, -0.04752063751220703, -0.045925140380859375, -0.04432964324951172, -0.04273414611816406, -0.041138648986816406, -0.03954315185546875, -0.037947654724121094, -0.03635215759277344, -0.03475666046142578, -0.033161163330078125, -0.03156566619873047, -0.029970169067382812, -0.028374671936035156, -0.0267791748046875, -0.025183677673339844, -0.023588180541992188, -0.02199268341064453, -0.020397186279296875, -0.01880168914794922, -0.017206192016601562, -0.015610694885253906, -0.01401519775390625, -0.012419700622558594, -0.010824203491210938, -0.009228706359863281, -0.007633209228515625, -0.006037712097167969, -0.0044422149658203125, -0.0028467178344726562, -0.001251220703125, 0.00034427642822265625, 0.0019397735595703125, 0.0035352706909179688, 0.005130767822265625, 0.006726264953613281, 0.008321762084960938, 0.009917259216308594, 0.01151275634765625, 0.013108253479003906, 0.014703750610351562, 0.01629924774169922, 0.017894744873046875, 0.01949024200439453, 0.021085739135742188, 0.022681236267089844, 0.0242767333984375, 0.025872230529785156, 0.027467727661132812, 0.02906322479248047, 0.030658721923828125, 0.03225421905517578, 0.03384971618652344, 0.035445213317871094, 0.03704071044921875, 0.038636207580566406, 0.04023170471191406, 0.04182720184326172, 0.043422698974609375, 0.04501819610595703, 0.04661369323730469, 0.048209190368652344, 0.0498046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 9.0, 9.0, 18.0, 22.0, 38.0, 92.0, 141.0, 214.0, 195.0, 113.0, 56.0, 31.0, 14.0, 17.0, 11.0, 3.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8835067749023438e-05, -1.8259510397911072e-05, -1.7683953046798706e-05, -1.710839569568634e-05, -1.6532838344573975e-05, -1.595728099346161e-05, -1.5381723642349243e-05, -1.4806166291236877e-05, -1.4230608940124512e-05, -1.3655051589012146e-05, -1.307949423789978e-05, -1.2503936886787415e-05, -1.1928379535675049e-05, -1.1352822184562683e-05, -1.0777264833450317e-05, -1.0201707482337952e-05, -9.626150131225586e-06, -9.05059278011322e-06, -8.475035429000854e-06, -7.899478077888489e-06, -7.323920726776123e-06, -6.748363375663757e-06, -6.172806024551392e-06, -5.597248673439026e-06, -5.02169132232666e-06, -4.4461339712142944e-06, -3.870576620101929e-06, -3.295019268989563e-06, -2.7194619178771973e-06, -2.1439045667648315e-06, -1.5683472156524658e-06, -9.927898645401e-07, -4.172325134277344e-07, 1.5832483768463135e-07, 7.338821887969971e-07, 1.3094395399093628e-06, 1.8849968910217285e-06, 2.4605542421340942e-06, 3.03611159324646e-06, 3.6116689443588257e-06, 4.187226295471191e-06, 4.762783646583557e-06, 5.338340997695923e-06, 5.9138983488082886e-06, 6.489455699920654e-06, 7.06501305103302e-06, 7.640570402145386e-06, 8.216127753257751e-06, 8.791685104370117e-06, 9.367242455482483e-06, 9.942799806594849e-06, 1.0518357157707214e-05, 1.109391450881958e-05, 1.1669471859931946e-05, 1.2245029211044312e-05, 1.2820586562156677e-05, 1.3396143913269043e-05, 1.3971701264381409e-05, 1.4547258615493774e-05, 1.512281596660614e-05, 1.5698373317718506e-05, 1.627393066883087e-05, 1.6849488019943237e-05, 1.7425045371055603e-05, 1.800060272216797e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 4.0, 4.0, 8.0, 17.0, 26.0, 43.0, 61.0, 95.0, 201.0, 398.0, 1064.0, 3545.0, 21744.0, 551554.0, 444494.0, 19856.0, 3569.0, 1001.0, 412.0, 187.0, 101.0, 63.0, 31.0, 30.0, 15.0, 10.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0921630859375, -0.08945083618164062, -0.08673858642578125, -0.08402633666992188, -0.0813140869140625, -0.07860183715820312, -0.07588958740234375, -0.07317733764648438, -0.070465087890625, -0.06775283813476562, -0.06504058837890625, -0.062328338623046875, -0.0596160888671875, -0.056903839111328125, -0.05419158935546875, -0.051479339599609375, -0.04876708984375, -0.046054840087890625, -0.04334259033203125, -0.040630340576171875, -0.0379180908203125, -0.035205841064453125, -0.03249359130859375, -0.029781341552734375, -0.027069091796875, -0.024356842041015625, -0.02164459228515625, -0.018932342529296875, -0.0162200927734375, -0.013507843017578125, -0.01079559326171875, -0.008083343505859375, -0.00537109375, -0.002658843994140625, 5.340576171875e-05, 0.002765655517578125, 0.0054779052734375, 0.008190155029296875, 0.01090240478515625, 0.013614654541015625, 0.016326904296875, 0.019039154052734375, 0.02175140380859375, 0.024463653564453125, 0.0271759033203125, 0.029888153076171875, 0.03260040283203125, 0.035312652587890625, 0.03802490234375, 0.040737152099609375, 0.04344940185546875, 0.046161651611328125, 0.0488739013671875, 0.051586151123046875, 0.05429840087890625, 0.057010650634765625, 0.059722900390625, 0.062435150146484375, 0.06514739990234375, 0.06785964965820312, 0.0705718994140625, 0.07328414916992188, 0.07599639892578125, 0.07870864868164062, 0.0814208984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 10.0, 20.0, 21.0, 30.0, 49.0, 61.0, 92.0, 92.0, 95.0, 111.0, 97.0, 80.0, 58.0, 38.0, 28.0, 34.0, 17.0, 13.0, 8.0, 8.0, 9.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041748046875, -0.04001331329345703, -0.03827857971191406, -0.036543846130371094, -0.034809112548828125, -0.033074378967285156, -0.03133964538574219, -0.02960491180419922, -0.02787017822265625, -0.02613544464111328, -0.024400711059570312, -0.022665977478027344, -0.020931243896484375, -0.019196510314941406, -0.017461776733398438, -0.01572704315185547, -0.0139923095703125, -0.012257575988769531, -0.010522842407226562, -0.008788108825683594, -0.007053375244140625, -0.005318641662597656, -0.0035839080810546875, -0.0018491744995117188, -0.00011444091796875, 0.0016202926635742188, 0.0033550262451171875, 0.005089759826660156, 0.006824493408203125, 0.008559226989746094, 0.010293960571289062, 0.012028694152832031, 0.013763427734375, 0.015498161315917969, 0.017232894897460938, 0.018967628479003906, 0.020702362060546875, 0.022437095642089844, 0.024171829223632812, 0.02590656280517578, 0.02764129638671875, 0.02937602996826172, 0.031110763549804688, 0.032845497131347656, 0.034580230712890625, 0.036314964294433594, 0.03804969787597656, 0.03978443145751953, 0.0415191650390625, 0.04325389862060547, 0.04498863220214844, 0.046723365783691406, 0.048458099365234375, 0.050192832946777344, 0.05192756652832031, 0.05366230010986328, 0.05539703369140625, 0.05713176727294922, 0.05886650085449219, 0.060601234436035156, 0.062335968017578125, 0.0640707015991211, 0.06580543518066406, 0.06754016876220703, 0.06927490234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 9.0, 32.0, 60.0, 141.0, 259.0, 264.0, 124.0, 57.0, 20.0, 10.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8826207518577576, -0.8521865606307983, -0.8217523694038391, -0.7913181781768799, -0.7608839273452759, -0.7304497361183167, -0.7000155448913574, -0.6695813536643982, -0.639147162437439, -0.6087129712104797, -0.5782787799835205, -0.5478445291519165, -0.5174103379249573, -0.48697614669799805, -0.4565419554710388, -0.4261077642440796, -0.3956735134124756, -0.36523932218551636, -0.33480510115623474, -0.3043709099292755, -0.2739366888999939, -0.24350249767303467, -0.21306830644607544, -0.18263410031795502, -0.1521998941898346, -0.12176568806171417, -0.09133148938417435, -0.06089729070663452, -0.0304630845785141, -2.8878450393676758e-05, 0.030405312776565552, 0.060839518904685974, 0.09127366542816162, 0.12170787155628204, 0.15214207768440247, 0.1825762689113617, 0.21301047503948212, 0.24344468116760254, 0.27387887239456177, 0.304313063621521, 0.3347472846508026, 0.36518147587776184, 0.39561569690704346, 0.4260498881340027, 0.4564840793609619, 0.48691830039024353, 0.5173524618148804, 0.5477867126464844, 0.5782209038734436, 0.6086550951004028, 0.6390892863273621, 0.6695234775543213, 0.6999577283859253, 0.7303919196128845, 0.7608261108398438, 0.791260302066803, 0.8216944932937622, 0.8521286845207214, 0.8825628757476807, 0.9129971265792847, 0.9434313178062439, 0.9738655090332031, 1.0042996406555176, 1.0347338914871216, 1.0651681423187256]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 8.0, 3.0, 8.0, 9.0, 13.0, 13.0, 7.0, 17.0, 16.0, 19.0, 18.0, 25.0, 20.0, 27.0, 32.0, 38.0, 31.0, 60.0, 45.0, 42.0, 47.0, 40.0, 36.0, 40.0, 36.0, 36.0, 39.0, 27.0, 36.0, 23.0, 27.0, 26.0, 25.0, 23.0, 19.0, 13.0, 10.0, 9.0, 10.0, 7.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.2642877101898193, -1.2248338460922241, -1.185379981994629, -1.1459261178970337, -1.1064722537994385, -1.0670185089111328, -1.0275646448135376, -0.9881107807159424, -0.9486569166183472, -0.909203052520752, -0.8697491884231567, -0.8302953839302063, -0.7908415198326111, -0.7513876557350159, -0.7119338512420654, -0.6724799871444702, -0.633026123046875, -0.5935722589492798, -0.5541183948516846, -0.5146645903587341, -0.4752107262611389, -0.4357568621635437, -0.3963030278682709, -0.35684919357299805, -0.31739532947540283, -0.2779414653778076, -0.2384876310825348, -0.19903378188610077, -0.15957993268966675, -0.12012608349323273, -0.0806722342967987, -0.04121840000152588, -0.0017644166946411133, 0.03768943250179291, 0.07714328169822693, 0.11659713089466095, 0.15605098009109497, 0.195504829287529, 0.234958678483963, 0.27441251277923584, 0.31386637687683105, 0.35332024097442627, 0.3927740752696991, 0.4322279095649719, 0.47168177366256714, 0.5111356377601624, 0.5505894422531128, 0.590043306350708, 0.6294971704483032, 0.6689510345458984, 0.7084048986434937, 0.7478587031364441, 0.7873125672340393, 0.8267664313316345, 0.866220235824585, 0.9056740999221802, 0.9451279640197754, 0.9845818281173706, 1.0240356922149658, 1.063489556312561, 1.1029434204101562, 1.142397165298462, 1.1818510293960571, 1.2213048934936523, 1.2607587575912476]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 1.0, 10.0, 11.0, 14.0, 6.0, 18.0, 32.0, 41.0, 105.0, 341.0, 4208.0, 4148399.0, 39851.0, 877.0, 174.0, 64.0, 37.0, 23.0, 21.0, 13.0, 8.0, 8.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.431884765625, -0.41782379150390625, -0.4037628173828125, -0.38970184326171875, -0.375640869140625, -0.36157989501953125, -0.3475189208984375, -0.33345794677734375, -0.31939697265625, -0.30533599853515625, -0.2912750244140625, -0.27721405029296875, -0.263153076171875, -0.24909210205078125, -0.2350311279296875, -0.22097015380859375, -0.2069091796875, -0.19284820556640625, -0.1787872314453125, -0.16472625732421875, -0.150665283203125, -0.13660430908203125, -0.1225433349609375, -0.10848236083984375, -0.09442138671875, -0.08036041259765625, -0.0662994384765625, -0.05223846435546875, -0.038177490234375, -0.02411651611328125, -0.0100555419921875, 0.00400543212890625, 0.01806640625, 0.03212738037109375, 0.0461883544921875, 0.06024932861328125, 0.074310302734375, 0.08837127685546875, 0.1024322509765625, 0.11649322509765625, 0.13055419921875, 0.14461517333984375, 0.1586761474609375, 0.17273712158203125, 0.186798095703125, 0.20085906982421875, 0.2149200439453125, 0.22898101806640625, 0.2430419921875, 0.25710296630859375, 0.2711639404296875, 0.28522491455078125, 0.299285888671875, 0.31334686279296875, 0.3274078369140625, 0.34146881103515625, 0.35552978515625, 0.36959075927734375, 0.3836517333984375, 0.39771270751953125, 0.411773681640625, 0.42583465576171875, 0.4398956298828125, 0.45395660400390625, 0.468017578125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 1.0, 1.0, 4.0, 5.0, 15.0, 11.0, 13.0, 30.0, 96.0, 187.0, 260.0, 201.0, 84.0, 30.0, 23.0, 11.0, 8.0, 10.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1290283203125, -0.12449836730957031, -0.11996841430664062, -0.11543846130371094, -0.11090850830078125, -0.10637855529785156, -0.10184860229492188, -0.09731864929199219, -0.0927886962890625, -0.08825874328613281, -0.08372879028320312, -0.07919883728027344, -0.07466888427734375, -0.07013893127441406, -0.06560897827148438, -0.06107902526855469, -0.056549072265625, -0.05201911926269531, -0.047489166259765625, -0.04295921325683594, -0.03842926025390625, -0.03389930725097656, -0.029369354248046875, -0.024839401245117188, -0.0203094482421875, -0.015779495239257812, -0.011249542236328125, -0.0067195892333984375, -0.00218963623046875, 0.0023403167724609375, 0.006870269775390625, 0.011400222778320312, 0.01593017578125, 0.020460128784179688, 0.024990081787109375, 0.029520034790039062, 0.03404998779296875, 0.03857994079589844, 0.043109893798828125, 0.04763984680175781, 0.0521697998046875, 0.05669975280761719, 0.061229705810546875, 0.06575965881347656, 0.07028961181640625, 0.07481956481933594, 0.07934951782226562, 0.08387947082519531, 0.088409423828125, 0.09293937683105469, 0.09746932983398438, 0.10199928283691406, 0.10652923583984375, 0.11105918884277344, 0.11558914184570312, 0.12011909484863281, 0.1246490478515625, 0.1291790008544922, 0.13370895385742188, 0.13823890686035156, 0.14276885986328125, 0.14729881286621094, 0.15182876586914062, 0.1563587188720703, 0.160888671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 10.0, 10.0, 18.0, 41.0, 63.0, 89.0, 203.0, 404.0, 895.0, 1931.0, 5915.0, 25661.0, 194190.0, 3628444.0, 291037.0, 33834.0, 7209.0, 2417.0, 947.0, 456.0, 221.0, 109.0, 57.0, 32.0, 24.0, 14.0, 10.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.10223388671875, -0.09943866729736328, -0.09664344787597656, -0.09384822845458984, -0.09105300903320312, -0.0882577896118164, -0.08546257019042969, -0.08266735076904297, -0.07987213134765625, -0.07707691192626953, -0.07428169250488281, -0.0714864730834961, -0.06869125366210938, -0.06589603424072266, -0.06310081481933594, -0.06030559539794922, -0.0575103759765625, -0.05471515655517578, -0.05191993713378906, -0.049124717712402344, -0.046329498291015625, -0.043534278869628906, -0.04073905944824219, -0.03794384002685547, -0.03514862060546875, -0.03235340118408203, -0.029558181762695312, -0.026762962341308594, -0.023967742919921875, -0.021172523498535156, -0.018377304077148438, -0.015582084655761719, -0.012786865234375, -0.009991645812988281, -0.0071964263916015625, -0.004401206970214844, -0.001605987548828125, 0.0011892318725585938, 0.0039844512939453125, 0.006779670715332031, 0.00957489013671875, 0.012370109558105469, 0.015165328979492188, 0.017960548400878906, 0.020755767822265625, 0.023550987243652344, 0.026346206665039062, 0.02914142608642578, 0.0319366455078125, 0.03473186492919922, 0.03752708435058594, 0.040322303771972656, 0.043117523193359375, 0.045912742614746094, 0.04870796203613281, 0.05150318145751953, 0.05429840087890625, 0.05709362030029297, 0.05988883972167969, 0.0626840591430664, 0.06547927856445312, 0.06827449798583984, 0.07106971740722656, 0.07386493682861328, 0.07666015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 11.0, 9.0, 12.0, 20.0, 45.0, 66.0, 97.0, 121.0, 207.0, 362.0, 1589.0, 664.0, 309.0, 188.0, 119.0, 68.0, 58.0, 30.0, 30.0, 17.0, 15.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.036468505859375, -0.035282135009765625, -0.03409576416015625, -0.032909393310546875, -0.0317230224609375, -0.030536651611328125, -0.02935028076171875, -0.028163909912109375, -0.0269775390625, -0.025791168212890625, -0.02460479736328125, -0.023418426513671875, -0.0222320556640625, -0.021045684814453125, -0.01985931396484375, -0.018672943115234375, -0.017486572265625, -0.016300201416015625, -0.01511383056640625, -0.013927459716796875, -0.0127410888671875, -0.011554718017578125, -0.01036834716796875, -0.009181976318359375, -0.00799560546875, -0.006809234619140625, -0.00562286376953125, -0.004436492919921875, -0.0032501220703125, -0.002063751220703125, -0.00087738037109375, 0.000308990478515625, 0.001495361328125, 0.002681732177734375, 0.00386810302734375, 0.005054473876953125, 0.0062408447265625, 0.007427215576171875, 0.00861358642578125, 0.009799957275390625, 0.010986328125, 0.012172698974609375, 0.01335906982421875, 0.014545440673828125, 0.0157318115234375, 0.016918182373046875, 0.01810455322265625, 0.019290924072265625, 0.020477294921875, 0.021663665771484375, 0.02285003662109375, 0.024036407470703125, 0.0252227783203125, 0.026409149169921875, 0.02759552001953125, 0.028781890869140625, 0.02996826171875, 0.031154632568359375, 0.03234100341796875, 0.033527374267578125, 0.0347137451171875, 0.035900115966796875, 0.03708648681640625, 0.038272857666015625, 0.039459228515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 8.0, 76.0, 548.0, 339.0, 27.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16194187104701996, -0.133729487657547, -0.10551711916923523, -0.07730473577976227, -0.049092359840869904, -0.02087998390197754, 0.007332399487495422, 0.03554476797580719, 0.06375715136528015, 0.09196952730417252, 0.12018190324306488, 0.14839428663253784, 0.1766066551208496, 0.20481903851032257, 0.23303142189979553, 0.2612437903881073, 0.28945618867874146, 0.3176685571670532, 0.3458809554576874, 0.37409332394599915, 0.4023056924343109, 0.43051809072494507, 0.45873045921325684, 0.4869428277015686, 0.5151551961898804, 0.5433675646781921, 0.5715799331665039, 0.5997923612594604, 0.6280047297477722, 0.656217098236084, 0.6844294667243958, 0.7126418352127075, 0.7408542037010193, 0.769066572189331, 0.7972789406776428, 0.8254913091659546, 0.8537037372589111, 0.8819161057472229, 0.9101284742355347, 0.9383408427238464, 0.9665532112121582, 0.99476557970047, 1.0229779481887817, 1.0511903762817383, 1.0794026851654053, 1.1076151132583618, 1.1358275413513184, 1.1640398502349854, 1.192252278327942, 1.2204647064208984, 1.2486770153045654, 1.276889443397522, 1.305101752281189, 1.3333141803741455, 1.3615264892578125, 1.389738917350769, 1.417951226234436, 1.4461636543273926, 1.4743759632110596, 1.5025883913040161, 1.530800700187683, 1.5590131282806396, 1.5872254371643066, 1.6154378652572632, 1.6436502933502197]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 7.0, 8.0, 6.0, 14.0, 18.0, 18.0, 19.0, 23.0, 31.0, 29.0, 38.0, 23.0, 36.0, 42.0, 40.0, 46.0, 41.0, 46.0, 42.0, 40.0, 47.0, 29.0, 36.0, 34.0, 36.0, 37.0, 20.0, 30.0, 28.0, 18.0, 22.0, 19.0, 19.0, 7.0, 16.0, 9.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.11557602882385254, -0.11183465272188187, -0.1080932691693306, -0.10435189306735992, -0.10061050951480865, -0.09686913341283798, -0.09312775731086731, -0.08938637375831604, -0.08564499765634537, -0.0819036215543747, -0.07816223800182343, -0.07442086189985275, -0.07067948579788208, -0.06693810224533081, -0.06319672614336014, -0.05945534631609917, -0.055713966488838196, -0.051972586661577225, -0.048231206834316254, -0.04448983073234558, -0.04074845090508461, -0.03700707107782364, -0.033265694975852966, -0.029524315148591995, -0.025782935321331024, -0.022041555494070053, -0.01830017752945423, -0.014558798633515835, -0.010817419737577438, -0.007076039910316467, -0.0033346619457006454, 0.0004067160189151764, 0.0041480958461761475, 0.007889474742114544, 0.01163085363805294, 0.015372232533991337, 0.019113611429929733, 0.022854991257190704, 0.026596369221806526, 0.030337747186422348, 0.03407912701368332, 0.03782050684094429, 0.04156188666820526, 0.045303262770175934, 0.049044642597436905, 0.052786022424697876, 0.05652739852666855, 0.06026877835392952, 0.06401015818119049, 0.06775153428316116, 0.07149291783571243, 0.0752342939376831, 0.07897567749023438, 0.08271705359220505, 0.08645842969417572, 0.09019981324672699, 0.09394118934869766, 0.09768256545066833, 0.1014239490032196, 0.10516532510519028, 0.10890670120716095, 0.11264808475971222, 0.11638946086168289, 0.12013083696365356, 0.12387222051620483]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 4.0, 12.0, 16.0, 20.0, 30.0, 65.0, 103.0, 172.0, 308.0, 669.0, 1691.0, 5921.0, 44961.0, 880958.0, 100018.0, 9577.0, 2312.0, 885.0, 378.0, 169.0, 109.0, 54.0, 39.0, 25.0, 21.0, 11.0, 3.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1927490234375, -0.1855144500732422, -0.17827987670898438, -0.17104530334472656, -0.16381072998046875, -0.15657615661621094, -0.14934158325195312, -0.1421070098876953, -0.1348724365234375, -0.1276378631591797, -0.12040328979492188, -0.11316871643066406, -0.10593414306640625, -0.09869956970214844, -0.09146499633789062, -0.08423042297363281, -0.076995849609375, -0.06976127624511719, -0.06252670288085938, -0.05529212951660156, -0.04805755615234375, -0.04082298278808594, -0.033588409423828125, -0.026353836059570312, -0.0191192626953125, -0.011884689331054688, -0.004650115966796875, 0.0025844573974609375, 0.00981903076171875, 0.017053604125976562, 0.024288177490234375, 0.03152275085449219, 0.03875732421875, 0.04599189758300781, 0.053226470947265625, 0.06046104431152344, 0.06769561767578125, 0.07493019104003906, 0.08216476440429688, 0.08939933776855469, 0.0966339111328125, 0.10386848449707031, 0.11110305786132812, 0.11833763122558594, 0.12557220458984375, 0.13280677795410156, 0.14004135131835938, 0.1472759246826172, 0.154510498046875, 0.1617450714111328, 0.16897964477539062, 0.17621421813964844, 0.18344879150390625, 0.19068336486816406, 0.19791793823242188, 0.2051525115966797, 0.2123870849609375, 0.2196216583251953, 0.22685623168945312, 0.23409080505371094, 0.24132537841796875, 0.24855995178222656, 0.2557945251464844, 0.2630290985107422, 0.270263671875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 1.0, 2.0, 4.0, 4.0, 15.0, 9.0, 18.0, 29.0, 80.0, 194.0, 256.0, 201.0, 96.0, 27.0, 24.0, 12.0, 7.0, 8.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12841796875, -0.12391471862792969, -0.11941146850585938, -0.11490821838378906, -0.11040496826171875, -0.10590171813964844, -0.10139846801757812, -0.09689521789550781, -0.0923919677734375, -0.08788871765136719, -0.08338546752929688, -0.07888221740722656, -0.07437896728515625, -0.06987571716308594, -0.06537246704101562, -0.06086921691894531, -0.056365966796875, -0.05186271667480469, -0.047359466552734375, -0.04285621643066406, -0.03835296630859375, -0.03384971618652344, -0.029346466064453125, -0.024843215942382812, -0.0203399658203125, -0.015836715698242188, -0.011333465576171875, -0.0068302154541015625, -0.00232696533203125, 0.0021762847900390625, 0.006679534912109375, 0.011182785034179688, 0.01568603515625, 0.020189285278320312, 0.024692535400390625, 0.029195785522460938, 0.03369903564453125, 0.03820228576660156, 0.042705535888671875, 0.04720878601074219, 0.0517120361328125, 0.05621528625488281, 0.060718536376953125, 0.06522178649902344, 0.06972503662109375, 0.07422828674316406, 0.07873153686523438, 0.08323478698730469, 0.087738037109375, 0.09224128723144531, 0.09674453735351562, 0.10124778747558594, 0.10575103759765625, 0.11025428771972656, 0.11475753784179688, 0.11926078796386719, 0.1237640380859375, 0.1282672882080078, 0.13277053833007812, 0.13727378845214844, 0.14177703857421875, 0.14628028869628906, 0.15078353881835938, 0.1552867889404297, 0.1597900390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 9.0, 9.0, 3.0, 13.0, 24.0, 18.0, 28.0, 43.0, 39.0, 55.0, 92.0, 118.0, 176.0, 248.0, 380.0, 747.0, 1865.0, 8625.0, 120433.0, 827099.0, 78377.0, 6646.0, 1617.0, 693.0, 350.0, 227.0, 151.0, 120.0, 88.0, 65.0, 50.0, 31.0, 32.0, 21.0, 13.0, 14.0, 10.0, 14.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12237548828125, -0.11774539947509766, -0.11311531066894531, -0.10848522186279297, -0.10385513305664062, -0.09922504425048828, -0.09459495544433594, -0.0899648666381836, -0.08533477783203125, -0.0807046890258789, -0.07607460021972656, -0.07144451141357422, -0.06681442260742188, -0.06218433380126953, -0.05755424499511719, -0.052924156188964844, -0.0482940673828125, -0.043663978576660156, -0.03903388977050781, -0.03440380096435547, -0.029773712158203125, -0.02514362335205078, -0.020513534545898438, -0.015883445739746094, -0.01125335693359375, -0.006623268127441406, -0.0019931793212890625, 0.0026369094848632812, 0.007266998291015625, 0.011897087097167969, 0.016527175903320312, 0.021157264709472656, 0.025787353515625, 0.030417442321777344, 0.03504753112792969, 0.03967761993408203, 0.044307708740234375, 0.04893779754638672, 0.05356788635253906, 0.058197975158691406, 0.06282806396484375, 0.0674581527709961, 0.07208824157714844, 0.07671833038330078, 0.08134841918945312, 0.08597850799560547, 0.09060859680175781, 0.09523868560791016, 0.0998687744140625, 0.10449886322021484, 0.10912895202636719, 0.11375904083251953, 0.11838912963867188, 0.12301921844482422, 0.12764930725097656, 0.1322793960571289, 0.13690948486328125, 0.1415395736694336, 0.14616966247558594, 0.15079975128173828, 0.15542984008789062, 0.16005992889404297, 0.1646900177001953, 0.16932010650634766, 0.1739501953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 10.0, 4.0, 5.0, 11.0, 12.0, 12.0, 16.0, 17.0, 24.0, 19.0, 19.0, 31.0, 16.0, 28.0, 27.0, 32.0, 38.0, 41.0, 32.0, 34.0, 46.0, 33.0, 37.0, 32.0, 42.0, 38.0, 29.0, 41.0, 32.0, 33.0, 17.0, 27.0, 36.0, 16.0, 16.0, 12.0, 15.0, 8.0, 12.0, 13.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.2015380859375, -0.19568634033203125, -0.1898345947265625, -0.18398284912109375, -0.178131103515625, -0.17227935791015625, -0.1664276123046875, -0.16057586669921875, -0.15472412109375, -0.14887237548828125, -0.1430206298828125, -0.13716888427734375, -0.131317138671875, -0.12546539306640625, -0.1196136474609375, -0.11376190185546875, -0.10791015625, -0.10205841064453125, -0.0962066650390625, -0.09035491943359375, -0.084503173828125, -0.07865142822265625, -0.0727996826171875, -0.06694793701171875, -0.06109619140625, -0.05524444580078125, -0.0493927001953125, -0.04354095458984375, -0.037689208984375, -0.03183746337890625, -0.0259857177734375, -0.02013397216796875, -0.0142822265625, -0.00843048095703125, -0.0025787353515625, 0.00327301025390625, 0.009124755859375, 0.01497650146484375, 0.0208282470703125, 0.02667999267578125, 0.03253173828125, 0.03838348388671875, 0.0442352294921875, 0.05008697509765625, 0.055938720703125, 0.06179046630859375, 0.0676422119140625, 0.07349395751953125, 0.079345703125, 0.08519744873046875, 0.0910491943359375, 0.09690093994140625, 0.102752685546875, 0.10860443115234375, 0.1144561767578125, 0.12030792236328125, 0.12615966796875, 0.13201141357421875, 0.1378631591796875, 0.14371490478515625, 0.149566650390625, 0.15541839599609375, 0.1612701416015625, 0.16712188720703125, 0.1729736328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 12.0, 11.0, 14.0, 22.0, 39.0, 62.0, 82.0, 150.0, 239.0, 417.0, 853.0, 2209.0, 6639.0, 27953.0, 178850.0, 769373.0, 46235.0, 10108.0, 2925.0, 1067.0, 550.0, 292.0, 164.0, 85.0, 58.0, 38.0, 31.0, 21.0, 18.0, 13.0, 3.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05987548828125, -0.05817222595214844, -0.056468963623046875, -0.05476570129394531, -0.05306243896484375, -0.05135917663574219, -0.049655914306640625, -0.04795265197753906, -0.0462493896484375, -0.04454612731933594, -0.042842864990234375, -0.04113960266113281, -0.03943634033203125, -0.03773307800292969, -0.036029815673828125, -0.03432655334472656, -0.032623291015625, -0.030920028686523438, -0.029216766357421875, -0.027513504028320312, -0.02581024169921875, -0.024106979370117188, -0.022403717041015625, -0.020700454711914062, -0.0189971923828125, -0.017293930053710938, -0.015590667724609375, -0.013887405395507812, -0.01218414306640625, -0.010480880737304688, -0.008777618408203125, -0.0070743560791015625, -0.00537109375, -0.0036678314208984375, -0.001964569091796875, -0.0002613067626953125, 0.00144195556640625, 0.0031452178955078125, 0.004848480224609375, 0.0065517425537109375, 0.0082550048828125, 0.009958267211914062, 0.011661529541015625, 0.013364791870117188, 0.01506805419921875, 0.016771316528320312, 0.018474578857421875, 0.020177841186523438, 0.021881103515625, 0.023584365844726562, 0.025287628173828125, 0.026990890502929688, 0.02869415283203125, 0.030397415161132812, 0.032100677490234375, 0.03380393981933594, 0.0355072021484375, 0.03721046447753906, 0.038913726806640625, 0.04061698913574219, 0.04232025146484375, 0.04402351379394531, 0.045726776123046875, 0.04743003845214844, 0.04913330078125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 9.0, 4.0, 13.0, 5.0, 10.0, 22.0, 30.0, 57.0, 111.0, 152.0, 186.0, 140.0, 88.0, 55.0, 44.0, 11.0, 8.0, 12.0, 8.0, 11.0, 7.0, 4.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5974044799804688e-05, -1.556985080242157e-05, -1.5165656805038452e-05, -1.4761462807655334e-05, -1.4357268810272217e-05, -1.3953074812889099e-05, -1.3548880815505981e-05, -1.3144686818122864e-05, -1.2740492820739746e-05, -1.2336298823356628e-05, -1.193210482597351e-05, -1.1527910828590393e-05, -1.1123716831207275e-05, -1.0719522833824158e-05, -1.031532883644104e-05, -9.911134839057922e-06, -9.506940841674805e-06, -9.102746844291687e-06, -8.69855284690857e-06, -8.294358849525452e-06, -7.890164852142334e-06, -7.485970854759216e-06, -7.081776857376099e-06, -6.677582859992981e-06, -6.273388862609863e-06, -5.869194865226746e-06, -5.465000867843628e-06, -5.06080687046051e-06, -4.656612873077393e-06, -4.252418875694275e-06, -3.848224878311157e-06, -3.4440308809280396e-06, -3.039836883544922e-06, -2.635642886161804e-06, -2.2314488887786865e-06, -1.8272548913955688e-06, -1.4230608940124512e-06, -1.0188668966293335e-06, -6.146728992462158e-07, -2.1047890186309814e-07, 1.9371509552001953e-07, 5.979090929031372e-07, 1.0021030902862549e-06, 1.4062970876693726e-06, 1.8104910850524902e-06, 2.214685082435608e-06, 2.6188790798187256e-06, 3.0230730772018433e-06, 3.427267074584961e-06, 3.831461071968079e-06, 4.235655069351196e-06, 4.639849066734314e-06, 5.044043064117432e-06, 5.448237061500549e-06, 5.852431058883667e-06, 6.256625056266785e-06, 6.660819053649902e-06, 7.06501305103302e-06, 7.469207048416138e-06, 7.873401045799255e-06, 8.277595043182373e-06, 8.68178904056549e-06, 9.085983037948608e-06, 9.490177035331726e-06, 9.894371032714844e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 10.0, 16.0, 23.0, 33.0, 54.0, 69.0, 90.0, 177.0, 313.0, 489.0, 1054.0, 2917.0, 10110.0, 52153.0, 836752.0, 117651.0, 18779.0, 4678.0, 1567.0, 705.0, 309.0, 209.0, 116.0, 74.0, 61.0, 46.0, 36.0, 19.0, 17.0, 7.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0665283203125, -0.064361572265625, -0.06219482421875, -0.060028076171875, -0.057861328125, -0.055694580078125, -0.05352783203125, -0.051361083984375, -0.0491943359375, -0.047027587890625, -0.04486083984375, -0.042694091796875, -0.04052734375, -0.038360595703125, -0.03619384765625, -0.034027099609375, -0.0318603515625, -0.029693603515625, -0.02752685546875, -0.025360107421875, -0.023193359375, -0.021026611328125, -0.01885986328125, -0.016693115234375, -0.0145263671875, -0.012359619140625, -0.01019287109375, -0.008026123046875, -0.005859375, -0.003692626953125, -0.00152587890625, 0.000640869140625, 0.0028076171875, 0.004974365234375, 0.00714111328125, 0.009307861328125, 0.011474609375, 0.013641357421875, 0.01580810546875, 0.017974853515625, 0.0201416015625, 0.022308349609375, 0.02447509765625, 0.026641845703125, 0.02880859375, 0.030975341796875, 0.03314208984375, 0.035308837890625, 0.0374755859375, 0.039642333984375, 0.04180908203125, 0.043975830078125, 0.046142578125, 0.048309326171875, 0.05047607421875, 0.052642822265625, 0.0548095703125, 0.056976318359375, 0.05914306640625, 0.061309814453125, 0.0634765625, 0.065643310546875, 0.06781005859375, 0.069976806640625, 0.0721435546875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 10.0, 11.0, 7.0, 8.0, 9.0, 15.0, 13.0, 28.0, 21.0, 29.0, 67.0, 155.0, 234.0, 150.0, 52.0, 30.0, 24.0, 15.0, 16.0, 17.0, 5.0, 14.0, 6.0, 11.0, 3.0, 10.0, 9.0, 5.0, 2.0, 6.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.055450439453125, -0.05356645584106445, -0.051682472229003906, -0.04979848861694336, -0.04791450500488281, -0.046030521392822266, -0.04414653778076172, -0.04226255416870117, -0.040378570556640625, -0.03849458694458008, -0.03661060333251953, -0.034726619720458984, -0.03284263610839844, -0.03095865249633789, -0.029074668884277344, -0.027190685272216797, -0.02530670166015625, -0.023422718048095703, -0.021538734436035156, -0.01965475082397461, -0.017770767211914062, -0.015886783599853516, -0.014002799987792969, -0.012118816375732422, -0.010234832763671875, -0.008350849151611328, -0.006466865539550781, -0.004582881927490234, -0.0026988983154296875, -0.0008149147033691406, 0.0010690689086914062, 0.002953052520751953, 0.0048370361328125, 0.006721019744873047, 0.008605003356933594, 0.01048898696899414, 0.012372970581054688, 0.014256954193115234, 0.01614093780517578, 0.018024921417236328, 0.019908905029296875, 0.021792888641357422, 0.02367687225341797, 0.025560855865478516, 0.027444839477539062, 0.02932882308959961, 0.031212806701660156, 0.0330967903137207, 0.03498077392578125, 0.0368647575378418, 0.038748741149902344, 0.04063272476196289, 0.04251670837402344, 0.044400691986083984, 0.04628467559814453, 0.04816865921020508, 0.050052642822265625, 0.05193662643432617, 0.05382061004638672, 0.055704593658447266, 0.05758857727050781, 0.05947256088256836, 0.061356544494628906, 0.06324052810668945, 0.06512451171875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 12.0, 139.0, 778.0, 68.0, 11.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5541019439697266, -2.4397695064544678, -2.325437068939209, -2.21110463142395, -2.0967721939086914, -1.9824398756027222, -1.8681074380874634, -1.7537751197814941, -1.6394426822662354, -1.5251102447509766, -1.4107778072357178, -1.296445369720459, -1.1821130514144897, -1.067780613899231, -0.9534481763839722, -0.8391157984733582, -0.7247833013534546, -0.6104508638381958, -0.4961184859275818, -0.381786048412323, -0.2674536406993866, -0.1531212329864502, -0.038788795471191406, 0.07554358243942261, 0.1898760199546814, 0.3042084276676178, 0.4185408353805542, 0.532873272895813, 0.6472057104110718, 0.7615380883216858, 0.8758705258369446, 0.9902029037475586, 1.1045353412628174, 1.2188677787780762, 1.333200216293335, 1.4475326538085938, 1.561864972114563, 1.6761974096298218, 1.7905298471450806, 1.9048621654510498, 2.0191946029663086, 2.1335270404815674, 2.247859477996826, 2.362191915512085, 2.4765243530273438, 2.5908565521240234, 2.7051892280578613, 2.819521427154541, 2.933854103088379, 3.0481865406036377, 3.1625189781188965, 3.2768514156341553, 3.391183853149414, 3.5055160522460938, 3.6198487281799316, 3.7341809272766113, 3.84851336479187, 3.962845802307129, 4.077178001403809, 4.1915106773376465, 4.305842876434326, 4.420175552368164, 4.534507751464844, 4.648840427398682, 4.763172626495361]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 5.0, 3.0, 6.0, 5.0, 5.0, 17.0, 11.0, 19.0, 20.0, 15.0, 25.0, 20.0, 26.0, 30.0, 29.0, 44.0, 32.0, 36.0, 39.0, 40.0, 54.0, 44.0, 49.0, 38.0, 44.0, 42.0, 34.0, 36.0, 29.0, 33.0, 19.0, 24.0, 28.0, 12.0, 15.0, 12.0, 6.0, 9.0, 8.0, 7.0, 5.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0003173351287842, -0.9699167013168335, -0.9395160675048828, -0.9091154336929321, -0.8787147998809814, -0.8483141660690308, -0.8179135322570801, -0.7875128984451294, -0.7571122646331787, -0.726711630821228, -0.6963109970092773, -0.6659103631973267, -0.635509729385376, -0.6051090955734253, -0.5747084617614746, -0.5443078279495239, -0.513907253742218, -0.48350661993026733, -0.45310598611831665, -0.42270535230636597, -0.3923047184944153, -0.3619040846824646, -0.3315034806728363, -0.3011028468608856, -0.27070221304893494, -0.24030157923698425, -0.20990094542503357, -0.17950032651424408, -0.1490996927022934, -0.11869905889034271, -0.08829843997955322, -0.05789780616760254, -0.02749711275100708, 0.002903517335653305, 0.03330414742231369, 0.06370477378368378, 0.09410540759563446, 0.12450604140758514, 0.15490666031837463, 0.18530729413032532, 0.215707927942276, 0.24610856175422668, 0.27650919556617737, 0.30690979957580566, 0.33731043338775635, 0.36771106719970703, 0.3981117010116577, 0.4285123348236084, 0.4589129686355591, 0.48931360244750977, 0.5197142362594604, 0.5501148700714111, 0.5805155038833618, 0.6109161376953125, 0.6413167715072632, 0.6717174053192139, 0.7021180391311646, 0.7325186729431152, 0.7629193067550659, 0.7933199405670166, 0.8237205743789673, 0.854121208190918, 0.8845218420028687, 0.9149224758148193, 0.9453230500221252]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 1.0, 6.0, 1.0, 3.0, 9.0, 10.0, 15.0, 16.0, 41.0, 192.0, 5710.0, 4187191.0, 897.0, 107.0, 30.0, 12.0, 10.0, 10.0, 8.0, 7.0, 6.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89306640625, -0.8626022338867188, -0.8321380615234375, -0.8016738891601562, -0.771209716796875, -0.7407455444335938, -0.7102813720703125, -0.6798171997070312, -0.64935302734375, -0.6188888549804688, -0.5884246826171875, -0.5579605102539062, -0.527496337890625, -0.49703216552734375, -0.4665679931640625, -0.43610382080078125, -0.4056396484375, -0.37517547607421875, -0.3447113037109375, -0.31424713134765625, -0.283782958984375, -0.25331878662109375, -0.2228546142578125, -0.19239044189453125, -0.16192626953125, -0.13146209716796875, -0.1009979248046875, -0.07053375244140625, -0.040069580078125, -0.00960540771484375, 0.0208587646484375, 0.05132293701171875, 0.081787109375, 0.11225128173828125, 0.1427154541015625, 0.17317962646484375, 0.203643798828125, 0.23410797119140625, 0.2645721435546875, 0.29503631591796875, 0.32550048828125, 0.35596466064453125, 0.3864288330078125, 0.41689300537109375, 0.447357177734375, 0.47782135009765625, 0.5082855224609375, 0.5387496948242188, 0.5692138671875, 0.5996780395507812, 0.6301422119140625, 0.6606063842773438, 0.691070556640625, 0.7215347290039062, 0.7519989013671875, 0.7824630737304688, 0.81292724609375, 0.8433914184570312, 0.8738555908203125, 0.9043197631835938, 0.934783935546875, 0.9652481079101562, 0.9957122802734375, 1.0261764526367188, 1.056640625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 2.0, 2.0, 5.0, 12.0, 10.0, 16.0, 29.0, 73.0, 168.0, 240.0, 224.0, 117.0, 37.0, 22.0, 12.0, 9.0, 6.0, 11.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.12441062927246094, -0.11991500854492188, -0.11541938781738281, -0.11092376708984375, -0.10642814636230469, -0.10193252563476562, -0.09743690490722656, -0.0929412841796875, -0.08844566345214844, -0.08395004272460938, -0.07945442199707031, -0.07495880126953125, -0.07046318054199219, -0.06596755981445312, -0.06147193908691406, -0.056976318359375, -0.05248069763183594, -0.047985076904296875, -0.04348945617675781, -0.03899383544921875, -0.03449821472167969, -0.030002593994140625, -0.025506973266601562, -0.0210113525390625, -0.016515731811523438, -0.012020111083984375, -0.0075244903564453125, -0.00302886962890625, 0.0014667510986328125, 0.005962371826171875, 0.010457992553710938, 0.01495361328125, 0.019449234008789062, 0.023944854736328125, 0.028440475463867188, 0.03293609619140625, 0.03743171691894531, 0.041927337646484375, 0.04642295837402344, 0.0509185791015625, 0.05541419982910156, 0.059909820556640625, 0.06440544128417969, 0.06890106201171875, 0.07339668273925781, 0.07789230346679688, 0.08238792419433594, 0.086883544921875, 0.09137916564941406, 0.09587478637695312, 0.10037040710449219, 0.10486602783203125, 0.10936164855957031, 0.11385726928710938, 0.11835289001464844, 0.1228485107421875, 0.12734413146972656, 0.13183975219726562, 0.1363353729248047, 0.14083099365234375, 0.1453266143798828, 0.14982223510742188, 0.15431785583496094, 0.1588134765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 14.0, 27.0, 55.0, 121.0, 378.0, 1175.0, 5557.0, 44650.0, 3614194.0, 501758.0, 21924.0, 3243.0, 788.0, 235.0, 83.0, 48.0, 13.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12646484375, -0.12175559997558594, -0.11704635620117188, -0.11233711242675781, -0.10762786865234375, -0.10291862487792969, -0.09820938110351562, -0.09350013732910156, -0.0887908935546875, -0.08408164978027344, -0.07937240600585938, -0.07466316223144531, -0.06995391845703125, -0.06524467468261719, -0.060535430908203125, -0.05582618713378906, -0.051116943359375, -0.04640769958496094, -0.041698455810546875, -0.03698921203613281, -0.03227996826171875, -0.027570724487304688, -0.022861480712890625, -0.018152236938476562, -0.0134429931640625, -0.008733749389648438, -0.004024505615234375, 0.0006847381591796875, 0.00539398193359375, 0.010103225708007812, 0.014812469482421875, 0.019521713256835938, 0.02423095703125, 0.028940200805664062, 0.033649444580078125, 0.03835868835449219, 0.04306793212890625, 0.04777717590332031, 0.052486419677734375, 0.05719566345214844, 0.0619049072265625, 0.06661415100097656, 0.07132339477539062, 0.07603263854980469, 0.08074188232421875, 0.08545112609863281, 0.09016036987304688, 0.09486961364746094, 0.099578857421875, 0.10428810119628906, 0.10899734497070312, 0.11370658874511719, 0.11841583251953125, 0.12312507629394531, 0.12783432006835938, 0.13254356384277344, 0.1372528076171875, 0.14196205139160156, 0.14667129516601562, 0.1513805389404297, 0.15608978271484375, 0.1607990264892578, 0.16550827026367188, 0.17021751403808594, 0.1749267578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 9.0, 11.0, 9.0, 17.0, 33.0, 52.0, 83.0, 140.0, 235.0, 655.0, 2050.0, 341.0, 180.0, 86.0, 52.0, 32.0, 29.0, 18.0, 15.0, 8.0, 5.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05609130859375, -0.05469703674316406, -0.053302764892578125, -0.05190849304199219, -0.05051422119140625, -0.04911994934082031, -0.047725677490234375, -0.04633140563964844, -0.0449371337890625, -0.04354286193847656, -0.042148590087890625, -0.04075431823730469, -0.03936004638671875, -0.03796577453613281, -0.036571502685546875, -0.03517723083496094, -0.033782958984375, -0.03238868713378906, -0.030994415283203125, -0.029600143432617188, -0.02820587158203125, -0.026811599731445312, -0.025417327880859375, -0.024023056030273438, -0.0226287841796875, -0.021234512329101562, -0.019840240478515625, -0.018445968627929688, -0.01705169677734375, -0.015657424926757812, -0.014263153076171875, -0.012868881225585938, -0.011474609375, -0.010080337524414062, -0.008686065673828125, -0.0072917938232421875, -0.00589752197265625, -0.0045032501220703125, -0.003108978271484375, -0.0017147064208984375, -0.0003204345703125, 0.0010738372802734375, 0.002468109130859375, 0.0038623809814453125, 0.00525665283203125, 0.0066509246826171875, 0.008045196533203125, 0.009439468383789062, 0.010833740234375, 0.012228012084960938, 0.013622283935546875, 0.015016555786132812, 0.01641082763671875, 0.017805099487304688, 0.019199371337890625, 0.020593643188476562, 0.0219879150390625, 0.023382186889648438, 0.024776458740234375, 0.026170730590820312, 0.02756500244140625, 0.028959274291992188, 0.030353546142578125, 0.03174781799316406, 0.03314208984375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 13.0, 24.0, 74.0, 150.0, 260.0, 261.0, 126.0, 56.0, 17.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5612211227416992, -0.5504186749458313, -0.5396162867546082, -0.5288138389587402, -0.5180113911628723, -0.5072090029716492, -0.49640655517578125, -0.48560410737991333, -0.4748016893863678, -0.46399927139282227, -0.45319682359695435, -0.4423944056034088, -0.4315919876098633, -0.42078953981399536, -0.40998712182044983, -0.3991847038269043, -0.3883822560310364, -0.37757983803749084, -0.3667773902416229, -0.3559749722480774, -0.3451725244522095, -0.33437010645866394, -0.3235676884651184, -0.3127652406692505, -0.30196282267570496, -0.2911604046821594, -0.2803579568862915, -0.26955553889274597, -0.25875312089920044, -0.24795067310333252, -0.237148255109787, -0.22634582221508026, -0.21554335951805115, -0.20474092662334442, -0.1939384937286377, -0.18313607573509216, -0.17233364284038544, -0.1615312099456787, -0.15072879195213318, -0.13992635905742645, -0.12912392616271973, -0.118321493268013, -0.10751906782388687, -0.09671664237976074, -0.08591420948505402, -0.07511177659034729, -0.06430935114622116, -0.05350692570209503, -0.042704492807388306, -0.03190206363797188, -0.02109963446855545, -0.010297205299139023, 0.0005052238702774048, 0.011307653039693832, 0.02211008220911026, 0.03291250765323639, 0.043714940547943115, 0.05451736971735954, 0.06531979888677597, 0.0761222243309021, 0.08692465722560883, 0.09772709012031555, 0.10852951556444168, 0.11933194100856781, 0.13013437390327454]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 3.0, 5.0, 7.0, 6.0, 14.0, 9.0, 14.0, 20.0, 14.0, 27.0, 29.0, 21.0, 26.0, 32.0, 38.0, 42.0, 37.0, 43.0, 44.0, 43.0, 48.0, 43.0, 40.0, 48.0, 48.0, 38.0, 29.0, 37.0, 32.0, 22.0, 12.0, 22.0, 24.0, 18.0, 12.0, 15.0, 13.0, 11.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10800290107727051, -0.10456464439630508, -0.10112638771533966, -0.09768813848495483, -0.09424988180398941, -0.09081162512302399, -0.08737337589263916, -0.08393511921167374, -0.08049686253070831, -0.07705860584974289, -0.07362034916877747, -0.07018209993839264, -0.06674384325742722, -0.06330558657646179, -0.05986733362078667, -0.05642908066511154, -0.05299082398414612, -0.049552567303180695, -0.04611431434750557, -0.042676061391830444, -0.03923780471086502, -0.0357995480298996, -0.03236129507422447, -0.028923040255904198, -0.025484785437583923, -0.02204653061926365, -0.018608275800943375, -0.0151700209826231, -0.011731766164302826, -0.008293511345982552, -0.004855256527662277, -0.0014170017093420029, 0.0020212531089782715, 0.005459507927298546, 0.00889776274561882, 0.012336017563939095, 0.01577427238225937, 0.019212527200579643, 0.022650782018899918, 0.026089036837220192, 0.029527291655540466, 0.03296554833650589, 0.036403801292181015, 0.03984205424785614, 0.043280310928821564, 0.04671856760978699, 0.05015682056546211, 0.05359507352113724, 0.05703333020210266, 0.060471586883068085, 0.06390984356403351, 0.06734809279441833, 0.07078634947538376, 0.07422460615634918, 0.07766285538673401, 0.08110111206769943, 0.08453936874866486, 0.08797762542963028, 0.0914158821105957, 0.09485413134098053, 0.09829238802194595, 0.10173064470291138, 0.1051688939332962, 0.10860715061426163, 0.11204540729522705]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 6.0, 5.0, 11.0, 25.0, 20.0, 30.0, 65.0, 86.0, 124.0, 245.0, 482.0, 898.0, 2093.0, 6632.0, 30876.0, 299466.0, 645917.0, 47571.0, 8958.0, 2687.0, 1141.0, 497.0, 252.0, 188.0, 99.0, 69.0, 29.0, 29.0, 20.0, 11.0, 10.0, 6.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.147216796875, -0.1431407928466797, -0.13906478881835938, -0.13498878479003906, -0.13091278076171875, -0.12683677673339844, -0.12276077270507812, -0.11868476867675781, -0.1146087646484375, -0.11053276062011719, -0.10645675659179688, -0.10238075256347656, -0.09830474853515625, -0.09422874450683594, -0.09015274047851562, -0.08607673645019531, -0.082000732421875, -0.07792472839355469, -0.07384872436523438, -0.06977272033691406, -0.06569671630859375, -0.06162071228027344, -0.057544708251953125, -0.05346870422363281, -0.0493927001953125, -0.04531669616699219, -0.041240692138671875, -0.03716468811035156, -0.03308868408203125, -0.029012680053710938, -0.024936676025390625, -0.020860671997070312, -0.01678466796875, -0.012708663940429688, -0.008632659912109375, -0.0045566558837890625, -0.00048065185546875, 0.0035953521728515625, 0.007671356201171875, 0.011747360229492188, 0.0158233642578125, 0.019899368286132812, 0.023975372314453125, 0.028051376342773438, 0.03212738037109375, 0.03620338439941406, 0.040279388427734375, 0.04435539245605469, 0.048431396484375, 0.05250740051269531, 0.056583404541015625, 0.06065940856933594, 0.06473541259765625, 0.06881141662597656, 0.07288742065429688, 0.07696342468261719, 0.0810394287109375, 0.08511543273925781, 0.08919143676757812, 0.09326744079589844, 0.09734344482421875, 0.10141944885253906, 0.10549545288085938, 0.10957145690917969, 0.1136474609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 0.0, 5.0, 6.0, 10.0, 10.0, 19.0, 29.0, 68.0, 169.0, 246.0, 206.0, 122.0, 47.0, 20.0, 11.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1275634765625, -0.12311553955078125, -0.1186676025390625, -0.11421966552734375, -0.109771728515625, -0.10532379150390625, -0.1008758544921875, -0.09642791748046875, -0.09197998046875, -0.08753204345703125, -0.0830841064453125, -0.07863616943359375, -0.074188232421875, -0.06974029541015625, -0.0652923583984375, -0.06084442138671875, -0.056396484375, -0.05194854736328125, -0.0475006103515625, -0.04305267333984375, -0.038604736328125, -0.03415679931640625, -0.0297088623046875, -0.02526092529296875, -0.02081298828125, -0.01636505126953125, -0.0119171142578125, -0.00746917724609375, -0.003021240234375, 0.00142669677734375, 0.0058746337890625, 0.01032257080078125, 0.0147705078125, 0.01921844482421875, 0.0236663818359375, 0.02811431884765625, 0.032562255859375, 0.03701019287109375, 0.0414581298828125, 0.04590606689453125, 0.05035400390625, 0.05480194091796875, 0.0592498779296875, 0.06369781494140625, 0.068145751953125, 0.07259368896484375, 0.0770416259765625, 0.08148956298828125, 0.0859375, 0.09038543701171875, 0.0948333740234375, 0.09928131103515625, 0.103729248046875, 0.10817718505859375, 0.1126251220703125, 0.11707305908203125, 0.12152099609375, 0.12596893310546875, 0.1304168701171875, 0.13486480712890625, 0.139312744140625, 0.14376068115234375, 0.1482086181640625, 0.15265655517578125, 0.1571044921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 14.0, 6.0, 7.0, 13.0, 14.0, 27.0, 29.0, 38.0, 44.0, 64.0, 77.0, 94.0, 179.0, 245.0, 367.0, 705.0, 1749.0, 6974.0, 46168.0, 498185.0, 442503.0, 41257.0, 6280.0, 1594.0, 664.0, 404.0, 216.0, 163.0, 117.0, 73.0, 58.0, 52.0, 42.0, 29.0, 20.0, 8.0, 18.0, 16.0, 8.0, 6.0, 4.0, 6.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10888671875, -0.1052541732788086, -0.10162162780761719, -0.09798908233642578, -0.09435653686523438, -0.09072399139404297, -0.08709144592285156, -0.08345890045166016, -0.07982635498046875, -0.07619380950927734, -0.07256126403808594, -0.06892871856689453, -0.06529617309570312, -0.06166362762451172, -0.05803108215332031, -0.054398536682128906, -0.0507659912109375, -0.047133445739746094, -0.04350090026855469, -0.03986835479736328, -0.036235809326171875, -0.03260326385498047, -0.028970718383789062, -0.025338172912597656, -0.02170562744140625, -0.018073081970214844, -0.014440536499023438, -0.010807991027832031, -0.007175445556640625, -0.0035429000854492188, 8.96453857421875e-05, 0.0037221908569335938, 0.007354736328125, 0.010987281799316406, 0.014619827270507812, 0.01825237274169922, 0.021884918212890625, 0.02551746368408203, 0.029150009155273438, 0.032782554626464844, 0.03641510009765625, 0.040047645568847656, 0.04368019104003906, 0.04731273651123047, 0.050945281982421875, 0.05457782745361328, 0.05821037292480469, 0.061842918395996094, 0.0654754638671875, 0.0691080093383789, 0.07274055480957031, 0.07637310028076172, 0.08000564575195312, 0.08363819122314453, 0.08727073669433594, 0.09090328216552734, 0.09453582763671875, 0.09816837310791016, 0.10180091857910156, 0.10543346405029297, 0.10906600952148438, 0.11269855499267578, 0.11633110046386719, 0.1199636459350586, 0.12359619140625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 11.0, 4.0, 4.0, 8.0, 9.0, 12.0, 13.0, 14.0, 18.0, 12.0, 17.0, 33.0, 33.0, 38.0, 39.0, 38.0, 43.0, 47.0, 46.0, 38.0, 36.0, 39.0, 47.0, 30.0, 39.0, 32.0, 30.0, 33.0, 22.0, 34.0, 28.0, 24.0, 25.0, 21.0, 9.0, 16.0, 11.0, 8.0, 3.0, 9.0, 2.0, 4.0, 8.0, 0.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.185546875, -0.17955970764160156, -0.17357254028320312, -0.1675853729248047, -0.16159820556640625, -0.1556110382080078, -0.14962387084960938, -0.14363670349121094, -0.1376495361328125, -0.13166236877441406, -0.12567520141601562, -0.11968803405761719, -0.11370086669921875, -0.10771369934082031, -0.10172653198242188, -0.09573936462402344, -0.089752197265625, -0.08376502990722656, -0.07777786254882812, -0.07179069519042969, -0.06580352783203125, -0.05981636047363281, -0.053829193115234375, -0.04784202575683594, -0.0418548583984375, -0.03586769104003906, -0.029880523681640625, -0.023893356323242188, -0.01790618896484375, -0.011919021606445312, -0.005931854248046875, 5.53131103515625e-05, 0.00604248046875, 0.012029647827148438, 0.018016815185546875, 0.024003982543945312, 0.02999114990234375, 0.03597831726074219, 0.041965484619140625, 0.04795265197753906, 0.0539398193359375, 0.05992698669433594, 0.06591415405273438, 0.07190132141113281, 0.07788848876953125, 0.08387565612792969, 0.08986282348632812, 0.09584999084472656, 0.101837158203125, 0.10782432556152344, 0.11381149291992188, 0.11979866027832031, 0.12578582763671875, 0.1317729949951172, 0.13776016235351562, 0.14374732971191406, 0.1497344970703125, 0.15572166442871094, 0.16170883178710938, 0.1676959991455078, 0.17368316650390625, 0.1796703338623047, 0.18565750122070312, 0.19164466857910156, 0.1976318359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 7.0, 2.0, 3.0, 6.0, 10.0, 6.0, 22.0, 25.0, 24.0, 52.0, 66.0, 126.0, 207.0, 401.0, 777.0, 2015.0, 5728.0, 18295.0, 65147.0, 751391.0, 155255.0, 33347.0, 9872.0, 3253.0, 1241.0, 528.0, 268.0, 176.0, 88.0, 58.0, 44.0, 43.0, 19.0, 11.0, 12.0, 13.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035980224609375, -0.03491401672363281, -0.033847808837890625, -0.03278160095214844, -0.03171539306640625, -0.030649185180664062, -0.029582977294921875, -0.028516769409179688, -0.0274505615234375, -0.026384353637695312, -0.025318145751953125, -0.024251937866210938, -0.02318572998046875, -0.022119522094726562, -0.021053314208984375, -0.019987106323242188, -0.0189208984375, -0.017854690551757812, -0.016788482666015625, -0.015722274780273438, -0.01465606689453125, -0.013589859008789062, -0.012523651123046875, -0.011457443237304688, -0.0103912353515625, -0.009325027465820312, -0.008258819580078125, -0.0071926116943359375, -0.00612640380859375, -0.0050601959228515625, -0.003993988037109375, -0.0029277801513671875, -0.001861572265625, -0.0007953643798828125, 0.000270843505859375, 0.0013370513916015625, 0.00240325927734375, 0.0034694671630859375, 0.004535675048828125, 0.0056018829345703125, 0.0066680908203125, 0.0077342987060546875, 0.008800506591796875, 0.009866714477539062, 0.01093292236328125, 0.011999130249023438, 0.013065338134765625, 0.014131546020507812, 0.01519775390625, 0.016263961791992188, 0.017330169677734375, 0.018396377563476562, 0.01946258544921875, 0.020528793334960938, 0.021595001220703125, 0.022661209106445312, 0.0237274169921875, 0.024793624877929688, 0.025859832763671875, 0.026926040649414062, 0.02799224853515625, 0.029058456420898438, 0.030124664306640625, 0.031190872192382812, 0.032257080078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 8.0, 7.0, 8.0, 12.0, 7.0, 7.0, 22.0, 19.0, 48.0, 62.0, 108.0, 132.0, 123.0, 137.0, 92.0, 51.0, 39.0, 29.0, 24.0, 5.0, 11.0, 9.0, 6.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.357929229736328e-06, -9.085983037948608e-06, -8.814036846160889e-06, -8.542090654373169e-06, -8.27014446258545e-06, -7.99819827079773e-06, -7.72625207901001e-06, -7.45430588722229e-06, -7.18235969543457e-06, -6.910413503646851e-06, -6.638467311859131e-06, -6.366521120071411e-06, -6.094574928283691e-06, -5.822628736495972e-06, -5.550682544708252e-06, -5.278736352920532e-06, -5.0067901611328125e-06, -4.734843969345093e-06, -4.462897777557373e-06, -4.190951585769653e-06, -3.919005393981934e-06, -3.647059202194214e-06, -3.375113010406494e-06, -3.1031668186187744e-06, -2.8312206268310547e-06, -2.559274435043335e-06, -2.2873282432556152e-06, -2.0153820514678955e-06, -1.7434358596801758e-06, -1.471489667892456e-06, -1.1995434761047363e-06, -9.275972843170166e-07, -6.556510925292969e-07, -3.8370490074157715e-07, -1.1175870895385742e-07, 1.601874828338623e-07, 4.3213367462158203e-07, 7.040798664093018e-07, 9.760260581970215e-07, 1.2479722499847412e-06, 1.519918441772461e-06, 1.7918646335601807e-06, 2.0638108253479004e-06, 2.33575701713562e-06, 2.60770320892334e-06, 2.8796494007110596e-06, 3.1515955924987793e-06, 3.423541784286499e-06, 3.6954879760742188e-06, 3.9674341678619385e-06, 4.239380359649658e-06, 4.511326551437378e-06, 4.783272743225098e-06, 5.055218935012817e-06, 5.327165126800537e-06, 5.599111318588257e-06, 5.8710575103759766e-06, 6.143003702163696e-06, 6.414949893951416e-06, 6.686896085739136e-06, 6.9588422775268555e-06, 7.230788469314575e-06, 7.502734661102295e-06, 7.774680852890015e-06, 8.046627044677734e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 7.0, 7.0, 4.0, 13.0, 16.0, 14.0, 27.0, 39.0, 43.0, 55.0, 95.0, 159.0, 230.0, 403.0, 752.0, 1439.0, 3662.0, 10760.0, 39579.0, 401239.0, 530059.0, 41534.0, 11237.0, 3736.0, 1529.0, 705.0, 438.0, 253.0, 170.0, 112.0, 64.0, 45.0, 36.0, 24.0, 15.0, 15.0, 11.0, 7.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.045318603515625, -0.04402446746826172, -0.04273033142089844, -0.041436195373535156, -0.040142059326171875, -0.038847923278808594, -0.03755378723144531, -0.03625965118408203, -0.03496551513671875, -0.03367137908935547, -0.03237724304199219, -0.031083106994628906, -0.029788970947265625, -0.028494834899902344, -0.027200698852539062, -0.02590656280517578, -0.0246124267578125, -0.02331829071044922, -0.022024154663085938, -0.020730018615722656, -0.019435882568359375, -0.018141746520996094, -0.016847610473632812, -0.015553474426269531, -0.01425933837890625, -0.012965202331542969, -0.011671066284179688, -0.010376930236816406, -0.009082794189453125, -0.007788658142089844, -0.0064945220947265625, -0.005200386047363281, -0.00390625, -0.0026121139526367188, -0.0013179779052734375, -2.384185791015625e-05, 0.001270294189453125, 0.0025644302368164062, 0.0038585662841796875, 0.005152702331542969, 0.00644683837890625, 0.007740974426269531, 0.009035110473632812, 0.010329246520996094, 0.011623382568359375, 0.012917518615722656, 0.014211654663085938, 0.015505790710449219, 0.0167999267578125, 0.01809406280517578, 0.019388198852539062, 0.020682334899902344, 0.021976470947265625, 0.023270606994628906, 0.024564743041992188, 0.02585887908935547, 0.02715301513671875, 0.02844715118408203, 0.029741287231445312, 0.031035423278808594, 0.032329559326171875, 0.033623695373535156, 0.03491783142089844, 0.03621196746826172, 0.037506103515625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 9.0, 7.0, 4.0, 7.0, 9.0, 5.0, 16.0, 25.0, 22.0, 39.0, 37.0, 64.0, 105.0, 132.0, 147.0, 103.0, 77.0, 45.0, 27.0, 35.0, 16.0, 12.0, 10.0, 15.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.04986572265625, -0.0484461784362793, -0.047026634216308594, -0.04560708999633789, -0.04418754577636719, -0.042768001556396484, -0.04134845733642578, -0.03992891311645508, -0.038509368896484375, -0.03708982467651367, -0.03567028045654297, -0.034250736236572266, -0.03283119201660156, -0.03141164779663086, -0.029992103576660156, -0.028572559356689453, -0.02715301513671875, -0.025733470916748047, -0.024313926696777344, -0.02289438247680664, -0.021474838256835938, -0.020055294036865234, -0.01863574981689453, -0.017216205596923828, -0.015796661376953125, -0.014377117156982422, -0.012957572937011719, -0.011538028717041016, -0.010118484497070312, -0.00869894027709961, -0.007279396057128906, -0.005859851837158203, -0.0044403076171875, -0.003020763397216797, -0.0016012191772460938, -0.00018167495727539062, 0.0012378692626953125, 0.0026574134826660156, 0.004076957702636719, 0.005496501922607422, 0.006916046142578125, 0.008335590362548828, 0.009755134582519531, 0.011174678802490234, 0.012594223022460938, 0.01401376724243164, 0.015433311462402344, 0.016852855682373047, 0.01827239990234375, 0.019691944122314453, 0.021111488342285156, 0.02253103256225586, 0.023950576782226562, 0.025370121002197266, 0.02678966522216797, 0.028209209442138672, 0.029628753662109375, 0.031048297882080078, 0.03246784210205078, 0.033887386322021484, 0.03530693054199219, 0.03672647476196289, 0.038146018981933594, 0.0395655632019043, 0.040985107421875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 11.0, 317.0, 683.0, 5.0, 2.0, 2.0], "bins": [-11.232830047607422, -11.04603385925293, -10.859237670898438, -10.672442436218262, -10.48564624786377, -10.298850059509277, -10.112053871154785, -9.92525863647461, -9.738462448120117, -9.551666259765625, -9.364870071411133, -9.178074836730957, -8.991278648376465, -8.804482460021973, -8.61768627166748, -8.430891036987305, -8.244094848632812, -8.05729866027832, -7.870502948760986, -7.683706760406494, -7.49691104888916, -7.310114860534668, -7.123319149017334, -6.936522960662842, -6.74972677230835, -6.562930583953857, -6.376134872436523, -6.189338684082031, -6.002542972564697, -5.815746784210205, -5.628951072692871, -5.442154884338379, -5.255359172821045, -5.068562984466553, -4.881767272949219, -4.694971084594727, -4.508175373077393, -4.3213791847229, -4.134583473205566, -3.947787284851074, -3.7609915733337402, -3.574195623397827, -3.387399673461914, -3.200603723526001, -3.013807773590088, -2.827011823654175, -2.6402158737182617, -2.4534196853637695, -2.2666237354278564, -2.0798277854919434, -1.8930318355560303, -1.7062358856201172, -1.519439935684204, -1.332643985748291, -1.1458479166030884, -0.9590519666671753, -0.7722560167312622, -0.5854600667953491, -0.39866408705711365, -0.21186810731887817, -0.025072157382965088, 0.161723792552948, 0.34851980209350586, 0.535315752029419, 0.722111701965332]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 3.0, 2.0, 13.0, 6.0, 17.0, 19.0, 18.0, 16.0, 25.0, 37.0, 28.0, 40.0, 51.0, 43.0, 41.0, 38.0, 41.0, 33.0, 50.0, 37.0, 47.0, 45.0, 40.0, 39.0, 38.0, 36.0, 29.0, 28.0, 25.0, 19.0, 13.0, 16.0, 6.0, 13.0, 12.0, 7.0, 6.0, 8.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9799671769142151, -0.9492667317390442, -0.9185662865638733, -0.8878658413887024, -0.8571653962135315, -0.8264649510383606, -0.7957645654678345, -0.7650641202926636, -0.7343636751174927, -0.7036632299423218, -0.6729627847671509, -0.64226233959198, -0.6115618944168091, -0.5808614492416382, -0.5501610040664673, -0.5194605588912964, -0.4887601137161255, -0.4580596685409546, -0.4273592233657837, -0.3966587781906128, -0.3659583330154419, -0.335257887840271, -0.3045574724674225, -0.2738570272922516, -0.2431565821170807, -0.2124561369419098, -0.1817556917667389, -0.1510552614927292, -0.12035481631755829, -0.08965437114238739, -0.058953940868377686, -0.028253495693206787, 0.002446889877319336, 0.033147331327199936, 0.06384777277708054, 0.09454821050167084, 0.12524865567684174, 0.15594910085201263, 0.18664953112602234, 0.21734997630119324, 0.24805042147636414, 0.27875086665153503, 0.30945131182670593, 0.34015172719955444, 0.37085217237472534, 0.40155261754989624, 0.43225306272506714, 0.46295350790023804, 0.49365395307540894, 0.5243543982505798, 0.5550548434257507, 0.5857552886009216, 0.6164557337760925, 0.6471561789512634, 0.6778565645217896, 0.7085570096969604, 0.7392574548721313, 0.7699579000473022, 0.8006583452224731, 0.831358790397644, 0.8620592355728149, 0.8927596807479858, 0.9234601259231567, 0.9541605710983276, 0.9848610162734985]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 7.0, 9.0, 7.0, 12.0, 13.0, 8.0, 25.0, 119.0, 24291.0, 4169471.0, 196.0, 36.0, 22.0, 15.0, 12.0, 10.0, 6.0, 5.0, 6.0, 7.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.646484375, -1.591796875, -1.537109375, -1.482421875, -1.427734375, -1.373046875, -1.318359375, -1.263671875, -1.208984375, -1.154296875, -1.099609375, -1.044921875, -0.990234375, -0.935546875, -0.880859375, -0.826171875, -0.771484375, -0.716796875, -0.662109375, -0.607421875, -0.552734375, -0.498046875, -0.443359375, -0.388671875, -0.333984375, -0.279296875, -0.224609375, -0.169921875, -0.115234375, -0.060546875, -0.005859375, 0.048828125, 0.103515625, 0.158203125, 0.212890625, 0.267578125, 0.322265625, 0.376953125, 0.431640625, 0.486328125, 0.541015625, 0.595703125, 0.650390625, 0.705078125, 0.759765625, 0.814453125, 0.869140625, 0.923828125, 0.978515625, 1.033203125, 1.087890625, 1.142578125, 1.197265625, 1.251953125, 1.306640625, 1.361328125, 1.416015625, 1.470703125, 1.525390625, 1.580078125, 1.634765625, 1.689453125, 1.744140625, 1.798828125, 1.853515625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 1.0, 6.0, 9.0, 16.0, 18.0, 28.0, 64.0, 183.0, 243.0, 198.0, 119.0, 54.0, 21.0, 7.0, 12.0, 9.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12841796875, -0.12394142150878906, -0.11946487426757812, -0.11498832702636719, -0.11051177978515625, -0.10603523254394531, -0.10155868530273438, -0.09708213806152344, -0.0926055908203125, -0.08812904357910156, -0.08365249633789062, -0.07917594909667969, -0.07469940185546875, -0.07022285461425781, -0.06574630737304688, -0.06126976013183594, -0.056793212890625, -0.05231666564941406, -0.047840118408203125, -0.04336357116699219, -0.03888702392578125, -0.03441047668457031, -0.029933929443359375, -0.025457382202148438, -0.0209808349609375, -0.016504287719726562, -0.012027740478515625, -0.0075511932373046875, -0.00307464599609375, 0.0014019012451171875, 0.005878448486328125, 0.010354995727539062, 0.01483154296875, 0.019308090209960938, 0.023784637451171875, 0.028261184692382812, 0.03273773193359375, 0.03721427917480469, 0.041690826416015625, 0.04616737365722656, 0.0506439208984375, 0.05512046813964844, 0.059597015380859375, 0.06407356262207031, 0.06855010986328125, 0.07302665710449219, 0.07750320434570312, 0.08197975158691406, 0.086456298828125, 0.09093284606933594, 0.09540939331054688, 0.09988594055175781, 0.10436248779296875, 0.10883903503417969, 0.11331558227539062, 0.11779212951660156, 0.1222686767578125, 0.12674522399902344, 0.13122177124023438, 0.1356983184814453, 0.14017486572265625, 0.1446514129638672, 0.14912796020507812, 0.15360450744628906, 0.1580810546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 19.0, 31.0, 67.0, 97.0, 162.0, 310.0, 548.0, 1115.0, 2623.0, 7604.0, 28534.0, 181671.0, 3668709.0, 253224.0, 35193.0, 8688.0, 2974.0, 1275.0, 642.0, 366.0, 185.0, 96.0, 55.0, 28.0, 17.0, 12.0, 14.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.11968994140625, -0.11641693115234375, -0.1131439208984375, -0.10987091064453125, -0.106597900390625, -0.10332489013671875, -0.1000518798828125, -0.09677886962890625, -0.093505859375, -0.09023284912109375, -0.0869598388671875, -0.08368682861328125, -0.080413818359375, -0.07714080810546875, -0.0738677978515625, -0.07059478759765625, -0.06732177734375, -0.06404876708984375, -0.0607757568359375, -0.05750274658203125, -0.054229736328125, -0.05095672607421875, -0.0476837158203125, -0.04441070556640625, -0.0411376953125, -0.03786468505859375, -0.0345916748046875, -0.03131866455078125, -0.028045654296875, -0.02477264404296875, -0.0214996337890625, -0.01822662353515625, -0.01495361328125, -0.01168060302734375, -0.0084075927734375, -0.00513458251953125, -0.001861572265625, 0.00141143798828125, 0.0046844482421875, 0.00795745849609375, 0.01123046875, 0.01450347900390625, 0.0177764892578125, 0.02104949951171875, 0.024322509765625, 0.02759552001953125, 0.0308685302734375, 0.03414154052734375, 0.03741455078125, 0.04068756103515625, 0.0439605712890625, 0.04723358154296875, 0.050506591796875, 0.05377960205078125, 0.0570526123046875, 0.06032562255859375, 0.0635986328125, 0.06687164306640625, 0.0701446533203125, 0.07341766357421875, 0.076690673828125, 0.07996368408203125, 0.0832366943359375, 0.08650970458984375, 0.08978271484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 10.0, 17.0, 27.0, 24.0, 50.0, 44.0, 77.0, 123.0, 234.0, 790.0, 1939.0, 278.0, 173.0, 99.0, 58.0, 32.0, 23.0, 18.0, 14.0, 6.0, 10.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038330078125, -0.03705739974975586, -0.03578472137451172, -0.03451204299926758, -0.03323936462402344, -0.0319666862487793, -0.030694007873535156, -0.029421329498291016, -0.028148651123046875, -0.026875972747802734, -0.025603294372558594, -0.024330615997314453, -0.023057937622070312, -0.021785259246826172, -0.02051258087158203, -0.01923990249633789, -0.01796722412109375, -0.01669454574584961, -0.015421867370605469, -0.014149188995361328, -0.012876510620117188, -0.011603832244873047, -0.010331153869628906, -0.009058475494384766, -0.007785797119140625, -0.006513118743896484, -0.005240440368652344, -0.003967761993408203, -0.0026950836181640625, -0.0014224052429199219, -0.00014972686767578125, 0.0011229515075683594, 0.0023956298828125, 0.0036683082580566406, 0.004940986633300781, 0.006213665008544922, 0.0074863433837890625, 0.008759021759033203, 0.010031700134277344, 0.011304378509521484, 0.012577056884765625, 0.013849735260009766, 0.015122413635253906, 0.016395092010498047, 0.017667770385742188, 0.018940448760986328, 0.02021312713623047, 0.02148580551147461, 0.02275848388671875, 0.02403116226196289, 0.02530384063720703, 0.026576519012451172, 0.027849197387695312, 0.029121875762939453, 0.030394554138183594, 0.031667232513427734, 0.032939910888671875, 0.034212589263916016, 0.035485267639160156, 0.0367579460144043, 0.03803062438964844, 0.03930330276489258, 0.04057598114013672, 0.04184865951538086, 0.043121337890625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 5.0, 7.0, 29.0, 174.0, 500.0, 240.0, 40.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1107993125915527, -1.0869327783584595, -1.0630662441253662, -1.0391998291015625, -1.0153332948684692, -0.991466760635376, -0.9676002264022827, -0.9437336921691895, -0.9198671579360962, -0.8960006237030029, -0.8721341490745544, -0.8482676148414612, -0.8244010806083679, -0.8005346059799194, -0.7766680717468262, -0.7528015375137329, -0.7289350628852844, -0.7050685286521912, -0.6812020540237427, -0.6573355197906494, -0.6334689855575562, -0.6096024513244629, -0.5857359766960144, -0.5618694424629211, -0.5380029678344727, -0.5141364336013794, -0.4902699291706085, -0.46640342473983765, -0.4425368905067444, -0.4186703860759735, -0.39480388164520264, -0.3709373474121094, -0.3470707833766937, -0.32320427894592285, -0.2993377447128296, -0.2754712402820587, -0.25160473585128784, -0.22773820161819458, -0.2038716971874237, -0.18000517785549164, -0.15613865852355957, -0.1322721391916275, -0.10840562731027603, -0.08453911542892456, -0.06067259609699249, -0.036806076765060425, -0.01293957233428955, 0.010926946997642517, 0.034793466329574585, 0.058659981936216354, 0.08252649754285812, 0.1063930094242096, 0.13025952875614166, 0.15412604808807373, 0.1779925525188446, 0.20185907185077667, 0.22572559118270874, 0.2495921105146408, 0.2734586298465729, 0.29732513427734375, 0.321191668510437, 0.3450581729412079, 0.36892467737197876, 0.392791211605072, 0.4166577160358429]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 10.0, 4.0, 3.0, 13.0, 14.0, 10.0, 14.0, 13.0, 12.0, 18.0, 15.0, 35.0, 20.0, 33.0, 25.0, 27.0, 37.0, 41.0, 33.0, 41.0, 39.0, 47.0, 37.0, 44.0, 32.0, 34.0, 36.0, 35.0, 21.0, 30.0, 27.0, 31.0, 22.0, 14.0, 17.0, 13.0, 16.0, 21.0, 16.0, 14.0, 10.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.10096240043640137, -0.0977456271648407, -0.09452885389328003, -0.09131207317113876, -0.0880952998995781, -0.08487852662801743, -0.08166174590587616, -0.07844497263431549, -0.07522819936275482, -0.07201142609119415, -0.06879465281963348, -0.06557787209749222, -0.06236109882593155, -0.05914432555437088, -0.05592754855751991, -0.052710771560668945, -0.049493998289108276, -0.04627722501754761, -0.04306044802069664, -0.03984367102384567, -0.036626897752285004, -0.033410124480724335, -0.030193347483873367, -0.02697657234966755, -0.02375979721546173, -0.020543022081255913, -0.017326246947050095, -0.014109471812844276, -0.010892696678638458, -0.00767592154443264, -0.004459146410226822, -0.0012423712760210037, 0.0019744038581848145, 0.005191178992390633, 0.00840795412659645, 0.011624729260802269, 0.014841504395008087, 0.018058279529213905, 0.021275054663419724, 0.02449182979762554, 0.02770860493183136, 0.030925380066037178, 0.034142155200242996, 0.037358932197093964, 0.04057570546865463, 0.0437924787402153, 0.04700925573706627, 0.050226032733917236, 0.053442806005477905, 0.056659579277038574, 0.05987635627388954, 0.06309313327074051, 0.06630990654230118, 0.06952667981386185, 0.07274346053600311, 0.07596023380756378, 0.07917700707912445, 0.08239378035068512, 0.08561055362224579, 0.08882733434438705, 0.09204410761594772, 0.09526088088750839, 0.09847766160964966, 0.10169443488121033, 0.104911208152771]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 10.0, 9.0, 17.0, 12.0, 31.0, 33.0, 45.0, 58.0, 102.0, 122.0, 187.0, 299.0, 513.0, 829.0, 1673.0, 3682.0, 9564.0, 36823.0, 224283.0, 623425.0, 112638.0, 21683.0, 6553.0, 2745.0, 1287.0, 725.0, 411.0, 261.0, 167.0, 105.0, 81.0, 53.0, 40.0, 29.0, 13.0, 13.0, 15.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1312255859375, -0.12689781188964844, -0.12257003784179688, -0.11824226379394531, -0.11391448974609375, -0.10958671569824219, -0.10525894165039062, -0.10093116760253906, -0.0966033935546875, -0.09227561950683594, -0.08794784545898438, -0.08362007141113281, -0.07929229736328125, -0.07496452331542969, -0.07063674926757812, -0.06630897521972656, -0.061981201171875, -0.05765342712402344, -0.053325653076171875, -0.04899787902832031, -0.04467010498046875, -0.04034233093261719, -0.036014556884765625, -0.03168678283691406, -0.0273590087890625, -0.023031234741210938, -0.018703460693359375, -0.014375686645507812, -0.01004791259765625, -0.0057201385498046875, -0.001392364501953125, 0.0029354095458984375, 0.00726318359375, 0.011590957641601562, 0.015918731689453125, 0.020246505737304688, 0.02457427978515625, 0.028902053833007812, 0.033229827880859375, 0.03755760192871094, 0.0418853759765625, 0.04621315002441406, 0.050540924072265625, 0.05486869812011719, 0.05919647216796875, 0.06352424621582031, 0.06785202026367188, 0.07217979431152344, 0.076507568359375, 0.08083534240722656, 0.08516311645507812, 0.08949089050292969, 0.09381866455078125, 0.09814643859863281, 0.10247421264648438, 0.10680198669433594, 0.1111297607421875, 0.11545753479003906, 0.11978530883789062, 0.12411308288574219, 0.12844085693359375, 0.1327686309814453, 0.13709640502929688, 0.14142417907714844, 0.145751953125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 1.0, 6.0, 8.0, 13.0, 19.0, 25.0, 70.0, 154.0, 229.0, 215.0, 124.0, 64.0, 29.0, 10.0, 11.0, 7.0, 8.0, 3.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12841796875, -0.12396430969238281, -0.11951065063476562, -0.11505699157714844, -0.11060333251953125, -0.10614967346191406, -0.10169601440429688, -0.09724235534667969, -0.0927886962890625, -0.08833503723144531, -0.08388137817382812, -0.07942771911621094, -0.07497406005859375, -0.07052040100097656, -0.06606674194335938, -0.06161308288574219, -0.057159423828125, -0.05270576477050781, -0.048252105712890625, -0.04379844665527344, -0.03934478759765625, -0.03489112854003906, -0.030437469482421875, -0.025983810424804688, -0.0215301513671875, -0.017076492309570312, -0.012622833251953125, -0.008169174194335938, -0.00371551513671875, 0.0007381439208984375, 0.005191802978515625, 0.009645462036132812, 0.01409912109375, 0.018552780151367188, 0.023006439208984375, 0.027460098266601562, 0.03191375732421875, 0.03636741638183594, 0.040821075439453125, 0.04527473449707031, 0.0497283935546875, 0.05418205261230469, 0.058635711669921875, 0.06308937072753906, 0.06754302978515625, 0.07199668884277344, 0.07645034790039062, 0.08090400695800781, 0.085357666015625, 0.08981132507324219, 0.09426498413085938, 0.09871864318847656, 0.10317230224609375, 0.10762596130371094, 0.11207962036132812, 0.11653327941894531, 0.1209869384765625, 0.1254405975341797, 0.12989425659179688, 0.13434791564941406, 0.13880157470703125, 0.14325523376464844, 0.14770889282226562, 0.1521625518798828, 0.1566162109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 8.0, 10.0, 16.0, 16.0, 19.0, 25.0, 45.0, 59.0, 90.0, 130.0, 223.0, 379.0, 711.0, 1893.0, 16006.0, 816541.0, 204691.0, 5098.0, 1227.0, 513.0, 270.0, 181.0, 100.0, 77.0, 67.0, 38.0, 23.0, 18.0, 19.0, 9.0, 11.0, 8.0, 6.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.314697265625, -0.3053855895996094, -0.29607391357421875, -0.2867622375488281, -0.2774505615234375, -0.2681388854980469, -0.25882720947265625, -0.24951553344726562, -0.240203857421875, -0.23089218139648438, -0.22158050537109375, -0.21226882934570312, -0.2029571533203125, -0.19364547729492188, -0.18433380126953125, -0.17502212524414062, -0.16571044921875, -0.15639877319335938, -0.14708709716796875, -0.13777542114257812, -0.1284637451171875, -0.11915206909179688, -0.10984039306640625, -0.10052871704101562, -0.091217041015625, -0.08190536499023438, -0.07259368896484375, -0.06328201293945312, -0.0539703369140625, -0.044658660888671875, -0.03534698486328125, -0.026035308837890625, -0.0167236328125, -0.007411956787109375, 0.00189971923828125, 0.011211395263671875, 0.0205230712890625, 0.029834747314453125, 0.03914642333984375, 0.048458099365234375, 0.057769775390625, 0.06708145141601562, 0.07639312744140625, 0.08570480346679688, 0.0950164794921875, 0.10432815551757812, 0.11363983154296875, 0.12295150756835938, 0.13226318359375, 0.14157485961914062, 0.15088653564453125, 0.16019821166992188, 0.1695098876953125, 0.17882156372070312, 0.18813323974609375, 0.19744491577148438, 0.206756591796875, 0.21606826782226562, 0.22537994384765625, 0.23469161987304688, 0.2440032958984375, 0.2533149719238281, 0.26262664794921875, 0.2719383239746094, 0.28125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 2.0, 5.0, 6.0, 11.0, 9.0, 17.0, 20.0, 17.0, 34.0, 24.0, 27.0, 18.0, 37.0, 35.0, 34.0, 37.0, 49.0, 41.0, 47.0, 48.0, 52.0, 38.0, 40.0, 33.0, 32.0, 40.0, 31.0, 21.0, 34.0, 20.0, 17.0, 25.0, 21.0, 11.0, 12.0, 15.0, 5.0, 6.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.2369384765625, -0.23050308227539062, -0.22406768798828125, -0.21763229370117188, -0.2111968994140625, -0.20476150512695312, -0.19832611083984375, -0.19189071655273438, -0.185455322265625, -0.17901992797851562, -0.17258453369140625, -0.16614913940429688, -0.1597137451171875, -0.15327835083007812, -0.14684295654296875, -0.14040756225585938, -0.13397216796875, -0.12753677368164062, -0.12110137939453125, -0.11466598510742188, -0.1082305908203125, -0.10179519653320312, -0.09535980224609375, -0.08892440795898438, -0.082489013671875, -0.07605361938476562, -0.06961822509765625, -0.06318283081054688, -0.0567474365234375, -0.050312042236328125, -0.04387664794921875, -0.037441253662109375, -0.031005859375, -0.024570465087890625, -0.01813507080078125, -0.011699676513671875, -0.0052642822265625, 0.001171112060546875, 0.00760650634765625, 0.014041900634765625, 0.020477294921875, 0.026912689208984375, 0.03334808349609375, 0.039783477783203125, 0.0462188720703125, 0.052654266357421875, 0.05908966064453125, 0.06552505493164062, 0.07196044921875, 0.07839584350585938, 0.08483123779296875, 0.09126663208007812, 0.0977020263671875, 0.10413742065429688, 0.11057281494140625, 0.11700820922851562, 0.123443603515625, 0.12987899780273438, 0.13631439208984375, 0.14274978637695312, 0.1491851806640625, 0.15562057495117188, 0.16205596923828125, 0.16849136352539062, 0.1749267578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 11.0, 10.0, 12.0, 21.0, 30.0, 41.0, 67.0, 102.0, 196.0, 375.0, 848.0, 2412.0, 9202.0, 54092.0, 762712.0, 192191.0, 19129.0, 4409.0, 1398.0, 573.0, 280.0, 131.0, 108.0, 68.0, 33.0, 26.0, 14.0, 15.0, 16.0, 6.0, 5.0, 6.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.06640625, -0.06409549713134766, -0.06178474426269531, -0.05947399139404297, -0.057163238525390625, -0.05485248565673828, -0.05254173278808594, -0.050230979919433594, -0.04792022705078125, -0.045609474182128906, -0.04329872131347656, -0.04098796844482422, -0.038677215576171875, -0.03636646270751953, -0.03405570983886719, -0.031744956970214844, -0.0294342041015625, -0.027123451232910156, -0.024812698364257812, -0.02250194549560547, -0.020191192626953125, -0.01788043975830078, -0.015569686889648438, -0.013258934020996094, -0.01094818115234375, -0.008637428283691406, -0.0063266754150390625, -0.004015922546386719, -0.001705169677734375, 0.0006055831909179688, 0.0029163360595703125, 0.005227088928222656, 0.007537841796875, 0.009848594665527344, 0.012159347534179688, 0.014470100402832031, 0.016780853271484375, 0.01909160614013672, 0.021402359008789062, 0.023713111877441406, 0.02602386474609375, 0.028334617614746094, 0.030645370483398438, 0.03295612335205078, 0.035266876220703125, 0.03757762908935547, 0.03988838195800781, 0.042199134826660156, 0.0445098876953125, 0.046820640563964844, 0.04913139343261719, 0.05144214630126953, 0.053752899169921875, 0.05606365203857422, 0.05837440490722656, 0.060685157775878906, 0.06299591064453125, 0.0653066635131836, 0.06761741638183594, 0.06992816925048828, 0.07223892211914062, 0.07454967498779297, 0.07686042785644531, 0.07917118072509766, 0.08148193359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 10.0, 8.0, 17.0, 21.0, 30.0, 75.0, 116.0, 173.0, 176.0, 121.0, 95.0, 41.0, 31.0, 22.0, 12.0, 7.0, 5.0, 8.0, 3.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.5556812286376953e-05, -1.5004537999629974e-05, -1.4452263712882996e-05, -1.3899989426136017e-05, -1.3347715139389038e-05, -1.279544085264206e-05, -1.224316656589508e-05, -1.1690892279148102e-05, -1.1138617992401123e-05, -1.0586343705654144e-05, -1.0034069418907166e-05, -9.481795132160187e-06, -8.929520845413208e-06, -8.37724655866623e-06, -7.82497227191925e-06, -7.272697985172272e-06, -6.720423698425293e-06, -6.168149411678314e-06, -5.6158751249313354e-06, -5.063600838184357e-06, -4.511326551437378e-06, -3.959052264690399e-06, -3.4067779779434204e-06, -2.8545036911964417e-06, -2.302229404449463e-06, -1.7499551177024841e-06, -1.1976808309555054e-06, -6.454065442085266e-07, -9.313225746154785e-08, 4.591420292854309e-07, 1.0114163160324097e-06, 1.5636906027793884e-06, 2.115964889526367e-06, 2.668239176273346e-06, 3.2205134630203247e-06, 3.7727877497673035e-06, 4.325062036514282e-06, 4.877336323261261e-06, 5.42961061000824e-06, 5.9818848967552185e-06, 6.534159183502197e-06, 7.086433470249176e-06, 7.638707756996155e-06, 8.190982043743134e-06, 8.743256330490112e-06, 9.295530617237091e-06, 9.84780490398407e-06, 1.0400079190731049e-05, 1.0952353477478027e-05, 1.1504627764225006e-05, 1.2056902050971985e-05, 1.2609176337718964e-05, 1.3161450624465942e-05, 1.3713724911212921e-05, 1.42659991979599e-05, 1.4818273484706879e-05, 1.5370547771453857e-05, 1.5922822058200836e-05, 1.6475096344947815e-05, 1.7027370631694794e-05, 1.7579644918441772e-05, 1.813191920518875e-05, 1.868419349193573e-05, 1.923646777868271e-05, 1.9788742065429688e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 7.0, 14.0, 19.0, 35.0, 64.0, 89.0, 138.0, 275.0, 512.0, 1363.0, 5115.0, 32513.0, 704583.0, 279616.0, 18677.0, 3339.0, 1120.0, 452.0, 235.0, 152.0, 82.0, 38.0, 28.0, 32.0, 23.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.107177734375, -0.10401344299316406, -0.10084915161132812, -0.09768486022949219, -0.09452056884765625, -0.09135627746582031, -0.08819198608398438, -0.08502769470214844, -0.0818634033203125, -0.07869911193847656, -0.07553482055664062, -0.07237052917480469, -0.06920623779296875, -0.06604194641113281, -0.06287765502929688, -0.05971336364746094, -0.056549072265625, -0.05338478088378906, -0.050220489501953125, -0.04705619812011719, -0.04389190673828125, -0.04072761535644531, -0.037563323974609375, -0.03439903259277344, -0.0312347412109375, -0.028070449829101562, -0.024906158447265625, -0.021741867065429688, -0.01857757568359375, -0.015413284301757812, -0.012248992919921875, -0.009084701538085938, -0.00592041015625, -0.0027561187744140625, 0.000408172607421875, 0.0035724639892578125, 0.00673675537109375, 0.009901046752929688, 0.013065338134765625, 0.016229629516601562, 0.0193939208984375, 0.022558212280273438, 0.025722503662109375, 0.028886795043945312, 0.03205108642578125, 0.03521537780761719, 0.038379669189453125, 0.04154396057128906, 0.044708251953125, 0.04787254333496094, 0.051036834716796875, 0.05420112609863281, 0.05736541748046875, 0.06052970886230469, 0.06369400024414062, 0.06685829162597656, 0.0700225830078125, 0.07318687438964844, 0.07635116577148438, 0.07951545715332031, 0.08267974853515625, 0.08584403991699219, 0.08900833129882812, 0.09217262268066406, 0.0953369140625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 6.0, 6.0, 12.0, 15.0, 19.0, 29.0, 45.0, 57.0, 63.0, 87.0, 97.0, 128.0, 118.0, 94.0, 71.0, 35.0, 30.0, 21.0, 17.0, 14.0, 3.0, 5.0, 10.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051483154296875, -0.049364566802978516, -0.04724597930908203, -0.04512739181518555, -0.04300880432128906, -0.04089021682739258, -0.038771629333496094, -0.03665304183959961, -0.034534454345703125, -0.03241586685180664, -0.030297279357910156, -0.028178691864013672, -0.026060104370117188, -0.023941516876220703, -0.02182292938232422, -0.019704341888427734, -0.01758575439453125, -0.015467166900634766, -0.013348579406738281, -0.011229991912841797, -0.009111404418945312, -0.006992816925048828, -0.004874229431152344, -0.0027556419372558594, -0.000637054443359375, 0.0014815330505371094, 0.0036001205444335938, 0.005718708038330078, 0.007837295532226562, 0.009955883026123047, 0.012074470520019531, 0.014193058013916016, 0.0163116455078125, 0.018430233001708984, 0.02054882049560547, 0.022667407989501953, 0.024785995483398438, 0.026904582977294922, 0.029023170471191406, 0.03114175796508789, 0.033260345458984375, 0.03537893295288086, 0.037497520446777344, 0.03961610794067383, 0.04173469543457031, 0.0438532829284668, 0.04597187042236328, 0.048090457916259766, 0.05020904541015625, 0.052327632904052734, 0.05444622039794922, 0.0565648078918457, 0.05868339538574219, 0.06080198287963867, 0.06292057037353516, 0.06503915786743164, 0.06715774536132812, 0.06927633285522461, 0.0713949203491211, 0.07351350784301758, 0.07563209533691406, 0.07775068283081055, 0.07986927032470703, 0.08198785781860352, 0.0841064453125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 30.0, 101.0, 285.0, 348.0, 162.0, 44.0, 8.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4760022163391113, -1.4173980951309204, -1.358794093132019, -1.3001899719238281, -1.2415859699249268, -1.1829818487167358, -1.124377727508545, -1.0657737255096436, -1.0071697235107422, -0.948565661907196, -0.8899616003036499, -0.831357479095459, -0.7727534770965576, -0.7141493558883667, -0.6555452942848206, -0.5969412326812744, -0.5383371114730835, -0.47973304986953735, -0.4211289882659912, -0.3625248968601227, -0.30392083525657654, -0.2453167736530304, -0.18671268224716187, -0.12810862064361572, -0.06950455904006958, -0.01090048998594284, 0.0477035790681839, 0.10630765557289124, 0.16491171717643738, 0.22351577877998352, 0.28211987018585205, 0.3407239317893982, 0.39932799339294434, 0.4579320549964905, 0.5165361166000366, 0.5751402378082275, 0.6337442398071289, 0.6923483610153198, 0.750952422618866, 0.8095564842224121, 0.8681605458259583, 0.9267646074295044, 0.9853686690330505, 1.0439727306365967, 1.1025768518447876, 1.161180853843689, 1.2197849750518799, 1.2783889770507812, 1.3369930982589722, 1.395597219467163, 1.4542012214660645, 1.5128053426742554, 1.5714093446731567, 1.6300134658813477, 1.688617467880249, 1.74722158908844, 1.8058257102966309, 1.8644298315048218, 1.9230338335037231, 1.981637954711914, 2.0402419567108154, 2.098845958709717, 2.1574501991271973, 2.2160542011260986, 2.274658203125]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 4.0, 5.0, 15.0, 18.0, 17.0, 22.0, 30.0, 27.0, 30.0, 27.0, 21.0, 32.0, 34.0, 47.0, 46.0, 45.0, 48.0, 62.0, 59.0, 34.0, 37.0, 41.0, 34.0, 42.0, 30.0, 31.0, 21.0, 20.0, 10.0, 20.0, 13.0, 14.0, 8.0, 5.0, 7.0, 3.0, 7.0, 6.0, 8.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.124292254447937, -1.0891640186309814, -1.0540356636047363, -1.0189074277877808, -0.9837791323661804, -0.9486508369445801, -0.9135226011276245, -0.8783943057060242, -0.8432660102844238, -0.8081377148628235, -0.7730094194412231, -0.7378811836242676, -0.7027528882026672, -0.6676245927810669, -0.6324963569641113, -0.597368061542511, -0.5622397661209106, -0.5271114706993103, -0.49198320508003235, -0.4568549394607544, -0.42172664403915405, -0.3865983486175537, -0.35147008299827576, -0.3163418173789978, -0.28121352195739746, -0.2460852414369583, -0.21095696091651917, -0.17582868039608002, -0.14070039987564087, -0.10557211935520172, -0.07044383883476257, -0.035315558314323425, -0.00018715858459472656, 0.03494112193584442, 0.07006940245628357, 0.10519768297672272, 0.14032596349716187, 0.175454244017601, 0.21058252453804016, 0.2457108050584793, 0.28083908557891846, 0.3159673810005188, 0.35109564661979675, 0.3862239122390747, 0.42135220766067505, 0.4564805030822754, 0.49160876870155334, 0.5267370343208313, 0.5618653297424316, 0.596993625164032, 0.6321219205856323, 0.6672501564025879, 0.7023784518241882, 0.7375067472457886, 0.7726349830627441, 0.8077632784843445, 0.8428915739059448, 0.8780198693275452, 0.9131481647491455, 0.9482764005661011, 0.9834046959877014, 1.0185329914093018, 1.0536612272262573, 1.0887895822525024, 1.123917818069458]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 4.0, 12.0, 13.0, 20.0, 38.0, 39.0, 79.0, 126.0, 220.0, 472.0, 1394.0, 6543.0, 79268.0, 4018983.0, 77771.0, 6876.0, 1383.0, 495.0, 220.0, 124.0, 75.0, 38.0, 29.0, 18.0, 11.0, 4.0, 11.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1640625, -0.15850067138671875, -0.1529388427734375, -0.14737701416015625, -0.141815185546875, -0.13625335693359375, -0.1306915283203125, -0.12512969970703125, -0.11956787109375, -0.11400604248046875, -0.1084442138671875, -0.10288238525390625, -0.097320556640625, -0.09175872802734375, -0.0861968994140625, -0.08063507080078125, -0.0750732421875, -0.06951141357421875, -0.0639495849609375, -0.05838775634765625, -0.052825927734375, -0.04726409912109375, -0.0417022705078125, -0.03614044189453125, -0.03057861328125, -0.02501678466796875, -0.0194549560546875, -0.01389312744140625, -0.008331298828125, -0.00276947021484375, 0.0027923583984375, 0.00835418701171875, 0.013916015625, 0.01947784423828125, 0.0250396728515625, 0.03060150146484375, 0.036163330078125, 0.04172515869140625, 0.0472869873046875, 0.05284881591796875, 0.05841064453125, 0.06397247314453125, 0.0695343017578125, 0.07509613037109375, 0.080657958984375, 0.08621978759765625, 0.0917816162109375, 0.09734344482421875, 0.1029052734375, 0.10846710205078125, 0.1140289306640625, 0.11959075927734375, 0.125152587890625, 0.13071441650390625, 0.1362762451171875, 0.14183807373046875, 0.14739990234375, 0.15296173095703125, 0.1585235595703125, 0.16408538818359375, 0.169647216796875, 0.17520904541015625, 0.1807708740234375, 0.18633270263671875, 0.19189453125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 5.0, 6.0, 9.0, 19.0, 16.0, 69.0, 116.0, 221.0, 231.0, 150.0, 78.0, 29.0, 20.0, 8.0, 8.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13037109375, -0.12589073181152344, -0.12141036987304688, -0.11693000793457031, -0.11244964599609375, -0.10796928405761719, -0.10348892211914062, -0.09900856018066406, -0.0945281982421875, -0.09004783630371094, -0.08556747436523438, -0.08108711242675781, -0.07660675048828125, -0.07212638854980469, -0.06764602661132812, -0.06316566467285156, -0.058685302734375, -0.05420494079589844, -0.049724578857421875, -0.04524421691894531, -0.04076385498046875, -0.03628349304199219, -0.031803131103515625, -0.027322769165039062, -0.0228424072265625, -0.018362045288085938, -0.013881683349609375, -0.009401321411132812, -0.00492095947265625, -0.0004405975341796875, 0.004039764404296875, 0.008520126342773438, 0.01300048828125, 0.017480850219726562, 0.021961212158203125, 0.026441574096679688, 0.03092193603515625, 0.03540229797363281, 0.039882659912109375, 0.04436302185058594, 0.0488433837890625, 0.05332374572753906, 0.057804107666015625, 0.06228446960449219, 0.06676483154296875, 0.07124519348144531, 0.07572555541992188, 0.08020591735839844, 0.084686279296875, 0.08916664123535156, 0.09364700317382812, 0.09812736511230469, 0.10260772705078125, 0.10708808898925781, 0.11156845092773438, 0.11604881286621094, 0.1205291748046875, 0.12500953674316406, 0.12948989868164062, 0.1339702606201172, 0.13845062255859375, 0.1429309844970703, 0.14741134643554688, 0.15189170837402344, 0.1563720703125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 15.0, 23.0, 50.0, 101.0, 160.0, 315.0, 621.0, 1324.0, 3002.0, 8849.0, 36460.0, 346227.0, 3658107.0, 111288.0, 18482.0, 5402.0, 2019.0, 909.0, 450.0, 215.0, 109.0, 62.0, 43.0, 13.0, 16.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135009765625, -0.13118362426757812, -0.12735748291015625, -0.12353134155273438, -0.1197052001953125, -0.11587905883789062, -0.11205291748046875, -0.10822677612304688, -0.104400634765625, -0.10057449340820312, -0.09674835205078125, -0.09292221069335938, -0.0890960693359375, -0.08526992797851562, -0.08144378662109375, -0.07761764526367188, -0.07379150390625, -0.06996536254882812, -0.06613922119140625, -0.062313079833984375, -0.0584869384765625, -0.054660797119140625, -0.05083465576171875, -0.047008514404296875, -0.043182373046875, -0.039356231689453125, -0.03553009033203125, -0.031703948974609375, -0.0278778076171875, -0.024051666259765625, -0.02022552490234375, -0.016399383544921875, -0.0125732421875, -0.008747100830078125, -0.00492095947265625, -0.001094818115234375, 0.0027313232421875, 0.006557464599609375, 0.01038360595703125, 0.014209747314453125, 0.018035888671875, 0.021862030029296875, 0.02568817138671875, 0.029514312744140625, 0.0333404541015625, 0.037166595458984375, 0.04099273681640625, 0.044818878173828125, 0.04864501953125, 0.052471160888671875, 0.05629730224609375, 0.060123443603515625, 0.0639495849609375, 0.06777572631835938, 0.07160186767578125, 0.07542800903320312, 0.079254150390625, 0.08308029174804688, 0.08690643310546875, 0.09073257446289062, 0.0945587158203125, 0.09838485717773438, 0.10221099853515625, 0.10603713989257812, 0.10986328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 3.0, 13.0, 9.0, 15.0, 27.0, 30.0, 51.0, 69.0, 110.0, 229.0, 492.0, 2127.0, 408.0, 159.0, 103.0, 55.0, 41.0, 20.0, 33.0, 20.0, 10.0, 8.0, 2.0, 7.0, 1.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04974365234375, -0.04820871353149414, -0.04667377471923828, -0.04513883590698242, -0.04360389709472656, -0.0420689582824707, -0.040534019470214844, -0.038999080657958984, -0.037464141845703125, -0.035929203033447266, -0.034394264221191406, -0.03285932540893555, -0.03132438659667969, -0.029789447784423828, -0.02825450897216797, -0.02671957015991211, -0.02518463134765625, -0.02364969253540039, -0.02211475372314453, -0.020579814910888672, -0.019044876098632812, -0.017509937286376953, -0.015974998474121094, -0.014440059661865234, -0.012905120849609375, -0.011370182037353516, -0.009835243225097656, -0.008300304412841797, -0.0067653656005859375, -0.005230426788330078, -0.0036954879760742188, -0.0021605491638183594, -0.0006256103515625, 0.0009093284606933594, 0.0024442672729492188, 0.003979206085205078, 0.0055141448974609375, 0.007049083709716797, 0.008584022521972656, 0.010118961334228516, 0.011653900146484375, 0.013188838958740234, 0.014723777770996094, 0.016258716583251953, 0.017793655395507812, 0.019328594207763672, 0.02086353302001953, 0.02239847183227539, 0.02393341064453125, 0.02546834945678711, 0.02700328826904297, 0.028538227081298828, 0.030073165893554688, 0.03160810470581055, 0.033143043518066406, 0.034677982330322266, 0.036212921142578125, 0.037747859954833984, 0.039282798767089844, 0.0408177375793457, 0.04235267639160156, 0.04388761520385742, 0.04542255401611328, 0.04695749282836914, 0.048492431640625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 9.0, 20.0, 49.0, 117.0, 284.0, 306.0, 160.0, 41.0, 10.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33423781394958496, -0.3136671781539917, -0.2930965721607208, -0.27252593636512756, -0.2519553303718567, -0.23138469457626343, -0.21081405878067017, -0.1902434378862381, -0.16967281699180603, -0.14910219609737396, -0.1285315752029419, -0.10796093940734863, -0.08739031851291656, -0.0668196976184845, -0.04624906927347183, -0.025678440928459167, -0.0051078200340271, 0.015462804585695267, 0.03603342920541763, 0.05660405382514, 0.07717467844486237, 0.09774529933929443, 0.1183159276843071, 0.13888655602931976, 0.15945717692375183, 0.1800277978181839, 0.20059841871261597, 0.22116905450820923, 0.2417396754026413, 0.26231029629707336, 0.2828809320926666, 0.3034515380859375, 0.32402217388153076, 0.344592809677124, 0.3651634156703949, 0.38573405146598816, 0.40630465745925903, 0.4268752932548523, 0.44744592905044556, 0.4680165648460388, 0.4885871708393097, 0.5091577768325806, 0.5297284126281738, 0.5502990484237671, 0.5708696842193604, 0.5914403200149536, 0.6120108962059021, 0.6325815320014954, 0.6531521677970886, 0.6737228035926819, 0.6942934393882751, 0.7148640155792236, 0.7354346513748169, 0.7560052871704102, 0.7765759229660034, 0.7971465587615967, 0.8177171945571899, 0.8382878303527832, 0.8588584661483765, 0.879429042339325, 0.8999996781349182, 0.9205703139305115, 0.9411409497261047, 0.961711585521698, 0.9822821617126465]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 5.0, 2.0, 9.0, 4.0, 11.0, 12.0, 11.0, 14.0, 15.0, 19.0, 24.0, 27.0, 25.0, 40.0, 27.0, 22.0, 39.0, 33.0, 33.0, 34.0, 36.0, 57.0, 32.0, 40.0, 42.0, 31.0, 38.0, 31.0, 33.0, 40.0, 33.0, 23.0, 27.0, 21.0, 11.0, 16.0, 15.0, 15.0, 16.0, 9.0, 6.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1309802532196045, -0.12680184841156006, -0.12262345850467682, -0.11844506114721298, -0.11426666378974915, -0.11008826643228531, -0.10590986907482147, -0.10173147171735764, -0.0975530743598938, -0.09337467700242996, -0.08919627964496613, -0.08501788228750229, -0.08083948493003845, -0.07666108757257462, -0.07248269021511078, -0.06830429285764694, -0.0641258955001831, -0.05994749814271927, -0.05576910078525543, -0.051590703427791595, -0.04741230607032776, -0.04323390871286392, -0.039055511355400085, -0.03487711399793625, -0.030698716640472412, -0.026520319283008575, -0.02234192192554474, -0.018163524568080902, -0.013985127210617065, -0.009806729853153229, -0.005628332495689392, -0.0014499351382255554, 0.0027284622192382812, 0.006906859576702118, 0.011085256934165955, 0.015263654291629791, 0.019442051649093628, 0.023620449006557465, 0.0277988463640213, 0.03197724372148514, 0.036155641078948975, 0.04033403843641281, 0.04451243579387665, 0.048690833151340485, 0.05286923050880432, 0.05704762786626816, 0.061226025223731995, 0.06540442258119583, 0.06958281993865967, 0.0737612172961235, 0.07793961465358734, 0.08211801201105118, 0.08629640936851501, 0.09047480672597885, 0.09465320408344269, 0.09883160144090652, 0.10300999879837036, 0.1071883961558342, 0.11136679351329803, 0.11554519087076187, 0.11972358822822571, 0.12390198558568954, 0.12808038294315338, 0.13225877285003662, 0.13643717765808105]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 13.0, 28.0, 54.0, 69.0, 149.0, 208.0, 448.0, 966.0, 2478.0, 9549.0, 81217.0, 813399.0, 122772.0, 12037.0, 2984.0, 1041.0, 493.0, 255.0, 149.0, 77.0, 38.0, 45.0, 19.0, 14.0, 4.0, 7.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.19921875, -0.19345664978027344, -0.18769454956054688, -0.1819324493408203, -0.17617034912109375, -0.1704082489013672, -0.16464614868164062, -0.15888404846191406, -0.1531219482421875, -0.14735984802246094, -0.14159774780273438, -0.1358356475830078, -0.13007354736328125, -0.12431144714355469, -0.11854934692382812, -0.11278724670410156, -0.107025146484375, -0.10126304626464844, -0.09550094604492188, -0.08973884582519531, -0.08397674560546875, -0.07821464538574219, -0.07245254516601562, -0.06669044494628906, -0.0609283447265625, -0.05516624450683594, -0.049404144287109375, -0.04364204406738281, -0.03787994384765625, -0.03211784362792969, -0.026355743408203125, -0.020593643188476562, -0.01483154296875, -0.009069442749023438, -0.003307342529296875, 0.0024547576904296875, 0.00821685791015625, 0.013978958129882812, 0.019741058349609375, 0.025503158569335938, 0.0312652587890625, 0.03702735900878906, 0.042789459228515625, 0.04855155944824219, 0.05431365966796875, 0.06007575988769531, 0.06583786010742188, 0.07159996032714844, 0.077362060546875, 0.08312416076660156, 0.08888626098632812, 0.09464836120605469, 0.10041046142578125, 0.10617256164550781, 0.11193466186523438, 0.11769676208496094, 0.1234588623046875, 0.12922096252441406, 0.13498306274414062, 0.1407451629638672, 0.14650726318359375, 0.1522693634033203, 0.15803146362304688, 0.16379356384277344, 0.1695556640625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 9.0, 12.0, 16.0, 20.0, 64.0, 129.0, 216.0, 217.0, 158.0, 73.0, 35.0, 12.0, 15.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1298828125, -0.12541961669921875, -0.1209564208984375, -0.11649322509765625, -0.112030029296875, -0.10756683349609375, -0.1031036376953125, -0.09864044189453125, -0.09417724609375, -0.08971405029296875, -0.0852508544921875, -0.08078765869140625, -0.076324462890625, -0.07186126708984375, -0.0673980712890625, -0.06293487548828125, -0.0584716796875, -0.05400848388671875, -0.0495452880859375, -0.04508209228515625, -0.040618896484375, -0.03615570068359375, -0.0316925048828125, -0.02722930908203125, -0.02276611328125, -0.01830291748046875, -0.0138397216796875, -0.00937652587890625, -0.004913330078125, -0.00045013427734375, 0.0040130615234375, 0.00847625732421875, 0.012939453125, 0.01740264892578125, 0.0218658447265625, 0.02632904052734375, 0.030792236328125, 0.03525543212890625, 0.0397186279296875, 0.04418182373046875, 0.04864501953125, 0.05310821533203125, 0.0575714111328125, 0.06203460693359375, 0.066497802734375, 0.07096099853515625, 0.0754241943359375, 0.07988739013671875, 0.0843505859375, 0.08881378173828125, 0.0932769775390625, 0.09774017333984375, 0.102203369140625, 0.10666656494140625, 0.1111297607421875, 0.11559295654296875, 0.12005615234375, 0.12451934814453125, 0.1289825439453125, 0.13344573974609375, 0.137908935546875, 0.14237213134765625, 0.1468353271484375, 0.15129852294921875, 0.15576171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 8.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 10.0, 10.0, 10.0, 17.0, 26.0, 23.0, 46.0, 47.0, 67.0, 112.0, 110.0, 247.0, 518.0, 1332.0, 6186.0, 120447.0, 871739.0, 42213.0, 3412.0, 903.0, 388.0, 193.0, 118.0, 74.0, 54.0, 57.0, 35.0, 30.0, 24.0, 12.0, 16.0, 12.0, 10.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.2264404296875, -0.22021102905273438, -0.21398162841796875, -0.20775222778320312, -0.2015228271484375, -0.19529342651367188, -0.18906402587890625, -0.18283462524414062, -0.176605224609375, -0.17037582397460938, -0.16414642333984375, -0.15791702270507812, -0.1516876220703125, -0.14545822143554688, -0.13922882080078125, -0.13299942016601562, -0.12677001953125, -0.12054061889648438, -0.11431121826171875, -0.10808181762695312, -0.1018524169921875, -0.09562301635742188, -0.08939361572265625, -0.08316421508789062, -0.076934814453125, -0.07070541381835938, -0.06447601318359375, -0.058246612548828125, -0.0520172119140625, -0.045787811279296875, -0.03955841064453125, -0.033329010009765625, -0.027099609375, -0.020870208740234375, -0.01464080810546875, -0.008411407470703125, -0.0021820068359375, 0.004047393798828125, 0.01027679443359375, 0.016506195068359375, 0.022735595703125, 0.028964996337890625, 0.03519439697265625, 0.041423797607421875, 0.0476531982421875, 0.053882598876953125, 0.06011199951171875, 0.06634140014648438, 0.07257080078125, 0.07880020141601562, 0.08502960205078125, 0.09125900268554688, 0.0974884033203125, 0.10371780395507812, 0.10994720458984375, 0.11617660522460938, 0.122406005859375, 0.12863540649414062, 0.13486480712890625, 0.14109420776367188, 0.1473236083984375, 0.15355300903320312, 0.15978240966796875, 0.16601181030273438, 0.1722412109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 9.0, 8.0, 16.0, 18.0, 25.0, 23.0, 22.0, 21.0, 25.0, 29.0, 33.0, 39.0, 37.0, 46.0, 38.0, 39.0, 57.0, 48.0, 37.0, 27.0, 50.0, 30.0, 41.0, 28.0, 31.0, 29.0, 26.0, 20.0, 19.0, 19.0, 17.0, 18.0, 12.0, 6.0, 7.0, 6.0, 4.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.2034912109375, -0.19748878479003906, -0.19148635864257812, -0.1854839324951172, -0.17948150634765625, -0.1734790802001953, -0.16747665405273438, -0.16147422790527344, -0.1554718017578125, -0.14946937561035156, -0.14346694946289062, -0.1374645233154297, -0.13146209716796875, -0.1254596710205078, -0.11945724487304688, -0.11345481872558594, -0.107452392578125, -0.10144996643066406, -0.09544754028320312, -0.08944511413574219, -0.08344268798828125, -0.07744026184082031, -0.07143783569335938, -0.06543540954589844, -0.0594329833984375, -0.05343055725097656, -0.047428131103515625, -0.04142570495605469, -0.03542327880859375, -0.029420852661132812, -0.023418426513671875, -0.017416000366210938, -0.01141357421875, -0.0054111480712890625, 0.000591278076171875, 0.0065937042236328125, 0.01259613037109375, 0.018598556518554688, 0.024600982666015625, 0.030603408813476562, 0.0366058349609375, 0.04260826110839844, 0.048610687255859375, 0.05461311340332031, 0.06061553955078125, 0.06661796569824219, 0.07262039184570312, 0.07862281799316406, 0.084625244140625, 0.09062767028808594, 0.09663009643554688, 0.10263252258300781, 0.10863494873046875, 0.11463737487792969, 0.12063980102539062, 0.12664222717285156, 0.1326446533203125, 0.13864707946777344, 0.14464950561523438, 0.1506519317626953, 0.15665435791015625, 0.1626567840576172, 0.16865921020507812, 0.17466163635253906, 0.1806640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 8.0, 6.0, 14.0, 24.0, 26.0, 23.0, 47.0, 56.0, 99.0, 152.0, 299.0, 570.0, 1378.0, 3474.0, 10603.0, 44366.0, 433330.0, 488107.0, 48352.0, 11048.0, 3752.0, 1377.0, 616.0, 301.0, 149.0, 109.0, 60.0, 38.0, 38.0, 31.0, 20.0, 15.0, 18.0, 9.0, 6.0, 9.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.049713134765625, -0.048207759857177734, -0.04670238494873047, -0.0451970100402832, -0.04369163513183594, -0.04218626022338867, -0.040680885314941406, -0.03917551040649414, -0.037670135498046875, -0.03616476058959961, -0.034659385681152344, -0.03315401077270508, -0.03164863586425781, -0.030143260955810547, -0.02863788604736328, -0.027132511138916016, -0.02562713623046875, -0.024121761322021484, -0.02261638641357422, -0.021111011505126953, -0.019605636596679688, -0.018100261688232422, -0.016594886779785156, -0.01508951187133789, -0.013584136962890625, -0.01207876205444336, -0.010573387145996094, -0.009068012237548828, -0.0075626373291015625, -0.006057262420654297, -0.004551887512207031, -0.0030465126037597656, -0.0015411376953125, -3.5762786865234375e-05, 0.0014696121215820312, 0.002974987030029297, 0.0044803619384765625, 0.005985736846923828, 0.007491111755371094, 0.00899648666381836, 0.010501861572265625, 0.01200723648071289, 0.013512611389160156, 0.015017986297607422, 0.016523361206054688, 0.018028736114501953, 0.01953411102294922, 0.021039485931396484, 0.02254486083984375, 0.024050235748291016, 0.02555561065673828, 0.027060985565185547, 0.028566360473632812, 0.030071735382080078, 0.031577110290527344, 0.03308248519897461, 0.034587860107421875, 0.03609323501586914, 0.037598609924316406, 0.03910398483276367, 0.04060935974121094, 0.0421147346496582, 0.04362010955810547, 0.045125484466552734, 0.046630859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 3.0, 3.0, 6.0, 9.0, 6.0, 12.0, 24.0, 20.0, 35.0, 36.0, 32.0, 80.0, 95.0, 114.0, 111.0, 94.0, 83.0, 57.0, 45.0, 34.0, 28.0, 12.0, 16.0, 8.0, 4.0, 8.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.049041748046875e-05, -1.0190531611442566e-05, -9.890645742416382e-06, -9.590759873390198e-06, -9.290874004364014e-06, -8.99098813533783e-06, -8.691102266311646e-06, -8.391216397285461e-06, -8.091330528259277e-06, -7.791444659233093e-06, -7.491558790206909e-06, -7.191672921180725e-06, -6.891787052154541e-06, -6.591901183128357e-06, -6.292015314102173e-06, -5.992129445075989e-06, -5.692243576049805e-06, -5.392357707023621e-06, -5.0924718379974365e-06, -4.7925859689712524e-06, -4.492700099945068e-06, -4.192814230918884e-06, -3.8929283618927e-06, -3.593042492866516e-06, -3.293156623840332e-06, -2.993270754814148e-06, -2.693384885787964e-06, -2.3934990167617798e-06, -2.0936131477355957e-06, -1.7937272787094116e-06, -1.4938414096832275e-06, -1.1939555406570435e-06, -8.940696716308594e-07, -5.941838026046753e-07, -2.942979335784912e-07, 5.587935447692871e-09, 3.0547380447387695e-07, 6.05359673500061e-07, 9.052455425262451e-07, 1.2051314115524292e-06, 1.5050172805786133e-06, 1.8049031496047974e-06, 2.1047890186309814e-06, 2.4046748876571655e-06, 2.7045607566833496e-06, 3.0044466257095337e-06, 3.3043324947357178e-06, 3.604218363761902e-06, 3.904104232788086e-06, 4.20399010181427e-06, 4.503875970840454e-06, 4.803761839866638e-06, 5.103647708892822e-06, 5.403533577919006e-06, 5.7034194469451904e-06, 6.0033053159713745e-06, 6.303191184997559e-06, 6.603077054023743e-06, 6.902962923049927e-06, 7.202848792076111e-06, 7.502734661102295e-06, 7.802620530128479e-06, 8.102506399154663e-06, 8.402392268180847e-06, 8.702278137207031e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 4.0, 18.0, 34.0, 44.0, 94.0, 177.0, 451.0, 1546.0, 7173.0, 83555.0, 908736.0, 40053.0, 4807.0, 1136.0, 415.0, 130.0, 62.0, 39.0, 24.0, 16.0, 11.0, 7.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12225341796875, -0.11889362335205078, -0.11553382873535156, -0.11217403411865234, -0.10881423950195312, -0.1054544448852539, -0.10209465026855469, -0.09873485565185547, -0.09537506103515625, -0.09201526641845703, -0.08865547180175781, -0.0852956771850586, -0.08193588256835938, -0.07857608795166016, -0.07521629333496094, -0.07185649871826172, -0.0684967041015625, -0.06513690948486328, -0.06177711486816406, -0.058417320251464844, -0.055057525634765625, -0.051697731018066406, -0.04833793640136719, -0.04497814178466797, -0.04161834716796875, -0.03825855255126953, -0.03489875793457031, -0.031538963317871094, -0.028179168701171875, -0.024819374084472656, -0.021459579467773438, -0.01809978485107422, -0.014739990234375, -0.011380195617675781, -0.008020401000976562, -0.004660606384277344, -0.001300811767578125, 0.0020589828491210938, 0.0054187774658203125, 0.008778572082519531, 0.01213836669921875, 0.015498161315917969, 0.018857955932617188, 0.022217750549316406, 0.025577545166015625, 0.028937339782714844, 0.03229713439941406, 0.03565692901611328, 0.0390167236328125, 0.04237651824951172, 0.04573631286621094, 0.049096107482910156, 0.052455902099609375, 0.055815696716308594, 0.05917549133300781, 0.06253528594970703, 0.06589508056640625, 0.06925487518310547, 0.07261466979980469, 0.0759744644165039, 0.07933425903320312, 0.08269405364990234, 0.08605384826660156, 0.08941364288330078, 0.0927734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 15.0, 15.0, 44.0, 57.0, 113.0, 206.0, 239.0, 139.0, 66.0, 51.0, 22.0, 19.0, 12.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12548828125, -0.12220191955566406, -0.11891555786132812, -0.11562919616699219, -0.11234283447265625, -0.10905647277832031, -0.10577011108398438, -0.10248374938964844, -0.0991973876953125, -0.09591102600097656, -0.09262466430664062, -0.08933830261230469, -0.08605194091796875, -0.08276557922363281, -0.07947921752929688, -0.07619285583496094, -0.072906494140625, -0.06962013244628906, -0.06633377075195312, -0.06304740905761719, -0.05976104736328125, -0.05647468566894531, -0.053188323974609375, -0.04990196228027344, -0.0466156005859375, -0.04332923889160156, -0.040042877197265625, -0.03675651550292969, -0.03347015380859375, -0.030183792114257812, -0.026897430419921875, -0.023611068725585938, -0.02032470703125, -0.017038345336914062, -0.013751983642578125, -0.010465621948242188, -0.00717926025390625, -0.0038928985595703125, -0.000606536865234375, 0.0026798248291015625, 0.0059661865234375, 0.009252548217773438, 0.012538909912109375, 0.015825271606445312, 0.01911163330078125, 0.022397994995117188, 0.025684356689453125, 0.028970718383789062, 0.032257080078125, 0.03554344177246094, 0.038829803466796875, 0.04211616516113281, 0.04540252685546875, 0.04868888854980469, 0.051975250244140625, 0.05526161193847656, 0.0585479736328125, 0.06183433532714844, 0.06512069702148438, 0.06840705871582031, 0.07169342041015625, 0.07497978210449219, 0.07826614379882812, 0.08155250549316406, 0.0848388671875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 129.0, 855.0, 22.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8728519678115845, -1.6714962720870972, -1.4701405763626099, -1.2687848806381226, -1.0674291849136353, -0.866073489189148, -0.6647177934646606, -0.46336209774017334, -0.26200640201568604, -0.06065070629119873, 0.14070498943328857, 0.3420606851577759, 0.5434163808822632, 0.7447720766067505, 0.9461277723312378, 1.147483468055725, 1.3488391637802124, 1.5501948595046997, 1.751550555229187, 1.9529062509536743, 2.154262065887451, 2.3556175231933594, 2.556973457336426, 2.758328914642334, 2.9596848487854004, 3.1610405445098877, 3.362396240234375, 3.5637519359588623, 3.7651076316833496, 3.966463327407837, 4.167819023132324, 4.369174957275391, 4.570529937744141, 4.771885871887207, 4.973241329193115, 5.174596786499023, 5.37595272064209, 5.577308654785156, 5.7786641120910645, 5.980019569396973, 6.181375503540039, 6.3827314376831055, 6.584086894989014, 6.785442352294922, 6.986798286437988, 7.188154220581055, 7.389509677886963, 7.590865135192871, 7.7922210693359375, 7.993577003479004, 8.19493293762207, 8.39628791809082, 8.597643852233887, 8.798999786376953, 9.000354766845703, 9.20171070098877, 9.403066635131836, 9.604422569274902, 9.805778503417969, 10.007133483886719, 10.208489418029785, 10.409845352172852, 10.611200332641602, 10.812556266784668, 11.013912200927734]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 3.0, 6.0, 4.0, 6.0, 7.0, 11.0, 13.0, 8.0, 15.0, 27.0, 19.0, 20.0, 26.0, 29.0, 27.0, 36.0, 40.0, 45.0, 40.0, 38.0, 38.0, 42.0, 46.0, 43.0, 34.0, 47.0, 33.0, 29.0, 43.0, 28.0, 38.0, 33.0, 24.0, 13.0, 20.0, 12.0, 6.0, 12.0, 4.0, 10.0, 9.0, 3.0, 4.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9678308367729187, -0.9374896287918091, -0.9071483612060547, -0.8768071532249451, -0.8464658856391907, -0.816124677658081, -0.7857834100723267, -0.755442202091217, -0.7251009941101074, -0.6947597861289978, -0.6644185185432434, -0.6340773105621338, -0.6037360429763794, -0.5733948349952698, -0.5430536270141602, -0.5127123594284058, -0.48237109184265137, -0.45202985405921936, -0.42168861627578735, -0.39134740829467773, -0.36100614070892334, -0.3306649327278137, -0.3003236949443817, -0.2699824571609497, -0.2396412193775177, -0.2092999815940857, -0.1789587438106537, -0.14861752092838287, -0.11827628314495087, -0.08793504536151886, -0.05759382247924805, -0.02725258469581604, 0.003088712692260742, 0.03342994675040245, 0.06377118080854416, 0.09411241114139557, 0.12445364892482758, 0.15479488670825958, 0.1851361095905304, 0.2154773473739624, 0.2458185851573944, 0.2761598229408264, 0.3065010607242584, 0.33684229850769043, 0.36718350648880005, 0.39752477407455444, 0.42786598205566406, 0.45820721983909607, 0.4885484576225281, 0.5188896656036377, 0.5492309331893921, 0.5795721411705017, 0.6099134087562561, 0.6402546167373657, 0.6705958843231201, 0.7009370923042297, 0.7312783002853394, 0.761619508266449, 0.7919607758522034, 0.822301983833313, 0.8526432514190674, 0.882984459400177, 0.9133256673812866, 0.943666934967041, 0.9740082025527954]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 4.0, 8.0, 4.0, 5.0, 6.0, 11.0, 15.0, 26.0, 33.0, 59.0, 129.0, 272.0, 600.0, 1441.0, 4157.0, 14717.0, 228267.0, 3919925.0, 17094.0, 4518.0, 1658.0, 634.0, 339.0, 152.0, 78.0, 51.0, 26.0, 11.0, 9.0, 7.0, 7.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.17138671875, -0.16649627685546875, -0.1616058349609375, -0.15671539306640625, -0.151824951171875, -0.14693450927734375, -0.1420440673828125, -0.13715362548828125, -0.13226318359375, -0.12737274169921875, -0.1224822998046875, -0.11759185791015625, -0.112701416015625, -0.10781097412109375, -0.1029205322265625, -0.09803009033203125, -0.0931396484375, -0.08824920654296875, -0.0833587646484375, -0.07846832275390625, -0.073577880859375, -0.06868743896484375, -0.0637969970703125, -0.05890655517578125, -0.05401611328125, -0.04912567138671875, -0.0442352294921875, -0.03934478759765625, -0.034454345703125, -0.02956390380859375, -0.0246734619140625, -0.01978302001953125, -0.014892578125, -0.01000213623046875, -0.0051116943359375, -0.00022125244140625, 0.004669189453125, 0.00955963134765625, 0.0144500732421875, 0.01934051513671875, 0.02423095703125, 0.02912139892578125, 0.0340118408203125, 0.03890228271484375, 0.043792724609375, 0.04868316650390625, 0.0535736083984375, 0.05846405029296875, 0.0633544921875, 0.06824493408203125, 0.0731353759765625, 0.07802581787109375, 0.082916259765625, 0.08780670166015625, 0.0926971435546875, 0.09758758544921875, 0.10247802734375, 0.10736846923828125, 0.1122589111328125, 0.11714935302734375, 0.122039794921875, 0.12693023681640625, 0.1318206787109375, 0.13671112060546875, 0.1416015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 10.0, 20.0, 21.0, 74.0, 144.0, 219.0, 221.0, 126.0, 79.0, 27.0, 21.0, 9.0, 7.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1298828125, -0.125396728515625, -0.12091064453125, -0.116424560546875, -0.1119384765625, -0.107452392578125, -0.10296630859375, -0.098480224609375, -0.093994140625, -0.089508056640625, -0.08502197265625, -0.080535888671875, -0.0760498046875, -0.071563720703125, -0.06707763671875, -0.062591552734375, -0.05810546875, -0.053619384765625, -0.04913330078125, -0.044647216796875, -0.0401611328125, -0.035675048828125, -0.03118896484375, -0.026702880859375, -0.022216796875, -0.017730712890625, -0.01324462890625, -0.008758544921875, -0.0042724609375, 0.000213623046875, 0.00469970703125, 0.009185791015625, 0.013671875, 0.018157958984375, 0.02264404296875, 0.027130126953125, 0.0316162109375, 0.036102294921875, 0.04058837890625, 0.045074462890625, 0.049560546875, 0.054046630859375, 0.05853271484375, 0.063018798828125, 0.0675048828125, 0.071990966796875, 0.07647705078125, 0.080963134765625, 0.08544921875, 0.089935302734375, 0.09442138671875, 0.098907470703125, 0.1033935546875, 0.107879638671875, 0.11236572265625, 0.116851806640625, 0.121337890625, 0.125823974609375, 0.13031005859375, 0.134796142578125, 0.1392822265625, 0.143768310546875, 0.14825439453125, 0.152740478515625, 0.1572265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 10.0, 7.0, 10.0, 25.0, 23.0, 44.0, 61.0, 114.0, 175.0, 296.0, 405.0, 764.0, 1402.0, 3074.0, 10813.0, 306358.0, 3851066.0, 12774.0, 3227.0, 1488.0, 872.0, 475.0, 302.0, 160.0, 113.0, 77.0, 52.0, 34.0, 19.0, 15.0, 12.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24602890014648438, -0.23693084716796875, -0.22783279418945312, -0.2187347412109375, -0.20963668823242188, -0.20053863525390625, -0.19144058227539062, -0.182342529296875, -0.17324447631835938, -0.16414642333984375, -0.15504837036132812, -0.1459503173828125, -0.13685226440429688, -0.12775421142578125, -0.11865615844726562, -0.10955810546875, -0.10046005249023438, -0.09136199951171875, -0.08226394653320312, -0.0731658935546875, -0.06406784057617188, -0.05496978759765625, -0.045871734619140625, -0.036773681640625, -0.027675628662109375, -0.01857757568359375, -0.009479522705078125, -0.0003814697265625, 0.008716583251953125, 0.01781463623046875, 0.026912689208984375, 0.0360107421875, 0.045108795166015625, 0.05420684814453125, 0.06330490112304688, 0.0724029541015625, 0.08150100708007812, 0.09059906005859375, 0.09969711303710938, 0.108795166015625, 0.11789321899414062, 0.12699127197265625, 0.13608932495117188, 0.1451873779296875, 0.15428543090820312, 0.16338348388671875, 0.17248153686523438, 0.18157958984375, 0.19067764282226562, 0.19977569580078125, 0.20887374877929688, 0.2179718017578125, 0.22706985473632812, 0.23616790771484375, 0.24526596069335938, 0.254364013671875, 0.2634620666503906, 0.27256011962890625, 0.2816581726074219, 0.2907562255859375, 0.2998542785644531, 0.30895233154296875, 0.3180503845214844, 0.3271484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 22.0, 23.0, 38.0, 96.0, 622.0, 3069.0, 88.0, 45.0, 24.0, 16.0, 8.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03662109375, -0.035314083099365234, -0.03400707244873047, -0.0327000617980957, -0.03139305114746094, -0.030086040496826172, -0.028779029846191406, -0.02747201919555664, -0.026165008544921875, -0.02485799789428711, -0.023550987243652344, -0.022243976593017578, -0.020936965942382812, -0.019629955291748047, -0.01832294464111328, -0.017015933990478516, -0.01570892333984375, -0.014401912689208984, -0.013094902038574219, -0.011787891387939453, -0.010480880737304688, -0.009173870086669922, -0.007866859436035156, -0.006559848785400391, -0.005252838134765625, -0.003945827484130859, -0.0026388168334960938, -0.0013318061828613281, -2.47955322265625e-05, 0.0012822151184082031, 0.0025892257690429688, 0.0038962364196777344, 0.0052032470703125, 0.006510257720947266, 0.007817268371582031, 0.009124279022216797, 0.010431289672851562, 0.011738300323486328, 0.013045310974121094, 0.01435232162475586, 0.015659332275390625, 0.01696634292602539, 0.018273353576660156, 0.019580364227294922, 0.020887374877929688, 0.022194385528564453, 0.02350139617919922, 0.024808406829833984, 0.02611541748046875, 0.027422428131103516, 0.02872943878173828, 0.030036449432373047, 0.03134346008300781, 0.03265047073364258, 0.033957481384277344, 0.03526449203491211, 0.036571502685546875, 0.03787851333618164, 0.039185523986816406, 0.04049253463745117, 0.04179954528808594, 0.0431065559387207, 0.04441356658935547, 0.045720577239990234, 0.047027587890625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 15.0, 18.0, 27.0, 82.0, 143.0, 212.0, 225.0, 140.0, 72.0, 34.0, 11.0, 10.0, 10.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36155495047569275, -0.35292932391166687, -0.344303697347641, -0.3356780707836151, -0.32705244421958923, -0.31842681765556335, -0.3098011910915375, -0.3011755347251892, -0.29254990816116333, -0.28392428159713745, -0.2752986550331116, -0.2666730284690857, -0.2580474019050598, -0.24942177534103394, -0.24079613387584686, -0.23217050731182098, -0.2235448956489563, -0.21491926908493042, -0.20629364252090454, -0.19766801595687866, -0.18904238939285278, -0.1804167628288269, -0.17179112136363983, -0.16316549479961395, -0.15453986823558807, -0.1459142416715622, -0.13728861510753632, -0.12866298854351044, -0.12003735452890396, -0.11141172796487808, -0.1027860939502716, -0.09416046738624573, -0.08553485572338104, -0.07690922915935516, -0.06828360259532928, -0.05965796858072281, -0.05103234201669693, -0.04240671545267105, -0.033781085163354874, -0.025155454874038696, -0.016529828310012817, -0.00790419988334179, 0.0007214285433292389, 0.009347056970000267, 0.017972685396671295, 0.026598311960697174, 0.03522394225001335, 0.04384957253932953, 0.05247519910335541, 0.06110082566738129, 0.06972645223140717, 0.07835208624601364, 0.08697771281003952, 0.0956033393740654, 0.10422897338867188, 0.11285459995269775, 0.12148022651672363, 0.1301058530807495, 0.1387314796447754, 0.14735710620880127, 0.15598273277282715, 0.16460835933685303, 0.1732340008020401, 0.18185962736606598, 0.19048525393009186]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 1.0, 7.0, 16.0, 4.0, 4.0, 9.0, 8.0, 11.0, 17.0, 17.0, 22.0, 22.0, 24.0, 28.0, 28.0, 41.0, 27.0, 43.0, 46.0, 39.0, 34.0, 30.0, 34.0, 41.0, 40.0, 41.0, 35.0, 26.0, 36.0, 33.0, 33.0, 28.0, 31.0, 21.0, 18.0, 10.0, 19.0, 19.0, 10.0, 6.0, 14.0, 4.0, 5.0, 4.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06788229942321777, -0.06577342748641968, -0.06366455554962158, -0.06155569106340408, -0.05944681912660599, -0.05733794718980789, -0.055229078978300095, -0.0531202107667923, -0.0510113388299942, -0.048902466893196106, -0.04679359868168831, -0.04468473047018051, -0.042575858533382416, -0.04046698659658432, -0.03835811838507652, -0.036249250173568726, -0.03414037823677063, -0.032031506299972534, -0.029922638088464737, -0.02781376801431179, -0.025704897940158844, -0.023596027866005898, -0.02148715779185295, -0.019378287717700005, -0.017269417643547058, -0.015160547569394112, -0.013051677495241165, -0.010942807421088219, -0.008833937346935272, -0.006725067272782326, -0.004616197198629379, -0.002507327124476433, -0.00039845705032348633, 0.0017104130238294601, 0.0038192830979824066, 0.005928153172135353, 0.0080370232462883, 0.010145893320441246, 0.012254763394594193, 0.014363633468747139, 0.016472503542900085, 0.018581373617053032, 0.02069024369120598, 0.022799113765358925, 0.02490798383951187, 0.027016853913664818, 0.029125723987817764, 0.03123459406197071, 0.03334346413612366, 0.03545233607292175, 0.03756120428442955, 0.03967007249593735, 0.04177894443273544, 0.04388781636953354, 0.045996684581041336, 0.04810555279254913, 0.05021442472934723, 0.052323296666145325, 0.05443216487765312, 0.05654103308916092, 0.058649905025959015, 0.06075877696275711, 0.06286764144897461, 0.0649765133857727, 0.0670853853225708]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 16.0, 23.0, 28.0, 59.0, 68.0, 130.0, 222.0, 476.0, 1064.0, 3149.0, 15241.0, 187999.0, 756856.0, 71324.0, 8163.0, 2060.0, 813.0, 423.0, 160.0, 89.0, 61.0, 42.0, 30.0, 16.0, 17.0, 13.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2039794921875, -0.19820594787597656, -0.19243240356445312, -0.1866588592529297, -0.18088531494140625, -0.1751117706298828, -0.16933822631835938, -0.16356468200683594, -0.1577911376953125, -0.15201759338378906, -0.14624404907226562, -0.1404705047607422, -0.13469696044921875, -0.1289234161376953, -0.12314987182617188, -0.11737632751464844, -0.111602783203125, -0.10582923889160156, -0.10005569458007812, -0.09428215026855469, -0.08850860595703125, -0.08273506164550781, -0.07696151733398438, -0.07118797302246094, -0.0654144287109375, -0.05964088439941406, -0.053867340087890625, -0.04809379577636719, -0.04232025146484375, -0.03654670715332031, -0.030773162841796875, -0.024999618530273438, -0.01922607421875, -0.013452529907226562, -0.007678985595703125, -0.0019054412841796875, 0.00386810302734375, 0.009641647338867188, 0.015415191650390625, 0.021188735961914062, 0.0269622802734375, 0.03273582458496094, 0.038509368896484375, 0.04428291320800781, 0.05005645751953125, 0.05583000183105469, 0.061603546142578125, 0.06737709045410156, 0.073150634765625, 0.07892417907714844, 0.08469772338867188, 0.09047126770019531, 0.09624481201171875, 0.10201835632324219, 0.10779190063476562, 0.11356544494628906, 0.1193389892578125, 0.12511253356933594, 0.13088607788085938, 0.1366596221923828, 0.14243316650390625, 0.1482067108154297, 0.15398025512695312, 0.15975379943847656, 0.16552734375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 7.0, 9.0, 23.0, 33.0, 78.0, 160.0, 195.0, 189.0, 135.0, 88.0, 32.0, 15.0, 14.0, 6.0, 6.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1302490234375, -0.12574386596679688, -0.12123870849609375, -0.11673355102539062, -0.1122283935546875, -0.10772323608398438, -0.10321807861328125, -0.09871292114257812, -0.094207763671875, -0.08970260620117188, -0.08519744873046875, -0.08069229125976562, -0.0761871337890625, -0.07168197631835938, -0.06717681884765625, -0.06267166137695312, -0.05816650390625, -0.053661346435546875, -0.04915618896484375, -0.044651031494140625, -0.0401458740234375, -0.035640716552734375, -0.03113555908203125, -0.026630401611328125, -0.022125244140625, -0.017620086669921875, -0.01311492919921875, -0.008609771728515625, -0.0041046142578125, 0.000400543212890625, 0.00490570068359375, 0.009410858154296875, 0.013916015625, 0.018421173095703125, 0.02292633056640625, 0.027431488037109375, 0.0319366455078125, 0.036441802978515625, 0.04094696044921875, 0.045452117919921875, 0.049957275390625, 0.054462432861328125, 0.05896759033203125, 0.06347274780273438, 0.0679779052734375, 0.07248306274414062, 0.07698822021484375, 0.08149337768554688, 0.08599853515625, 0.09050369262695312, 0.09500885009765625, 0.09951400756835938, 0.1040191650390625, 0.10852432250976562, 0.11302947998046875, 0.11753463745117188, 0.122039794921875, 0.12654495239257812, 0.13105010986328125, 0.13555526733398438, 0.1400604248046875, 0.14456558227539062, 0.14907073974609375, 0.15357589721679688, 0.1580810546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 8.0, 2.0, 4.0, 8.0, 11.0, 15.0, 7.0, 25.0, 20.0, 29.0, 39.0, 52.0, 70.0, 105.0, 136.0, 261.0, 497.0, 945.0, 3206.0, 37961.0, 802301.0, 191638.0, 8088.0, 1479.0, 632.0, 345.0, 195.0, 116.0, 94.0, 65.0, 50.0, 33.0, 31.0, 18.0, 11.0, 8.0, 6.0, 11.0, 4.0, 10.0, 13.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.202392578125, -0.19639205932617188, -0.19039154052734375, -0.18439102172851562, -0.1783905029296875, -0.17238998413085938, -0.16638946533203125, -0.16038894653320312, -0.154388427734375, -0.14838790893554688, -0.14238739013671875, -0.13638687133789062, -0.1303863525390625, -0.12438583374023438, -0.11838531494140625, -0.11238479614257812, -0.10638427734375, -0.10038375854492188, -0.09438323974609375, -0.08838272094726562, -0.0823822021484375, -0.07638168334960938, -0.07038116455078125, -0.06438064575195312, -0.058380126953125, -0.052379608154296875, -0.04637908935546875, -0.040378570556640625, -0.0343780517578125, -0.028377532958984375, -0.02237701416015625, -0.016376495361328125, -0.0103759765625, -0.004375457763671875, 0.00162506103515625, 0.007625579833984375, 0.0136260986328125, 0.019626617431640625, 0.02562713623046875, 0.031627655029296875, 0.037628173828125, 0.043628692626953125, 0.04962921142578125, 0.055629730224609375, 0.0616302490234375, 0.06763076782226562, 0.07363128662109375, 0.07963180541992188, 0.08563232421875, 0.09163284301757812, 0.09763336181640625, 0.10363388061523438, 0.1096343994140625, 0.11563491821289062, 0.12163543701171875, 0.12763595581054688, 0.133636474609375, 0.13963699340820312, 0.14563751220703125, 0.15163803100585938, 0.1576385498046875, 0.16363906860351562, 0.16963958740234375, 0.17564010620117188, 0.181640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 7.0, 8.0, 13.0, 10.0, 16.0, 19.0, 19.0, 18.0, 27.0, 40.0, 31.0, 22.0, 33.0, 44.0, 35.0, 49.0, 39.0, 44.0, 38.0, 51.0, 33.0, 53.0, 46.0, 30.0, 41.0, 26.0, 35.0, 22.0, 21.0, 21.0, 14.0, 18.0, 15.0, 7.0, 10.0, 6.0, 8.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2021484375, -0.19599151611328125, -0.1898345947265625, -0.18367767333984375, -0.177520751953125, -0.17136383056640625, -0.1652069091796875, -0.15904998779296875, -0.15289306640625, -0.14673614501953125, -0.1405792236328125, -0.13442230224609375, -0.128265380859375, -0.12210845947265625, -0.1159515380859375, -0.10979461669921875, -0.1036376953125, -0.09748077392578125, -0.0913238525390625, -0.08516693115234375, -0.079010009765625, -0.07285308837890625, -0.0666961669921875, -0.06053924560546875, -0.05438232421875, -0.04822540283203125, -0.0420684814453125, -0.03591156005859375, -0.029754638671875, -0.02359771728515625, -0.0174407958984375, -0.01128387451171875, -0.005126953125, 0.00102996826171875, 0.0071868896484375, 0.01334381103515625, 0.019500732421875, 0.02565765380859375, 0.0318145751953125, 0.03797149658203125, 0.04412841796875, 0.05028533935546875, 0.0564422607421875, 0.06259918212890625, 0.068756103515625, 0.07491302490234375, 0.0810699462890625, 0.08722686767578125, 0.0933837890625, 0.09954071044921875, 0.1056976318359375, 0.11185455322265625, 0.118011474609375, 0.12416839599609375, 0.1303253173828125, 0.13648223876953125, 0.14263916015625, 0.14879608154296875, 0.1549530029296875, 0.16110992431640625, 0.167266845703125, 0.17342376708984375, 0.1795806884765625, 0.18573760986328125, 0.19189453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 5.0, 8.0, 16.0, 18.0, 43.0, 50.0, 71.0, 132.0, 229.0, 508.0, 1094.0, 2771.0, 11426.0, 266220.0, 738220.0, 20977.0, 3999.0, 1465.0, 604.0, 295.0, 148.0, 90.0, 60.0, 25.0, 22.0, 20.0, 15.0, 5.0, 2.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06658935546875, -0.0642232894897461, -0.06185722351074219, -0.05949115753173828, -0.057125091552734375, -0.05475902557373047, -0.05239295959472656, -0.050026893615722656, -0.04766082763671875, -0.045294761657714844, -0.04292869567871094, -0.04056262969970703, -0.038196563720703125, -0.03583049774169922, -0.03346443176269531, -0.031098365783691406, -0.0287322998046875, -0.026366233825683594, -0.024000167846679688, -0.02163410186767578, -0.019268035888671875, -0.01690196990966797, -0.014535903930664062, -0.012169837951660156, -0.00980377197265625, -0.007437705993652344, -0.0050716400146484375, -0.0027055740356445312, -0.000339508056640625, 0.0020265579223632812, 0.0043926239013671875, 0.006758689880371094, 0.009124755859375, 0.011490821838378906, 0.013856887817382812, 0.01622295379638672, 0.018589019775390625, 0.02095508575439453, 0.023321151733398438, 0.025687217712402344, 0.02805328369140625, 0.030419349670410156, 0.03278541564941406, 0.03515148162841797, 0.037517547607421875, 0.03988361358642578, 0.04224967956542969, 0.044615745544433594, 0.0469818115234375, 0.049347877502441406, 0.05171394348144531, 0.05408000946044922, 0.056446075439453125, 0.05881214141845703, 0.06117820739746094, 0.06354427337646484, 0.06591033935546875, 0.06827640533447266, 0.07064247131347656, 0.07300853729248047, 0.07537460327148438, 0.07774066925048828, 0.08010673522949219, 0.0824728012084961, 0.0848388671875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 25.0, 59.0, 120.0, 283.0, 256.0, 163.0, 55.0, 21.0, 11.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1425228118896484e-05, -4.057958722114563e-05, -3.9733946323394775e-05, -3.888830542564392e-05, -3.8042664527893066e-05, -3.719702363014221e-05, -3.635138273239136e-05, -3.55057418346405e-05, -3.466010093688965e-05, -3.3814460039138794e-05, -3.296881914138794e-05, -3.2123178243637085e-05, -3.127753734588623e-05, -3.0431896448135376e-05, -2.958625555038452e-05, -2.8740614652633667e-05, -2.7894973754882812e-05, -2.7049332857131958e-05, -2.6203691959381104e-05, -2.535805106163025e-05, -2.4512410163879395e-05, -2.366676926612854e-05, -2.2821128368377686e-05, -2.197548747062683e-05, -2.1129846572875977e-05, -2.0284205675125122e-05, -1.9438564777374268e-05, -1.8592923879623413e-05, -1.774728298187256e-05, -1.6901642084121704e-05, -1.605600118637085e-05, -1.5210360288619995e-05, -1.436471939086914e-05, -1.3519078493118286e-05, -1.2673437595367432e-05, -1.1827796697616577e-05, -1.0982155799865723e-05, -1.0136514902114868e-05, -9.290874004364014e-06, -8.44523310661316e-06, -7.599592208862305e-06, -6.75395131111145e-06, -5.908310413360596e-06, -5.062669515609741e-06, -4.217028617858887e-06, -3.3713877201080322e-06, -2.5257468223571777e-06, -1.6801059246063232e-06, -8.344650268554688e-07, 1.1175870895385742e-08, 8.568167686462402e-07, 1.7024576663970947e-06, 2.5480985641479492e-06, 3.3937394618988037e-06, 4.239380359649658e-06, 5.085021257400513e-06, 5.930662155151367e-06, 6.776303052902222e-06, 7.621943950653076e-06, 8.46758484840393e-06, 9.313225746154785e-06, 1.015886664390564e-05, 1.1004507541656494e-05, 1.1850148439407349e-05, 1.2695789337158203e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 7.0, 12.0, 11.0, 17.0, 25.0, 33.0, 54.0, 86.0, 118.0, 180.0, 322.0, 611.0, 1368.0, 3516.0, 15830.0, 248643.0, 727886.0, 40039.0, 6015.0, 1851.0, 809.0, 407.0, 246.0, 150.0, 103.0, 62.0, 46.0, 28.0, 24.0, 17.0, 9.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06915283203125, -0.06713104248046875, -0.0651092529296875, -0.06308746337890625, -0.061065673828125, -0.05904388427734375, -0.0570220947265625, -0.05500030517578125, -0.052978515625, -0.05095672607421875, -0.0489349365234375, -0.04691314697265625, -0.044891357421875, -0.04286956787109375, -0.0408477783203125, -0.03882598876953125, -0.03680419921875, -0.03478240966796875, -0.0327606201171875, -0.03073883056640625, -0.028717041015625, -0.02669525146484375, -0.0246734619140625, -0.02265167236328125, -0.0206298828125, -0.01860809326171875, -0.0165863037109375, -0.01456451416015625, -0.012542724609375, -0.01052093505859375, -0.0084991455078125, -0.00647735595703125, -0.00445556640625, -0.00243377685546875, -0.0004119873046875, 0.00160980224609375, 0.003631591796875, 0.00565338134765625, 0.0076751708984375, 0.00969696044921875, 0.01171875, 0.01374053955078125, 0.0157623291015625, 0.01778411865234375, 0.019805908203125, 0.02182769775390625, 0.0238494873046875, 0.02587127685546875, 0.02789306640625, 0.02991485595703125, 0.0319366455078125, 0.03395843505859375, 0.035980224609375, 0.03800201416015625, 0.0400238037109375, 0.04204559326171875, 0.0440673828125, 0.04608917236328125, 0.0481109619140625, 0.05013275146484375, 0.052154541015625, 0.05417633056640625, 0.0561981201171875, 0.05821990966796875, 0.06024169921875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 0.0, 4.0, 5.0, 8.0, 8.0, 7.0, 9.0, 12.0, 11.0, 21.0, 29.0, 26.0, 37.0, 46.0, 60.0, 65.0, 59.0, 57.0, 75.0, 73.0, 76.0, 58.0, 49.0, 38.0, 30.0, 25.0, 21.0, 17.0, 20.0, 12.0, 11.0, 11.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.034942626953125, -0.03388500213623047, -0.03282737731933594, -0.031769752502441406, -0.030712127685546875, -0.029654502868652344, -0.028596878051757812, -0.02753925323486328, -0.02648162841796875, -0.02542400360107422, -0.024366378784179688, -0.023308753967285156, -0.022251129150390625, -0.021193504333496094, -0.020135879516601562, -0.01907825469970703, -0.0180206298828125, -0.01696300506591797, -0.015905380249023438, -0.014847755432128906, -0.013790130615234375, -0.012732505798339844, -0.011674880981445312, -0.010617256164550781, -0.00955963134765625, -0.008502006530761719, -0.0074443817138671875, -0.006386756896972656, -0.005329132080078125, -0.004271507263183594, -0.0032138824462890625, -0.0021562576293945312, -0.0010986328125, -4.100799560546875e-05, 0.0010166168212890625, 0.0020742416381835938, 0.003131866455078125, 0.004189491271972656, 0.0052471160888671875, 0.006304740905761719, 0.00736236572265625, 0.008419990539550781, 0.009477615356445312, 0.010535240173339844, 0.011592864990234375, 0.012650489807128906, 0.013708114624023438, 0.014765739440917969, 0.0158233642578125, 0.01688098907470703, 0.017938613891601562, 0.018996238708496094, 0.020053863525390625, 0.021111488342285156, 0.022169113159179688, 0.02322673797607422, 0.02428436279296875, 0.02534198760986328, 0.026399612426757812, 0.027457237243652344, 0.028514862060546875, 0.029572486877441406, 0.030630111694335938, 0.03168773651123047, 0.032745361328125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 21.0, 65.0, 207.0, 357.0, 243.0, 81.0, 22.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0293564796447754, -1.9689313173294067, -1.9085060358047485, -1.8480808734893799, -1.7876555919647217, -1.727230429649353, -1.6668052673339844, -1.6063799858093262, -1.545954704284668, -1.4855295419692993, -1.4251042604446411, -1.3646790981292725, -1.3042538166046143, -1.2438286542892456, -1.183403491973877, -1.1229782104492188, -1.06255304813385, -1.0021278858184814, -0.9417026042938232, -0.8812774419784546, -0.8208521604537964, -0.7604269981384277, -0.7000017762184143, -0.6395765542984009, -0.5791513323783875, -0.518726110458374, -0.4583008885383606, -0.39787569642066956, -0.33745047450065613, -0.2770252525806427, -0.21660006046295166, -0.15617483854293823, -0.0957496166229248, -0.035324402153491974, 0.025100812315940857, 0.08552601933479309, 0.14595124125480652, 0.20637646317481995, 0.266801655292511, 0.3272268772125244, 0.38765209913253784, 0.44807732105255127, 0.5085025429725647, 0.5689277648925781, 0.6293529272079468, 0.689778208732605, 0.7502033710479736, 0.8106285929679871, 0.8710538148880005, 0.9314790368080139, 0.9919042587280273, 1.052329421043396, 1.1127547025680542, 1.1731798648834229, 1.233605146408081, 1.2940303087234497, 1.3544554710388184, 1.414880633354187, 1.4753059148788452, 1.5357310771942139, 1.596156358718872, 1.6565815210342407, 1.7170066833496094, 1.7774319648742676, 1.8378572463989258]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 8.0, 12.0, 6.0, 7.0, 9.0, 17.0, 19.0, 9.0, 20.0, 18.0, 24.0, 27.0, 33.0, 33.0, 33.0, 46.0, 49.0, 42.0, 49.0, 45.0, 52.0, 57.0, 41.0, 44.0, 41.0, 30.0, 38.0, 36.0, 19.0, 13.0, 18.0, 17.0, 12.0, 26.0, 8.0, 4.0, 7.0, 11.0, 4.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.940723717212677, -0.9100852012634277, -0.8794466257095337, -0.8488081097602844, -0.8181695342063904, -0.7875310182571411, -0.7568924427032471, -0.7262539267539978, -0.6956154108047485, -0.6649768948554993, -0.6343383193016052, -0.603699803352356, -0.5730612277984619, -0.5424227118492126, -0.5117841958999634, -0.48114562034606934, -0.4505070447921753, -0.41986849904060364, -0.389229953289032, -0.3585914373397827, -0.32795286178588867, -0.2973143458366394, -0.26667580008506775, -0.2360372543334961, -0.20539870858192444, -0.17476016283035278, -0.14412161707878113, -0.11348308622837067, -0.08284454047679901, -0.052205994725227356, -0.021567463874816895, 0.00907108187675476, 0.03970968723297119, 0.07034823298454285, 0.1009867712855339, 0.13162530958652496, 0.16226385533809662, 0.19290240108966827, 0.22354093194007874, 0.2541794776916504, 0.28481802344322205, 0.3154565691947937, 0.34609511494636536, 0.376733660697937, 0.4073721766471863, 0.4380107522010803, 0.4686492681503296, 0.49928781390190125, 0.5299263596534729, 0.5605648756027222, 0.5912034511566162, 0.6218419671058655, 0.6524805426597595, 0.6831190586090088, 0.7137576341629028, 0.7443961501121521, 0.7750346660614014, 0.8056731820106506, 0.8363117575645447, 0.866950273513794, 0.897588849067688, 0.9282273650169373, 0.9588658809661865, 0.9895044565200806, 1.0201430320739746]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 4.0, 6.0, 6.0, 14.0, 22.0, 38.0, 66.0, 107.0, 179.0, 298.0, 609.0, 1149.0, 2335.0, 5673.0, 20931.0, 4067665.0, 76207.0, 11430.0, 3896.0, 1663.0, 862.0, 470.0, 267.0, 141.0, 79.0, 62.0, 36.0, 23.0, 13.0, 9.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.11828041076660156, -0.11467361450195312, -0.11106681823730469, -0.10746002197265625, -0.10385322570800781, -0.10024642944335938, -0.09663963317871094, -0.0930328369140625, -0.08942604064941406, -0.08581924438476562, -0.08221244812011719, -0.07860565185546875, -0.07499885559082031, -0.07139205932617188, -0.06778526306152344, -0.064178466796875, -0.06057167053222656, -0.056964874267578125, -0.05335807800292969, -0.04975128173828125, -0.04614448547363281, -0.042537689208984375, -0.03893089294433594, -0.0353240966796875, -0.03171730041503906, -0.028110504150390625, -0.024503707885742188, -0.02089691162109375, -0.017290115356445312, -0.013683319091796875, -0.010076522827148438, -0.0064697265625, -0.0028629302978515625, 0.000743865966796875, 0.0043506622314453125, 0.00795745849609375, 0.011564254760742188, 0.015171051025390625, 0.018777847290039062, 0.0223846435546875, 0.025991439819335938, 0.029598236083984375, 0.03320503234863281, 0.03681182861328125, 0.04041862487792969, 0.044025421142578125, 0.04763221740722656, 0.051239013671875, 0.05484580993652344, 0.058452606201171875, 0.06205940246582031, 0.06566619873046875, 0.06927299499511719, 0.07287979125976562, 0.07648658752441406, 0.0800933837890625, 0.08370018005371094, 0.08730697631835938, 0.09091377258300781, 0.09452056884765625, 0.09812736511230469, 0.10173416137695312, 0.10534095764160156, 0.10894775390625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 13.0, 11.0, 40.0, 78.0, 156.0, 182.0, 203.0, 145.0, 76.0, 40.0, 15.0, 14.0, 4.0, 10.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1302490234375, -0.1257476806640625, -0.121246337890625, -0.1167449951171875, -0.11224365234375, -0.1077423095703125, -0.103240966796875, -0.0987396240234375, -0.09423828125, -0.0897369384765625, -0.085235595703125, -0.0807342529296875, -0.07623291015625, -0.0717315673828125, -0.067230224609375, -0.0627288818359375, -0.0582275390625, -0.0537261962890625, -0.049224853515625, -0.0447235107421875, -0.04022216796875, -0.0357208251953125, -0.031219482421875, -0.0267181396484375, -0.022216796875, -0.0177154541015625, -0.013214111328125, -0.0087127685546875, -0.00421142578125, 0.0002899169921875, 0.004791259765625, 0.0092926025390625, 0.0137939453125, 0.0182952880859375, 0.022796630859375, 0.0272979736328125, 0.03179931640625, 0.0363006591796875, 0.040802001953125, 0.0453033447265625, 0.0498046875, 0.0543060302734375, 0.058807373046875, 0.0633087158203125, 0.06781005859375, 0.0723114013671875, 0.076812744140625, 0.0813140869140625, 0.0858154296875, 0.0903167724609375, 0.094818115234375, 0.0993194580078125, 0.10382080078125, 0.1083221435546875, 0.112823486328125, 0.1173248291015625, 0.121826171875, 0.1263275146484375, 0.130828857421875, 0.1353302001953125, 0.13983154296875, 0.1443328857421875, 0.148834228515625, 0.1533355712890625, 0.1578369140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 9.0, 10.0, 12.0, 15.0, 30.0, 28.0, 23.0, 44.0, 76.0, 108.0, 150.0, 202.0, 313.0, 519.0, 801.0, 1468.0, 2826.0, 7123.0, 31738.0, 4055663.0, 73639.0, 11125.0, 3852.0, 1765.0, 941.0, 587.0, 368.0, 239.0, 198.0, 114.0, 82.0, 48.0, 44.0, 29.0, 32.0, 19.0, 12.0, 8.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1666259765625, -0.16167831420898438, -0.15673065185546875, -0.15178298950195312, -0.1468353271484375, -0.14188766479492188, -0.13694000244140625, -0.13199234008789062, -0.127044677734375, -0.12209701538085938, -0.11714935302734375, -0.11220169067382812, -0.1072540283203125, -0.10230636596679688, -0.09735870361328125, -0.09241104125976562, -0.08746337890625, -0.08251571655273438, -0.07756805419921875, -0.07262039184570312, -0.0676727294921875, -0.06272506713867188, -0.05777740478515625, -0.052829742431640625, -0.047882080078125, -0.042934417724609375, -0.03798675537109375, -0.033039093017578125, -0.0280914306640625, -0.023143768310546875, -0.01819610595703125, -0.013248443603515625, -0.00830078125, -0.003353118896484375, 0.00159454345703125, 0.006542205810546875, 0.0114898681640625, 0.016437530517578125, 0.02138519287109375, 0.026332855224609375, 0.031280517578125, 0.036228179931640625, 0.04117584228515625, 0.046123504638671875, 0.0510711669921875, 0.056018829345703125, 0.06096649169921875, 0.06591415405273438, 0.07086181640625, 0.07580947875976562, 0.08075714111328125, 0.08570480346679688, 0.0906524658203125, 0.09560012817382812, 0.10054779052734375, 0.10549545288085938, 0.110443115234375, 0.11539077758789062, 0.12033843994140625, 0.12528610229492188, 0.1302337646484375, 0.13518142700195312, 0.14012908935546875, 0.14507675170898438, 0.1500244140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 12.0, 15.0, 21.0, 56.0, 164.0, 3641.0, 74.0, 32.0, 19.0, 11.0, 5.0, 8.0, 4.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0394287109375, -0.03807878494262695, -0.036728858947753906, -0.03537893295288086, -0.03402900695800781, -0.032679080963134766, -0.03132915496826172, -0.029979228973388672, -0.028629302978515625, -0.027279376983642578, -0.02592945098876953, -0.024579524993896484, -0.023229598999023438, -0.02187967300415039, -0.020529747009277344, -0.019179821014404297, -0.01782989501953125, -0.016479969024658203, -0.015130043029785156, -0.01378011703491211, -0.012430191040039062, -0.011080265045166016, -0.009730339050292969, -0.008380413055419922, -0.007030487060546875, -0.005680561065673828, -0.004330635070800781, -0.0029807090759277344, -0.0016307830810546875, -0.0002808570861816406, 0.0010690689086914062, 0.002418994903564453, 0.0037689208984375, 0.005118846893310547, 0.006468772888183594, 0.00781869888305664, 0.009168624877929688, 0.010518550872802734, 0.011868476867675781, 0.013218402862548828, 0.014568328857421875, 0.015918254852294922, 0.01726818084716797, 0.018618106842041016, 0.019968032836914062, 0.02131795883178711, 0.022667884826660156, 0.024017810821533203, 0.02536773681640625, 0.026717662811279297, 0.028067588806152344, 0.02941751480102539, 0.030767440795898438, 0.032117366790771484, 0.03346729278564453, 0.03481721878051758, 0.036167144775390625, 0.03751707077026367, 0.03886699676513672, 0.040216922760009766, 0.04156684875488281, 0.04291677474975586, 0.044266700744628906, 0.04561662673950195, 0.046966552734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 8.0, 15.0, 18.0, 20.0, 35.0, 57.0, 87.0, 105.0, 127.0, 117.0, 97.0, 88.0, 61.0, 49.0, 30.0, 24.0, 15.0, 14.0, 8.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08543664216995239, -0.08130544424057007, -0.07717424631118774, -0.07304304838180542, -0.0689118504524231, -0.06478065252304077, -0.060649458318948746, -0.05651826038956642, -0.0523870624601841, -0.04825586453080177, -0.04412466660141945, -0.03999347239732742, -0.0358622744679451, -0.031731076538562775, -0.02759987860918045, -0.023468680679798126, -0.019337482750415802, -0.015206284821033478, -0.011075087822973728, -0.006943890824913979, -0.0028126928955316544, 0.0013185050338506699, 0.005449701100587845, 0.009580899029970169, 0.013712096959352493, 0.017843294888734818, 0.02197449281811714, 0.026105688884854317, 0.03023688681423664, 0.034368082880973816, 0.03849928081035614, 0.042630478739738464, 0.04676167666912079, 0.05089287459850311, 0.05502407252788544, 0.05915527045726776, 0.06328646838665009, 0.06741766631603241, 0.07154886424541473, 0.07568006217479706, 0.07981126010417938, 0.0839424580335617, 0.08807365596294403, 0.09220485389232635, 0.09633605182170868, 0.100467249751091, 0.10459844768047333, 0.10872964560985565, 0.11286083608865738, 0.1169920340180397, 0.12112323194742203, 0.12525442242622375, 0.12938562035560608, 0.1335168182849884, 0.13764801621437073, 0.14177921414375305, 0.14591041207313538, 0.1500416100025177, 0.15417280793190002, 0.15830400586128235, 0.16243520379066467, 0.166566401720047, 0.17069759964942932, 0.17482879757881165, 0.17895999550819397]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 1.0, 7.0, 5.0, 4.0, 6.0, 11.0, 5.0, 7.0, 10.0, 19.0, 19.0, 17.0, 19.0, 29.0, 24.0, 27.0, 28.0, 37.0, 37.0, 34.0, 49.0, 37.0, 42.0, 32.0, 42.0, 35.0, 30.0, 37.0, 39.0, 36.0, 32.0, 23.0, 17.0, 33.0, 22.0, 31.0, 15.0, 21.0, 13.0, 24.0, 11.0, 10.0, 9.0, 6.0, 3.0, 2.0, 8.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05700498819351196, -0.05497797578573227, -0.052950967103242874, -0.05092395842075348, -0.048896946012973785, -0.04686993360519409, -0.0448429249227047, -0.0428159162402153, -0.04078890383243561, -0.038761891424655914, -0.03673488274216652, -0.034707874059677124, -0.03268086165189743, -0.030653851106762886, -0.02862684056162834, -0.026599830016493797, -0.024572819471359253, -0.02254580892622471, -0.020518798381090164, -0.01849178783595562, -0.016464777290821075, -0.014437766745686531, -0.012410756200551987, -0.010383745655417442, -0.008356735110282898, -0.006329724565148354, -0.004302714020013809, -0.002275703474879265, -0.00024869292974472046, 0.001778317615389824, 0.0038053281605243683, 0.005832338705658913, 0.007859349250793457, 0.009886359795928001, 0.011913370341062546, 0.01394038088619709, 0.015967391431331635, 0.01799440197646618, 0.020021412521600723, 0.022048423066735268, 0.024075433611869812, 0.026102444157004356, 0.0281294547021389, 0.030156465247273445, 0.03218347579240799, 0.03421048820018768, 0.03623749688267708, 0.03826450556516647, 0.04029151797294617, 0.04231853038072586, 0.044345539063215256, 0.04637254774570465, 0.048399560153484344, 0.05042657256126404, 0.05245358124375343, 0.05448058992624283, 0.05650760233402252, 0.058534614741802216, 0.06056162342429161, 0.062588632106781, 0.0646156445145607, 0.0666426569223404, 0.06866966187953949, 0.07069667428731918, 0.07272368669509888]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 1.0, 19.0, 22.0, 39.0, 61.0, 146.0, 331.0, 886.0, 3224.0, 26065.0, 848568.0, 159440.0, 7200.0, 1545.0, 529.0, 239.0, 104.0, 54.0, 24.0, 21.0, 12.0, 4.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306396484375, -0.2964286804199219, -0.28646087646484375, -0.2764930725097656, -0.2665252685546875, -0.2565574645996094, -0.24658966064453125, -0.23662185668945312, -0.226654052734375, -0.21668624877929688, -0.20671844482421875, -0.19675064086914062, -0.1867828369140625, -0.17681503295898438, -0.16684722900390625, -0.15687942504882812, -0.14691162109375, -0.13694381713867188, -0.12697601318359375, -0.11700820922851562, -0.1070404052734375, -0.09707260131835938, -0.08710479736328125, -0.07713699340820312, -0.067169189453125, -0.057201385498046875, -0.04723358154296875, -0.037265777587890625, -0.0272979736328125, -0.017330169677734375, -0.00736236572265625, 0.002605438232421875, 0.0125732421875, 0.022541046142578125, 0.03250885009765625, 0.042476654052734375, 0.0524444580078125, 0.062412261962890625, 0.07238006591796875, 0.08234786987304688, 0.092315673828125, 0.10228347778320312, 0.11225128173828125, 0.12221908569335938, 0.1321868896484375, 0.14215469360351562, 0.15212249755859375, 0.16209030151367188, 0.17205810546875, 0.18202590942382812, 0.19199371337890625, 0.20196151733398438, 0.2119293212890625, 0.22189712524414062, 0.23186492919921875, 0.24183273315429688, 0.251800537109375, 0.2617683410644531, 0.27173614501953125, 0.2817039489746094, 0.2916717529296875, 0.3016395568847656, 0.31160736083984375, 0.3215751647949219, 0.33154296875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 11.0, 18.0, 42.0, 82.0, 149.0, 162.0, 197.0, 146.0, 89.0, 46.0, 15.0, 14.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1307373046875, -0.12623023986816406, -0.12172317504882812, -0.11721611022949219, -0.11270904541015625, -0.10820198059082031, -0.10369491577148438, -0.09918785095214844, -0.0946807861328125, -0.09017372131347656, -0.08566665649414062, -0.08115959167480469, -0.07665252685546875, -0.07214546203613281, -0.06763839721679688, -0.06313133239746094, -0.058624267578125, -0.05411720275878906, -0.049610137939453125, -0.04510307312011719, -0.04059600830078125, -0.03608894348144531, -0.031581878662109375, -0.027074813842773438, -0.0225677490234375, -0.018060684204101562, -0.013553619384765625, -0.009046554565429688, -0.00453948974609375, -3.24249267578125e-05, 0.004474639892578125, 0.008981704711914062, 0.01348876953125, 0.017995834350585938, 0.022502899169921875, 0.027009963989257812, 0.03151702880859375, 0.03602409362792969, 0.040531158447265625, 0.04503822326660156, 0.0495452880859375, 0.05405235290527344, 0.058559417724609375, 0.06306648254394531, 0.06757354736328125, 0.07208061218261719, 0.07658767700195312, 0.08109474182128906, 0.085601806640625, 0.09010887145996094, 0.09461593627929688, 0.09912300109863281, 0.10363006591796875, 0.10813713073730469, 0.11264419555664062, 0.11715126037597656, 0.1216583251953125, 0.12616539001464844, 0.13067245483398438, 0.1351795196533203, 0.13968658447265625, 0.1441936492919922, 0.14870071411132812, 0.15320777893066406, 0.15771484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 6.0, 5.0, 14.0, 14.0, 18.0, 16.0, 30.0, 41.0, 43.0, 53.0, 80.0, 113.0, 146.0, 277.0, 481.0, 1006.0, 2676.0, 20019.0, 748233.0, 262887.0, 8649.0, 1848.0, 761.0, 417.0, 241.0, 134.0, 83.0, 58.0, 48.0, 36.0, 24.0, 18.0, 14.0, 17.0, 4.0, 12.0, 7.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.250244140625, -0.24306106567382812, -0.23587799072265625, -0.22869491577148438, -0.2215118408203125, -0.21432876586914062, -0.20714569091796875, -0.19996261596679688, -0.192779541015625, -0.18559646606445312, -0.17841339111328125, -0.17123031616210938, -0.1640472412109375, -0.15686416625976562, -0.14968109130859375, -0.14249801635742188, -0.13531494140625, -0.12813186645507812, -0.12094879150390625, -0.11376571655273438, -0.1065826416015625, -0.09939956665039062, -0.09221649169921875, -0.08503341674804688, -0.077850341796875, -0.07066726684570312, -0.06348419189453125, -0.056301116943359375, -0.0491180419921875, -0.041934967041015625, -0.03475189208984375, -0.027568817138671875, -0.0203857421875, -0.013202667236328125, -0.00601959228515625, 0.001163482666015625, 0.0083465576171875, 0.015529632568359375, 0.02271270751953125, 0.029895782470703125, 0.037078857421875, 0.044261932373046875, 0.05144500732421875, 0.058628082275390625, 0.0658111572265625, 0.07299423217773438, 0.08017730712890625, 0.08736038208007812, 0.09454345703125, 0.10172653198242188, 0.10890960693359375, 0.11609268188476562, 0.1232757568359375, 0.13045883178710938, 0.13764190673828125, 0.14482498168945312, 0.152008056640625, 0.15919113159179688, 0.16637420654296875, 0.17355728149414062, 0.1807403564453125, 0.18792343139648438, 0.19510650634765625, 0.20228958129882812, 0.20947265625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 8.0, 9.0, 7.0, 14.0, 12.0, 23.0, 26.0, 29.0, 23.0, 37.0, 40.0, 47.0, 36.0, 49.0, 41.0, 44.0, 42.0, 43.0, 33.0, 55.0, 36.0, 42.0, 50.0, 36.0, 27.0, 24.0, 29.0, 11.0, 11.0, 16.0, 19.0, 19.0, 8.0, 9.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1973876953125, -0.19134140014648438, -0.18529510498046875, -0.17924880981445312, -0.1732025146484375, -0.16715621948242188, -0.16110992431640625, -0.15506362915039062, -0.149017333984375, -0.14297103881835938, -0.13692474365234375, -0.13087844848632812, -0.1248321533203125, -0.11878585815429688, -0.11273956298828125, -0.10669326782226562, -0.10064697265625, -0.09460067749023438, -0.08855438232421875, -0.08250808715820312, -0.0764617919921875, -0.07041549682617188, -0.06436920166015625, -0.058322906494140625, -0.052276611328125, -0.046230316162109375, -0.04018402099609375, -0.034137725830078125, -0.0280914306640625, -0.022045135498046875, -0.01599884033203125, -0.009952545166015625, -0.00390625, 0.002140045166015625, 0.00818634033203125, 0.014232635498046875, 0.0202789306640625, 0.026325225830078125, 0.03237152099609375, 0.038417816162109375, 0.044464111328125, 0.050510406494140625, 0.05655670166015625, 0.06260299682617188, 0.0686492919921875, 0.07469558715820312, 0.08074188232421875, 0.08678817749023438, 0.09283447265625, 0.09888076782226562, 0.10492706298828125, 0.11097335815429688, 0.1170196533203125, 0.12306594848632812, 0.12911224365234375, 0.13515853881835938, 0.141204833984375, 0.14725112915039062, 0.15329742431640625, 0.15934371948242188, 0.1653900146484375, 0.17143630981445312, 0.17748260498046875, 0.18352890014648438, 0.1895751953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 9.0, 13.0, 12.0, 19.0, 40.0, 58.0, 86.0, 162.0, 354.0, 817.0, 4050.0, 99543.0, 921743.0, 18671.0, 1844.0, 532.0, 211.0, 131.0, 85.0, 62.0, 21.0, 23.0, 19.0, 8.0, 7.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1134033203125, -0.10953140258789062, -0.10565948486328125, -0.10178756713867188, -0.0979156494140625, -0.09404373168945312, -0.09017181396484375, -0.08629989624023438, -0.082427978515625, -0.07855606079101562, -0.07468414306640625, -0.07081222534179688, -0.0669403076171875, -0.06306838989257812, -0.05919647216796875, -0.055324554443359375, -0.05145263671875, -0.047580718994140625, -0.04370880126953125, -0.039836883544921875, -0.0359649658203125, -0.032093048095703125, -0.02822113037109375, -0.024349212646484375, -0.020477294921875, -0.016605377197265625, -0.01273345947265625, -0.008861541748046875, -0.0049896240234375, -0.001117706298828125, 0.00275421142578125, 0.006626129150390625, 0.010498046875, 0.014369964599609375, 0.01824188232421875, 0.022113800048828125, 0.0259857177734375, 0.029857635498046875, 0.03372955322265625, 0.037601470947265625, 0.041473388671875, 0.045345306396484375, 0.04921722412109375, 0.053089141845703125, 0.0569610595703125, 0.060832977294921875, 0.06470489501953125, 0.06857681274414062, 0.07244873046875, 0.07632064819335938, 0.08019256591796875, 0.08406448364257812, 0.0879364013671875, 0.09180831909179688, 0.09568023681640625, 0.09955215454101562, 0.103424072265625, 0.10729598999023438, 0.11116790771484375, 0.11503982543945312, 0.1189117431640625, 0.12278366088867188, 0.12665557861328125, 0.13052749633789062, 0.1343994140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 2.0, 8.0, 8.0, 11.0, 11.0, 16.0, 21.0, 32.0, 38.0, 45.0, 48.0, 62.0, 81.0, 87.0, 80.0, 80.0, 59.0, 48.0, 59.0, 42.0, 33.0, 33.0, 20.0, 12.0, 11.0, 16.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.059906005859375e-06, -8.804723620414734e-06, -8.549541234970093e-06, -8.294358849525452e-06, -8.03917646408081e-06, -7.78399407863617e-06, -7.528811693191528e-06, -7.273629307746887e-06, -7.018446922302246e-06, -6.763264536857605e-06, -6.508082151412964e-06, -6.252899765968323e-06, -5.997717380523682e-06, -5.7425349950790405e-06, -5.487352609634399e-06, -5.232170224189758e-06, -4.976987838745117e-06, -4.721805453300476e-06, -4.466623067855835e-06, -4.211440682411194e-06, -3.956258296966553e-06, -3.7010759115219116e-06, -3.4458935260772705e-06, -3.1907111406326294e-06, -2.9355287551879883e-06, -2.680346369743347e-06, -2.425163984298706e-06, -2.169981598854065e-06, -1.914799213409424e-06, -1.6596168279647827e-06, -1.4044344425201416e-06, -1.1492520570755005e-06, -8.940696716308594e-07, -6.388872861862183e-07, -3.8370490074157715e-07, -1.2852251529693604e-07, 1.2665987014770508e-07, 3.818422555923462e-07, 6.370246410369873e-07, 8.922070264816284e-07, 1.1473894119262695e-06, 1.4025717973709106e-06, 1.6577541828155518e-06, 1.912936568260193e-06, 2.168118953704834e-06, 2.423301339149475e-06, 2.678483724594116e-06, 2.9336661100387573e-06, 3.1888484954833984e-06, 3.4440308809280396e-06, 3.6992132663726807e-06, 3.954395651817322e-06, 4.209578037261963e-06, 4.464760422706604e-06, 4.719942808151245e-06, 4.975125193595886e-06, 5.230307579040527e-06, 5.4854899644851685e-06, 5.7406723499298096e-06, 5.995854735374451e-06, 6.251037120819092e-06, 6.506219506263733e-06, 6.761401891708374e-06, 7.016584277153015e-06, 7.271766662597656e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 12.0, 26.0, 20.0, 46.0, 104.0, 259.0, 591.0, 2122.0, 18897.0, 943204.0, 77915.0, 3799.0, 882.0, 350.0, 144.0, 73.0, 44.0, 21.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1494140625, -0.1446971893310547, -0.13998031616210938, -0.13526344299316406, -0.13054656982421875, -0.12582969665527344, -0.12111282348632812, -0.11639595031738281, -0.1116790771484375, -0.10696220397949219, -0.10224533081054688, -0.09752845764160156, -0.09281158447265625, -0.08809471130371094, -0.08337783813476562, -0.07866096496582031, -0.073944091796875, -0.06922721862792969, -0.06451034545898438, -0.05979347229003906, -0.05507659912109375, -0.05035972595214844, -0.045642852783203125, -0.04092597961425781, -0.0362091064453125, -0.03149223327636719, -0.026775360107421875, -0.022058486938476562, -0.01734161376953125, -0.012624740600585938, -0.007907867431640625, -0.0031909942626953125, 0.00152587890625, 0.0062427520751953125, 0.010959625244140625, 0.015676498413085938, 0.02039337158203125, 0.025110244750976562, 0.029827117919921875, 0.03454399108886719, 0.0392608642578125, 0.04397773742675781, 0.048694610595703125, 0.05341148376464844, 0.05812835693359375, 0.06284523010253906, 0.06756210327148438, 0.07227897644042969, 0.076995849609375, 0.08171272277832031, 0.08642959594726562, 0.09114646911621094, 0.09586334228515625, 0.10058021545410156, 0.10529708862304688, 0.11001396179199219, 0.1147308349609375, 0.11944770812988281, 0.12416458129882812, 0.12888145446777344, 0.13359832763671875, 0.13831520080566406, 0.14303207397460938, 0.1477489471435547, 0.1524658203125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 6.0, 9.0, 18.0, 19.0, 47.0, 109.0, 221.0, 262.0, 173.0, 69.0, 28.0, 16.0, 10.0, 2.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.24169921875, -0.23678970336914062, -0.23188018798828125, -0.22697067260742188, -0.2220611572265625, -0.21715164184570312, -0.21224212646484375, -0.20733261108398438, -0.202423095703125, -0.19751358032226562, -0.19260406494140625, -0.18769454956054688, -0.1827850341796875, -0.17787551879882812, -0.17296600341796875, -0.16805648803710938, -0.16314697265625, -0.15823745727539062, -0.15332794189453125, -0.14841842651367188, -0.1435089111328125, -0.13859939575195312, -0.13368988037109375, -0.12878036499023438, -0.123870849609375, -0.11896133422851562, -0.11405181884765625, -0.10914230346679688, -0.1042327880859375, -0.09932327270507812, -0.09441375732421875, -0.08950424194335938, -0.0845947265625, -0.07968521118164062, -0.07477569580078125, -0.06986618041992188, -0.0649566650390625, -0.060047149658203125, -0.05513763427734375, -0.050228118896484375, -0.045318603515625, -0.040409088134765625, -0.03549957275390625, -0.030590057373046875, -0.0256805419921875, -0.020771026611328125, -0.01586151123046875, -0.010951995849609375, -0.00604248046875, -0.001132965087890625, 0.00377655029296875, 0.008686065673828125, 0.0135955810546875, 0.018505096435546875, 0.02341461181640625, 0.028324127197265625, 0.033233642578125, 0.038143157958984375, 0.04305267333984375, 0.047962188720703125, 0.0528717041015625, 0.057781219482421875, 0.06269073486328125, 0.06760025024414062, 0.072509765625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 25.0, 151.0, 347.0, 337.0, 100.0, 27.0, 11.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2232409715652466, -1.1460566520690918, -1.0688724517822266, -0.9916881918907166, -0.9145039319992065, -0.8373196721076965, -0.7601354122161865, -0.6829511523246765, -0.6057668924331665, -0.5285826325416565, -0.4513983726501465, -0.3742141127586365, -0.29702985286712646, -0.21984559297561646, -0.14266133308410645, -0.06547707319259644, 0.011707186698913574, 0.08889144659042358, 0.1660757064819336, 0.2432599663734436, 0.3204442262649536, 0.3976284861564636, 0.47481274604797363, 0.5519970059394836, 0.6291812658309937, 0.7063655257225037, 0.7835497856140137, 0.8607340455055237, 0.9379183053970337, 1.0151026248931885, 1.0922868251800537, 1.169471025466919, 1.2466554641723633, 1.3238396644592285, 1.4010239839553833, 1.478208303451538, 1.5553925037384033, 1.6325767040252686, 1.7097610235214233, 1.7869453430175781, 1.8641295433044434, 1.9413137435913086, 2.018497943878174, 2.095682382583618, 2.1728665828704834, 2.2500507831573486, 2.327235221862793, 2.404419422149658, 2.4816036224365234, 2.5587878227233887, 2.635972023010254, 2.7131564617156982, 2.7903406620025635, 2.8675248622894287, 2.944709300994873, 3.0218935012817383, 3.0990777015686035, 3.1762619018554688, 3.253446102142334, 3.3306305408477783, 3.4078147411346436, 3.484998941421509, 3.562183380126953, 3.6393675804138184, 3.7165517807006836]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 2.0, 6.0, 5.0, 5.0, 18.0, 18.0, 15.0, 17.0, 16.0, 23.0, 33.0, 27.0, 33.0, 36.0, 38.0, 48.0, 60.0, 49.0, 35.0, 55.0, 51.0, 40.0, 48.0, 43.0, 34.0, 39.0, 26.0, 32.0, 20.0, 20.0, 23.0, 13.0, 9.0, 7.0, 9.0, 8.0, 12.0, 4.0, 8.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8718730807304382, -0.8419447541236877, -0.8120164275169373, -0.782088041305542, -0.7521597146987915, -0.722231388092041, -0.6923030614852905, -0.66237473487854, -0.6324464082717896, -0.6025180816650391, -0.5725897550582886, -0.5426614284515381, -0.5127330422401428, -0.48280471563339233, -0.45287638902664185, -0.42294806241989136, -0.3930196762084961, -0.3630913496017456, -0.33316299319267273, -0.30323466658592224, -0.27330631017684937, -0.24337798357009888, -0.2134496569633484, -0.1835213154554367, -0.15359297394752502, -0.12366463243961334, -0.09373629838228226, -0.06380796432495117, -0.03387962281703949, -0.003951281309127808, 0.02597704529762268, 0.05590538680553436, 0.08583378791809082, 0.1157621294260025, 0.14569047093391418, 0.17561879754066467, 0.20554713904857635, 0.23547548055648804, 0.2654038071632385, 0.295332133769989, 0.3252604901790619, 0.3551888167858124, 0.38511717319488525, 0.41504549980163574, 0.44497382640838623, 0.4749021828174591, 0.5048304796218872, 0.5347588658332825, 0.564687192440033, 0.5946155190467834, 0.6245438456535339, 0.6544722318649292, 0.6844005584716797, 0.7143288850784302, 0.7442572116851807, 0.7741855382919312, 0.8041138648986816, 0.8340421915054321, 0.8639705181121826, 0.8938988447189331, 0.9238272309303284, 0.9537555575370789, 0.9836838841438293, 1.0136122703552246, 1.043540596961975]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 14.0, 21.0, 28.0, 30.0, 72.0, 118.0, 182.0, 281.0, 583.0, 1205.0, 2943.0, 8987.0, 43848.0, 4101456.0, 23843.0, 6382.0, 2209.0, 975.0, 435.0, 258.0, 138.0, 111.0, 52.0, 36.0, 17.0, 18.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.141845703125, -0.13771533966064453, -0.13358497619628906, -0.1294546127319336, -0.12532424926757812, -0.12119388580322266, -0.11706352233886719, -0.11293315887451172, -0.10880279541015625, -0.10467243194580078, -0.10054206848144531, -0.09641170501708984, -0.09228134155273438, -0.0881509780883789, -0.08402061462402344, -0.07989025115966797, -0.0757598876953125, -0.07162952423095703, -0.06749916076660156, -0.0633687973022461, -0.059238433837890625, -0.055108070373535156, -0.05097770690917969, -0.04684734344482422, -0.04271697998046875, -0.03858661651611328, -0.03445625305175781, -0.030325889587402344, -0.026195526123046875, -0.022065162658691406, -0.017934799194335938, -0.013804435729980469, -0.009674072265625, -0.005543708801269531, -0.0014133453369140625, 0.0027170181274414062, 0.006847381591796875, 0.010977745056152344, 0.015108108520507812, 0.01923847198486328, 0.02336883544921875, 0.02749919891357422, 0.03162956237792969, 0.035759925842285156, 0.039890289306640625, 0.044020652770996094, 0.04815101623535156, 0.05228137969970703, 0.0564117431640625, 0.06054210662841797, 0.06467247009277344, 0.0688028335571289, 0.07293319702148438, 0.07706356048583984, 0.08119392395019531, 0.08532428741455078, 0.08945465087890625, 0.09358501434326172, 0.09771537780761719, 0.10184574127197266, 0.10597610473632812, 0.1101064682006836, 0.11423683166503906, 0.11836719512939453, 0.12249755859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 12.0, 24.0, 41.0, 84.0, 151.0, 153.0, 206.0, 127.0, 95.0, 52.0, 14.0, 12.0, 10.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.131103515625, -0.12658309936523438, -0.12206268310546875, -0.11754226684570312, -0.1130218505859375, -0.10850143432617188, -0.10398101806640625, -0.09946060180664062, -0.094940185546875, -0.09041976928710938, -0.08589935302734375, -0.08137893676757812, -0.0768585205078125, -0.07233810424804688, -0.06781768798828125, -0.06329727172851562, -0.05877685546875, -0.054256439208984375, -0.04973602294921875, -0.045215606689453125, -0.0406951904296875, -0.036174774169921875, -0.03165435791015625, -0.027133941650390625, -0.022613525390625, -0.018093109130859375, -0.01357269287109375, -0.009052276611328125, -0.0045318603515625, -1.1444091796875e-05, 0.00450897216796875, 0.009029388427734375, 0.0135498046875, 0.018070220947265625, 0.02259063720703125, 0.027111053466796875, 0.0316314697265625, 0.036151885986328125, 0.04067230224609375, 0.045192718505859375, 0.049713134765625, 0.054233551025390625, 0.05875396728515625, 0.06327438354492188, 0.0677947998046875, 0.07231521606445312, 0.07683563232421875, 0.08135604858398438, 0.08587646484375, 0.09039688110351562, 0.09491729736328125, 0.09943771362304688, 0.1039581298828125, 0.10847854614257812, 0.11299896240234375, 0.11751937866210938, 0.122039794921875, 0.12656021118164062, 0.13108062744140625, 0.13560104370117188, 0.1401214599609375, 0.14464187622070312, 0.14916229248046875, 0.15368270874023438, 0.158203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 12.0, 9.0, 20.0, 30.0, 36.0, 69.0, 77.0, 137.0, 162.0, 230.0, 306.0, 499.0, 885.0, 1346.0, 2388.0, 4807.0, 11203.0, 39259.0, 4060094.0, 48513.0, 12389.0, 5164.0, 2588.0, 1474.0, 888.0, 551.0, 325.0, 219.0, 168.0, 101.0, 79.0, 63.0, 64.0, 44.0, 18.0, 14.0, 11.0, 8.0, 9.0, 5.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.14599609375, -0.1415119171142578, -0.13702774047851562, -0.13254356384277344, -0.12805938720703125, -0.12357521057128906, -0.11909103393554688, -0.11460685729980469, -0.1101226806640625, -0.10563850402832031, -0.10115432739257812, -0.09667015075683594, -0.09218597412109375, -0.08770179748535156, -0.08321762084960938, -0.07873344421386719, -0.074249267578125, -0.06976509094238281, -0.06528091430664062, -0.06079673767089844, -0.05631256103515625, -0.05182838439941406, -0.047344207763671875, -0.04286003112792969, -0.0383758544921875, -0.03389167785644531, -0.029407501220703125, -0.024923324584960938, -0.02043914794921875, -0.015954971313476562, -0.011470794677734375, -0.0069866180419921875, -0.00250244140625, 0.0019817352294921875, 0.006465911865234375, 0.010950088500976562, 0.01543426513671875, 0.019918441772460938, 0.024402618408203125, 0.028886795043945312, 0.0333709716796875, 0.03785514831542969, 0.042339324951171875, 0.04682350158691406, 0.05130767822265625, 0.05579185485839844, 0.060276031494140625, 0.06476020812988281, 0.069244384765625, 0.07372856140136719, 0.07821273803710938, 0.08269691467285156, 0.08718109130859375, 0.09166526794433594, 0.09614944458007812, 0.10063362121582031, 0.1051177978515625, 0.10960197448730469, 0.11408615112304688, 0.11857032775878906, 0.12305450439453125, 0.12753868103027344, 0.13202285766601562, 0.1365070343017578, 0.1409912109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 5.0, 10.0, 5.0, 7.0, 10.0, 14.0, 22.0, 38.0, 92.0, 3733.0, 61.0, 23.0, 14.0, 10.0, 7.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027984619140625, -0.02688455581665039, -0.02578449249267578, -0.024684429168701172, -0.023584365844726562, -0.022484302520751953, -0.021384239196777344, -0.020284175872802734, -0.019184112548828125, -0.018084049224853516, -0.016983985900878906, -0.015883922576904297, -0.014783859252929688, -0.013683795928955078, -0.012583732604980469, -0.01148366928100586, -0.01038360595703125, -0.00928354263305664, -0.008183479309082031, -0.007083415985107422, -0.0059833526611328125, -0.004883289337158203, -0.0037832260131835938, -0.0026831626892089844, -0.001583099365234375, -0.0004830360412597656, 0.0006170272827148438, 0.0017170906066894531, 0.0028171539306640625, 0.003917217254638672, 0.005017280578613281, 0.006117343902587891, 0.0072174072265625, 0.00831747055053711, 0.009417533874511719, 0.010517597198486328, 0.011617660522460938, 0.012717723846435547, 0.013817787170410156, 0.014917850494384766, 0.016017913818359375, 0.017117977142333984, 0.018218040466308594, 0.019318103790283203, 0.020418167114257812, 0.021518230438232422, 0.02261829376220703, 0.02371835708618164, 0.02481842041015625, 0.02591848373413086, 0.02701854705810547, 0.028118610382080078, 0.029218673706054688, 0.030318737030029297, 0.031418800354003906, 0.032518863677978516, 0.033618927001953125, 0.034718990325927734, 0.035819053649902344, 0.03691911697387695, 0.03801918029785156, 0.03911924362182617, 0.04021930694580078, 0.04131937026977539, 0.04241943359375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 5.0, 4.0, 8.0, 18.0, 26.0, 68.0, 77.0, 89.0, 136.0, 153.0, 146.0, 78.0, 72.0, 46.0, 25.0, 19.0, 9.0, 7.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1490519791841507, -0.14411598443984985, -0.13917997479438782, -0.13424398005008698, -0.12930798530578613, -0.1243719831109047, -0.11943598091602325, -0.11449998617172241, -0.10956399142742157, -0.10462798923254013, -0.09969199448823929, -0.09475599229335785, -0.089819997549057, -0.08488399535417557, -0.07994799315929413, -0.07501199841499329, -0.07007599622011185, -0.06513999402523041, -0.060203999280929565, -0.055267997086048126, -0.050332002341747284, -0.045396000146865845, -0.040460001677274704, -0.03552400320768356, -0.030588004738092422, -0.025652006268501282, -0.02071600779891014, -0.01578000746667385, -0.01084400899708271, -0.0059080105274915695, -0.0009720101952552795, 0.003963988274335861, 0.008899986743927002, 0.013835985213518143, 0.018771983683109283, 0.023707984015345573, 0.028643982484936714, 0.033579982817173004, 0.038515981286764145, 0.043451979756355286, 0.048387978225946426, 0.05332397669553757, 0.05825997516512871, 0.06319597363471985, 0.06813197582960129, 0.07306797057390213, 0.07800397276878357, 0.08293996751308441, 0.08787596970796585, 0.09281197190284729, 0.09774796664714813, 0.10268396884202957, 0.10761996358633041, 0.11255596578121185, 0.1174919605255127, 0.12242796272039413, 0.12736396491527557, 0.13229995965957642, 0.13723596930503845, 0.1421719640493393, 0.14710795879364014, 0.15204395353794098, 0.15697996318340302, 0.16191595792770386, 0.1668519526720047]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 5.0, 8.0, 13.0, 12.0, 15.0, 11.0, 26.0, 26.0, 29.0, 26.0, 35.0, 35.0, 48.0, 43.0, 56.0, 37.0, 48.0, 54.0, 40.0, 48.0, 49.0, 44.0, 43.0, 33.0, 33.0, 35.0, 30.0, 17.0, 22.0, 17.0, 11.0, 11.0, 8.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07425451278686523, -0.071880042552948, -0.06950556486845016, -0.06713109463453293, -0.0647566169500351, -0.06238214671611786, -0.06000767648220062, -0.05763320252299309, -0.05525872856378555, -0.05288425460457802, -0.05050978064537048, -0.04813531041145325, -0.04576083645224571, -0.04338636249303818, -0.04101189225912094, -0.038637418299913406, -0.03626294434070587, -0.03388847038149834, -0.0315139964222908, -0.029139526188373566, -0.02676505222916603, -0.024390578269958496, -0.02201610617339611, -0.019641634076833725, -0.01726716011762619, -0.01489268708974123, -0.01251821406185627, -0.01014374103397131, -0.0077692680060863495, -0.005394794978201389, -0.003020321950316429, -0.0006458498537540436, 0.0017286241054534912, 0.004103097133338451, 0.0064775701612234116, 0.008852043189108372, 0.011226516216993332, 0.013600989244878292, 0.015975462272763252, 0.018349934369325638, 0.020724408328533173, 0.023098882287740707, 0.025473354384303093, 0.02784782648086548, 0.030222300440073013, 0.03259677439928055, 0.034971244633197784, 0.03734571859240532, 0.039720192551612854, 0.04209466651082039, 0.044469140470027924, 0.04684361070394516, 0.049218084663152695, 0.05159255862236023, 0.053967028856277466, 0.056341502815485, 0.058715976774692535, 0.06109045073390007, 0.0634649246931076, 0.06583939492702484, 0.06821386516094208, 0.07058834284543991, 0.07296281307935715, 0.07533729076385498, 0.07771176099777222]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 7.0, 8.0, 14.0, 37.0, 76.0, 213.0, 883.0, 5974.0, 542430.0, 491918.0, 5726.0, 885.0, 199.0, 78.0, 23.0, 16.0, 16.0, 14.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.470703125, -0.45685577392578125, -0.4430084228515625, -0.42916107177734375, -0.415313720703125, -0.40146636962890625, -0.3876190185546875, -0.37377166748046875, -0.35992431640625, -0.34607696533203125, -0.3322296142578125, -0.31838226318359375, -0.304534912109375, -0.29068756103515625, -0.2768402099609375, -0.26299285888671875, -0.2491455078125, -0.23529815673828125, -0.2214508056640625, -0.20760345458984375, -0.193756103515625, -0.17990875244140625, -0.1660614013671875, -0.15221405029296875, -0.13836669921875, -0.12451934814453125, -0.1106719970703125, -0.09682464599609375, -0.082977294921875, -0.06912994384765625, -0.0552825927734375, -0.04143524169921875, -0.027587890625, -0.01374053955078125, 0.0001068115234375, 0.01395416259765625, 0.027801513671875, 0.04164886474609375, 0.0554962158203125, 0.06934356689453125, 0.08319091796875, 0.09703826904296875, 0.1108856201171875, 0.12473297119140625, 0.138580322265625, 0.15242767333984375, 0.1662750244140625, 0.18012237548828125, 0.1939697265625, 0.20781707763671875, 0.2216644287109375, 0.23551177978515625, 0.249359130859375, 0.26320648193359375, 0.2770538330078125, 0.29090118408203125, 0.30474853515625, 0.31859588623046875, 0.3324432373046875, 0.34629058837890625, 0.360137939453125, 0.37398529052734375, 0.3878326416015625, 0.40167999267578125, 0.41552734375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 9.0, 32.0, 30.0, 95.0, 136.0, 160.0, 171.0, 151.0, 80.0, 65.0, 32.0, 10.0, 7.0, 5.0, 9.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.132080078125, -0.12754440307617188, -0.12300872802734375, -0.11847305297851562, -0.1139373779296875, -0.10940170288085938, -0.10486602783203125, -0.10033035278320312, -0.095794677734375, -0.09125900268554688, -0.08672332763671875, -0.08218765258789062, -0.0776519775390625, -0.07311630249023438, -0.06858062744140625, -0.06404495239257812, -0.05950927734375, -0.054973602294921875, -0.05043792724609375, -0.045902252197265625, -0.0413665771484375, -0.036830902099609375, -0.03229522705078125, -0.027759552001953125, -0.023223876953125, -0.018688201904296875, -0.01415252685546875, -0.009616851806640625, -0.0050811767578125, -0.000545501708984375, 0.00399017333984375, 0.008525848388671875, 0.0130615234375, 0.017597198486328125, 0.02213287353515625, 0.026668548583984375, 0.0312042236328125, 0.035739898681640625, 0.04027557373046875, 0.044811248779296875, 0.049346923828125, 0.053882598876953125, 0.05841827392578125, 0.06295394897460938, 0.0674896240234375, 0.07202529907226562, 0.07656097412109375, 0.08109664916992188, 0.08563232421875, 0.09016799926757812, 0.09470367431640625, 0.09923934936523438, 0.1037750244140625, 0.10831069946289062, 0.11284637451171875, 0.11738204956054688, 0.121917724609375, 0.12645339965820312, 0.13098907470703125, 0.13552474975585938, 0.1400604248046875, 0.14459609985351562, 0.14913177490234375, 0.15366744995117188, 0.158203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 2.0, 7.0, 4.0, 4.0, 3.0, 10.0, 10.0, 10.0, 12.0, 15.0, 19.0, 21.0, 39.0, 48.0, 42.0, 78.0, 139.0, 242.0, 451.0, 1039.0, 3402.0, 28652.0, 833350.0, 169347.0, 8281.0, 1733.0, 653.0, 330.0, 172.0, 123.0, 55.0, 58.0, 42.0, 30.0, 22.0, 16.0, 15.0, 10.0, 14.0, 9.0, 13.0, 8.0, 3.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1806640625, -0.174591064453125, -0.16851806640625, -0.162445068359375, -0.1563720703125, -0.150299072265625, -0.14422607421875, -0.138153076171875, -0.132080078125, -0.126007080078125, -0.11993408203125, -0.113861083984375, -0.1077880859375, -0.101715087890625, -0.09564208984375, -0.089569091796875, -0.08349609375, -0.077423095703125, -0.07135009765625, -0.065277099609375, -0.0592041015625, -0.053131103515625, -0.04705810546875, -0.040985107421875, -0.034912109375, -0.028839111328125, -0.02276611328125, -0.016693115234375, -0.0106201171875, -0.004547119140625, 0.00152587890625, 0.007598876953125, 0.013671875, 0.019744873046875, 0.02581787109375, 0.031890869140625, 0.0379638671875, 0.044036865234375, 0.05010986328125, 0.056182861328125, 0.062255859375, 0.068328857421875, 0.07440185546875, 0.080474853515625, 0.0865478515625, 0.092620849609375, 0.09869384765625, 0.104766845703125, 0.11083984375, 0.116912841796875, 0.12298583984375, 0.129058837890625, 0.1351318359375, 0.141204833984375, 0.14727783203125, 0.153350830078125, 0.159423828125, 0.165496826171875, 0.17156982421875, 0.177642822265625, 0.1837158203125, 0.189788818359375, 0.19586181640625, 0.201934814453125, 0.2080078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 11.0, 11.0, 14.0, 10.0, 26.0, 26.0, 20.0, 20.0, 39.0, 35.0, 41.0, 44.0, 55.0, 57.0, 50.0, 42.0, 61.0, 48.0, 42.0, 52.0, 46.0, 35.0, 41.0, 28.0, 31.0, 23.0, 23.0, 12.0, 12.0, 10.0, 8.0, 8.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.224853515625, -0.2179241180419922, -0.21099472045898438, -0.20406532287597656, -0.19713592529296875, -0.19020652770996094, -0.18327713012695312, -0.1763477325439453, -0.1694183349609375, -0.1624889373779297, -0.15555953979492188, -0.14863014221191406, -0.14170074462890625, -0.13477134704589844, -0.12784194946289062, -0.12091255187988281, -0.113983154296875, -0.10705375671386719, -0.10012435913085938, -0.09319496154785156, -0.08626556396484375, -0.07933616638183594, -0.07240676879882812, -0.06547737121582031, -0.0585479736328125, -0.05161857604980469, -0.044689178466796875, -0.03775978088378906, -0.03083038330078125, -0.023900985717773438, -0.016971588134765625, -0.010042190551757812, -0.00311279296875, 0.0038166046142578125, 0.010746002197265625, 0.017675399780273438, 0.02460479736328125, 0.03153419494628906, 0.038463592529296875, 0.04539299011230469, 0.0523223876953125, 0.05925178527832031, 0.06618118286132812, 0.07311058044433594, 0.08003997802734375, 0.08696937561035156, 0.09389877319335938, 0.10082817077636719, 0.107757568359375, 0.11468696594238281, 0.12161636352539062, 0.12854576110839844, 0.13547515869140625, 0.14240455627441406, 0.14933395385742188, 0.1562633514404297, 0.1631927490234375, 0.1701221466064453, 0.17705154418945312, 0.18398094177246094, 0.19091033935546875, 0.19783973693847656, 0.20476913452148438, 0.2116985321044922, 0.2186279296875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 7.0, 16.0, 11.0, 17.0, 37.0, 40.0, 66.0, 112.0, 230.0, 583.0, 2005.0, 11169.0, 599948.0, 421391.0, 10014.0, 1722.0, 623.0, 243.0, 118.0, 69.0, 35.0, 28.0, 18.0, 14.0, 8.0, 5.0, 9.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08013916015625, -0.0767965316772461, -0.07345390319824219, -0.07011127471923828, -0.06676864624023438, -0.06342601776123047, -0.06008338928222656, -0.056740760803222656, -0.05339813232421875, -0.050055503845214844, -0.04671287536621094, -0.04337024688720703, -0.040027618408203125, -0.03668498992919922, -0.03334236145019531, -0.029999732971191406, -0.0266571044921875, -0.023314476013183594, -0.019971847534179688, -0.01662921905517578, -0.013286590576171875, -0.009943962097167969, -0.0066013336181640625, -0.0032587051391601562, 8.392333984375e-05, 0.0034265518188476562, 0.0067691802978515625, 0.010111808776855469, 0.013454437255859375, 0.01679706573486328, 0.020139694213867188, 0.023482322692871094, 0.026824951171875, 0.030167579650878906, 0.03351020812988281, 0.03685283660888672, 0.040195465087890625, 0.04353809356689453, 0.04688072204589844, 0.050223350524902344, 0.05356597900390625, 0.056908607482910156, 0.06025123596191406, 0.06359386444091797, 0.06693649291992188, 0.07027912139892578, 0.07362174987792969, 0.0769643783569336, 0.0803070068359375, 0.0836496353149414, 0.08699226379394531, 0.09033489227294922, 0.09367752075195312, 0.09702014923095703, 0.10036277770996094, 0.10370540618896484, 0.10704803466796875, 0.11039066314697266, 0.11373329162597656, 0.11707592010498047, 0.12041854858398438, 0.12376117706298828, 0.1271038055419922, 0.1304464340209961, 0.1337890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 14.0, 15.0, 29.0, 82.0, 140.0, 224.0, 209.0, 126.0, 69.0, 41.0, 15.0, 15.0, 9.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1682510375976562e-05, -1.1033378541469574e-05, -1.0384246706962585e-05, -9.735114872455597e-06, -9.085983037948608e-06, -8.43685120344162e-06, -7.787719368934631e-06, -7.138587534427643e-06, -6.489455699920654e-06, -5.840323865413666e-06, -5.191192030906677e-06, -4.542060196399689e-06, -3.8929283618927e-06, -3.2437965273857117e-06, -2.594664692878723e-06, -1.9455328583717346e-06, -1.296401023864746e-06, -6.472691893577576e-07, 1.862645149230957e-09, 6.509944796562195e-07, 1.300126314163208e-06, 1.9492581486701965e-06, 2.598389983177185e-06, 3.2475218176841736e-06, 3.896653652191162e-06, 4.545785486698151e-06, 5.194917321205139e-06, 5.844049155712128e-06, 6.493180990219116e-06, 7.142312824726105e-06, 7.791444659233093e-06, 8.440576493740082e-06, 9.08970832824707e-06, 9.738840162754059e-06, 1.0387971997261047e-05, 1.1037103831768036e-05, 1.1686235666275024e-05, 1.2335367500782013e-05, 1.2984499335289001e-05, 1.363363116979599e-05, 1.4282763004302979e-05, 1.4931894838809967e-05, 1.5581026673316956e-05, 1.6230158507823944e-05, 1.6879290342330933e-05, 1.752842217683792e-05, 1.817755401134491e-05, 1.8826685845851898e-05, 1.9475817680358887e-05, 2.0124949514865875e-05, 2.0774081349372864e-05, 2.1423213183879852e-05, 2.207234501838684e-05, 2.272147685289383e-05, 2.3370608687400818e-05, 2.4019740521907806e-05, 2.4668872356414795e-05, 2.5318004190921783e-05, 2.5967136025428772e-05, 2.661626785993576e-05, 2.726539969444275e-05, 2.7914531528949738e-05, 2.8563663363456726e-05, 2.9212795197963715e-05, 2.9861927032470703e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 19.0, 24.0, 30.0, 43.0, 93.0, 149.0, 292.0, 618.0, 1708.0, 6254.0, 48960.0, 887898.0, 89849.0, 8850.0, 2184.0, 734.0, 340.0, 177.0, 101.0, 63.0, 52.0, 35.0, 18.0, 15.0, 8.0, 3.0, 2.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.11864566802978516, -0.11540412902832031, -0.11216259002685547, -0.10892105102539062, -0.10567951202392578, -0.10243797302246094, -0.0991964340209961, -0.09595489501953125, -0.0927133560180664, -0.08947181701660156, -0.08623027801513672, -0.08298873901367188, -0.07974720001220703, -0.07650566101074219, -0.07326412200927734, -0.0700225830078125, -0.06678104400634766, -0.06353950500488281, -0.06029796600341797, -0.057056427001953125, -0.05381488800048828, -0.05057334899902344, -0.047331809997558594, -0.04409027099609375, -0.040848731994628906, -0.03760719299316406, -0.03436565399169922, -0.031124114990234375, -0.02788257598876953, -0.024641036987304688, -0.021399497985839844, -0.018157958984375, -0.014916419982910156, -0.011674880981445312, -0.008433341979980469, -0.005191802978515625, -0.0019502639770507812, 0.0012912750244140625, 0.004532814025878906, 0.00777435302734375, 0.011015892028808594, 0.014257431030273438, 0.01749897003173828, 0.020740509033203125, 0.02398204803466797, 0.027223587036132812, 0.030465126037597656, 0.0337066650390625, 0.036948204040527344, 0.04018974304199219, 0.04343128204345703, 0.046672821044921875, 0.04991436004638672, 0.05315589904785156, 0.056397438049316406, 0.05963897705078125, 0.0628805160522461, 0.06612205505371094, 0.06936359405517578, 0.07260513305664062, 0.07584667205810547, 0.07908821105957031, 0.08232975006103516, 0.0855712890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 8.0, 7.0, 2.0, 6.0, 13.0, 29.0, 45.0, 63.0, 78.0, 145.0, 154.0, 109.0, 119.0, 57.0, 44.0, 28.0, 29.0, 27.0, 11.0, 5.0, 5.0, 0.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.10894775390625, -0.10612106323242188, -0.10329437255859375, -0.10046768188476562, -0.0976409912109375, -0.09481430053710938, -0.09198760986328125, -0.08916091918945312, -0.086334228515625, -0.08350753784179688, -0.08068084716796875, -0.07785415649414062, -0.0750274658203125, -0.07220077514648438, -0.06937408447265625, -0.06654739379882812, -0.063720703125, -0.060894012451171875, -0.05806732177734375, -0.055240631103515625, -0.0524139404296875, -0.049587249755859375, -0.04676055908203125, -0.043933868408203125, -0.041107177734375, -0.038280487060546875, -0.03545379638671875, -0.032627105712890625, -0.0298004150390625, -0.026973724365234375, -0.02414703369140625, -0.021320343017578125, -0.01849365234375, -0.015666961669921875, -0.01284027099609375, -0.010013580322265625, -0.0071868896484375, -0.004360198974609375, -0.00153350830078125, 0.001293182373046875, 0.004119873046875, 0.006946563720703125, 0.00977325439453125, 0.012599945068359375, 0.0154266357421875, 0.018253326416015625, 0.02108001708984375, 0.023906707763671875, 0.0267333984375, 0.029560089111328125, 0.03238677978515625, 0.035213470458984375, 0.0380401611328125, 0.040866851806640625, 0.04369354248046875, 0.046520233154296875, 0.049346923828125, 0.052173614501953125, 0.05500030517578125, 0.057826995849609375, 0.0606536865234375, 0.06348037719726562, 0.06630706787109375, 0.06913375854492188, 0.07196044921875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 8.0, 92.0, 560.0, 305.0, 32.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8584301471710205, -1.7330029010772705, -1.6075756549835205, -1.4821484088897705, -1.3567211627960205, -1.2312939167022705, -1.1058666706085205, -0.9804394245147705, -0.8550121784210205, -0.7295849323272705, -0.6041576862335205, -0.4787304401397705, -0.3533031940460205, -0.2278759479522705, -0.10244870185852051, 0.022978544235229492, 0.1484057903289795, 0.2738330364227295, 0.3992602825164795, 0.5246875286102295, 0.6501147747039795, 0.7755420207977295, 0.9009692668914795, 1.0263965129852295, 1.1518237590789795, 1.2772510051727295, 1.4026782512664795, 1.5281054973602295, 1.6535327434539795, 1.7789599895477295, 1.9043872356414795, 2.0298144817352295, 2.1552419662475586, 2.2806692123413086, 2.4060964584350586, 2.5315237045288086, 2.6569509506225586, 2.7823781967163086, 2.9078054428100586, 3.0332326889038086, 3.1586599349975586, 3.2840871810913086, 3.4095144271850586, 3.5349416732788086, 3.6603689193725586, 3.7857961654663086, 3.9112234115600586, 4.036650657653809, 4.162077903747559, 4.287505149841309, 4.412932395935059, 4.538359642028809, 4.663786888122559, 4.789214134216309, 4.914641380310059, 5.040068626403809, 5.165495872497559, 5.290923118591309, 5.416350364685059, 5.541777610778809, 5.667204856872559, 5.792632102966309, 5.918059349060059, 6.043486595153809, 6.168913841247559]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 5.0, 8.0, 5.0, 3.0, 9.0, 2.0, 4.0, 16.0, 18.0, 5.0, 18.0, 31.0, 22.0, 28.0, 28.0, 42.0, 40.0, 47.0, 47.0, 57.0, 51.0, 45.0, 61.0, 54.0, 47.0, 36.0, 33.0, 33.0, 32.0, 29.0, 20.0, 20.0, 22.0, 17.0, 12.0, 21.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.871202290058136, -0.8424568772315979, -0.8137115240097046, -0.7849661111831665, -0.7562206983566284, -0.7274753451347351, -0.698729932308197, -0.6699845790863037, -0.6412391662597656, -0.6124937534332275, -0.5837484002113342, -0.5550029873847961, -0.5262576341629028, -0.49751222133636475, -0.46876680850982666, -0.44002142548561096, -0.41127604246139526, -0.38253065943717957, -0.35378527641296387, -0.3250398635864258, -0.2962944805622101, -0.2675490975379944, -0.2388036996126175, -0.2100583016872406, -0.1813129186630249, -0.1525675356388092, -0.12382213771343231, -0.09507674723863602, -0.06633135676383972, -0.03758597373962402, -0.008840575814247131, 0.01990482211112976, 0.04865020513534546, 0.07739559561014175, 0.10614098608493805, 0.13488638401031494, 0.16363176703453064, 0.19237715005874634, 0.22112254798412323, 0.24986794590950012, 0.2786133289337158, 0.3073587119579315, 0.3361040949821472, 0.3648495078086853, 0.393594890832901, 0.4223402738571167, 0.4510856866836548, 0.4798310697078705, 0.5085764527320862, 0.5373218655586243, 0.5660672187805176, 0.5948126316070557, 0.6235580444335938, 0.6523033976554871, 0.6810488104820251, 0.7097941637039185, 0.7385395765304565, 0.7672849893569946, 0.7960303425788879, 0.824775755405426, 0.8535211086273193, 0.8822665214538574, 0.9110119342803955, 0.9397573471069336, 0.9685027003288269]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 12.0, 22.0, 22.0, 23.0, 35.0, 44.0, 84.0, 120.0, 170.0, 256.0, 442.0, 825.0, 1741.0, 3977.0, 11626.0, 48075.0, 4022822.0, 79675.0, 14914.0, 4999.0, 2061.0, 949.0, 484.0, 295.0, 169.0, 136.0, 92.0, 66.0, 43.0, 28.0, 19.0, 12.0, 11.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1363525390625, -0.132171630859375, -0.12799072265625, -0.123809814453125, -0.11962890625, -0.115447998046875, -0.11126708984375, -0.107086181640625, -0.1029052734375, -0.098724365234375, -0.09454345703125, -0.090362548828125, -0.086181640625, -0.082000732421875, -0.07781982421875, -0.073638916015625, -0.0694580078125, -0.065277099609375, -0.06109619140625, -0.056915283203125, -0.052734375, -0.048553466796875, -0.04437255859375, -0.040191650390625, -0.0360107421875, -0.031829833984375, -0.02764892578125, -0.023468017578125, -0.019287109375, -0.015106201171875, -0.01092529296875, -0.006744384765625, -0.0025634765625, 0.001617431640625, 0.00579833984375, 0.009979248046875, 0.01416015625, 0.018341064453125, 0.02252197265625, 0.026702880859375, 0.0308837890625, 0.035064697265625, 0.03924560546875, 0.043426513671875, 0.047607421875, 0.051788330078125, 0.05596923828125, 0.060150146484375, 0.0643310546875, 0.068511962890625, 0.07269287109375, 0.076873779296875, 0.0810546875, 0.085235595703125, 0.08941650390625, 0.093597412109375, 0.0977783203125, 0.101959228515625, 0.10614013671875, 0.110321044921875, 0.114501953125, 0.118682861328125, 0.12286376953125, 0.127044677734375, 0.1312255859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 12.0, 9.0, 23.0, 58.0, 91.0, 145.0, 152.0, 178.0, 137.0, 89.0, 45.0, 33.0, 11.0, 5.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.132080078125, -0.1275196075439453, -0.12295913696289062, -0.11839866638183594, -0.11383819580078125, -0.10927772521972656, -0.10471725463867188, -0.10015678405761719, -0.0955963134765625, -0.09103584289550781, -0.08647537231445312, -0.08191490173339844, -0.07735443115234375, -0.07279396057128906, -0.06823348999023438, -0.06367301940917969, -0.059112548828125, -0.05455207824707031, -0.049991607666015625, -0.04543113708496094, -0.04087066650390625, -0.03631019592285156, -0.031749725341796875, -0.027189254760742188, -0.0226287841796875, -0.018068313598632812, -0.013507843017578125, -0.008947372436523438, -0.00438690185546875, 0.0001735687255859375, 0.004734039306640625, 0.009294509887695312, 0.01385498046875, 0.018415451049804688, 0.022975921630859375, 0.027536392211914062, 0.03209686279296875, 0.03665733337402344, 0.041217803955078125, 0.04577827453613281, 0.0503387451171875, 0.05489921569824219, 0.059459686279296875, 0.06402015686035156, 0.06858062744140625, 0.07314109802246094, 0.07770156860351562, 0.08226203918457031, 0.086822509765625, 0.09138298034667969, 0.09594345092773438, 0.10050392150878906, 0.10506439208984375, 0.10962486267089844, 0.11418533325195312, 0.11874580383300781, 0.1233062744140625, 0.1278667449951172, 0.13242721557617188, 0.13698768615722656, 0.14154815673828125, 0.14610862731933594, 0.15066909790039062, 0.1552295684814453, 0.1597900390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 7.0, 10.0, 15.0, 12.0, 25.0, 30.0, 42.0, 67.0, 134.0, 158.0, 234.0, 432.0, 656.0, 1193.0, 2665.0, 6599.0, 21583.0, 139704.0, 3943316.0, 55870.0, 12838.0, 4288.0, 1898.0, 979.0, 506.0, 353.0, 217.0, 133.0, 84.0, 66.0, 44.0, 30.0, 23.0, 13.0, 11.0, 12.0, 10.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.16845703125, -0.1638164520263672, -0.15917587280273438, -0.15453529357910156, -0.14989471435546875, -0.14525413513183594, -0.14061355590820312, -0.1359729766845703, -0.1313323974609375, -0.1266918182373047, -0.12205123901367188, -0.11741065979003906, -0.11277008056640625, -0.10812950134277344, -0.10348892211914062, -0.09884834289550781, -0.094207763671875, -0.08956718444824219, -0.08492660522460938, -0.08028602600097656, -0.07564544677734375, -0.07100486755371094, -0.06636428833007812, -0.06172370910644531, -0.0570831298828125, -0.05244255065917969, -0.047801971435546875, -0.04316139221191406, -0.03852081298828125, -0.03388023376464844, -0.029239654541015625, -0.024599075317382812, -0.01995849609375, -0.015317916870117188, -0.010677337646484375, -0.0060367584228515625, -0.00139617919921875, 0.0032444000244140625, 0.007884979248046875, 0.012525558471679688, 0.0171661376953125, 0.021806716918945312, 0.026447296142578125, 0.031087875366210938, 0.03572845458984375, 0.04036903381347656, 0.045009613037109375, 0.04965019226074219, 0.054290771484375, 0.05893135070800781, 0.06357192993164062, 0.06821250915527344, 0.07285308837890625, 0.07749366760253906, 0.08213424682617188, 0.08677482604980469, 0.0914154052734375, 0.09605598449707031, 0.10069656372070312, 0.10533714294433594, 0.10997772216796875, 0.11461830139160156, 0.11925888061523438, 0.12389945983886719, 0.1285400390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 9.0, 9.0, 21.0, 15.0, 14.0, 31.0, 39.0, 91.0, 344.0, 3159.0, 144.0, 79.0, 34.0, 19.0, 18.0, 14.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0396728515625, -0.037888526916503906, -0.03610420227050781, -0.03431987762451172, -0.032535552978515625, -0.03075122833251953, -0.028966903686523438, -0.027182579040527344, -0.02539825439453125, -0.023613929748535156, -0.021829605102539062, -0.02004528045654297, -0.018260955810546875, -0.01647663116455078, -0.014692306518554688, -0.012907981872558594, -0.0111236572265625, -0.009339332580566406, -0.0075550079345703125, -0.005770683288574219, -0.003986358642578125, -0.0022020339965820312, -0.0004177093505859375, 0.0013666152954101562, 0.00315093994140625, 0.004935264587402344, 0.0067195892333984375, 0.008503913879394531, 0.010288238525390625, 0.012072563171386719, 0.013856887817382812, 0.015641212463378906, 0.017425537109375, 0.019209861755371094, 0.020994186401367188, 0.02277851104736328, 0.024562835693359375, 0.02634716033935547, 0.028131484985351562, 0.029915809631347656, 0.03170013427734375, 0.033484458923339844, 0.03526878356933594, 0.03705310821533203, 0.038837432861328125, 0.04062175750732422, 0.04240608215332031, 0.044190406799316406, 0.0459747314453125, 0.047759056091308594, 0.04954338073730469, 0.05132770538330078, 0.053112030029296875, 0.05489635467529297, 0.05668067932128906, 0.058465003967285156, 0.06024932861328125, 0.062033653259277344, 0.06381797790527344, 0.06560230255126953, 0.06738662719726562, 0.06917095184326172, 0.07095527648925781, 0.0727396011352539, 0.07452392578125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 11.0, 16.0, 39.0, 66.0, 115.0, 170.0, 215.0, 127.0, 103.0, 59.0, 31.0, 14.0, 13.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3768138885498047, -0.3651999831199646, -0.3535860478878021, -0.34197214245796204, -0.33035820722579956, -0.3187443017959595, -0.307130366563797, -0.2955164611339569, -0.28390252590179443, -0.27228862047195435, -0.26067468523979187, -0.2490607649087906, -0.2374468445777893, -0.22583292424678802, -0.21421900391578674, -0.20260509848594666, -0.19099117815494537, -0.1793772578239441, -0.1677633374929428, -0.15614941716194153, -0.14453549683094025, -0.13292157649993896, -0.12130766361951828, -0.109693743288517, -0.09807982295751572, -0.08646590262651443, -0.07485198229551315, -0.06323806941509247, -0.05162414535880089, -0.040010225027799606, -0.028396308422088623, -0.01678238809108734, -0.00516846776008606, 0.0064454516395926476, 0.018059371039271355, 0.029673289507627487, 0.04128720983862877, 0.05290113016963005, 0.06451504677534103, 0.07612896710634232, 0.0877428874373436, 0.09935680776834488, 0.11097072809934616, 0.12258464097976685, 0.13419856131076813, 0.1458124816417694, 0.1574264019727707, 0.16904032230377197, 0.18065424263477325, 0.19226816296577454, 0.20388208329677582, 0.2154960036277771, 0.22710992395877838, 0.23872384428977966, 0.25033774971961975, 0.2619516849517822, 0.2735655903816223, 0.2851794958114624, 0.2967934310436249, 0.30840733647346497, 0.32002127170562744, 0.33163517713546753, 0.34324911236763, 0.3548630177974701, 0.36647695302963257]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 8.0, 6.0, 16.0, 16.0, 21.0, 25.0, 11.0, 21.0, 35.0, 41.0, 22.0, 43.0, 35.0, 35.0, 52.0, 50.0, 50.0, 52.0, 54.0, 42.0, 53.0, 52.0, 37.0, 34.0, 29.0, 27.0, 30.0, 19.0, 19.0, 24.0, 9.0, 5.0, 12.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16601133346557617, -0.1615161895751953, -0.15702106058597565, -0.1525259166955948, -0.14803077280521393, -0.14353564381599426, -0.1390404999256134, -0.13454535603523254, -0.13005021214485168, -0.12555506825447083, -0.12105993181467056, -0.1165647953748703, -0.11206965148448944, -0.10757451504468918, -0.10307937860488892, -0.09858423471450806, -0.09408910572528839, -0.08959396928548813, -0.08509882539510727, -0.080603688955307, -0.07610854506492615, -0.07161340862512589, -0.06711827218532562, -0.06262312829494476, -0.0581279918551445, -0.05363285169005394, -0.04913771152496338, -0.044642575085163116, -0.040147434920072556, -0.035652294754981995, -0.031157156452536583, -0.02666201815009117, -0.02216687798500061, -0.01767173781991005, -0.013176599517464638, -0.008681460283696651, -0.004186321049928665, 0.00030881911516189575, 0.0048039574176073074, 0.009299095720052719, 0.01379423588514328, 0.01828937605023384, 0.022784514352679253, 0.027279652655124664, 0.031774792820215225, 0.036269932985305786, 0.04076506942510605, 0.04526020959019661, 0.04975534975528717, 0.05425048992037773, 0.05874563008546829, 0.06324076652526855, 0.06773591041564941, 0.07223104685544968, 0.07672618329524994, 0.0812213271856308, 0.08571646362543106, 0.09021160006523132, 0.09470674395561218, 0.09920188039541245, 0.10369701683521271, 0.10819216072559357, 0.11268729716539383, 0.11718243360519409, 0.12167757749557495]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 7.0, 5.0, 16.0, 21.0, 38.0, 41.0, 82.0, 179.0, 363.0, 941.0, 3189.0, 20872.0, 447316.0, 544877.0, 25216.0, 3534.0, 1004.0, 409.0, 181.0, 94.0, 56.0, 36.0, 19.0, 22.0, 10.0, 12.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.266845703125, -0.2576560974121094, -0.24846649169921875, -0.23927688598632812, -0.2300872802734375, -0.22089767456054688, -0.21170806884765625, -0.20251846313476562, -0.193328857421875, -0.18413925170898438, -0.17494964599609375, -0.16576004028320312, -0.1565704345703125, -0.14738082885742188, -0.13819122314453125, -0.12900161743164062, -0.11981201171875, -0.11062240600585938, -0.10143280029296875, -0.09224319458007812, -0.0830535888671875, -0.07386398315429688, -0.06467437744140625, -0.055484771728515625, -0.046295166015625, -0.037105560302734375, -0.02791595458984375, -0.018726348876953125, -0.0095367431640625, -0.000347137451171875, 0.00884246826171875, 0.018032073974609375, 0.0272216796875, 0.036411285400390625, 0.04560089111328125, 0.054790496826171875, 0.0639801025390625, 0.07316970825195312, 0.08235931396484375, 0.09154891967773438, 0.100738525390625, 0.10992813110351562, 0.11911773681640625, 0.12830734252929688, 0.1374969482421875, 0.14668655395507812, 0.15587615966796875, 0.16506576538085938, 0.17425537109375, 0.18344497680664062, 0.19263458251953125, 0.20182418823242188, 0.2110137939453125, 0.22020339965820312, 0.22939300537109375, 0.23858261108398438, 0.247772216796875, 0.2569618225097656, 0.26615142822265625, 0.2753410339355469, 0.2845306396484375, 0.2937202453613281, 0.30290985107421875, 0.3120994567871094, 0.3212890625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 1.0, 10.0, 13.0, 17.0, 41.0, 84.0, 132.0, 142.0, 163.0, 149.0, 101.0, 64.0, 43.0, 20.0, 6.0, 9.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.128631591796875, -0.12408447265625, -0.119537353515625, -0.114990234375, -0.110443115234375, -0.10589599609375, -0.101348876953125, -0.0968017578125, -0.092254638671875, -0.08770751953125, -0.083160400390625, -0.07861328125, -0.074066162109375, -0.06951904296875, -0.064971923828125, -0.0604248046875, -0.055877685546875, -0.05133056640625, -0.046783447265625, -0.042236328125, -0.037689208984375, -0.03314208984375, -0.028594970703125, -0.0240478515625, -0.019500732421875, -0.01495361328125, -0.010406494140625, -0.005859375, -0.001312255859375, 0.00323486328125, 0.007781982421875, 0.0123291015625, 0.016876220703125, 0.02142333984375, 0.025970458984375, 0.030517578125, 0.035064697265625, 0.03961181640625, 0.044158935546875, 0.0487060546875, 0.053253173828125, 0.05780029296875, 0.062347412109375, 0.06689453125, 0.071441650390625, 0.07598876953125, 0.080535888671875, 0.0850830078125, 0.089630126953125, 0.09417724609375, 0.098724365234375, 0.103271484375, 0.107818603515625, 0.11236572265625, 0.116912841796875, 0.1214599609375, 0.126007080078125, 0.13055419921875, 0.135101318359375, 0.1396484375, 0.144195556640625, 0.14874267578125, 0.153289794921875, 0.1578369140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 5.0, 4.0, 8.0, 6.0, 12.0, 12.0, 25.0, 21.0, 32.0, 59.0, 86.0, 122.0, 258.0, 605.0, 1651.0, 7577.0, 128499.0, 856895.0, 45967.0, 4489.0, 1146.0, 459.0, 224.0, 121.0, 90.0, 46.0, 32.0, 26.0, 24.0, 12.0, 6.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.265380859375, -0.2569160461425781, -0.24845123291015625, -0.23998641967773438, -0.2315216064453125, -0.22305679321289062, -0.21459197998046875, -0.20612716674804688, -0.197662353515625, -0.18919754028320312, -0.18073272705078125, -0.17226791381835938, -0.1638031005859375, -0.15533828735351562, -0.14687347412109375, -0.13840866088867188, -0.12994384765625, -0.12147903442382812, -0.11301422119140625, -0.10454940795898438, -0.0960845947265625, -0.08761978149414062, -0.07915496826171875, -0.07069015502929688, -0.062225341796875, -0.053760528564453125, -0.04529571533203125, -0.036830902099609375, -0.0283660888671875, -0.019901275634765625, -0.01143646240234375, -0.002971649169921875, 0.0054931640625, 0.013957977294921875, 0.02242279052734375, 0.030887603759765625, 0.0393524169921875, 0.047817230224609375, 0.05628204345703125, 0.06474685668945312, 0.073211669921875, 0.08167648315429688, 0.09014129638671875, 0.09860610961914062, 0.1070709228515625, 0.11553573608398438, 0.12400054931640625, 0.13246536254882812, 0.14093017578125, 0.14939498901367188, 0.15785980224609375, 0.16632461547851562, 0.1747894287109375, 0.18325424194335938, 0.19171905517578125, 0.20018386840820312, 0.208648681640625, 0.21711349487304688, 0.22557830810546875, 0.23404312133789062, 0.2425079345703125, 0.2509727478027344, 0.25943756103515625, 0.2679023742675781, 0.2763671875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 6.0, 5.0, 10.0, 9.0, 15.0, 23.0, 16.0, 17.0, 24.0, 23.0, 35.0, 37.0, 31.0, 28.0, 38.0, 38.0, 34.0, 47.0, 48.0, 46.0, 42.0, 43.0, 36.0, 55.0, 41.0, 32.0, 33.0, 36.0, 35.0, 25.0, 16.0, 19.0, 10.0, 9.0, 10.0, 7.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15869140625, -0.15230751037597656, -0.14592361450195312, -0.1395397186279297, -0.13315582275390625, -0.1267719268798828, -0.12038803100585938, -0.11400413513183594, -0.1076202392578125, -0.10123634338378906, -0.09485244750976562, -0.08846855163574219, -0.08208465576171875, -0.07570075988769531, -0.06931686401367188, -0.06293296813964844, -0.056549072265625, -0.05016517639160156, -0.043781280517578125, -0.03739738464355469, -0.03101348876953125, -0.024629592895507812, -0.018245697021484375, -0.011861801147460938, -0.0054779052734375, 0.0009059906005859375, 0.007289886474609375, 0.013673782348632812, 0.02005767822265625, 0.026441574096679688, 0.032825469970703125, 0.03920936584472656, 0.04559326171875, 0.05197715759277344, 0.058361053466796875, 0.06474494934082031, 0.07112884521484375, 0.07751274108886719, 0.08389663696289062, 0.09028053283691406, 0.0966644287109375, 0.10304832458496094, 0.10943222045898438, 0.11581611633300781, 0.12220001220703125, 0.1285839080810547, 0.13496780395507812, 0.14135169982910156, 0.147735595703125, 0.15411949157714844, 0.16050338745117188, 0.1668872833251953, 0.17327117919921875, 0.1796550750732422, 0.18603897094726562, 0.19242286682128906, 0.1988067626953125, 0.20519065856933594, 0.21157455444335938, 0.2179584503173828, 0.22434234619140625, 0.2307262420654297, 0.23711013793945312, 0.24349403381347656, 0.2498779296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 10.0, 17.0, 33.0, 70.0, 111.0, 326.0, 1229.0, 10972.0, 932960.0, 98471.0, 3264.0, 651.0, 219.0, 99.0, 49.0, 15.0, 12.0, 8.0, 9.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1729736328125, -0.1679973602294922, -0.16302108764648438, -0.15804481506347656, -0.15306854248046875, -0.14809226989746094, -0.14311599731445312, -0.1381397247314453, -0.1331634521484375, -0.1281871795654297, -0.12321090698242188, -0.11823463439941406, -0.11325836181640625, -0.10828208923339844, -0.10330581665039062, -0.09832954406738281, -0.093353271484375, -0.08837699890136719, -0.08340072631835938, -0.07842445373535156, -0.07344818115234375, -0.06847190856933594, -0.06349563598632812, -0.05851936340332031, -0.0535430908203125, -0.04856681823730469, -0.043590545654296875, -0.03861427307128906, -0.03363800048828125, -0.028661727905273438, -0.023685455322265625, -0.018709182739257812, -0.01373291015625, -0.008756637573242188, -0.003780364990234375, 0.0011959075927734375, 0.00617218017578125, 0.011148452758789062, 0.016124725341796875, 0.021100997924804688, 0.0260772705078125, 0.031053543090820312, 0.036029815673828125, 0.04100608825683594, 0.04598236083984375, 0.05095863342285156, 0.055934906005859375, 0.06091117858886719, 0.065887451171875, 0.07086372375488281, 0.07583999633789062, 0.08081626892089844, 0.08579254150390625, 0.09076881408691406, 0.09574508666992188, 0.10072135925292969, 0.1056976318359375, 0.11067390441894531, 0.11565017700195312, 0.12062644958496094, 0.12560272216796875, 0.13057899475097656, 0.13555526733398438, 0.1405315399169922, 0.1455078125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 9.0, 6.0, 10.0, 9.0, 16.0, 9.0, 18.0, 23.0, 47.0, 27.0, 45.0, 58.0, 84.0, 65.0, 89.0, 74.0, 74.0, 69.0, 38.0, 42.0, 32.0, 26.0, 26.0, 23.0, 11.0, 16.0, 9.0, 6.0, 5.0, 11.0, 5.0, 8.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0192394256591797e-05, -9.862706065177917e-06, -9.533017873764038e-06, -9.203329682350159e-06, -8.87364149093628e-06, -8.5439532995224e-06, -8.21426510810852e-06, -7.884576916694641e-06, -7.554888725280762e-06, -7.225200533866882e-06, -6.895512342453003e-06, -6.5658241510391235e-06, -6.236135959625244e-06, -5.906447768211365e-06, -5.576759576797485e-06, -5.247071385383606e-06, -4.9173831939697266e-06, -4.587695002555847e-06, -4.258006811141968e-06, -3.928318619728088e-06, -3.598630428314209e-06, -3.2689422369003296e-06, -2.93925404548645e-06, -2.609565854072571e-06, -2.2798776626586914e-06, -1.950189471244812e-06, -1.6205012798309326e-06, -1.2908130884170532e-06, -9.611248970031738e-07, -6.314367055892944e-07, -3.0174851417541504e-07, 2.7939677238464355e-08, 3.5762786865234375e-07, 6.873160600662231e-07, 1.0170042514801025e-06, 1.346692442893982e-06, 1.6763806343078613e-06, 2.0060688257217407e-06, 2.33575701713562e-06, 2.6654452085494995e-06, 2.995133399963379e-06, 3.3248215913772583e-06, 3.6545097827911377e-06, 3.984197974205017e-06, 4.3138861656188965e-06, 4.643574357032776e-06, 4.973262548446655e-06, 5.302950739860535e-06, 5.632638931274414e-06, 5.9623271226882935e-06, 6.292015314102173e-06, 6.621703505516052e-06, 6.951391696929932e-06, 7.281079888343811e-06, 7.6107680797576904e-06, 7.94045627117157e-06, 8.27014446258545e-06, 8.599832653999329e-06, 8.929520845413208e-06, 9.259209036827087e-06, 9.588897228240967e-06, 9.918585419654846e-06, 1.0248273611068726e-05, 1.0577961802482605e-05, 1.0907649993896484e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 8.0, 22.0, 27.0, 38.0, 73.0, 114.0, 242.0, 522.0, 1486.0, 5509.0, 52258.0, 912633.0, 66574.0, 6220.0, 1592.0, 618.0, 270.0, 129.0, 67.0, 48.0, 31.0, 14.0, 9.0, 10.0, 6.0, 6.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1319580078125, -0.1280231475830078, -0.12408828735351562, -0.12015342712402344, -0.11621856689453125, -0.11228370666503906, -0.10834884643554688, -0.10441398620605469, -0.1004791259765625, -0.09654426574707031, -0.09260940551757812, -0.08867454528808594, -0.08473968505859375, -0.08080482482910156, -0.07686996459960938, -0.07293510437011719, -0.069000244140625, -0.06506538391113281, -0.061130523681640625, -0.05719566345214844, -0.05326080322265625, -0.04932594299316406, -0.045391082763671875, -0.04145622253417969, -0.0375213623046875, -0.03358650207519531, -0.029651641845703125, -0.025716781616210938, -0.02178192138671875, -0.017847061157226562, -0.013912200927734375, -0.009977340698242188, -0.00604248046875, -0.0021076202392578125, 0.001827239990234375, 0.0057621002197265625, 0.00969696044921875, 0.013631820678710938, 0.017566680908203125, 0.021501541137695312, 0.0254364013671875, 0.029371261596679688, 0.033306121826171875, 0.03724098205566406, 0.04117584228515625, 0.04511070251464844, 0.049045562744140625, 0.05298042297363281, 0.056915283203125, 0.06085014343261719, 0.06478500366210938, 0.06871986389160156, 0.07265472412109375, 0.07658958435058594, 0.08052444458007812, 0.08445930480957031, 0.0883941650390625, 0.09232902526855469, 0.09626388549804688, 0.10019874572753906, 0.10413360595703125, 0.10806846618652344, 0.11200332641601562, 0.11593818664550781, 0.119873046875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 3.0, 15.0, 13.0, 11.0, 14.0, 32.0, 37.0, 52.0, 82.0, 117.0, 145.0, 143.0, 104.0, 70.0, 45.0, 40.0, 20.0, 13.0, 12.0, 8.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10260009765625, -0.09938812255859375, -0.0961761474609375, -0.09296417236328125, -0.089752197265625, -0.08654022216796875, -0.0833282470703125, -0.08011627197265625, -0.076904296875, -0.07369232177734375, -0.0704803466796875, -0.06726837158203125, -0.064056396484375, -0.06084442138671875, -0.0576324462890625, -0.05442047119140625, -0.05120849609375, -0.04799652099609375, -0.0447845458984375, -0.04157257080078125, -0.038360595703125, -0.03514862060546875, -0.0319366455078125, -0.02872467041015625, -0.0255126953125, -0.02230072021484375, -0.0190887451171875, -0.01587677001953125, -0.012664794921875, -0.00945281982421875, -0.0062408447265625, -0.00302886962890625, 0.00018310546875, 0.00339508056640625, 0.0066070556640625, 0.00981903076171875, 0.013031005859375, 0.01624298095703125, 0.0194549560546875, 0.02266693115234375, 0.02587890625, 0.02909088134765625, 0.0323028564453125, 0.03551483154296875, 0.038726806640625, 0.04193878173828125, 0.0451507568359375, 0.04836273193359375, 0.05157470703125, 0.05478668212890625, 0.0579986572265625, 0.06121063232421875, 0.064422607421875, 0.06763458251953125, 0.0708465576171875, 0.07405853271484375, 0.0772705078125, 0.08048248291015625, 0.0836944580078125, 0.08690643310546875, 0.090118408203125, 0.09333038330078125, 0.0965423583984375, 0.09975433349609375, 0.10296630859375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 19.0, 59.0, 181.0, 322.0, 265.0, 99.0, 34.0, 10.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3284640312194824, -3.2503602504730225, -3.1722564697265625, -3.0941529273986816, -3.0160491466522217, -2.9379453659057617, -2.8598415851593018, -2.781737804412842, -2.703634262084961, -2.625530481338501, -2.547426700592041, -2.46932315826416, -2.3912193775177, -2.3131155967712402, -2.2350118160247803, -2.1569080352783203, -2.0788044929504395, -2.0007007122039795, -1.922597050666809, -1.8444932699203491, -1.7663896083831787, -1.6882858276367188, -1.6101820468902588, -1.5320783853530884, -1.4539744853973389, -1.375870704650879, -1.2977670431137085, -1.2196632623672485, -1.1415596008300781, -1.0634558200836182, -0.985352098941803, -0.9072483777999878, -0.8291447162628174, -0.7510409951210022, -0.672937273979187, -0.594833493232727, -0.5167298316955566, -0.43862608075141907, -0.3605223298072815, -0.2824186086654663, -0.20431488752365112, -0.12621116638183594, -0.04810743033885956, 0.02999630570411682, 0.108100026845932, 0.1862037479877472, 0.26430749893188477, 0.34241122007369995, 0.42051494121551514, 0.4986186623573303, 0.5767223834991455, 0.6548261642456055, 0.7329298257827759, 0.8110336065292358, 0.889137327671051, 0.9672410488128662, 1.0453448295593262, 1.1234486103057861, 1.2015522718429565, 1.2796560525894165, 1.357759714126587, 1.4358634948730469, 1.5139672756195068, 1.5920709371566772, 1.6701745986938477]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 6.0, 5.0, 9.0, 11.0, 10.0, 14.0, 22.0, 14.0, 14.0, 20.0, 18.0, 29.0, 23.0, 25.0, 25.0, 31.0, 34.0, 39.0, 33.0, 29.0, 31.0, 40.0, 42.0, 45.0, 42.0, 30.0, 43.0, 33.0, 39.0, 29.0, 28.0, 28.0, 16.0, 22.0, 20.0, 20.0, 14.0, 16.0, 6.0, 7.0, 6.0, 3.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.7534415125846863, -0.7289000153541565, -0.7043585181236267, -0.6798170208930969, -0.6552755832672119, -0.6307340860366821, -0.6061925888061523, -0.5816510915756226, -0.5571095943450928, -0.532568097114563, -0.5080265998840332, -0.4834851324558258, -0.458943635225296, -0.43440213799476624, -0.40986067056655884, -0.38531917333602905, -0.36077767610549927, -0.3362361788749695, -0.3116946816444397, -0.2871532142162323, -0.2626117169857025, -0.23807021975517273, -0.21352873742580414, -0.18898725509643555, -0.16444575786590576, -0.13990426063537598, -0.11536277830600739, -0.0908212885260582, -0.06627979874610901, -0.04173830896615982, -0.017196819186210632, 0.007344663143157959, 0.03188621997833252, 0.05642770975828171, 0.0809691995382309, 0.10551068931818008, 0.13005217909812927, 0.15459367632865906, 0.17913515865802765, 0.20367664098739624, 0.22821813821792603, 0.2527596354484558, 0.2773011326789856, 0.301842600107193, 0.3263840973377228, 0.35092559456825256, 0.37546706199645996, 0.40000855922698975, 0.42455005645751953, 0.4490915536880493, 0.4736330509185791, 0.4981745183467865, 0.5227160453796387, 0.5472574830055237, 0.5717989802360535, 0.5963404774665833, 0.620881974697113, 0.6454234719276428, 0.6699649691581726, 0.6945064663887024, 0.7190479040145874, 0.7435894012451172, 0.768130898475647, 0.7926723957061768, 0.8172138929367065]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 15.0, 27.0, 37.0, 38.0, 66.0, 98.0, 184.0, 392.0, 2536.0, 4177105.0, 12604.0, 589.0, 228.0, 117.0, 72.0, 47.0, 32.0, 26.0, 12.0, 12.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99609375, -0.9636077880859375, -0.931121826171875, -0.8986358642578125, -0.86614990234375, -0.8336639404296875, -0.801177978515625, -0.7686920166015625, -0.7362060546875, -0.7037200927734375, -0.671234130859375, -0.6387481689453125, -0.60626220703125, -0.5737762451171875, -0.541290283203125, -0.5088043212890625, -0.476318359375, -0.4438323974609375, -0.411346435546875, -0.3788604736328125, -0.34637451171875, -0.3138885498046875, -0.281402587890625, -0.2489166259765625, -0.2164306640625, -0.1839447021484375, -0.151458740234375, -0.1189727783203125, -0.08648681640625, -0.0540008544921875, -0.021514892578125, 0.0109710693359375, 0.04345703125, 0.0759429931640625, 0.108428955078125, 0.1409149169921875, 0.17340087890625, 0.2058868408203125, 0.238372802734375, 0.2708587646484375, 0.3033447265625, 0.3358306884765625, 0.368316650390625, 0.4008026123046875, 0.43328857421875, 0.4657745361328125, 0.498260498046875, 0.5307464599609375, 0.563232421875, 0.5957183837890625, 0.628204345703125, 0.6606903076171875, 0.69317626953125, 0.7256622314453125, 0.758148193359375, 0.7906341552734375, 0.8231201171875, 0.8556060791015625, 0.888092041015625, 0.9205780029296875, 0.95306396484375, 0.9855499267578125, 1.018035888671875, 1.0505218505859375, 1.0830078125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 11.0, 24.0, 36.0, 74.0, 112.0, 151.0, 155.0, 155.0, 132.0, 61.0, 33.0, 29.0, 12.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.1286602020263672, -0.12414169311523438, -0.11962318420410156, -0.11510467529296875, -0.11058616638183594, -0.10606765747070312, -0.10154914855957031, -0.0970306396484375, -0.09251213073730469, -0.08799362182617188, -0.08347511291503906, -0.07895660400390625, -0.07443809509277344, -0.06991958618164062, -0.06540107727050781, -0.060882568359375, -0.05636405944824219, -0.051845550537109375, -0.04732704162597656, -0.04280853271484375, -0.03829002380371094, -0.033771514892578125, -0.029253005981445312, -0.0247344970703125, -0.020215988159179688, -0.015697479248046875, -0.011178970336914062, -0.00666046142578125, -0.0021419525146484375, 0.002376556396484375, 0.0068950653076171875, 0.01141357421875, 0.015932083129882812, 0.020450592041015625, 0.024969100952148438, 0.02948760986328125, 0.03400611877441406, 0.038524627685546875, 0.04304313659667969, 0.0475616455078125, 0.05208015441894531, 0.056598663330078125, 0.06111717224121094, 0.06563568115234375, 0.07015419006347656, 0.07467269897460938, 0.07919120788574219, 0.083709716796875, 0.08822822570800781, 0.09274673461914062, 0.09726524353027344, 0.10178375244140625, 0.10630226135253906, 0.11082077026367188, 0.11533927917480469, 0.1198577880859375, 0.12437629699707031, 0.12889480590820312, 0.13341331481933594, 0.13793182373046875, 0.14245033264160156, 0.14696884155273438, 0.1514873504638672, 0.156005859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 2.0, 5.0, 6.0, 7.0, 3.0, 14.0, 12.0, 12.0, 16.0, 26.0, 29.0, 50.0, 86.0, 151.0, 420.0, 1328.0, 6164.0, 65434.0, 3748386.0, 352143.0, 16113.0, 2555.0, 663.0, 283.0, 128.0, 67.0, 43.0, 30.0, 23.0, 19.0, 19.0, 7.0, 7.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2318115234375, -0.2247295379638672, -0.21764755249023438, -0.21056556701660156, -0.20348358154296875, -0.19640159606933594, -0.18931961059570312, -0.1822376251220703, -0.1751556396484375, -0.1680736541748047, -0.16099166870117188, -0.15390968322753906, -0.14682769775390625, -0.13974571228027344, -0.13266372680664062, -0.1255817413330078, -0.118499755859375, -0.11141777038574219, -0.10433578491210938, -0.09725379943847656, -0.09017181396484375, -0.08308982849121094, -0.07600784301757812, -0.06892585754394531, -0.0618438720703125, -0.05476188659667969, -0.047679901123046875, -0.04059791564941406, -0.03351593017578125, -0.026433944702148438, -0.019351959228515625, -0.012269973754882812, -0.00518798828125, 0.0018939971923828125, 0.008975982666015625, 0.016057968139648438, 0.02313995361328125, 0.030221939086914062, 0.037303924560546875, 0.04438591003417969, 0.0514678955078125, 0.05854988098144531, 0.06563186645507812, 0.07271385192871094, 0.07979583740234375, 0.08687782287597656, 0.09395980834960938, 0.10104179382324219, 0.108123779296875, 0.11520576477050781, 0.12228775024414062, 0.12936973571777344, 0.13645172119140625, 0.14353370666503906, 0.15061569213867188, 0.1576976776123047, 0.1647796630859375, 0.1718616485595703, 0.17894363403320312, 0.18602561950683594, 0.19310760498046875, 0.20018959045410156, 0.20727157592773438, 0.2143535614013672, 0.221435546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 10.0, 3.0, 11.0, 9.0, 13.0, 20.0, 28.0, 36.0, 50.0, 55.0, 89.0, 166.0, 276.0, 510.0, 876.0, 793.0, 471.0, 232.0, 145.0, 75.0, 59.0, 32.0, 30.0, 13.0, 19.0, 7.0, 11.0, 11.0, 3.0, 5.0, 7.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.120849609375, -0.11694145202636719, -0.11303329467773438, -0.10912513732910156, -0.10521697998046875, -0.10130882263183594, -0.09740066528320312, -0.09349250793457031, -0.0895843505859375, -0.08567619323730469, -0.08176803588867188, -0.07785987854003906, -0.07395172119140625, -0.07004356384277344, -0.06613540649414062, -0.06222724914550781, -0.058319091796875, -0.05441093444824219, -0.050502777099609375, -0.04659461975097656, -0.04268646240234375, -0.03877830505371094, -0.034870147705078125, -0.030961990356445312, -0.0270538330078125, -0.023145675659179688, -0.019237518310546875, -0.015329360961914062, -0.01142120361328125, -0.0075130462646484375, -0.003604888916015625, 0.0003032684326171875, 0.00421142578125, 0.008119583129882812, 0.012027740478515625, 0.015935897827148438, 0.01984405517578125, 0.023752212524414062, 0.027660369873046875, 0.03156852722167969, 0.0354766845703125, 0.03938484191894531, 0.043292999267578125, 0.04720115661621094, 0.05110931396484375, 0.05501747131347656, 0.058925628662109375, 0.06283378601074219, 0.066741943359375, 0.07065010070800781, 0.07455825805664062, 0.07846641540527344, 0.08237457275390625, 0.08628273010253906, 0.09019088745117188, 0.09409904479980469, 0.0980072021484375, 0.10191535949707031, 0.10582351684570312, 0.10973167419433594, 0.11363983154296875, 0.11754798889160156, 0.12145614624023438, 0.1253643035888672, 0.1292724609375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 1.0, 7.0, 6.0, 10.0, 34.0, 70.0, 162.0, 212.0, 245.0, 142.0, 59.0, 26.0, 8.0, 5.0, 0.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1750646829605103, -1.1261309385299683, -1.0771971940994263, -1.0282633304595947, -0.9793295860290527, -0.9303958415985107, -0.8814620971679688, -0.8325283527374268, -0.78359454870224, -0.734660804271698, -0.6857270002365112, -0.6367932558059692, -0.5878595113754272, -0.5389257073402405, -0.4899919629096985, -0.4410581886768341, -0.3921244144439697, -0.34319064021110535, -0.29425686597824097, -0.24532312154769897, -0.1963893473148346, -0.14745557308197021, -0.09852182865142822, -0.04958805441856384, -0.0006542801856994629, 0.04827948659658432, 0.0972132533788681, 0.1461470127105713, 0.19508078694343567, 0.24401456117630005, 0.29294830560684204, 0.3418820798397064, 0.39081573486328125, 0.43974950909614563, 0.48868328332901, 0.537617027759552, 0.5865508317947388, 0.6354845762252808, 0.6844183206558228, 0.7333520650863647, 0.7822858691215515, 0.8312196135520935, 0.8801534175872803, 0.9290871620178223, 0.9780209064483643, 1.0269546508789062, 1.0758883953094482, 1.1248222589492798, 1.1737560033798218, 1.2226897478103638, 1.2716234922409058, 1.3205573558807373, 1.3694911003112793, 1.4184248447418213, 1.4673585891723633, 1.5162923336029053, 1.5652260780334473, 1.6141598224639893, 1.6630935668945312, 1.7120273113250732, 1.7609611749649048, 1.8098949193954468, 1.8588286638259888, 1.9077624082565308, 1.9566962718963623]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 8.0, 10.0, 8.0, 15.0, 20.0, 20.0, 17.0, 25.0, 25.0, 29.0, 30.0, 25.0, 38.0, 38.0, 44.0, 40.0, 41.0, 55.0, 49.0, 48.0, 53.0, 51.0, 29.0, 42.0, 34.0, 30.0, 20.0, 34.0, 20.0, 14.0, 17.0, 12.0, 12.0, 8.0, 11.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47909897565841675, -0.46196699142456055, -0.44483500719070435, -0.42770302295684814, -0.41057103872299194, -0.39343905448913574, -0.37630707025527954, -0.35917508602142334, -0.34204310178756714, -0.32491111755371094, -0.30777913331985474, -0.29064714908599854, -0.27351516485214233, -0.25638318061828613, -0.23925121128559113, -0.22211922705173492, -0.20498725771903992, -0.18785527348518372, -0.17072328925132751, -0.1535913050174713, -0.1364593207836151, -0.11932734400033951, -0.1021953672170639, -0.0850633829832077, -0.0679313987493515, -0.0507994145154953, -0.0336674340069294, -0.016535453498363495, 0.0005965307354927063, 0.017728514969348907, 0.03486049175262451, 0.05199247598648071, 0.06912446022033691, 0.08625644445419312, 0.10338842868804932, 0.12052040547132492, 0.13765239715576172, 0.15478438138961792, 0.17191635072231293, 0.18904833495616913, 0.20618031919002533, 0.22331230342388153, 0.24044428765773773, 0.25757625699043274, 0.27470824122428894, 0.29184022545814514, 0.30897220969200134, 0.32610419392585754, 0.34323617815971375, 0.36036816239356995, 0.37750014662742615, 0.39463213086128235, 0.41176411509513855, 0.42889609932899475, 0.44602805376052856, 0.46316003799438477, 0.48029202222824097, 0.49742400646209717, 0.5145559906959534, 0.5316879749298096, 0.5488199591636658, 0.565951943397522, 0.5830839276313782, 0.6002159118652344, 0.6173478960990906]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 11.0, 12.0, 25.0, 16.0, 36.0, 39.0, 54.0, 91.0, 124.0, 196.0, 271.0, 520.0, 939.0, 1761.0, 3949.0, 15030.0, 225632.0, 748315.0, 39538.0, 6572.0, 2459.0, 1221.0, 668.0, 387.0, 219.0, 129.0, 102.0, 54.0, 41.0, 26.0, 27.0, 16.0, 11.0, 13.0, 10.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.410400390625, -0.3976631164550781, -0.38492584228515625, -0.3721885681152344, -0.3594512939453125, -0.3467140197753906, -0.33397674560546875, -0.3212394714355469, -0.308502197265625, -0.2957649230957031, -0.28302764892578125, -0.2702903747558594, -0.2575531005859375, -0.24481582641601562, -0.23207855224609375, -0.21934127807617188, -0.20660400390625, -0.19386672973632812, -0.18112945556640625, -0.16839218139648438, -0.1556549072265625, -0.14291763305664062, -0.13018035888671875, -0.11744308471679688, -0.104705810546875, -0.09196853637695312, -0.07923126220703125, -0.06649398803710938, -0.0537567138671875, -0.041019439697265625, -0.02828216552734375, -0.015544891357421875, -0.0028076171875, 0.009929656982421875, 0.02266693115234375, 0.035404205322265625, 0.0481414794921875, 0.060878753662109375, 0.07361602783203125, 0.08635330200195312, 0.099090576171875, 0.11182785034179688, 0.12456512451171875, 0.13730239868164062, 0.1500396728515625, 0.16277694702148438, 0.17551422119140625, 0.18825149536132812, 0.20098876953125, 0.21372604370117188, 0.22646331787109375, 0.23920059204101562, 0.2519378662109375, 0.2646751403808594, 0.27741241455078125, 0.2901496887207031, 0.302886962890625, 0.3156242370605469, 0.32836151123046875, 0.3410987854003906, 0.3538360595703125, 0.3665733337402344, 0.37931060791015625, 0.3920478820800781, 0.40478515625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 14.0, 17.0, 45.0, 73.0, 96.0, 150.0, 169.0, 163.0, 102.0, 70.0, 44.0, 25.0, 9.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134765625, -0.13019943237304688, -0.12563323974609375, -0.12106704711914062, -0.1165008544921875, -0.11193466186523438, -0.10736846923828125, -0.10280227661132812, -0.098236083984375, -0.09366989135742188, -0.08910369873046875, -0.08453750610351562, -0.0799713134765625, -0.07540512084960938, -0.07083892822265625, -0.06627273559570312, -0.06170654296875, -0.057140350341796875, -0.05257415771484375, -0.048007965087890625, -0.0434417724609375, -0.038875579833984375, -0.03430938720703125, -0.029743194580078125, -0.025177001953125, -0.020610809326171875, -0.01604461669921875, -0.011478424072265625, -0.0069122314453125, -0.002346038818359375, 0.00222015380859375, 0.006786346435546875, 0.0113525390625, 0.015918731689453125, 0.02048492431640625, 0.025051116943359375, 0.0296173095703125, 0.034183502197265625, 0.03874969482421875, 0.043315887451171875, 0.047882080078125, 0.052448272705078125, 0.05701446533203125, 0.061580657958984375, 0.0661468505859375, 0.07071304321289062, 0.07527923583984375, 0.07984542846679688, 0.08441162109375, 0.08897781372070312, 0.09354400634765625, 0.09811019897460938, 0.1026763916015625, 0.10724258422851562, 0.11180877685546875, 0.11637496948242188, 0.120941162109375, 0.12550735473632812, 0.13007354736328125, 0.13463973999023438, 0.1392059326171875, 0.14377212524414062, 0.14833831787109375, 0.15290451049804688, 0.157470703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 11.0, 6.0, 16.0, 22.0, 30.0, 34.0, 48.0, 58.0, 91.0, 103.0, 177.0, 267.0, 481.0, 990.0, 2312.0, 9298.0, 117508.0, 855384.0, 51731.0, 6180.0, 1824.0, 800.0, 391.0, 224.0, 170.0, 88.0, 74.0, 57.0, 43.0, 29.0, 15.0, 17.0, 21.0, 7.0, 6.0, 6.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.325927734375, -0.316162109375, -0.306396484375, -0.296630859375, -0.286865234375, -0.277099609375, -0.267333984375, -0.257568359375, -0.247802734375, -0.238037109375, -0.228271484375, -0.218505859375, -0.208740234375, -0.198974609375, -0.189208984375, -0.179443359375, -0.169677734375, -0.159912109375, -0.150146484375, -0.140380859375, -0.130615234375, -0.120849609375, -0.111083984375, -0.101318359375, -0.091552734375, -0.081787109375, -0.072021484375, -0.062255859375, -0.052490234375, -0.042724609375, -0.032958984375, -0.023193359375, -0.013427734375, -0.003662109375, 0.006103515625, 0.015869140625, 0.025634765625, 0.035400390625, 0.045166015625, 0.054931640625, 0.064697265625, 0.074462890625, 0.084228515625, 0.093994140625, 0.103759765625, 0.113525390625, 0.123291015625, 0.133056640625, 0.142822265625, 0.152587890625, 0.162353515625, 0.172119140625, 0.181884765625, 0.191650390625, 0.201416015625, 0.211181640625, 0.220947265625, 0.230712890625, 0.240478515625, 0.250244140625, 0.260009765625, 0.269775390625, 0.279541015625, 0.289306640625, 0.299072265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 2.0, 4.0, 6.0, 6.0, 11.0, 16.0, 13.0, 14.0, 19.0, 21.0, 32.0, 42.0, 47.0, 50.0, 49.0, 65.0, 60.0, 53.0, 60.0, 55.0, 51.0, 49.0, 41.0, 37.0, 39.0, 37.0, 26.0, 16.0, 16.0, 19.0, 9.0, 8.0, 3.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.313720703125, -0.30498313903808594, -0.2962455749511719, -0.2875080108642578, -0.27877044677734375, -0.2700328826904297, -0.2612953186035156, -0.25255775451660156, -0.2438201904296875, -0.23508262634277344, -0.22634506225585938, -0.2176074981689453, -0.20886993408203125, -0.2001323699951172, -0.19139480590820312, -0.18265724182128906, -0.173919677734375, -0.16518211364746094, -0.15644454956054688, -0.1477069854736328, -0.13896942138671875, -0.1302318572998047, -0.12149429321289062, -0.11275672912597656, -0.1040191650390625, -0.09528160095214844, -0.08654403686523438, -0.07780647277832031, -0.06906890869140625, -0.06033134460449219, -0.051593780517578125, -0.04285621643066406, -0.03411865234375, -0.025381088256835938, -0.016643524169921875, -0.007905960083007812, 0.00083160400390625, 0.009569168090820312, 0.018306732177734375, 0.027044296264648438, 0.0357818603515625, 0.04451942443847656, 0.053256988525390625, 0.06199455261230469, 0.07073211669921875, 0.07946968078613281, 0.08820724487304688, 0.09694480895996094, 0.105682373046875, 0.11441993713378906, 0.12315750122070312, 0.1318950653076172, 0.14063262939453125, 0.1493701934814453, 0.15810775756835938, 0.16684532165527344, 0.1755828857421875, 0.18432044982910156, 0.19305801391601562, 0.2017955780029297, 0.21053314208984375, 0.2192707061767578, 0.22800827026367188, 0.23674583435058594, 0.2454833984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 9.0, 13.0, 15.0, 28.0, 46.0, 76.0, 131.0, 238.0, 443.0, 1008.0, 3023.0, 13599.0, 221874.0, 774423.0, 26238.0, 4696.0, 1431.0, 613.0, 246.0, 150.0, 81.0, 48.0, 30.0, 14.0, 17.0, 19.0, 7.0, 9.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14434242248535156, -0.13939285278320312, -0.1344432830810547, -0.12949371337890625, -0.12454414367675781, -0.11959457397460938, -0.11464500427246094, -0.1096954345703125, -0.10474586486816406, -0.09979629516601562, -0.09484672546386719, -0.08989715576171875, -0.08494758605957031, -0.07999801635742188, -0.07504844665527344, -0.070098876953125, -0.06514930725097656, -0.060199737548828125, -0.05525016784667969, -0.05030059814453125, -0.04535102844238281, -0.040401458740234375, -0.03545188903808594, -0.0305023193359375, -0.025552749633789062, -0.020603179931640625, -0.015653610229492188, -0.01070404052734375, -0.0057544708251953125, -0.000804901123046875, 0.0041446685791015625, 0.00909423828125, 0.014043807983398438, 0.018993377685546875, 0.023942947387695312, 0.02889251708984375, 0.03384208679199219, 0.038791656494140625, 0.04374122619628906, 0.0486907958984375, 0.05364036560058594, 0.058589935302734375, 0.06353950500488281, 0.06848907470703125, 0.07343864440917969, 0.07838821411132812, 0.08333778381347656, 0.088287353515625, 0.09323692321777344, 0.09818649291992188, 0.10313606262207031, 0.10808563232421875, 0.11303520202636719, 0.11798477172851562, 0.12293434143066406, 0.1278839111328125, 0.13283348083496094, 0.13778305053710938, 0.1427326202392578, 0.14768218994140625, 0.1526317596435547, 0.15758132934570312, 0.16253089904785156, 0.16748046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 3.0, 11.0, 13.0, 16.0, 23.0, 38.0, 57.0, 95.0, 133.0, 167.0, 151.0, 92.0, 69.0, 47.0, 23.0, 16.0, 13.0, 9.0, 13.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.045797348022461e-05, -2.9462389647960663e-05, -2.8466805815696716e-05, -2.747122198343277e-05, -2.6475638151168823e-05, -2.5480054318904877e-05, -2.448447048664093e-05, -2.3488886654376984e-05, -2.2493302822113037e-05, -2.149771898984909e-05, -2.0502135157585144e-05, -1.9506551325321198e-05, -1.851096749305725e-05, -1.7515383660793304e-05, -1.6519799828529358e-05, -1.552421599626541e-05, -1.4528632164001465e-05, -1.3533048331737518e-05, -1.2537464499473572e-05, -1.1541880667209625e-05, -1.0546296834945679e-05, -9.550713002681732e-06, -8.555129170417786e-06, -7.559545338153839e-06, -6.563961505889893e-06, -5.568377673625946e-06, -4.5727938413619995e-06, -3.577210009098053e-06, -2.5816261768341064e-06, -1.58604234457016e-06, -5.904585123062134e-07, 4.0512531995773315e-07, 1.4007091522216797e-06, 2.3962929844856262e-06, 3.3918768167495728e-06, 4.387460649013519e-06, 5.383044481277466e-06, 6.378628313541412e-06, 7.374212145805359e-06, 8.369795978069305e-06, 9.365379810333252e-06, 1.0360963642597198e-05, 1.1356547474861145e-05, 1.2352131307125092e-05, 1.3347715139389038e-05, 1.4343298971652985e-05, 1.533888280391693e-05, 1.6334466636180878e-05, 1.7330050468444824e-05, 1.832563430070877e-05, 1.9321218132972717e-05, 2.0316801965236664e-05, 2.131238579750061e-05, 2.2307969629764557e-05, 2.3303553462028503e-05, 2.429913729429245e-05, 2.5294721126556396e-05, 2.6290304958820343e-05, 2.728588879108429e-05, 2.8281472623348236e-05, 2.9277056455612183e-05, 3.027264028787613e-05, 3.1268224120140076e-05, 3.226380795240402e-05, 3.325939178466797e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 6.0, 4.0, 10.0, 18.0, 21.0, 26.0, 48.0, 42.0, 72.0, 106.0, 127.0, 203.0, 363.0, 634.0, 1221.0, 2667.0, 7172.0, 29960.0, 350455.0, 600321.0, 40098.0, 8664.0, 3111.0, 1319.0, 724.0, 385.0, 239.0, 164.0, 98.0, 71.0, 58.0, 39.0, 27.0, 13.0, 15.0, 14.0, 14.0, 2.0, 6.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.140625, -0.13637351989746094, -0.13212203979492188, -0.1278705596923828, -0.12361907958984375, -0.11936759948730469, -0.11511611938476562, -0.11086463928222656, -0.1066131591796875, -0.10236167907714844, -0.09811019897460938, -0.09385871887207031, -0.08960723876953125, -0.08535575866699219, -0.08110427856445312, -0.07685279846191406, -0.072601318359375, -0.06834983825683594, -0.06409835815429688, -0.05984687805175781, -0.05559539794921875, -0.05134391784667969, -0.047092437744140625, -0.04284095764160156, -0.0385894775390625, -0.03433799743652344, -0.030086517333984375, -0.025835037231445312, -0.02158355712890625, -0.017332077026367188, -0.013080596923828125, -0.008829116821289062, -0.00457763671875, -0.0003261566162109375, 0.003925323486328125, 0.008176803588867188, 0.01242828369140625, 0.016679763793945312, 0.020931243896484375, 0.025182723999023438, 0.0294342041015625, 0.03368568420410156, 0.037937164306640625, 0.04218864440917969, 0.04644012451171875, 0.05069160461425781, 0.054943084716796875, 0.05919456481933594, 0.063446044921875, 0.06769752502441406, 0.07194900512695312, 0.07620048522949219, 0.08045196533203125, 0.08470344543457031, 0.08895492553710938, 0.09320640563964844, 0.0974578857421875, 0.10170936584472656, 0.10596084594726562, 0.11021232604980469, 0.11446380615234375, 0.11871528625488281, 0.12296676635742188, 0.12721824645996094, 0.1314697265625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 8.0, 11.0, 18.0, 13.0, 34.0, 37.0, 42.0, 54.0, 88.0, 85.0, 99.0, 95.0, 89.0, 71.0, 51.0, 48.0, 27.0, 29.0, 18.0, 12.0, 15.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11285400390625, -0.10929679870605469, -0.10573959350585938, -0.10218238830566406, -0.09862518310546875, -0.09506797790527344, -0.09151077270507812, -0.08795356750488281, -0.0843963623046875, -0.08083915710449219, -0.07728195190429688, -0.07372474670410156, -0.07016754150390625, -0.06661033630371094, -0.06305313110351562, -0.05949592590332031, -0.055938720703125, -0.05238151550292969, -0.048824310302734375, -0.04526710510253906, -0.04170989990234375, -0.03815269470214844, -0.034595489501953125, -0.031038284301757812, -0.0274810791015625, -0.023923873901367188, -0.020366668701171875, -0.016809463500976562, -0.01325225830078125, -0.009695053100585938, -0.006137847900390625, -0.0025806427001953125, 0.0009765625, 0.0045337677001953125, 0.008090972900390625, 0.011648178100585938, 0.01520538330078125, 0.018762588500976562, 0.022319793701171875, 0.025876998901367188, 0.0294342041015625, 0.03299140930175781, 0.036548614501953125, 0.04010581970214844, 0.04366302490234375, 0.04722023010253906, 0.050777435302734375, 0.05433464050292969, 0.057891845703125, 0.06144905090332031, 0.06500625610351562, 0.06856346130371094, 0.07212066650390625, 0.07567787170410156, 0.07923507690429688, 0.08279228210449219, 0.0863494873046875, 0.08990669250488281, 0.09346389770507812, 0.09702110290527344, 0.10057830810546875, 0.10413551330566406, 0.10769271850585938, 0.11124992370605469, 0.11480712890625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 17.0, 47.0, 126.0, 250.0, 284.0, 154.0, 71.0, 21.0, 5.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9098281860351562, -1.8276026248931885, -1.7453771829605103, -1.6631516218185425, -1.5809261798858643, -1.4987006187438965, -1.4164750576019287, -1.334249496459961, -1.2520240545272827, -1.169798493385315, -1.0875730514526367, -1.005347490310669, -0.923121988773346, -0.840896487236023, -0.7586709260940552, -0.6764454245567322, -0.5942199230194092, -0.5119944214820862, -0.4297688901424408, -0.3475433588027954, -0.2653178572654724, -0.18309235572814941, -0.10086682438850403, -0.018641293048858643, 0.06358420848846436, 0.14580972492694855, 0.22803524136543274, 0.3102607727050781, 0.3924862742424011, 0.4747117757797241, 0.5569373369216919, 0.6391628384590149, 0.7213883399963379, 0.8036138415336609, 0.8858393430709839, 0.9680649042129517, 1.0502903461456299, 1.1325159072875977, 1.2147414684295654, 1.2969670295715332, 1.3791924715042114, 1.4614180326461792, 1.5436434745788574, 1.6258690357208252, 1.708094596862793, 1.7903200387954712, 1.872545599937439, 1.9547710418701172, 2.036996603012085, 2.1192221641540527, 2.2014477252960205, 2.283673048019409, 2.365898609161377, 2.4481241703033447, 2.5303497314453125, 2.6125752925872803, 2.694800853729248, 2.777026414871216, 2.8592519760131836, 2.9414772987365723, 3.02370285987854, 3.105928421020508, 3.1881539821624756, 3.2703795433044434, 3.352604866027832]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 9.0, 13.0, 6.0, 14.0, 6.0, 13.0, 15.0, 12.0, 21.0, 21.0, 26.0, 24.0, 36.0, 36.0, 42.0, 55.0, 52.0, 52.0, 50.0, 48.0, 58.0, 51.0, 47.0, 44.0, 26.0, 31.0, 31.0, 26.0, 24.0, 16.0, 17.0, 10.0, 13.0, 16.0, 10.0, 8.0, 4.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-1.1702250242233276, -1.1381992101669312, -1.1061733961105347, -1.0741477012634277, -1.0421218872070312, -1.0100960731506348, -0.9780702590942383, -0.9460444450378418, -0.9140186905860901, -0.8819928765296936, -0.8499671220779419, -0.8179413080215454, -0.7859154939651489, -0.7538897395133972, -0.7218639254570007, -0.689838171005249, -0.6578123569488525, -0.625786542892456, -0.5937607884407043, -0.5617349743843079, -0.5297092199325562, -0.49768340587615967, -0.4656575918197632, -0.4336318075656891, -0.401606023311615, -0.3695802390575409, -0.3375544548034668, -0.3055286407470703, -0.2735028564929962, -0.24147707223892212, -0.20945127308368683, -0.17742547392845154, -0.14539974927902222, -0.11337395757436752, -0.08134816586971283, -0.049322374165058136, -0.017296582460403442, 0.014729201793670654, 0.046755000948905945, 0.07878080010414124, 0.11080658435821533, 0.14283236861228943, 0.17485816776752472, 0.20688396692276, 0.2389097511768341, 0.2709355354309082, 0.3029613494873047, 0.3349871337413788, 0.3670129179954529, 0.399038702249527, 0.4310644865036011, 0.46309030055999756, 0.49511608481407166, 0.5271418690681458, 0.5591676831245422, 0.591193437576294, 0.6232192516326904, 0.6552450656890869, 0.6872708201408386, 0.7192966341972351, 0.7513223886489868, 0.7833482027053833, 0.8153740167617798, 0.8473998308181763, 0.879425585269928]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 3.0, 11.0, 13.0, 12.0, 14.0, 29.0, 26.0, 49.0, 77.0, 293.0, 4191965.0, 1395.0, 172.0, 64.0, 47.0, 31.0, 23.0, 14.0, 12.0, 8.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.6875, -20.015380859375, -19.34326171875, -18.671142578125, -17.9990234375, -17.326904296875, -16.65478515625, -15.982666015625, -15.310546875, -14.638427734375, -13.96630859375, -13.294189453125, -12.6220703125, -11.949951171875, -11.27783203125, -10.605712890625, -9.93359375, -9.261474609375, -8.58935546875, -7.917236328125, -7.2451171875, -6.572998046875, -5.90087890625, -5.228759765625, -4.556640625, -3.884521484375, -3.21240234375, -2.540283203125, -1.8681640625, -1.196044921875, -0.52392578125, 0.148193359375, 0.8203125, 1.492431640625, 2.16455078125, 2.836669921875, 3.5087890625, 4.180908203125, 4.85302734375, 5.525146484375, 6.197265625, 6.869384765625, 7.54150390625, 8.213623046875, 8.8857421875, 9.557861328125, 10.22998046875, 10.902099609375, 11.57421875, 12.246337890625, 12.91845703125, 13.590576171875, 14.2626953125, 14.934814453125, 15.60693359375, 16.279052734375, 16.951171875, 17.623291015625, 18.29541015625, 18.967529296875, 19.6396484375, 20.311767578125, 20.98388671875, 21.656005859375, 22.328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 22.0, 33.0, 57.0, 93.0, 130.0, 170.0, 149.0, 115.0, 91.0, 61.0, 26.0, 13.0, 14.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135009765625, -0.13048362731933594, -0.12595748901367188, -0.12143135070800781, -0.11690521240234375, -0.11237907409667969, -0.10785293579101562, -0.10332679748535156, -0.0988006591796875, -0.09427452087402344, -0.08974838256835938, -0.08522224426269531, -0.08069610595703125, -0.07616996765136719, -0.07164382934570312, -0.06711769104003906, -0.062591552734375, -0.05806541442871094, -0.053539276123046875, -0.04901313781738281, -0.04448699951171875, -0.03996086120605469, -0.035434722900390625, -0.030908584594726562, -0.0263824462890625, -0.021856307983398438, -0.017330169677734375, -0.012804031372070312, -0.00827789306640625, -0.0037517547607421875, 0.000774383544921875, 0.0053005218505859375, 0.00982666015625, 0.014352798461914062, 0.018878936767578125, 0.023405075073242188, 0.02793121337890625, 0.03245735168457031, 0.036983489990234375, 0.04150962829589844, 0.0460357666015625, 0.05056190490722656, 0.055088043212890625, 0.05961418151855469, 0.06414031982421875, 0.06866645812988281, 0.07319259643554688, 0.07771873474121094, 0.082244873046875, 0.08677101135253906, 0.09129714965820312, 0.09582328796386719, 0.10034942626953125, 0.10487556457519531, 0.10940170288085938, 0.11392784118652344, 0.1184539794921875, 0.12298011779785156, 0.12750625610351562, 0.1320323944091797, 0.13655853271484375, 0.1410846710205078, 0.14561080932617188, 0.15013694763183594, 0.1546630859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 6.0, 7.0, 14.0, 22.0, 27.0, 44.0, 95.0, 178.0, 384.0, 1193.0, 6044.0, 95798.0, 4018222.0, 64836.0, 5482.0, 1183.0, 359.0, 172.0, 78.0, 54.0, 25.0, 15.0, 7.0, 4.0, 11.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.46875, -0.4565582275390625, -0.444366455078125, -0.4321746826171875, -0.41998291015625, -0.4077911376953125, -0.395599365234375, -0.3834075927734375, -0.3712158203125, -0.3590240478515625, -0.346832275390625, -0.3346405029296875, -0.32244873046875, -0.3102569580078125, -0.298065185546875, -0.2858734130859375, -0.273681640625, -0.2614898681640625, -0.249298095703125, -0.2371063232421875, -0.22491455078125, -0.2127227783203125, -0.200531005859375, -0.1883392333984375, -0.1761474609375, -0.1639556884765625, -0.151763916015625, -0.1395721435546875, -0.12738037109375, -0.1151885986328125, -0.102996826171875, -0.0908050537109375, -0.07861328125, -0.0664215087890625, -0.054229736328125, -0.0420379638671875, -0.02984619140625, -0.0176544189453125, -0.005462646484375, 0.0067291259765625, 0.0189208984375, 0.0311126708984375, 0.043304443359375, 0.0554962158203125, 0.06768798828125, 0.0798797607421875, 0.092071533203125, 0.1042633056640625, 0.116455078125, 0.1286468505859375, 0.140838623046875, 0.1530303955078125, 0.16522216796875, 0.1774139404296875, 0.189605712890625, 0.2017974853515625, 0.2139892578125, 0.2261810302734375, 0.238372802734375, 0.2505645751953125, 0.26275634765625, 0.2749481201171875, 0.287139892578125, 0.2993316650390625, 0.3115234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 8.0, 7.0, 12.0, 14.0, 19.0, 29.0, 31.0, 56.0, 94.0, 151.0, 240.0, 495.0, 1039.0, 884.0, 387.0, 218.0, 125.0, 68.0, 48.0, 41.0, 21.0, 22.0, 14.0, 10.0, 6.0, 2.0, 6.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1234130859375, -0.11942100524902344, -0.11542892456054688, -0.11143684387207031, -0.10744476318359375, -0.10345268249511719, -0.09946060180664062, -0.09546852111816406, -0.0914764404296875, -0.08748435974121094, -0.08349227905273438, -0.07950019836425781, -0.07550811767578125, -0.07151603698730469, -0.06752395629882812, -0.06353187561035156, -0.059539794921875, -0.05554771423339844, -0.051555633544921875, -0.04756355285644531, -0.04357147216796875, -0.03957939147949219, -0.035587310791015625, -0.03159523010253906, -0.0276031494140625, -0.023611068725585938, -0.019618988037109375, -0.015626907348632812, -0.01163482666015625, -0.0076427459716796875, -0.003650665283203125, 0.0003414154052734375, 0.00433349609375, 0.008325576782226562, 0.012317657470703125, 0.016309738159179688, 0.02030181884765625, 0.024293899536132812, 0.028285980224609375, 0.03227806091308594, 0.0362701416015625, 0.04026222229003906, 0.044254302978515625, 0.04824638366699219, 0.05223846435546875, 0.05623054504394531, 0.060222625732421875, 0.06421470642089844, 0.068206787109375, 0.07219886779785156, 0.07619094848632812, 0.08018302917480469, 0.08417510986328125, 0.08816719055175781, 0.09215927124023438, 0.09615135192871094, 0.1001434326171875, 0.10413551330566406, 0.10812759399414062, 0.11211967468261719, 0.11611175537109375, 0.12010383605957031, 0.12409591674804688, 0.12808799743652344, 0.132080078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 18.0, 66.0, 481.0, 264.0, 88.0, 37.0, 22.0, 12.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2628905773162842, -1.1309131383895874, -0.9989356994628906, -0.8669582605361938, -0.7349808216094971, -0.6030033826828003, -0.4710259437561035, -0.33904850482940674, -0.20707106590270996, -0.07509362697601318, 0.056883811950683594, 0.18886125087738037, 0.32083868980407715, 0.4528161287307739, 0.5847935676574707, 0.7167710065841675, 0.8487484455108643, 0.980725884437561, 1.1127033233642578, 1.2446807622909546, 1.3766582012176514, 1.5086356401443481, 1.640613079071045, 1.7725905179977417, 1.9045679569244385, 2.0365452766418457, 2.168522834777832, 2.3005003929138184, 2.4324777126312256, 2.564455032348633, 2.696432590484619, 2.8284101486206055, 2.9603872299194336, 3.09236478805542, 3.224342107772827, 3.3563194274902344, 3.4882969856262207, 3.620274543762207, 3.7522518634796143, 3.8842291831970215, 4.016206741333008, 4.148184299468994, 4.2801618576049805, 4.412138938903809, 4.544116497039795, 4.676094055175781, 4.808071136474609, 4.940048694610596, 5.072026252746582, 5.204003810882568, 5.335981369018555, 5.467958450317383, 5.599936008453369, 5.7319135665893555, 5.863890647888184, 5.99586820602417, 6.127845764160156, 6.259823322296143, 6.391800880432129, 6.523777961730957, 6.655755519866943, 6.78773307800293, 6.919710159301758, 7.051687717437744, 7.1836652755737305]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 3.0, 13.0, 10.0, 16.0, 17.0, 27.0, 34.0, 26.0, 39.0, 49.0, 43.0, 63.0, 52.0, 76.0, 61.0, 62.0, 69.0, 62.0, 46.0, 42.0, 39.0, 34.0, 20.0, 24.0, 19.0, 8.0, 11.0, 8.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9663889408111572, -0.9363610148429871, -0.9063330888748169, -0.8763052225112915, -0.8462772965431213, -0.8162493705749512, -0.786221444606781, -0.7561935186386108, -0.7261656522750854, -0.6961377263069153, -0.6661098003387451, -0.6360819339752197, -0.6060540080070496, -0.5760260820388794, -0.5459981560707092, -0.5159702301025391, -0.4859423041343689, -0.45591437816619873, -0.42588648200035095, -0.3958585560321808, -0.365830659866333, -0.33580273389816284, -0.3057748079299927, -0.2757468819618225, -0.24571898579597473, -0.21569107472896576, -0.1856631636619568, -0.15563523769378662, -0.12560732662677765, -0.09557941555976868, -0.06555148959159851, -0.03552357852458954, -0.005495667457580566, 0.024532247334718704, 0.054560162127017975, 0.08458808064460754, 0.11461599171161652, 0.1446439027786255, 0.17467182874679565, 0.20469973981380463, 0.2347276508808136, 0.26475557684898376, 0.29478347301483154, 0.3248113989830017, 0.3548393249511719, 0.38486722111701965, 0.4148951470851898, 0.4449230432510376, 0.47495096921920776, 0.5049788951873779, 0.5350068211555481, 0.5650347471237183, 0.5950626134872437, 0.6250905394554138, 0.655118465423584, 0.6851463913917542, 0.7151743173599243, 0.7452022433280945, 0.7752301692962646, 0.80525803565979, 0.8352859616279602, 0.8653138875961304, 0.8953418135643005, 0.9253697395324707, 0.9553976058959961]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 4.0, 7.0, 10.0, 19.0, 44.0, 103.0, 224.0, 776.0, 4722.0, 118943.0, 902001.0, 18985.0, 1974.0, 474.0, 116.0, 64.0, 31.0, 18.0, 15.0, 11.0, 4.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.736328125, -0.7127838134765625, -0.689239501953125, -0.6656951904296875, -0.64215087890625, -0.6186065673828125, -0.595062255859375, -0.5715179443359375, -0.5479736328125, -0.5244293212890625, -0.500885009765625, -0.4773406982421875, -0.45379638671875, -0.4302520751953125, -0.406707763671875, -0.3831634521484375, -0.359619140625, -0.3360748291015625, -0.312530517578125, -0.2889862060546875, -0.26544189453125, -0.2418975830078125, -0.218353271484375, -0.1948089599609375, -0.1712646484375, -0.1477203369140625, -0.124176025390625, -0.1006317138671875, -0.07708740234375, -0.0535430908203125, -0.029998779296875, -0.0064544677734375, 0.01708984375, 0.0406341552734375, 0.064178466796875, 0.0877227783203125, 0.11126708984375, 0.1348114013671875, 0.158355712890625, 0.1819000244140625, 0.2054443359375, 0.2289886474609375, 0.252532958984375, 0.2760772705078125, 0.29962158203125, 0.3231658935546875, 0.346710205078125, 0.3702545166015625, 0.393798828125, 0.4173431396484375, 0.440887451171875, 0.4644317626953125, 0.48797607421875, 0.5115203857421875, 0.535064697265625, 0.5586090087890625, 0.5821533203125, 0.6056976318359375, 0.629241943359375, 0.6527862548828125, 0.67633056640625, 0.6998748779296875, 0.723419189453125, 0.7469635009765625, 0.7705078125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 14.0, 23.0, 42.0, 52.0, 111.0, 127.0, 133.0, 159.0, 124.0, 87.0, 55.0, 24.0, 21.0, 9.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1397705078125, -0.13522720336914062, -0.13068389892578125, -0.12614059448242188, -0.1215972900390625, -0.11705398559570312, -0.11251068115234375, -0.10796737670898438, -0.103424072265625, -0.09888076782226562, -0.09433746337890625, -0.08979415893554688, -0.0852508544921875, -0.08070755004882812, -0.07616424560546875, -0.07162094116210938, -0.06707763671875, -0.06253433227539062, -0.05799102783203125, -0.053447723388671875, -0.0489044189453125, -0.044361114501953125, -0.03981781005859375, -0.035274505615234375, -0.030731201171875, -0.026187896728515625, -0.02164459228515625, -0.017101287841796875, -0.0125579833984375, -0.008014678955078125, -0.00347137451171875, 0.001071929931640625, 0.005615234375, 0.010158538818359375, 0.01470184326171875, 0.019245147705078125, 0.0237884521484375, 0.028331756591796875, 0.03287506103515625, 0.037418365478515625, 0.041961669921875, 0.046504974365234375, 0.05104827880859375, 0.055591583251953125, 0.0601348876953125, 0.06467819213867188, 0.06922149658203125, 0.07376480102539062, 0.07830810546875, 0.08285140991210938, 0.08739471435546875, 0.09193801879882812, 0.0964813232421875, 0.10102462768554688, 0.10556793212890625, 0.11011123657226562, 0.114654541015625, 0.11919784545898438, 0.12374114990234375, 0.12828445434570312, 0.1328277587890625, 0.13737106323242188, 0.14191436767578125, 0.14645767211914062, 0.1510009765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 5.0, 11.0, 12.0, 14.0, 13.0, 19.0, 27.0, 43.0, 52.0, 72.0, 93.0, 198.0, 285.0, 476.0, 819.0, 1532.0, 3243.0, 7933.0, 22174.0, 74432.0, 297214.0, 480535.0, 109742.0, 30838.0, 10336.0, 4065.0, 1894.0, 962.0, 551.0, 325.0, 184.0, 141.0, 85.0, 64.0, 39.0, 31.0, 19.0, 20.0, 8.0, 7.0, 6.0, 11.0, 2.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1536865234375, -0.1482257843017578, -0.14276504516601562, -0.13730430603027344, -0.13184356689453125, -0.12638282775878906, -0.12092208862304688, -0.11546134948730469, -0.1100006103515625, -0.10453987121582031, -0.09907913208007812, -0.09361839294433594, -0.08815765380859375, -0.08269691467285156, -0.07723617553710938, -0.07177543640136719, -0.066314697265625, -0.06085395812988281, -0.055393218994140625, -0.04993247985839844, -0.04447174072265625, -0.03901100158691406, -0.033550262451171875, -0.028089523315429688, -0.0226287841796875, -0.017168045043945312, -0.011707305908203125, -0.0062465667724609375, -0.00078582763671875, 0.0046749114990234375, 0.010135650634765625, 0.015596389770507812, 0.02105712890625, 0.026517868041992188, 0.031978607177734375, 0.03743934631347656, 0.04290008544921875, 0.04836082458496094, 0.053821563720703125, 0.05928230285644531, 0.0647430419921875, 0.07020378112792969, 0.07566452026367188, 0.08112525939941406, 0.08658599853515625, 0.09204673767089844, 0.09750747680664062, 0.10296821594238281, 0.108428955078125, 0.11388969421386719, 0.11935043334960938, 0.12481117248535156, 0.13027191162109375, 0.13573265075683594, 0.14119338989257812, 0.1466541290283203, 0.1521148681640625, 0.1575756072998047, 0.16303634643554688, 0.16849708557128906, 0.17395782470703125, 0.17941856384277344, 0.18487930297851562, 0.1903400421142578, 0.19580078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 1.0, 5.0, 4.0, 4.0, 9.0, 12.0, 17.0, 7.0, 22.0, 16.0, 17.0, 31.0, 28.0, 42.0, 41.0, 28.0, 42.0, 54.0, 41.0, 45.0, 42.0, 50.0, 57.0, 42.0, 42.0, 41.0, 37.0, 34.0, 30.0, 28.0, 15.0, 18.0, 17.0, 10.0, 15.0, 9.0, 15.0, 3.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.2392578125, -0.2323169708251953, -0.22537612915039062, -0.21843528747558594, -0.21149444580078125, -0.20455360412597656, -0.19761276245117188, -0.1906719207763672, -0.1837310791015625, -0.1767902374267578, -0.16984939575195312, -0.16290855407714844, -0.15596771240234375, -0.14902687072753906, -0.14208602905273438, -0.1351451873779297, -0.128204345703125, -0.12126350402832031, -0.11432266235351562, -0.10738182067871094, -0.10044097900390625, -0.09350013732910156, -0.08655929565429688, -0.07961845397949219, -0.0726776123046875, -0.06573677062988281, -0.058795928955078125, -0.05185508728027344, -0.04491424560546875, -0.03797340393066406, -0.031032562255859375, -0.024091720581054688, -0.01715087890625, -0.010210037231445312, -0.003269195556640625, 0.0036716461181640625, 0.01061248779296875, 0.017553329467773438, 0.024494171142578125, 0.03143501281738281, 0.0383758544921875, 0.04531669616699219, 0.052257537841796875, 0.05919837951660156, 0.06613922119140625, 0.07308006286621094, 0.08002090454101562, 0.08696174621582031, 0.093902587890625, 0.10084342956542969, 0.10778427124023438, 0.11472511291503906, 0.12166595458984375, 0.12860679626464844, 0.13554763793945312, 0.1424884796142578, 0.1494293212890625, 0.1563701629638672, 0.16331100463867188, 0.17025184631347656, 0.17719268798828125, 0.18413352966308594, 0.19107437133789062, 0.1980152130126953, 0.2049560546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 1.0, 9.0, 6.0, 10.0, 11.0, 28.0, 31.0, 36.0, 85.0, 90.0, 154.0, 239.0, 462.0, 879.0, 1877.0, 4664.0, 15705.0, 296334.0, 696523.0, 21362.0, 5476.0, 2230.0, 1032.0, 505.0, 307.0, 150.0, 107.0, 66.0, 42.0, 36.0, 23.0, 12.0, 11.0, 9.0, 6.0, 1.0, 6.0, 3.0, 2.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.310791015625, -0.3004608154296875, -0.290130615234375, -0.2798004150390625, -0.26947021484375, -0.2591400146484375, -0.248809814453125, -0.2384796142578125, -0.2281494140625, -0.2178192138671875, -0.207489013671875, -0.1971588134765625, -0.18682861328125, -0.1764984130859375, -0.166168212890625, -0.1558380126953125, -0.1455078125, -0.1351776123046875, -0.124847412109375, -0.1145172119140625, -0.10418701171875, -0.0938568115234375, -0.083526611328125, -0.0731964111328125, -0.0628662109375, -0.0525360107421875, -0.042205810546875, -0.0318756103515625, -0.02154541015625, -0.0112152099609375, -0.000885009765625, 0.0094451904296875, 0.019775390625, 0.0301055908203125, 0.040435791015625, 0.0507659912109375, 0.06109619140625, 0.0714263916015625, 0.081756591796875, 0.0920867919921875, 0.1024169921875, 0.1127471923828125, 0.123077392578125, 0.1334075927734375, 0.14373779296875, 0.1540679931640625, 0.164398193359375, 0.1747283935546875, 0.18505859375, 0.1953887939453125, 0.205718994140625, 0.2160491943359375, 0.22637939453125, 0.2367095947265625, 0.247039794921875, 0.2573699951171875, 0.2677001953125, 0.2780303955078125, 0.288360595703125, 0.2986907958984375, 0.30902099609375, 0.3193511962890625, 0.329681396484375, 0.3400115966796875, 0.350341796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 7.0, 3.0, 5.0, 8.0, 22.0, 38.0, 90.0, 176.0, 304.0, 190.0, 83.0, 31.0, 20.0, 9.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00010162591934204102, -9.923335164785385e-05, -9.684078395366669e-05, -9.444821625947952e-05, -9.205564856529236e-05, -8.96630808711052e-05, -8.727051317691803e-05, -8.487794548273087e-05, -8.24853777885437e-05, -8.009281009435654e-05, -7.770024240016937e-05, -7.530767470598221e-05, -7.291510701179504e-05, -7.052253931760788e-05, -6.812997162342072e-05, -6.573740392923355e-05, -6.334483623504639e-05, -6.095226854085922e-05, -5.855970084667206e-05, -5.6167133152484894e-05, -5.377456545829773e-05, -5.1381997764110565e-05, -4.89894300699234e-05, -4.6596862375736237e-05, -4.420429468154907e-05, -4.181172698736191e-05, -3.9419159293174744e-05, -3.702659159898758e-05, -3.4634023904800415e-05, -3.224145621061325e-05, -2.9848888516426086e-05, -2.7456320822238922e-05, -2.5063753128051758e-05, -2.2671185433864594e-05, -2.027861773967743e-05, -1.7886050045490265e-05, -1.54934823513031e-05, -1.3100914657115936e-05, -1.0708346962928772e-05, -8.315779268741608e-06, -5.923211574554443e-06, -3.530643880367279e-06, -1.1380761861801147e-06, 1.2544915080070496e-06, 3.647059202194214e-06, 6.039626896381378e-06, 8.432194590568542e-06, 1.0824762284755707e-05, 1.3217329978942871e-05, 1.5609897673130035e-05, 1.80024653673172e-05, 2.0395033061504364e-05, 2.278760075569153e-05, 2.5180168449878693e-05, 2.7572736144065857e-05, 2.996530383825302e-05, 3.2357871532440186e-05, 3.475043922662735e-05, 3.7143006920814514e-05, 3.953557461500168e-05, 4.192814230918884e-05, 4.432071000337601e-05, 4.671327769756317e-05, 4.9105845391750336e-05, 5.14984130859375e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 8.0, 15.0, 16.0, 37.0, 49.0, 98.0, 234.0, 460.0, 1355.0, 4883.0, 39235.0, 960827.0, 34340.0, 4786.0, 1334.0, 449.0, 226.0, 80.0, 53.0, 22.0, 13.0, 9.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406982421875, -0.3916130065917969, -0.37624359130859375, -0.3608741760253906, -0.3455047607421875, -0.3301353454589844, -0.31476593017578125, -0.2993965148925781, -0.284027099609375, -0.2686576843261719, -0.25328826904296875, -0.23791885375976562, -0.2225494384765625, -0.20718002319335938, -0.19181060791015625, -0.17644119262695312, -0.16107177734375, -0.14570236206054688, -0.13033294677734375, -0.11496353149414062, -0.0995941162109375, -0.08422470092773438, -0.06885528564453125, -0.053485870361328125, -0.038116455078125, -0.022747039794921875, -0.00737762451171875, 0.007991790771484375, 0.0233612060546875, 0.038730621337890625, 0.05410003662109375, 0.06946945190429688, 0.0848388671875, 0.10020828247070312, 0.11557769775390625, 0.13094711303710938, 0.1463165283203125, 0.16168594360351562, 0.17705535888671875, 0.19242477416992188, 0.207794189453125, 0.22316360473632812, 0.23853302001953125, 0.2539024353027344, 0.2692718505859375, 0.2846412658691406, 0.30001068115234375, 0.3153800964355469, 0.33074951171875, 0.3461189270019531, 0.36148834228515625, 0.3768577575683594, 0.3922271728515625, 0.4075965881347656, 0.42296600341796875, 0.4383354187011719, 0.453704833984375, 0.4690742492675781, 0.48444366455078125, 0.4998130798339844, 0.5151824951171875, 0.5305519104003906, 0.5459213256835938, 0.5612907409667969, 0.57666015625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 4.0, 7.0, 9.0, 7.0, 33.0, 46.0, 71.0, 126.0, 181.0, 187.0, 128.0, 85.0, 38.0, 31.0, 12.0, 10.0, 12.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.30242347717285156, -0.2940559387207031, -0.2856884002685547, -0.27732086181640625, -0.2689533233642578, -0.2605857849121094, -0.25221824645996094, -0.2438507080078125, -0.23548316955566406, -0.22711563110351562, -0.2187480926513672, -0.21038055419921875, -0.2020130157470703, -0.19364547729492188, -0.18527793884277344, -0.176910400390625, -0.16854286193847656, -0.16017532348632812, -0.1518077850341797, -0.14344024658203125, -0.1350727081298828, -0.12670516967773438, -0.11833763122558594, -0.1099700927734375, -0.10160255432128906, -0.09323501586914062, -0.08486747741699219, -0.07649993896484375, -0.06813240051269531, -0.059764862060546875, -0.05139732360839844, -0.04302978515625, -0.03466224670410156, -0.026294708251953125, -0.017927169799804688, -0.00955963134765625, -0.0011920928955078125, 0.007175445556640625, 0.015542984008789062, 0.0239105224609375, 0.03227806091308594, 0.040645599365234375, 0.04901313781738281, 0.05738067626953125, 0.06574821472167969, 0.07411575317382812, 0.08248329162597656, 0.090850830078125, 0.09921836853027344, 0.10758590698242188, 0.11595344543457031, 0.12432098388671875, 0.1326885223388672, 0.14105606079101562, 0.14942359924316406, 0.1577911376953125, 0.16615867614746094, 0.17452621459960938, 0.1828937530517578, 0.19126129150390625, 0.1996288299560547, 0.20799636840820312, 0.21636390686035156, 0.2247314453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 7.0, 11.0, 29.0, 43.0, 109.0, 196.0, 285.0, 163.0, 91.0, 36.0, 12.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7721872329711914, -3.652040719985962, -3.5318939685821533, -3.411747455596924, -3.2916007041931152, -3.1714541912078857, -3.0513076782226562, -2.9311609268188477, -2.811014413833618, -2.6908679008483887, -2.57072114944458, -2.4505746364593506, -2.330428123474121, -2.2102813720703125, -2.090134859085083, -1.969988226890564, -1.849841594696045, -1.7296949625015259, -1.6095483303070068, -1.4894018173217773, -1.3692551851272583, -1.2491085529327393, -1.1289620399475098, -1.0088154077529907, -0.8886687755584717, -0.7685221433639526, -0.6483755707740784, -0.5282289981842041, -0.40808236598968506, -0.287935733795166, -0.16778916120529175, -0.04764258861541748, 0.07250428199768066, 0.19265088438987732, 0.312797486782074, 0.43294408917427063, 0.5530906915664673, 0.6732373237609863, 0.7933838963508606, 0.9135304689407349, 1.033677101135254, 1.153823733329773, 1.273970365524292, 1.3941168785095215, 1.5142635107040405, 1.6344101428985596, 1.754556655883789, 1.874703288078308, 1.9948499202728271, 2.1149964332580566, 2.2351431846618652, 2.3552896976470947, 2.475436210632324, 2.595582962036133, 2.7157294750213623, 2.835875988006592, 2.9560227394104004, 3.07616925239563, 3.1963160037994385, 3.316462516784668, 3.4366092681884766, 3.556755781173706, 3.6769022941589355, 3.797049045562744, 3.9171955585479736]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 6.0, 7.0, 10.0, 12.0, 10.0, 4.0, 7.0, 18.0, 15.0, 18.0, 24.0, 32.0, 35.0, 38.0, 40.0, 33.0, 43.0, 49.0, 59.0, 48.0, 53.0, 49.0, 39.0, 33.0, 43.0, 28.0, 41.0, 23.0, 31.0, 20.0, 27.0, 16.0, 18.0, 16.0, 16.0, 5.0, 10.0, 7.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.0337803363800049, -1.0030534267425537, -0.972326397895813, -0.941599428653717, -0.9108724594116211, -0.8801455497741699, -0.849418580532074, -0.818691611289978, -0.7879646420478821, -0.7572376728057861, -0.7265107035636902, -0.6957837343215942, -0.6650568246841431, -0.6343297958374023, -0.6036028861999512, -0.5728759169578552, -0.5421489477157593, -0.5114219784736633, -0.4806950092315674, -0.4499680697917938, -0.4192411005496979, -0.38851413130760193, -0.35778719186782837, -0.3270602226257324, -0.2963332533836365, -0.2656062841415405, -0.23487932980060577, -0.20415237545967102, -0.17342540621757507, -0.14269843697547913, -0.11197148263454437, -0.08124452829360962, -0.05051761865615845, -0.019790656864643097, 0.010936304926872253, 0.041663266718387604, 0.07239022850990295, 0.1031171977519989, 0.13384415209293365, 0.1645711064338684, 0.19529807567596436, 0.2260250449180603, 0.25675201416015625, 0.2874789535999298, 0.31820592284202576, 0.3489328920841217, 0.37965983152389526, 0.4103868007659912, 0.44111377000808716, 0.4718407392501831, 0.502567708492279, 0.533294677734375, 0.5640215873718262, 0.5947486162185669, 0.6254755258560181, 0.656202495098114, 0.68692946434021, 0.7176564335823059, 0.7483834028244019, 0.7791103720664978, 0.8098373413085938, 0.8405642509460449, 0.8712912201881409, 0.9020181894302368, 0.9327451586723328]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 11.0, 9.0, 7.0, 14.0, 24.0, 36.0, 101.0, 236.0, 2106.0, 4190800.0, 607.0, 183.0, 54.0, 29.0, 17.0, 12.0, 11.0, 8.0, 6.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51171875, -2.4315185546875, -2.351318359375, -2.2711181640625, -2.19091796875, -2.1107177734375, -2.030517578125, -1.9503173828125, -1.8701171875, -1.7899169921875, -1.709716796875, -1.6295166015625, -1.54931640625, -1.4691162109375, -1.388916015625, -1.3087158203125, -1.228515625, -1.1483154296875, -1.068115234375, -0.9879150390625, -0.90771484375, -0.8275146484375, -0.747314453125, -0.6671142578125, -0.5869140625, -0.5067138671875, -0.426513671875, -0.3463134765625, -0.26611328125, -0.1859130859375, -0.105712890625, -0.0255126953125, 0.0546875, 0.1348876953125, 0.215087890625, 0.2952880859375, 0.37548828125, 0.4556884765625, 0.535888671875, 0.6160888671875, 0.6962890625, 0.7764892578125, 0.856689453125, 0.9368896484375, 1.01708984375, 1.0972900390625, 1.177490234375, 1.2576904296875, 1.337890625, 1.4180908203125, 1.498291015625, 1.5784912109375, 1.65869140625, 1.7388916015625, 1.819091796875, 1.8992919921875, 1.9794921875, 2.0596923828125, 2.139892578125, 2.2200927734375, 2.30029296875, 2.3804931640625, 2.460693359375, 2.5408935546875, 2.62109375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 13.0, 18.0, 28.0, 51.0, 63.0, 119.0, 128.0, 156.0, 139.0, 102.0, 68.0, 47.0, 36.0, 16.0, 7.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1400146484375, -0.1355571746826172, -0.13109970092773438, -0.12664222717285156, -0.12218475341796875, -0.11772727966308594, -0.11326980590820312, -0.10881233215332031, -0.1043548583984375, -0.09989738464355469, -0.09543991088867188, -0.09098243713378906, -0.08652496337890625, -0.08206748962402344, -0.07761001586914062, -0.07315254211425781, -0.068695068359375, -0.06423759460449219, -0.059780120849609375, -0.05532264709472656, -0.05086517333984375, -0.04640769958496094, -0.041950225830078125, -0.03749275207519531, -0.0330352783203125, -0.028577804565429688, -0.024120330810546875, -0.019662857055664062, -0.01520538330078125, -0.010747909545898438, -0.006290435791015625, -0.0018329620361328125, 0.00262451171875, 0.0070819854736328125, 0.011539459228515625, 0.015996932983398438, 0.02045440673828125, 0.024911880493164062, 0.029369354248046875, 0.03382682800292969, 0.0382843017578125, 0.04274177551269531, 0.047199249267578125, 0.05165672302246094, 0.05611419677734375, 0.06057167053222656, 0.06502914428710938, 0.06948661804199219, 0.073944091796875, 0.07840156555175781, 0.08285903930664062, 0.08731651306152344, 0.09177398681640625, 0.09623146057128906, 0.10068893432617188, 0.10514640808105469, 0.1096038818359375, 0.11406135559082031, 0.11851882934570312, 0.12297630310058594, 0.12743377685546875, 0.13189125061035156, 0.13634872436523438, 0.1408061981201172, 0.145263671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 10.0, 10.0, 18.0, 33.0, 45.0, 55.0, 112.0, 229.0, 689.0, 4017.0, 108100.0, 4031450.0, 45539.0, 2519.0, 647.0, 257.0, 151.0, 86.0, 85.0, 29.0, 52.0, 29.0, 21.0, 15.0, 19.0, 13.0, 14.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.426025390625, -0.41201019287109375, -0.3979949951171875, -0.38397979736328125, -0.369964599609375, -0.35594940185546875, -0.3419342041015625, -0.32791900634765625, -0.31390380859375, -0.29988861083984375, -0.2858734130859375, -0.27185821533203125, -0.257843017578125, -0.24382781982421875, -0.2298126220703125, -0.21579742431640625, -0.2017822265625, -0.18776702880859375, -0.1737518310546875, -0.15973663330078125, -0.145721435546875, -0.13170623779296875, -0.1176910400390625, -0.10367584228515625, -0.08966064453125, -0.07564544677734375, -0.0616302490234375, -0.04761505126953125, -0.033599853515625, -0.01958465576171875, -0.0055694580078125, 0.00844573974609375, 0.0224609375, 0.03647613525390625, 0.0504913330078125, 0.06450653076171875, 0.078521728515625, 0.09253692626953125, 0.1065521240234375, 0.12056732177734375, 0.13458251953125, 0.14859771728515625, 0.1626129150390625, 0.17662811279296875, 0.190643310546875, 0.20465850830078125, 0.2186737060546875, 0.23268890380859375, 0.2467041015625, 0.26071929931640625, 0.2747344970703125, 0.28874969482421875, 0.302764892578125, 0.31678009033203125, 0.3307952880859375, 0.34481048583984375, 0.35882568359375, 0.37284088134765625, 0.3868560791015625, 0.40087127685546875, 0.414886474609375, 0.42890167236328125, 0.4429168701171875, 0.45693206787109375, 0.470947265625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 1.0, 3.0, 4.0, 6.0, 20.0, 26.0, 71.0, 152.0, 390.0, 1481.0, 1281.0, 362.0, 144.0, 77.0, 28.0, 15.0, 15.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1461181640625, -0.1348094940185547, -0.12350082397460938, -0.11219215393066406, -0.10088348388671875, -0.08957481384277344, -0.07826614379882812, -0.06695747375488281, -0.0556488037109375, -0.04434013366699219, -0.033031463623046875, -0.021722793579101562, -0.01041412353515625, 0.0008945465087890625, 0.012203216552734375, 0.023511886596679688, 0.034820556640625, 0.04612922668457031, 0.057437896728515625, 0.06874656677246094, 0.08005523681640625, 0.09136390686035156, 0.10267257690429688, 0.11398124694824219, 0.1252899169921875, 0.1365985870361328, 0.14790725708007812, 0.15921592712402344, 0.17052459716796875, 0.18183326721191406, 0.19314193725585938, 0.2044506072998047, 0.21575927734375, 0.2270679473876953, 0.23837661743164062, 0.24968528747558594, 0.26099395751953125, 0.27230262756347656, 0.2836112976074219, 0.2949199676513672, 0.3062286376953125, 0.3175373077392578, 0.3288459777832031, 0.34015464782714844, 0.35146331787109375, 0.36277198791503906, 0.3740806579589844, 0.3853893280029297, 0.396697998046875, 0.4080066680908203, 0.4193153381347656, 0.43062400817871094, 0.44193267822265625, 0.45324134826660156, 0.4645500183105469, 0.4758586883544922, 0.4871673583984375, 0.4984760284423828, 0.5097846984863281, 0.5210933685302734, 0.5324020385742188, 0.5437107086181641, 0.5550193786621094, 0.5663280487060547, 0.57763671875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 5.0, 15.0, 14.0, 20.0, 45.0, 59.0, 104.0, 141.0, 140.0, 127.0, 89.0, 57.0, 44.0, 33.0, 21.0, 18.0, 10.0, 13.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.461466908454895, -1.4091870784759521, -1.3569073677062988, -1.304627537727356, -1.252347707748413, -1.2000679969787598, -1.147788166999817, -1.095508337020874, -1.0432285070419312, -0.9909487366676331, -0.9386689066886902, -0.8863891363143921, -0.8341093063354492, -0.7818295359611511, -0.729549765586853, -0.6772699356079102, -0.6249901652336121, -0.572710394859314, -0.5204305648803711, -0.468150794506073, -0.4158709645271301, -0.36359119415283203, -0.31131139397621155, -0.25903159379959106, -0.20675179362297058, -0.1544719934463501, -0.10219220072031021, -0.049912407994270325, 0.0023673921823501587, 0.05464717745780945, 0.10692697763442993, 0.15920677781105042, 0.2114865779876709, 0.2637663781642914, 0.31604617834091187, 0.36832594871520996, 0.42060577869415283, 0.4728855490684509, 0.525165319442749, 0.5774451494216919, 0.6297249794006348, 0.6820047497749329, 0.7342845797538757, 0.7865643501281738, 0.8388441801071167, 0.8911239504814148, 0.9434037208557129, 0.9956835508346558, 1.0479633808135986, 1.1002432107925415, 1.1525229215621948, 1.2048027515411377, 1.2570825815200806, 1.3093624114990234, 1.3616421222686768, 1.4139219522476196, 1.466201663017273, 1.5184814929962158, 1.5707612037658691, 1.623041033744812, 1.6753208637237549, 1.7276005744934082, 1.779880404472351, 1.832160234451294, 1.8844400644302368]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 3.0, 6.0, 7.0, 3.0, 6.0, 14.0, 12.0, 13.0, 20.0, 11.0, 25.0, 28.0, 35.0, 22.0, 28.0, 34.0, 40.0, 42.0, 44.0, 50.0, 52.0, 50.0, 51.0, 35.0, 50.0, 52.0, 29.0, 26.0, 36.0, 27.0, 33.0, 21.0, 12.0, 20.0, 13.0, 4.0, 14.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2019305229187012, -1.1654633283615112, -1.1289961338043213, -1.0925289392471313, -1.0560617446899414, -1.0195945501327515, -0.9831272959709167, -0.9466601014137268, -0.9101929068565369, -0.8737257122993469, -0.837258517742157, -0.800791323184967, -0.7643240690231323, -0.7278568744659424, -0.6913896799087524, -0.6549224853515625, -0.6184552907943726, -0.5819880962371826, -0.5455209016799927, -0.5090537071228027, -0.4725864827632904, -0.43611928820610046, -0.39965206384658813, -0.3631848692893982, -0.32671767473220825, -0.2902504801750183, -0.25378328561782837, -0.21731606125831604, -0.1808488667011261, -0.14438167214393616, -0.10791446268558502, -0.07144725322723389, -0.034980177879333496, 0.0014870241284370422, 0.03795422613620758, 0.07442142814397812, 0.11088863015174866, 0.1473558247089386, 0.18382303416728973, 0.22029024362564087, 0.2567574381828308, 0.29322463274002075, 0.3296918272972107, 0.366159051656723, 0.40262624621391296, 0.4390934407711029, 0.47556066513061523, 0.5120278596878052, 0.5484950542449951, 0.5849622488021851, 0.621429443359375, 0.6578966379165649, 0.6943638324737549, 0.7308310270309448, 0.7672982811927795, 0.8037654757499695, 0.8402326703071594, 0.8766998648643494, 0.9131670594215393, 0.9496342539787292, 0.986101508140564, 1.022568702697754, 1.0590358972549438, 1.0955030918121338, 1.1319702863693237]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 9.0, 10.0, 14.0, 16.0, 28.0, 47.0, 46.0, 70.0, 87.0, 107.0, 204.0, 288.0, 513.0, 811.0, 1432.0, 2682.0, 5218.0, 11152.0, 24931.0, 60498.0, 152645.0, 319301.0, 269521.0, 114945.0, 45828.0, 19387.0, 8851.0, 4419.0, 2283.0, 1261.0, 722.0, 416.0, 257.0, 148.0, 113.0, 76.0, 55.0, 41.0, 29.0, 28.0, 12.0, 17.0, 9.0, 3.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1533203125, -0.14850616455078125, -0.1436920166015625, -0.13887786865234375, -0.134063720703125, -0.12924957275390625, -0.1244354248046875, -0.11962127685546875, -0.11480712890625, -0.10999298095703125, -0.1051788330078125, -0.10036468505859375, -0.095550537109375, -0.09073638916015625, -0.0859222412109375, -0.08110809326171875, -0.0762939453125, -0.07147979736328125, -0.0666656494140625, -0.06185150146484375, -0.057037353515625, -0.05222320556640625, -0.0474090576171875, -0.04259490966796875, -0.03778076171875, -0.03296661376953125, -0.0281524658203125, -0.02333831787109375, -0.018524169921875, -0.01371002197265625, -0.0088958740234375, -0.00408172607421875, 0.000732421875, 0.00554656982421875, 0.0103607177734375, 0.01517486572265625, 0.019989013671875, 0.02480316162109375, 0.0296173095703125, 0.03443145751953125, 0.03924560546875, 0.04405975341796875, 0.0488739013671875, 0.05368804931640625, 0.058502197265625, 0.06331634521484375, 0.0681304931640625, 0.07294464111328125, 0.0777587890625, 0.08257293701171875, 0.0873870849609375, 0.09220123291015625, 0.097015380859375, 0.10182952880859375, 0.1066436767578125, 0.11145782470703125, 0.11627197265625, 0.12108612060546875, 0.1259002685546875, 0.13071441650390625, 0.135528564453125, 0.14034271240234375, 0.1451568603515625, 0.14997100830078125, 0.15478515625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 20.0, 35.0, 45.0, 53.0, 76.0, 111.0, 140.0, 112.0, 127.0, 96.0, 56.0, 41.0, 31.0, 20.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13427734375, -0.1300678253173828, -0.12585830688476562, -0.12164878845214844, -0.11743927001953125, -0.11322975158691406, -0.10902023315429688, -0.10481071472167969, -0.1006011962890625, -0.09639167785644531, -0.09218215942382812, -0.08797264099121094, -0.08376312255859375, -0.07955360412597656, -0.07534408569335938, -0.07113456726074219, -0.066925048828125, -0.06271553039550781, -0.058506011962890625, -0.05429649353027344, -0.05008697509765625, -0.04587745666503906, -0.041667938232421875, -0.03745841979980469, -0.0332489013671875, -0.029039382934570312, -0.024829864501953125, -0.020620346069335938, -0.01641082763671875, -0.012201309204101562, -0.007991790771484375, -0.0037822723388671875, 0.00042724609375, 0.0046367645263671875, 0.008846282958984375, 0.013055801391601562, 0.01726531982421875, 0.021474838256835938, 0.025684356689453125, 0.029893875122070312, 0.0341033935546875, 0.03831291198730469, 0.042522430419921875, 0.04673194885253906, 0.05094146728515625, 0.05515098571777344, 0.059360504150390625, 0.06357002258300781, 0.067779541015625, 0.07198905944824219, 0.07619857788085938, 0.08040809631347656, 0.08461761474609375, 0.08882713317871094, 0.09303665161132812, 0.09724617004394531, 0.1014556884765625, 0.10566520690917969, 0.10987472534179688, 0.11408424377441406, 0.11829376220703125, 0.12250328063964844, 0.12671279907226562, 0.1309223175048828, 0.1351318359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 1.0, 11.0, 2.0, 6.0, 14.0, 19.0, 23.0, 36.0, 56.0, 94.0, 116.0, 178.0, 319.0, 549.0, 1052.0, 2226.0, 5176.0, 15913.0, 66829.0, 515333.0, 358760.0, 58348.0, 14285.0, 4859.0, 2034.0, 1000.0, 514.0, 283.0, 182.0, 118.0, 70.0, 42.0, 27.0, 24.0, 16.0, 16.0, 9.0, 8.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.289306640625, -0.2793159484863281, -0.26932525634765625, -0.2593345642089844, -0.2493438720703125, -0.23935317993164062, -0.22936248779296875, -0.21937179565429688, -0.209381103515625, -0.19939041137695312, -0.18939971923828125, -0.17940902709960938, -0.1694183349609375, -0.15942764282226562, -0.14943695068359375, -0.13944625854492188, -0.12945556640625, -0.11946487426757812, -0.10947418212890625, -0.09948348999023438, -0.0894927978515625, -0.07950210571289062, -0.06951141357421875, -0.059520721435546875, -0.049530029296875, -0.039539337158203125, -0.02954864501953125, -0.019557952880859375, -0.0095672607421875, 0.000423431396484375, 0.01041412353515625, 0.020404815673828125, 0.0303955078125, 0.040386199951171875, 0.05037689208984375, 0.060367584228515625, 0.0703582763671875, 0.08034896850585938, 0.09033966064453125, 0.10033035278320312, 0.110321044921875, 0.12031173706054688, 0.13030242919921875, 0.14029312133789062, 0.1502838134765625, 0.16027450561523438, 0.17026519775390625, 0.18025588989257812, 0.19024658203125, 0.20023727416992188, 0.21022796630859375, 0.22021865844726562, 0.2302093505859375, 0.24020004272460938, 0.25019073486328125, 0.2601814270019531, 0.270172119140625, 0.2801628112792969, 0.29015350341796875, 0.3001441955566406, 0.3101348876953125, 0.3201255798339844, 0.33011627197265625, 0.3401069641113281, 0.35009765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 2.0, 4.0, 4.0, 8.0, 7.0, 9.0, 17.0, 9.0, 15.0, 20.0, 25.0, 20.0, 32.0, 52.0, 43.0, 43.0, 44.0, 50.0, 70.0, 60.0, 54.0, 53.0, 55.0, 49.0, 40.0, 29.0, 39.0, 24.0, 21.0, 19.0, 20.0, 12.0, 14.0, 10.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3466796875, -0.33489227294921875, -0.3231048583984375, -0.31131744384765625, -0.299530029296875, -0.28774261474609375, -0.2759552001953125, -0.26416778564453125, -0.25238037109375, -0.24059295654296875, -0.2288055419921875, -0.21701812744140625, -0.205230712890625, -0.19344329833984375, -0.1816558837890625, -0.16986846923828125, -0.1580810546875, -0.14629364013671875, -0.1345062255859375, -0.12271881103515625, -0.110931396484375, -0.09914398193359375, -0.0873565673828125, -0.07556915283203125, -0.06378173828125, -0.05199432373046875, -0.0402069091796875, -0.02841949462890625, -0.016632080078125, -0.00484466552734375, 0.0069427490234375, 0.01873016357421875, 0.030517578125, 0.04230499267578125, 0.0540924072265625, 0.06587982177734375, 0.077667236328125, 0.08945465087890625, 0.1012420654296875, 0.11302947998046875, 0.12481689453125, 0.13660430908203125, 0.1483917236328125, 0.16017913818359375, 0.171966552734375, 0.18375396728515625, 0.1955413818359375, 0.20732879638671875, 0.2191162109375, 0.23090362548828125, 0.2426910400390625, 0.25447845458984375, 0.266265869140625, 0.27805328369140625, 0.2898406982421875, 0.30162811279296875, 0.31341552734375, 0.32520294189453125, 0.3369903564453125, 0.34877777099609375, 0.360565185546875, 0.37235260009765625, 0.3841400146484375, 0.39592742919921875, 0.40771484375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 13.0, 13.0, 19.0, 41.0, 67.0, 103.0, 157.0, 303.0, 644.0, 1207.0, 2473.0, 5985.0, 18014.0, 158104.0, 808167.0, 36990.0, 9192.0, 3596.0, 1722.0, 791.0, 398.0, 234.0, 134.0, 66.0, 34.0, 22.0, 20.0, 12.0, 9.0, 10.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.6455078125, -0.6286201477050781, -0.6117324829101562, -0.5948448181152344, -0.5779571533203125, -0.5610694885253906, -0.5441818237304688, -0.5272941589355469, -0.510406494140625, -0.4935188293457031, -0.47663116455078125, -0.4597434997558594, -0.4428558349609375, -0.4259681701660156, -0.40908050537109375, -0.3921928405761719, -0.37530517578125, -0.3584175109863281, -0.34152984619140625, -0.3246421813964844, -0.3077545166015625, -0.2908668518066406, -0.27397918701171875, -0.2570915222167969, -0.240203857421875, -0.22331619262695312, -0.20642852783203125, -0.18954086303710938, -0.1726531982421875, -0.15576553344726562, -0.13887786865234375, -0.12199020385742188, -0.1051025390625, -0.08821487426757812, -0.07132720947265625, -0.054439544677734375, -0.0375518798828125, -0.020664215087890625, -0.00377655029296875, 0.013111114501953125, 0.029998779296875, 0.046886444091796875, 0.06377410888671875, 0.08066177368164062, 0.0975494384765625, 0.11443710327148438, 0.13132476806640625, 0.14821243286132812, 0.16510009765625, 0.18198776245117188, 0.19887542724609375, 0.21576309204101562, 0.2326507568359375, 0.24953842163085938, 0.26642608642578125, 0.2833137512207031, 0.300201416015625, 0.3170890808105469, 0.33397674560546875, 0.3508644104003906, 0.3677520751953125, 0.3846397399902344, 0.40152740478515625, 0.4184150695800781, 0.435302734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 12.0, 5.0, 8.0, 15.0, 21.0, 27.0, 42.0, 96.0, 155.0, 231.0, 167.0, 76.0, 45.0, 28.0, 17.0, 10.0, 12.0, 5.0, 7.0, 4.0, 3.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0001195669174194336, -0.00011619646102190018, -0.00011282600462436676, -0.00010945554822683334, -0.00010608509182929993, -0.00010271463543176651, -9.93441790342331e-05, -9.597372263669968e-05, -9.260326623916626e-05, -8.923280984163284e-05, -8.586235344409943e-05, -8.249189704656601e-05, -7.912144064903259e-05, -7.575098425149918e-05, -7.238052785396576e-05, -6.901007145643234e-05, -6.563961505889893e-05, -6.226915866136551e-05, -5.889870226383209e-05, -5.5528245866298676e-05, -5.215778946876526e-05, -4.878733307123184e-05, -4.5416876673698425e-05, -4.204642027616501e-05, -3.867596387863159e-05, -3.5305507481098175e-05, -3.193505108356476e-05, -2.856459468603134e-05, -2.5194138288497925e-05, -2.1823681890964508e-05, -1.845322549343109e-05, -1.5082769095897675e-05, -1.1712312698364258e-05, -8.341856300830841e-06, -4.971399903297424e-06, -1.6009435057640076e-06, 1.7695128917694092e-06, 5.139969289302826e-06, 8.510425686836243e-06, 1.188088208436966e-05, 1.5251338481903076e-05, 1.8621794879436493e-05, 2.199225127696991e-05, 2.5362707674503326e-05, 2.8733164072036743e-05, 3.210362046957016e-05, 3.547407686710358e-05, 3.8844533264636993e-05, 4.221498966217041e-05, 4.558544605970383e-05, 4.8955902457237244e-05, 5.232635885477066e-05, 5.569681525230408e-05, 5.9067271649837494e-05, 6.243772804737091e-05, 6.580818444490433e-05, 6.917864084243774e-05, 7.254909723997116e-05, 7.591955363750458e-05, 7.9290010035038e-05, 8.266046643257141e-05, 8.603092283010483e-05, 8.940137922763824e-05, 9.277183562517166e-05, 9.614229202270508e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 13.0, 7.0, 11.0, 17.0, 16.0, 40.0, 45.0, 59.0, 96.0, 143.0, 190.0, 302.0, 435.0, 765.0, 1168.0, 2007.0, 3988.0, 8768.0, 25213.0, 188917.0, 739306.0, 51052.0, 13401.0, 5701.0, 2776.0, 1487.0, 901.0, 611.0, 328.0, 248.0, 155.0, 119.0, 81.0, 50.0, 40.0, 16.0, 19.0, 9.0, 12.0, 10.0, 6.0, 12.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.34619140625, -0.33510589599609375, -0.3240203857421875, -0.31293487548828125, -0.301849365234375, -0.29076385498046875, -0.2796783447265625, -0.26859283447265625, -0.25750732421875, -0.24642181396484375, -0.2353363037109375, -0.22425079345703125, -0.213165283203125, -0.20207977294921875, -0.1909942626953125, -0.17990875244140625, -0.1688232421875, -0.15773773193359375, -0.1466522216796875, -0.13556671142578125, -0.124481201171875, -0.11339569091796875, -0.1023101806640625, -0.09122467041015625, -0.08013916015625, -0.06905364990234375, -0.0579681396484375, -0.04688262939453125, -0.035797119140625, -0.02471160888671875, -0.0136260986328125, -0.00254058837890625, 0.008544921875, 0.01963043212890625, 0.0307159423828125, 0.04180145263671875, 0.052886962890625, 0.06397247314453125, 0.0750579833984375, 0.08614349365234375, 0.09722900390625, 0.10831451416015625, 0.1194000244140625, 0.13048553466796875, 0.141571044921875, 0.15265655517578125, 0.1637420654296875, 0.17482757568359375, 0.1859130859375, 0.19699859619140625, 0.2080841064453125, 0.21916961669921875, 0.230255126953125, 0.24134063720703125, 0.2524261474609375, 0.26351165771484375, 0.27459716796875, 0.28568267822265625, 0.2967681884765625, 0.30785369873046875, 0.318939208984375, 0.33002471923828125, 0.3411102294921875, 0.35219573974609375, 0.36328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 10.0, 11.0, 25.0, 69.0, 85.0, 170.0, 191.0, 182.0, 90.0, 50.0, 29.0, 11.0, 12.0, 7.0, 8.0, 8.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.478271484375, -0.4621162414550781, -0.44596099853515625, -0.4298057556152344, -0.4136505126953125, -0.3974952697753906, -0.38134002685546875, -0.3651847839355469, -0.349029541015625, -0.3328742980957031, -0.31671905517578125, -0.3005638122558594, -0.2844085693359375, -0.2682533264160156, -0.25209808349609375, -0.23594284057617188, -0.21978759765625, -0.20363235473632812, -0.18747711181640625, -0.17132186889648438, -0.1551666259765625, -0.13901138305664062, -0.12285614013671875, -0.10670089721679688, -0.090545654296875, -0.07439041137695312, -0.05823516845703125, -0.042079925537109375, -0.0259246826171875, -0.009769439697265625, 0.00638580322265625, 0.022541046142578125, 0.0386962890625, 0.054851531982421875, 0.07100677490234375, 0.08716201782226562, 0.1033172607421875, 0.11947250366210938, 0.13562774658203125, 0.15178298950195312, 0.167938232421875, 0.18409347534179688, 0.20024871826171875, 0.21640396118164062, 0.2325592041015625, 0.24871444702148438, 0.26486968994140625, 0.2810249328613281, 0.29718017578125, 0.3133354187011719, 0.32949066162109375, 0.3456459045410156, 0.3618011474609375, 0.3779563903808594, 0.39411163330078125, 0.4102668762207031, 0.426422119140625, 0.4425773620605469, 0.45873260498046875, 0.4748878479003906, 0.4910430908203125, 0.5071983337402344, 0.5233535766601562, 0.5395088195800781, 0.5556640625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 10.0, 12.0, 18.0, 29.0, 85.0, 197.0, 359.0, 159.0, 73.0, 30.0, 11.0, 3.0, 6.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.622251033782959, -3.3521265983581543, -3.0820019245147705, -2.811877489089966, -2.541752815246582, -2.2716283798217773, -2.0015039443969727, -1.7313793897628784, -1.4612548351287842, -1.19113028049469, -0.9210057854652405, -0.650881290435791, -0.3807567358016968, -0.11063218116760254, 0.15949225425720215, 0.4296168088912964, 0.6997413635253906, 0.9698659181594849, 1.239990472793579, 1.5101149082183838, 1.780239462852478, 2.0503640174865723, 2.320488452911377, 2.5906128883361816, 2.8607375621795654, 3.13086199760437, 3.400986671447754, 3.6711111068725586, 3.9412355422973633, 4.211359977722168, 4.481484413146973, 4.7516093254089355, 5.021734237670898, 5.291858673095703, 5.561983108520508, 5.8321075439453125, 6.102232456207275, 6.37235689163208, 6.642481327056885, 6.9126057624816895, 7.182730674743652, 7.452855110168457, 7.722979545593262, 7.993103981018066, 8.263228416442871, 8.533353805541992, 8.803478240966797, 9.073602676391602, 9.343727111816406, 9.613851547241211, 9.883975982666016, 10.15410041809082, 10.424224853515625, 10.69434928894043, 10.964473724365234, 11.234599113464355, 11.504722595214844, 11.774847030639648, 12.044971466064453, 12.315095901489258, 12.585220336914062, 12.855344772338867, 13.125469207763672, 13.395594596862793, 13.665719032287598]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 3.0, 4.0, 8.0, 5.0, 5.0, 9.0, 9.0, 14.0, 17.0, 17.0, 17.0, 9.0, 22.0, 25.0, 25.0, 35.0, 26.0, 45.0, 49.0, 62.0, 52.0, 57.0, 51.0, 46.0, 35.0, 38.0, 32.0, 27.0, 35.0, 34.0, 25.0, 17.0, 23.0, 23.0, 14.0, 19.0, 14.0, 10.0, 8.0, 7.0, 9.0, 6.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0789895057678223, -2.0096607208251953, -1.940332055091858, -1.8710033893585205, -1.8016746044158936, -1.7323458194732666, -1.6630171537399292, -1.5936884880065918, -1.5243597030639648, -1.455030918121338, -1.3857022523880005, -1.316373586654663, -1.2470448017120361, -1.1777160167694092, -1.1083873510360718, -1.0390586853027344, -0.9697299003601074, -0.9004011750221252, -0.8310724496841431, -0.7617437243461609, -0.6924149990081787, -0.6230862736701965, -0.5537575483322144, -0.4844288229942322, -0.41510009765625, -0.3457713723182678, -0.27644264698028564, -0.20711392164230347, -0.1377851963043213, -0.06845647096633911, 0.0008722543716430664, 0.07020097970962524, 0.13952970504760742, 0.2088584303855896, 0.2781871557235718, 0.34751588106155396, 0.41684460639953613, 0.4861733317375183, 0.5555020570755005, 0.6248307824134827, 0.6941595077514648, 0.763488233089447, 0.8328169584274292, 0.9021456837654114, 0.9714744091033936, 1.0408031940460205, 1.110131859779358, 1.1794605255126953, 1.2487893104553223, 1.3181180953979492, 1.3874467611312866, 1.456775426864624, 1.526104211807251, 1.595432996749878, 1.6647616624832153, 1.7340903282165527, 1.8034191131591797, 1.8727478981018066, 1.942076563835144, 2.0114052295684814, 2.0807340145111084, 2.1500627994537354, 2.219391345977783, 2.28872013092041, 2.358048915863037]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 8.0, 7.0, 17.0, 37.0, 55.0, 60.0, 64.0, 98.0, 144.0, 274.0, 560.0, 2193.0, 35202.0, 4103272.0, 48507.0, 2442.0, 566.0, 253.0, 143.0, 104.0, 73.0, 61.0, 40.0, 33.0, 18.0, 18.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6826171875, -0.6616363525390625, -0.640655517578125, -0.6196746826171875, -0.59869384765625, -0.5777130126953125, -0.556732177734375, -0.5357513427734375, -0.5147705078125, -0.4937896728515625, -0.472808837890625, -0.4518280029296875, -0.43084716796875, -0.4098663330078125, -0.388885498046875, -0.3679046630859375, -0.346923828125, -0.3259429931640625, -0.304962158203125, -0.2839813232421875, -0.26300048828125, -0.2420196533203125, -0.221038818359375, -0.2000579833984375, -0.1790771484375, -0.1580963134765625, -0.137115478515625, -0.1161346435546875, -0.09515380859375, -0.0741729736328125, -0.053192138671875, -0.0322113037109375, -0.01123046875, 0.0097503662109375, 0.030731201171875, 0.0517120361328125, 0.07269287109375, 0.0936737060546875, 0.114654541015625, 0.1356353759765625, 0.1566162109375, 0.1775970458984375, 0.198577880859375, 0.2195587158203125, 0.24053955078125, 0.2615203857421875, 0.282501220703125, 0.3034820556640625, 0.324462890625, 0.3454437255859375, 0.366424560546875, 0.3874053955078125, 0.40838623046875, 0.4293670654296875, 0.450347900390625, 0.4713287353515625, 0.4923095703125, 0.5132904052734375, 0.534271240234375, 0.5552520751953125, 0.57623291015625, 0.5972137451171875, 0.618194580078125, 0.6391754150390625, 0.66015625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 14.0, 29.0, 29.0, 50.0, 51.0, 78.0, 92.0, 100.0, 112.0, 90.0, 89.0, 73.0, 45.0, 52.0, 33.0, 21.0, 4.0, 8.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.13319969177246094, -0.12907028198242188, -0.12494087219238281, -0.12081146240234375, -0.11668205261230469, -0.11255264282226562, -0.10842323303222656, -0.1042938232421875, -0.10016441345214844, -0.09603500366210938, -0.09190559387207031, -0.08777618408203125, -0.08364677429199219, -0.07951736450195312, -0.07538795471191406, -0.071258544921875, -0.06712913513183594, -0.06299972534179688, -0.05887031555175781, -0.05474090576171875, -0.05061149597167969, -0.046482086181640625, -0.04235267639160156, -0.0382232666015625, -0.03409385681152344, -0.029964447021484375, -0.025835037231445312, -0.02170562744140625, -0.017576217651367188, -0.013446807861328125, -0.009317398071289062, -0.00518798828125, -0.0010585784912109375, 0.003070831298828125, 0.0072002410888671875, 0.01132965087890625, 0.015459060668945312, 0.019588470458984375, 0.023717880249023438, 0.0278472900390625, 0.03197669982910156, 0.036106109619140625, 0.04023551940917969, 0.04436492919921875, 0.04849433898925781, 0.052623748779296875, 0.05675315856933594, 0.060882568359375, 0.06501197814941406, 0.06914138793945312, 0.07327079772949219, 0.07740020751953125, 0.08152961730957031, 0.08565902709960938, 0.08978843688964844, 0.0939178466796875, 0.09804725646972656, 0.10217666625976562, 0.10630607604980469, 0.11043548583984375, 0.11456489562988281, 0.11869430541992188, 0.12282371520996094, 0.126953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 10.0, 11.0, 9.0, 21.0, 28.0, 44.0, 41.0, 67.0, 69.0, 95.0, 124.0, 205.0, 348.0, 540.0, 960.0, 2665.0, 14976.0, 491157.0, 3637708.0, 37362.0, 4519.0, 1363.0, 642.0, 409.0, 252.0, 187.0, 156.0, 118.0, 55.0, 47.0, 31.0, 23.0, 14.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48388671875, -0.4678497314453125, -0.451812744140625, -0.4357757568359375, -0.41973876953125, -0.4037017822265625, -0.387664794921875, -0.3716278076171875, -0.3555908203125, -0.3395538330078125, -0.323516845703125, -0.3074798583984375, -0.29144287109375, -0.2754058837890625, -0.259368896484375, -0.2433319091796875, -0.227294921875, -0.2112579345703125, -0.195220947265625, -0.1791839599609375, -0.16314697265625, -0.1471099853515625, -0.131072998046875, -0.1150360107421875, -0.0989990234375, -0.0829620361328125, -0.066925048828125, -0.0508880615234375, -0.03485107421875, -0.0188140869140625, -0.002777099609375, 0.0132598876953125, 0.029296875, 0.0453338623046875, 0.061370849609375, 0.0774078369140625, 0.09344482421875, 0.1094818115234375, 0.125518798828125, 0.1415557861328125, 0.1575927734375, 0.1736297607421875, 0.189666748046875, 0.2057037353515625, 0.22174072265625, 0.2377777099609375, 0.253814697265625, 0.2698516845703125, 0.285888671875, 0.3019256591796875, 0.317962646484375, 0.3339996337890625, 0.35003662109375, 0.3660736083984375, 0.382110595703125, 0.3981475830078125, 0.4141845703125, 0.4302215576171875, 0.446258544921875, 0.4622955322265625, 0.47833251953125, 0.4943695068359375, 0.510406494140625, 0.5264434814453125, 0.54248046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 19.0, 29.0, 98.0, 320.0, 1901.0, 1340.0, 227.0, 71.0, 39.0, 15.0, 10.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98193359375, -0.957916259765625, -0.93389892578125, -0.909881591796875, -0.8858642578125, -0.861846923828125, -0.83782958984375, -0.813812255859375, -0.789794921875, -0.765777587890625, -0.74176025390625, -0.717742919921875, -0.6937255859375, -0.669708251953125, -0.64569091796875, -0.621673583984375, -0.59765625, -0.573638916015625, -0.54962158203125, -0.525604248046875, -0.5015869140625, -0.477569580078125, -0.45355224609375, -0.429534912109375, -0.405517578125, -0.381500244140625, -0.35748291015625, -0.333465576171875, -0.3094482421875, -0.285430908203125, -0.26141357421875, -0.237396240234375, -0.21337890625, -0.189361572265625, -0.16534423828125, -0.141326904296875, -0.1173095703125, -0.093292236328125, -0.06927490234375, -0.045257568359375, -0.021240234375, 0.002777099609375, 0.02679443359375, 0.050811767578125, 0.0748291015625, 0.098846435546875, 0.12286376953125, 0.146881103515625, 0.1708984375, 0.194915771484375, 0.21893310546875, 0.242950439453125, 0.2669677734375, 0.290985107421875, 0.31500244140625, 0.339019775390625, 0.363037109375, 0.387054443359375, 0.41107177734375, 0.435089111328125, 0.4591064453125, 0.483123779296875, 0.50714111328125, 0.531158447265625, 0.55517578125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 3.0, 13.0, 25.0, 36.0, 75.0, 152.0, 229.0, 209.0, 121.0, 59.0, 29.0, 13.0, 16.0, 10.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.38411283493042, -5.266946315765381, -5.149779796600342, -5.032613277435303, -4.915446758270264, -4.798280239105225, -4.6811137199401855, -4.5639472007751465, -4.446780681610107, -4.329614162445068, -4.212447643280029, -4.09528112411499, -3.978114604949951, -3.860948085784912, -3.743781566619873, -3.626615047454834, -3.509448289871216, -3.3922817707061768, -3.2751152515411377, -3.1579487323760986, -3.0407822132110596, -2.9236156940460205, -2.8064489364624023, -2.6892824172973633, -2.572115898132324, -2.454949378967285, -2.337782859802246, -2.220616340637207, -2.103449821472168, -1.986283302307129, -1.8691166639328003, -1.7519501447677612, -1.6347835063934326, -1.5176169872283936, -1.4004504680633545, -1.2832839488983154, -1.1661174297332764, -1.0489509105682373, -0.9317842721939087, -0.8146177530288696, -0.6974512338638306, -0.5802847146987915, -0.46311816573143005, -0.3459516167640686, -0.22878509759902954, -0.11161857843399048, 0.005548000335693359, 0.12271451950073242, 0.23988103866577148, 0.35704755783081055, 0.474214106798172, 0.5913806557655334, 0.7085471749305725, 0.8257136940956116, 0.9428802728652954, 1.0600467920303345, 1.1772133111953735, 1.2943798303604126, 1.4115463495254517, 1.5287129878997803, 1.6458795070648193, 1.7630460262298584, 1.8802125453948975, 1.9973790645599365, 2.1145455837249756]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 7.0, 4.0, 4.0, 11.0, 15.0, 17.0, 11.0, 22.0, 25.0, 40.0, 38.0, 32.0, 41.0, 41.0, 54.0, 67.0, 46.0, 40.0, 61.0, 54.0, 56.0, 40.0, 38.0, 41.0, 38.0, 23.0, 30.0, 24.0, 15.0, 14.0, 8.0, 11.0, 5.0, 7.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3683083057403564, -1.3242965936660767, -1.2802847623825073, -1.2362730503082275, -1.1922612190246582, -1.1482495069503784, -1.1042377948760986, -1.0602259635925293, -1.0162142515182495, -0.972202479839325, -0.9281907081604004, -0.8841789960861206, -0.840167224407196, -0.7961554527282715, -0.7521436810493469, -0.7081319093704224, -0.6641201376914978, -0.6201083660125732, -0.5760965943336487, -0.5320848226547241, -0.48807311058044434, -0.4440613389015198, -0.4000495672225952, -0.35603782534599304, -0.3120260536670685, -0.2680142819881439, -0.22400254011154175, -0.1799907684326172, -0.13597901165485382, -0.09196725487709045, -0.047955483198165894, -0.003943741321563721, 0.04006803035736084, 0.0840797871351242, 0.12809154391288757, 0.17210331559181213, 0.2161150723695755, 0.26012682914733887, 0.3041386008262634, 0.3481503427028656, 0.39216211438179016, 0.4361738860607147, 0.4801856279373169, 0.5241973996162415, 0.568209171295166, 0.6122208833694458, 0.6562327146530151, 0.7002444267272949, 0.7442561984062195, 0.788267970085144, 0.8322797417640686, 0.8762915134429932, 0.920303225517273, 0.9643149971961975, 1.008326768875122, 1.0523384809494019, 1.0963503122329712, 1.140362024307251, 1.1843738555908203, 1.2283855676651, 1.2723973989486694, 1.3164091110229492, 1.3604209423065186, 1.4044326543807983, 1.4484443664550781]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 2.0, 5.0, 12.0, 23.0, 29.0, 45.0, 61.0, 71.0, 140.0, 148.0, 257.0, 347.0, 538.0, 865.0, 1417.0, 2291.0, 3890.0, 6966.0, 13288.0, 26551.0, 57655.0, 135696.0, 293776.0, 276013.0, 122665.0, 52665.0, 24582.0, 12399.0, 6576.0, 3680.0, 2112.0, 1315.0, 858.0, 515.0, 319.0, 234.0, 186.0, 110.0, 77.0, 47.0, 35.0, 23.0, 29.0, 17.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1981201171875, -0.1921062469482422, -0.18609237670898438, -0.18007850646972656, -0.17406463623046875, -0.16805076599121094, -0.16203689575195312, -0.1560230255126953, -0.1500091552734375, -0.1439952850341797, -0.13798141479492188, -0.13196754455566406, -0.12595367431640625, -0.11993980407714844, -0.11392593383789062, -0.10791206359863281, -0.101898193359375, -0.09588432312011719, -0.08987045288085938, -0.08385658264160156, -0.07784271240234375, -0.07182884216308594, -0.06581497192382812, -0.05980110168457031, -0.0537872314453125, -0.04777336120605469, -0.041759490966796875, -0.03574562072753906, -0.02973175048828125, -0.023717880249023438, -0.017704010009765625, -0.011690139770507812, -0.00567626953125, 0.0003376007080078125, 0.006351470947265625, 0.012365341186523438, 0.01837921142578125, 0.024393081665039062, 0.030406951904296875, 0.03642082214355469, 0.0424346923828125, 0.04844856262207031, 0.054462432861328125, 0.06047630310058594, 0.06649017333984375, 0.07250404357910156, 0.07851791381835938, 0.08453178405761719, 0.090545654296875, 0.09655952453613281, 0.10257339477539062, 0.10858726501464844, 0.11460113525390625, 0.12061500549316406, 0.12662887573242188, 0.1326427459716797, 0.1386566162109375, 0.1446704864501953, 0.15068435668945312, 0.15669822692871094, 0.16271209716796875, 0.16872596740722656, 0.17473983764648438, 0.1807537078857422, 0.186767578125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 11.0, 21.0, 29.0, 31.0, 39.0, 43.0, 76.0, 90.0, 92.0, 83.0, 98.0, 88.0, 68.0, 61.0, 44.0, 34.0, 30.0, 21.0, 16.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1436767578125, -0.13951587677001953, -0.13535499572753906, -0.1311941146850586, -0.12703323364257812, -0.12287235260009766, -0.11871147155761719, -0.11455059051513672, -0.11038970947265625, -0.10622882843017578, -0.10206794738769531, -0.09790706634521484, -0.09374618530273438, -0.0895853042602539, -0.08542442321777344, -0.08126354217529297, -0.0771026611328125, -0.07294178009033203, -0.06878089904785156, -0.0646200180053711, -0.060459136962890625, -0.056298255920410156, -0.05213737487792969, -0.04797649383544922, -0.04381561279296875, -0.03965473175048828, -0.03549385070800781, -0.031332969665527344, -0.027172088623046875, -0.023011207580566406, -0.018850326538085938, -0.014689445495605469, -0.010528564453125, -0.006367683410644531, -0.0022068023681640625, 0.0019540786743164062, 0.006114959716796875, 0.010275840759277344, 0.014436721801757812, 0.01859760284423828, 0.02275848388671875, 0.02691936492919922, 0.031080245971679688, 0.035241127014160156, 0.039402008056640625, 0.043562889099121094, 0.04772377014160156, 0.05188465118408203, 0.0560455322265625, 0.06020641326904297, 0.06436729431152344, 0.0685281753540039, 0.07268905639648438, 0.07684993743896484, 0.08101081848144531, 0.08517169952392578, 0.08933258056640625, 0.09349346160888672, 0.09765434265136719, 0.10181522369384766, 0.10597610473632812, 0.1101369857788086, 0.11429786682128906, 0.11845874786376953, 0.12261962890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 9.0, 6.0, 12.0, 9.0, 14.0, 28.0, 41.0, 56.0, 91.0, 133.0, 198.0, 389.0, 751.0, 1423.0, 3201.0, 8790.0, 30571.0, 152001.0, 673104.0, 135083.0, 28206.0, 8236.0, 3126.0, 1387.0, 696.0, 379.0, 206.0, 134.0, 83.0, 58.0, 37.0, 18.0, 15.0, 13.0, 13.0, 7.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.42041015625, -0.4066123962402344, -0.39281463623046875, -0.3790168762207031, -0.3652191162109375, -0.3514213562011719, -0.33762359619140625, -0.3238258361816406, -0.310028076171875, -0.2962303161621094, -0.28243255615234375, -0.2686347961425781, -0.2548370361328125, -0.24103927612304688, -0.22724151611328125, -0.21344375610351562, -0.19964599609375, -0.18584823608398438, -0.17205047607421875, -0.15825271606445312, -0.1444549560546875, -0.13065719604492188, -0.11685943603515625, -0.10306167602539062, -0.089263916015625, -0.07546615600585938, -0.06166839599609375, -0.047870635986328125, -0.0340728759765625, -0.020275115966796875, -0.00647735595703125, 0.007320404052734375, 0.0211181640625, 0.034915924072265625, 0.04871368408203125, 0.06251144409179688, 0.0763092041015625, 0.09010696411132812, 0.10390472412109375, 0.11770248413085938, 0.131500244140625, 0.14529800415039062, 0.15909576416015625, 0.17289352416992188, 0.1866912841796875, 0.20048904418945312, 0.21428680419921875, 0.22808456420898438, 0.24188232421875, 0.2556800842285156, 0.26947784423828125, 0.2832756042480469, 0.2970733642578125, 0.3108711242675781, 0.32466888427734375, 0.3384666442871094, 0.352264404296875, 0.3660621643066406, 0.37985992431640625, 0.3936576843261719, 0.4074554443359375, 0.4212532043457031, 0.43505096435546875, 0.4488487243652344, 0.462646484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 7.0, 12.0, 8.0, 12.0, 10.0, 10.0, 17.0, 18.0, 29.0, 24.0, 29.0, 25.0, 35.0, 37.0, 51.0, 57.0, 52.0, 55.0, 62.0, 41.0, 48.0, 37.0, 64.0, 36.0, 33.0, 30.0, 28.0, 28.0, 12.0, 15.0, 12.0, 18.0, 8.0, 8.0, 9.0, 5.0, 6.0, 4.0, 5.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.39404296875, -0.382476806640625, -0.37091064453125, -0.359344482421875, -0.3477783203125, -0.336212158203125, -0.32464599609375, -0.313079833984375, -0.301513671875, -0.289947509765625, -0.27838134765625, -0.266815185546875, -0.2552490234375, -0.243682861328125, -0.23211669921875, -0.220550537109375, -0.208984375, -0.197418212890625, -0.18585205078125, -0.174285888671875, -0.1627197265625, -0.151153564453125, -0.13958740234375, -0.128021240234375, -0.116455078125, -0.104888916015625, -0.09332275390625, -0.081756591796875, -0.0701904296875, -0.058624267578125, -0.04705810546875, -0.035491943359375, -0.02392578125, -0.012359619140625, -0.00079345703125, 0.010772705078125, 0.0223388671875, 0.033905029296875, 0.04547119140625, 0.057037353515625, 0.068603515625, 0.080169677734375, 0.09173583984375, 0.103302001953125, 0.1148681640625, 0.126434326171875, 0.13800048828125, 0.149566650390625, 0.1611328125, 0.172698974609375, 0.18426513671875, 0.195831298828125, 0.2073974609375, 0.218963623046875, 0.23052978515625, 0.242095947265625, 0.253662109375, 0.265228271484375, 0.27679443359375, 0.288360595703125, 0.2999267578125, 0.311492919921875, 0.32305908203125, 0.334625244140625, 0.34619140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 21.0, 23.0, 30.0, 39.0, 54.0, 82.0, 132.0, 207.0, 384.0, 654.0, 1356.0, 2937.0, 7512.0, 25578.0, 161696.0, 744984.0, 76639.0, 16384.0, 5393.0, 2107.0, 982.0, 493.0, 303.0, 190.0, 109.0, 68.0, 47.0, 44.0, 26.0, 15.0, 14.0, 8.0, 11.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.41015625, -0.3982086181640625, -0.386260986328125, -0.3743133544921875, -0.36236572265625, -0.3504180908203125, -0.338470458984375, -0.3265228271484375, -0.3145751953125, -0.3026275634765625, -0.290679931640625, -0.2787322998046875, -0.26678466796875, -0.2548370361328125, -0.242889404296875, -0.2309417724609375, -0.218994140625, -0.2070465087890625, -0.195098876953125, -0.1831512451171875, -0.17120361328125, -0.1592559814453125, -0.147308349609375, -0.1353607177734375, -0.1234130859375, -0.1114654541015625, -0.099517822265625, -0.0875701904296875, -0.07562255859375, -0.0636749267578125, -0.051727294921875, -0.0397796630859375, -0.02783203125, -0.0158843994140625, -0.003936767578125, 0.0080108642578125, 0.01995849609375, 0.0319061279296875, 0.043853759765625, 0.0558013916015625, 0.0677490234375, 0.0796966552734375, 0.091644287109375, 0.1035919189453125, 0.11553955078125, 0.1274871826171875, 0.139434814453125, 0.1513824462890625, 0.163330078125, 0.1752777099609375, 0.187225341796875, 0.1991729736328125, 0.21112060546875, 0.2230682373046875, 0.235015869140625, 0.2469635009765625, 0.2589111328125, 0.2708587646484375, 0.282806396484375, 0.2947540283203125, 0.30670166015625, 0.3186492919921875, 0.330596923828125, 0.3425445556640625, 0.3544921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 10.0, 11.0, 20.0, 27.0, 41.0, 60.0, 124.0, 180.0, 193.0, 113.0, 65.0, 39.0, 39.0, 19.0, 12.0, 12.0, 4.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010693073272705078, -0.00010295771062374115, -9.898468852043152e-05, -9.501166641712189e-05, -9.103864431381226e-05, -8.706562221050262e-05, -8.309260010719299e-05, -7.911957800388336e-05, -7.514655590057373e-05, -7.11735337972641e-05, -6.720051169395447e-05, -6.322748959064484e-05, -5.9254467487335205e-05, -5.5281445384025574e-05, -5.130842328071594e-05, -4.733540117740631e-05, -4.336237907409668e-05, -3.938935697078705e-05, -3.541633486747742e-05, -3.1443312764167786e-05, -2.7470290660858154e-05, -2.3497268557548523e-05, -1.952424645423889e-05, -1.555122435092926e-05, -1.1578202247619629e-05, -7.6051801443099976e-06, -3.632158041000366e-06, 3.4086406230926514e-07, 4.3138861656188965e-06, 8.286908268928528e-06, 1.225993037223816e-05, 1.623295247554779e-05, 2.0205974578857422e-05, 2.4178996682167053e-05, 2.8152018785476685e-05, 3.2125040888786316e-05, 3.609806299209595e-05, 4.007108509540558e-05, 4.404410719871521e-05, 4.801712930202484e-05, 5.199015140533447e-05, 5.5963173508644104e-05, 5.9936195611953735e-05, 6.390921771526337e-05, 6.7882239818573e-05, 7.185526192188263e-05, 7.582828402519226e-05, 7.980130612850189e-05, 8.377432823181152e-05, 8.774735033512115e-05, 9.172037243843079e-05, 9.569339454174042e-05, 9.966641664505005e-05, 0.00010363943874835968, 0.00010761246085166931, 0.00011158548295497894, 0.00011555850505828857, 0.0001195315271615982, 0.00012350454926490784, 0.00012747757136821747, 0.0001314505934715271, 0.00013542361557483673, 0.00013939663767814636, 0.000143369659781456, 0.00014734268188476562]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 5.0, 14.0, 18.0, 29.0, 31.0, 43.0, 64.0, 96.0, 148.0, 251.0, 429.0, 835.0, 1632.0, 4195.0, 14173.0, 101850.0, 826971.0, 78483.0, 12363.0, 3716.0, 1476.0, 727.0, 381.0, 237.0, 123.0, 71.0, 57.0, 47.0, 28.0, 17.0, 15.0, 11.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.458740234375, -0.44460296630859375, -0.4304656982421875, -0.41632843017578125, -0.402191162109375, -0.38805389404296875, -0.3739166259765625, -0.35977935791015625, -0.34564208984375, -0.33150482177734375, -0.3173675537109375, -0.30323028564453125, -0.289093017578125, -0.27495574951171875, -0.2608184814453125, -0.24668121337890625, -0.2325439453125, -0.21840667724609375, -0.2042694091796875, -0.19013214111328125, -0.175994873046875, -0.16185760498046875, -0.1477203369140625, -0.13358306884765625, -0.11944580078125, -0.10530853271484375, -0.0911712646484375, -0.07703399658203125, -0.062896728515625, -0.04875946044921875, -0.0346221923828125, -0.02048492431640625, -0.00634765625, 0.00778961181640625, 0.0219268798828125, 0.03606414794921875, 0.050201416015625, 0.06433868408203125, 0.0784759521484375, 0.09261322021484375, 0.10675048828125, 0.12088775634765625, 0.1350250244140625, 0.14916229248046875, 0.163299560546875, 0.17743682861328125, 0.1915740966796875, 0.20571136474609375, 0.2198486328125, 0.23398590087890625, 0.2481231689453125, 0.26226043701171875, 0.276397705078125, 0.29053497314453125, 0.3046722412109375, 0.31880950927734375, 0.33294677734375, 0.34708404541015625, 0.3612213134765625, 0.37535858154296875, 0.389495849609375, 0.40363311767578125, 0.4177703857421875, 0.43190765380859375, 0.446044921875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 14.0, 17.0, 17.0, 20.0, 34.0, 37.0, 49.0, 68.0, 83.0, 112.0, 118.0, 99.0, 60.0, 69.0, 53.0, 18.0, 26.0, 19.0, 11.0, 14.0, 4.0, 17.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2578125, -0.25089073181152344, -0.24396896362304688, -0.2370471954345703, -0.23012542724609375, -0.2232036590576172, -0.21628189086914062, -0.20936012268066406, -0.2024383544921875, -0.19551658630371094, -0.18859481811523438, -0.1816730499267578, -0.17475128173828125, -0.1678295135498047, -0.16090774536132812, -0.15398597717285156, -0.147064208984375, -0.14014244079589844, -0.13322067260742188, -0.1262989044189453, -0.11937713623046875, -0.11245536804199219, -0.10553359985351562, -0.09861183166503906, -0.0916900634765625, -0.08476829528808594, -0.07784652709960938, -0.07092475891113281, -0.06400299072265625, -0.05708122253417969, -0.050159454345703125, -0.04323768615722656, -0.03631591796875, -0.029394149780273438, -0.022472381591796875, -0.015550613403320312, -0.00862884521484375, -0.0017070770263671875, 0.005214691162109375, 0.012136459350585938, 0.0190582275390625, 0.025979995727539062, 0.032901763916015625, 0.03982353210449219, 0.04674530029296875, 0.05366706848144531, 0.060588836669921875, 0.06751060485839844, 0.074432373046875, 0.08135414123535156, 0.08827590942382812, 0.09519767761230469, 0.10211944580078125, 0.10904121398925781, 0.11596298217773438, 0.12288475036621094, 0.1298065185546875, 0.13672828674316406, 0.14365005493164062, 0.1505718231201172, 0.15749359130859375, 0.1644153594970703, 0.17133712768554688, 0.17825889587402344, 0.1851806640625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 15.0, 26.0, 31.0, 63.0, 125.0, 280.0, 246.0, 113.0, 48.0, 20.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.87274169921875, -9.648122787475586, -9.423504829406738, -9.198885917663574, -8.97426700592041, -8.749649047851562, -8.525030136108398, -8.300411224365234, -8.07579231262207, -7.8511738777160645, -7.6265549659729, -7.4019365310668945, -7.1773176193237305, -6.952699184417725, -6.728080749511719, -6.503461837768555, -6.278843879699707, -6.054225444793701, -5.829606533050537, -5.604988098144531, -5.380369186401367, -5.155750751495361, -4.9311323165893555, -4.706513404846191, -4.4818949699401855, -4.25727653503418, -4.032657623291016, -3.8080391883850098, -3.583420515060425, -3.35880184173584, -3.134183406829834, -2.909564733505249, -2.684946060180664, -2.460327386856079, -2.235708713531494, -2.0110902786254883, -1.7864716053009033, -1.5618529319763184, -1.337234377861023, -1.1126158237457275, -0.8879971504211426, -0.6633785367012024, -0.4387599229812622, -0.21414130926132202, 0.010477304458618164, 0.23509597778320312, 0.45971453189849854, 0.684333086013794, 0.9089517593383789, 1.1335704326629639, 1.3581889867782593, 1.5828075408935547, 1.8074262142181396, 2.0320448875427246, 2.2566633224487305, 2.4812819957733154, 2.7059006690979004, 2.9305193424224854, 3.1551380157470703, 3.379756450653076, 3.604375123977661, 3.828993797302246, 4.053612232208252, 4.278230667114258, 4.502849578857422]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 3.0, 12.0, 6.0, 15.0, 10.0, 21.0, 10.0, 14.0, 27.0, 30.0, 30.0, 35.0, 36.0, 41.0, 44.0, 61.0, 60.0, 77.0, 68.0, 55.0, 41.0, 44.0, 35.0, 32.0, 27.0, 23.0, 23.0, 13.0, 13.0, 15.0, 9.0, 14.0, 11.0, 8.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7776765823364258, -1.7192513942718506, -1.6608262062072754, -1.6024010181427002, -1.543975830078125, -1.4855506420135498, -1.4271254539489746, -1.3687002658843994, -1.3102750778198242, -1.251849889755249, -1.1934247016906738, -1.1349995136260986, -1.0765743255615234, -1.0181491374969482, -0.9597240090370178, -0.9012988209724426, -0.8428736925125122, -0.784448504447937, -0.7260233163833618, -0.6675981283187866, -0.6091729402542114, -0.5507477521896362, -0.4923226237297058, -0.4338974356651306, -0.3754722476005554, -0.3170470595359802, -0.25862187147140503, -0.20019671320915222, -0.14177152514457703, -0.08334633708000183, -0.024921178817749023, 0.03350400924682617, 0.09192931652069092, 0.1503545045852661, 0.20877967774868011, 0.2672048509120941, 0.3256300389766693, 0.3840552270412445, 0.4424803853034973, 0.5009055733680725, 0.5593307614326477, 0.6177559494972229, 0.6761811375617981, 0.7346062660217285, 0.7930314540863037, 0.8514566421508789, 0.9098818302154541, 0.9683070182800293, 1.0267322063446045, 1.0851573944091797, 1.1435825824737549, 1.20200777053833, 1.2604329586029053, 1.3188581466674805, 1.3772833347320557, 1.4357085227966309, 1.494133710861206, 1.5525588989257812, 1.6109840869903564, 1.6694092750549316, 1.7278344631195068, 1.786259651184082, 1.8446848392486572, 1.9031100273132324, 1.961535096168518]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 10.0, 20.0, 28.0, 28.0, 84.0, 119.0, 186.0, 302.0, 598.0, 1568.0, 91850.0, 4094116.0, 3713.0, 715.0, 373.0, 227.0, 116.0, 81.0, 57.0, 24.0, 16.0, 19.0, 12.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4453125, -1.398956298828125, -1.35260009765625, -1.306243896484375, -1.2598876953125, -1.213531494140625, -1.16717529296875, -1.120819091796875, -1.074462890625, -1.028106689453125, -0.98175048828125, -0.935394287109375, -0.8890380859375, -0.842681884765625, -0.79632568359375, -0.749969482421875, -0.70361328125, -0.657257080078125, -0.61090087890625, -0.564544677734375, -0.5181884765625, -0.471832275390625, -0.42547607421875, -0.379119873046875, -0.332763671875, -0.286407470703125, -0.24005126953125, -0.193695068359375, -0.1473388671875, -0.100982666015625, -0.05462646484375, -0.008270263671875, 0.0380859375, 0.084442138671875, 0.13079833984375, 0.177154541015625, 0.2235107421875, 0.269866943359375, 0.31622314453125, 0.362579345703125, 0.408935546875, 0.455291748046875, 0.50164794921875, 0.548004150390625, 0.5943603515625, 0.640716552734375, 0.68707275390625, 0.733428955078125, 0.77978515625, 0.826141357421875, 0.87249755859375, 0.918853759765625, 0.9652099609375, 1.011566162109375, 1.05792236328125, 1.104278564453125, 1.150634765625, 1.196990966796875, 1.24334716796875, 1.289703369140625, 1.3360595703125, 1.382415771484375, 1.42877197265625, 1.475128173828125, 1.521484375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 12.0, 19.0, 31.0, 32.0, 42.0, 54.0, 62.0, 86.0, 95.0, 102.0, 107.0, 77.0, 60.0, 67.0, 47.0, 29.0, 26.0, 17.0, 10.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1436767578125, -0.1394968032836914, -0.1353168487548828, -0.13113689422607422, -0.12695693969726562, -0.12277698516845703, -0.11859703063964844, -0.11441707611083984, -0.11023712158203125, -0.10605716705322266, -0.10187721252441406, -0.09769725799560547, -0.09351730346679688, -0.08933734893798828, -0.08515739440917969, -0.0809774398803711, -0.0767974853515625, -0.0726175308227539, -0.06843757629394531, -0.06425762176513672, -0.060077667236328125, -0.05589771270751953, -0.05171775817871094, -0.047537803649902344, -0.04335784912109375, -0.039177894592285156, -0.03499794006347656, -0.03081798553466797, -0.026638031005859375, -0.02245807647705078, -0.018278121948242188, -0.014098167419433594, -0.009918212890625, -0.005738258361816406, -0.0015583038330078125, 0.0026216506958007812, 0.006801605224609375, 0.010981559753417969, 0.015161514282226562, 0.019341468811035156, 0.02352142333984375, 0.027701377868652344, 0.03188133239746094, 0.03606128692626953, 0.040241241455078125, 0.04442119598388672, 0.04860115051269531, 0.052781105041503906, 0.0569610595703125, 0.061141014099121094, 0.06532096862792969, 0.06950092315673828, 0.07368087768554688, 0.07786083221435547, 0.08204078674316406, 0.08622074127197266, 0.09040069580078125, 0.09458065032958984, 0.09876060485839844, 0.10294055938720703, 0.10712051391601562, 0.11130046844482422, 0.11548042297363281, 0.1196603775024414, 0.12384033203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 9.0, 16.0, 18.0, 30.0, 41.0, 47.0, 75.0, 121.0, 182.0, 279.0, 417.0, 760.0, 2925.0, 91421.0, 4081777.0, 13243.0, 1374.0, 553.0, 334.0, 232.0, 154.0, 83.0, 66.0, 40.0, 37.0, 16.0, 7.0, 10.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21875, -1.1797943115234375, -1.140838623046875, -1.1018829345703125, -1.06292724609375, -1.0239715576171875, -0.985015869140625, -0.9460601806640625, -0.9071044921875, -0.8681488037109375, -0.829193115234375, -0.7902374267578125, -0.75128173828125, -0.7123260498046875, -0.673370361328125, -0.6344146728515625, -0.595458984375, -0.5565032958984375, -0.517547607421875, -0.4785919189453125, -0.43963623046875, -0.4006805419921875, -0.361724853515625, -0.3227691650390625, -0.2838134765625, -0.2448577880859375, -0.205902099609375, -0.1669464111328125, -0.12799072265625, -0.0890350341796875, -0.050079345703125, -0.0111236572265625, 0.02783203125, 0.0667877197265625, 0.105743408203125, 0.1446990966796875, 0.18365478515625, 0.2226104736328125, 0.261566162109375, 0.3005218505859375, 0.3394775390625, 0.3784332275390625, 0.417388916015625, 0.4563446044921875, 0.49530029296875, 0.5342559814453125, 0.573211669921875, 0.6121673583984375, 0.651123046875, 0.6900787353515625, 0.729034423828125, 0.7679901123046875, 0.80694580078125, 0.8459014892578125, 0.884857177734375, 0.9238128662109375, 0.9627685546875, 1.0017242431640625, 1.040679931640625, 1.0796356201171875, 1.11859130859375, 1.1575469970703125, 1.196502685546875, 1.2354583740234375, 1.2744140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 13.0, 12.0, 42.0, 132.0, 594.0, 2662.0, 436.0, 113.0, 41.0, 17.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1513671875, -1.1198043823242188, -1.0882415771484375, -1.0566787719726562, -1.025115966796875, -0.9935531616210938, -0.9619903564453125, -0.9304275512695312, -0.89886474609375, -0.8673019409179688, -0.8357391357421875, -0.8041763305664062, -0.772613525390625, -0.7410507202148438, -0.7094879150390625, -0.6779251098632812, -0.6463623046875, -0.6147994995117188, -0.5832366943359375, -0.5516738891601562, -0.520111083984375, -0.48854827880859375, -0.4569854736328125, -0.42542266845703125, -0.39385986328125, -0.36229705810546875, -0.3307342529296875, -0.29917144775390625, -0.267608642578125, -0.23604583740234375, -0.2044830322265625, -0.17292022705078125, -0.141357421875, -0.10979461669921875, -0.0782318115234375, -0.04666900634765625, -0.015106201171875, 0.01645660400390625, 0.0480194091796875, 0.07958221435546875, 0.11114501953125, 0.14270782470703125, 0.1742706298828125, 0.20583343505859375, 0.237396240234375, 0.26895904541015625, 0.3005218505859375, 0.33208465576171875, 0.3636474609375, 0.39521026611328125, 0.4267730712890625, 0.45833587646484375, 0.489898681640625, 0.5214614868164062, 0.5530242919921875, 0.5845870971679688, 0.61614990234375, 0.6477127075195312, 0.6792755126953125, 0.7108383178710938, 0.742401123046875, 0.7739639282226562, 0.8055267333984375, 0.8370895385742188, 0.86865234375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 11.0, 31.0, 52.0, 152.0, 289.0, 243.0, 115.0, 49.0, 19.0, 11.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.928096771240234, -6.723127365112305, -6.518158435821533, -6.3131890296936035, -6.108219623565674, -5.903250694274902, -5.698281288146973, -5.493311882019043, -5.288342475891113, -5.083373069763184, -4.878404140472412, -4.673434734344482, -4.468465328216553, -4.263496398925781, -4.058526992797852, -3.853557586669922, -3.6485884189605713, -3.4436192512512207, -3.238649845123291, -3.0336806774139404, -2.8287112712860107, -2.62374210357666, -2.4187726974487305, -2.21380352973938, -2.0088343620300293, -1.8038650751113892, -1.598895788192749, -1.3939266204833984, -1.1889572143554688, -0.9839880466461182, -0.779018759727478, -0.5740494728088379, -0.3690800666809082, -0.16411079466342926, 0.04085847735404968, 0.24582773447036743, 0.45079702138900757, 0.6557662487030029, 0.8607355356216431, 1.0657048225402832, 1.2706741094589233, 1.4756433963775635, 1.6806126832962036, 1.8855819702148438, 2.0905511379241943, 2.295520305633545, 2.5004897117614746, 2.7054591178894043, 2.910428285598755, 3.1153974533081055, 3.320366859436035, 3.5253360271453857, 3.7303054332733154, 3.935274600982666, 4.140244007110596, 4.345212936401367, 4.550182342529297, 4.755151748657227, 4.960120677947998, 5.165090084075928, 5.370059490203857, 5.575028419494629, 5.779997825622559, 5.984967231750488, 6.189936637878418]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 11.0, 10.0, 17.0, 23.0, 20.0, 36.0, 34.0, 46.0, 48.0, 64.0, 62.0, 51.0, 52.0, 56.0, 62.0, 56.0, 61.0, 55.0, 53.0, 44.0, 28.0, 26.0, 17.0, 20.0, 8.0, 9.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1856422424316406, -2.113992929458618, -2.0423436164855957, -1.9706943035125732, -1.8990449905395508, -1.8273956775665283, -1.7557463645935059, -1.6840970516204834, -1.612447738647461, -1.5407984256744385, -1.469149112701416, -1.3974997997283936, -1.325850486755371, -1.2542011737823486, -1.1825518608093262, -1.1109025478363037, -1.0392531156539917, -0.9676038026809692, -0.8959544897079468, -0.8243051767349243, -0.7526558637619019, -0.6810065507888794, -0.6093571782112122, -0.5377078652381897, -0.46605855226516724, -0.3944092392921448, -0.3227599263191223, -0.25111058354377747, -0.179461270570755, -0.10781195759773254, -0.036162614822387695, 0.035486698150634766, 0.10713601112365723, 0.1787853240966797, 0.25043463706970215, 0.322083979845047, 0.39373329281806946, 0.4653826057910919, 0.5370319485664368, 0.6086812615394592, 0.6803305745124817, 0.7519798874855042, 0.8236292004585266, 0.8952785730361938, 0.9669278860092163, 1.0385771989822388, 1.1102265119552612, 1.1818758249282837, 1.2535251379013062, 1.3251744508743286, 1.396823763847351, 1.4684730768203735, 1.540122389793396, 1.6117717027664185, 1.6834211349487305, 1.755070447921753, 1.8267197608947754, 1.8983690738677979, 1.9700183868408203, 2.0416676998138428, 2.1133170127868652, 2.1849663257598877, 2.25661563873291, 2.3282649517059326, 2.399914264678955]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 8.0, 17.0, 9.0, 29.0, 41.0, 77.0, 119.0, 221.0, 414.0, 899.0, 2137.0, 6077.0, 22434.0, 124707.0, 574875.0, 260025.0, 41104.0, 9700.0, 3216.0, 1284.0, 538.0, 250.0, 145.0, 84.0, 47.0, 34.0, 17.0, 10.0, 7.0, 9.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.46728515625, -0.454193115234375, -0.44110107421875, -0.428009033203125, -0.4149169921875, -0.401824951171875, -0.38873291015625, -0.375640869140625, -0.362548828125, -0.349456787109375, -0.33636474609375, -0.323272705078125, -0.3101806640625, -0.297088623046875, -0.28399658203125, -0.270904541015625, -0.2578125, -0.244720458984375, -0.23162841796875, -0.218536376953125, -0.2054443359375, -0.192352294921875, -0.17926025390625, -0.166168212890625, -0.153076171875, -0.139984130859375, -0.12689208984375, -0.113800048828125, -0.1007080078125, -0.087615966796875, -0.07452392578125, -0.061431884765625, -0.04833984375, -0.035247802734375, -0.02215576171875, -0.009063720703125, 0.0040283203125, 0.017120361328125, 0.03021240234375, 0.043304443359375, 0.056396484375, 0.069488525390625, 0.08258056640625, 0.095672607421875, 0.1087646484375, 0.121856689453125, 0.13494873046875, 0.148040771484375, 0.1611328125, 0.174224853515625, 0.18731689453125, 0.200408935546875, 0.2135009765625, 0.226593017578125, 0.23968505859375, 0.252777099609375, 0.265869140625, 0.278961181640625, 0.29205322265625, 0.305145263671875, 0.3182373046875, 0.331329345703125, 0.34442138671875, 0.357513427734375, 0.37060546875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 8.0, 10.0, 17.0, 18.0, 28.0, 30.0, 44.0, 59.0, 58.0, 59.0, 59.0, 76.0, 95.0, 65.0, 67.0, 57.0, 55.0, 37.0, 46.0, 25.0, 22.0, 24.0, 15.0, 12.0, 8.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1351318359375, -0.1310720443725586, -0.1270122528076172, -0.12295246124267578, -0.11889266967773438, -0.11483287811279297, -0.11077308654785156, -0.10671329498291016, -0.10265350341796875, -0.09859371185302734, -0.09453392028808594, -0.09047412872314453, -0.08641433715820312, -0.08235454559326172, -0.07829475402832031, -0.0742349624633789, -0.0701751708984375, -0.0661153793334961, -0.06205558776855469, -0.05799579620361328, -0.053936004638671875, -0.04987621307373047, -0.04581642150878906, -0.041756629943847656, -0.03769683837890625, -0.033637046813964844, -0.029577255249023438, -0.02551746368408203, -0.021457672119140625, -0.01739788055419922, -0.013338088989257812, -0.009278297424316406, -0.005218505859375, -0.0011587142944335938, 0.0029010772705078125, 0.006960868835449219, 0.011020660400390625, 0.015080451965332031, 0.019140243530273438, 0.023200035095214844, 0.02725982666015625, 0.031319618225097656, 0.03537940979003906, 0.03943920135498047, 0.043498992919921875, 0.04755878448486328, 0.05161857604980469, 0.055678367614746094, 0.0597381591796875, 0.0637979507446289, 0.06785774230957031, 0.07191753387451172, 0.07597732543945312, 0.08003711700439453, 0.08409690856933594, 0.08815670013427734, 0.09221649169921875, 0.09627628326416016, 0.10033607482910156, 0.10439586639404297, 0.10845565795898438, 0.11251544952392578, 0.11657524108886719, 0.1206350326538086, 0.12469482421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 3.0, 5.0, 1.0, 3.0, 8.0, 10.0, 11.0, 11.0, 14.0, 33.0, 49.0, 70.0, 76.0, 156.0, 284.0, 508.0, 1126.0, 2792.0, 8057.0, 30727.0, 155011.0, 644496.0, 160154.0, 31320.0, 8327.0, 2874.0, 1156.0, 529.0, 301.0, 160.0, 106.0, 56.0, 37.0, 24.0, 22.0, 13.0, 6.0, 10.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283935546875, -0.27185821533203125, -0.2597808837890625, -0.24770355224609375, -0.235626220703125, -0.22354888916015625, -0.2114715576171875, -0.19939422607421875, -0.18731689453125, -0.17523956298828125, -0.1631622314453125, -0.15108489990234375, -0.139007568359375, -0.12693023681640625, -0.1148529052734375, -0.10277557373046875, -0.0906982421875, -0.07862091064453125, -0.0665435791015625, -0.05446624755859375, -0.042388916015625, -0.03031158447265625, -0.0182342529296875, -0.00615692138671875, 0.00592041015625, 0.01799774169921875, 0.0300750732421875, 0.04215240478515625, 0.054229736328125, 0.06630706787109375, 0.0783843994140625, 0.09046173095703125, 0.1025390625, 0.11461639404296875, 0.1266937255859375, 0.13877105712890625, 0.150848388671875, 0.16292572021484375, 0.1750030517578125, 0.18708038330078125, 0.19915771484375, 0.21123504638671875, 0.2233123779296875, 0.23538970947265625, 0.247467041015625, 0.25954437255859375, 0.2716217041015625, 0.28369903564453125, 0.2957763671875, 0.30785369873046875, 0.3199310302734375, 0.33200836181640625, 0.344085693359375, 0.35616302490234375, 0.3682403564453125, 0.38031768798828125, 0.39239501953125, 0.40447235107421875, 0.4165496826171875, 0.42862701416015625, 0.440704345703125, 0.45278167724609375, 0.4648590087890625, 0.47693634033203125, 0.489013671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 6.0, 8.0, 8.0, 4.0, 10.0, 11.0, 18.0, 9.0, 20.0, 29.0, 35.0, 44.0, 41.0, 44.0, 54.0, 54.0, 60.0, 75.0, 64.0, 64.0, 64.0, 48.0, 52.0, 49.0, 29.0, 23.0, 22.0, 15.0, 8.0, 7.0, 6.0, 10.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.51513671875, -0.5008697509765625, -0.486602783203125, -0.4723358154296875, -0.45806884765625, -0.4438018798828125, -0.429534912109375, -0.4152679443359375, -0.4010009765625, -0.3867340087890625, -0.372467041015625, -0.3582000732421875, -0.34393310546875, -0.3296661376953125, -0.315399169921875, -0.3011322021484375, -0.286865234375, -0.2725982666015625, -0.258331298828125, -0.2440643310546875, -0.22979736328125, -0.2155303955078125, -0.201263427734375, -0.1869964599609375, -0.1727294921875, -0.1584625244140625, -0.144195556640625, -0.1299285888671875, -0.11566162109375, -0.1013946533203125, -0.087127685546875, -0.0728607177734375, -0.05859375, -0.0443267822265625, -0.030059814453125, -0.0157928466796875, -0.00152587890625, 0.0127410888671875, 0.027008056640625, 0.0412750244140625, 0.0555419921875, 0.0698089599609375, 0.084075927734375, 0.0983428955078125, 0.11260986328125, 0.1268768310546875, 0.141143798828125, 0.1554107666015625, 0.169677734375, 0.1839447021484375, 0.198211669921875, 0.2124786376953125, 0.22674560546875, 0.2410125732421875, 0.255279541015625, 0.2695465087890625, 0.2838134765625, 0.2980804443359375, 0.312347412109375, 0.3266143798828125, 0.34088134765625, 0.3551483154296875, 0.369415283203125, 0.3836822509765625, 0.39794921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 8.0, 5.0, 9.0, 9.0, 17.0, 32.0, 40.0, 47.0, 91.0, 172.0, 290.0, 482.0, 911.0, 1633.0, 3646.0, 9403.0, 29105.0, 125267.0, 654529.0, 167032.0, 36105.0, 11210.0, 4246.0, 1996.0, 983.0, 532.0, 312.0, 169.0, 98.0, 57.0, 41.0, 20.0, 23.0, 13.0, 15.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.19677734375, -0.1910877227783203, -0.18539810180664062, -0.17970848083496094, -0.17401885986328125, -0.16832923889160156, -0.16263961791992188, -0.1569499969482422, -0.1512603759765625, -0.1455707550048828, -0.13988113403320312, -0.13419151306152344, -0.12850189208984375, -0.12281227111816406, -0.11712265014648438, -0.11143302917480469, -0.105743408203125, -0.10005378723144531, -0.09436416625976562, -0.08867454528808594, -0.08298492431640625, -0.07729530334472656, -0.07160568237304688, -0.06591606140136719, -0.0602264404296875, -0.05453681945800781, -0.048847198486328125, -0.04315757751464844, -0.03746795654296875, -0.03177833557128906, -0.026088714599609375, -0.020399093627929688, -0.01470947265625, -0.009019851684570312, -0.003330230712890625, 0.0023593902587890625, 0.00804901123046875, 0.013738632202148438, 0.019428253173828125, 0.025117874145507812, 0.0308074951171875, 0.03649711608886719, 0.042186737060546875, 0.04787635803222656, 0.05356597900390625, 0.05925559997558594, 0.06494522094726562, 0.07063484191894531, 0.076324462890625, 0.08201408386230469, 0.08770370483398438, 0.09339332580566406, 0.09908294677734375, 0.10477256774902344, 0.11046218872070312, 0.11615180969238281, 0.1218414306640625, 0.1275310516357422, 0.13322067260742188, 0.13891029357910156, 0.14459991455078125, 0.15028953552246094, 0.15597915649414062, 0.1616687774658203, 0.1673583984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 10.0, 18.0, 17.0, 36.0, 46.0, 88.0, 121.0, 168.0, 153.0, 104.0, 83.0, 44.0, 38.0, 17.0, 13.0, 13.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.96453857421875e-05, -8.728262037038803e-05, -8.491985499858856e-05, -8.255708962678909e-05, -8.019432425498962e-05, -7.783155888319016e-05, -7.546879351139069e-05, -7.310602813959122e-05, -7.074326276779175e-05, -6.838049739599228e-05, -6.601773202419281e-05, -6.365496665239334e-05, -6.129220128059387e-05, -5.89294359087944e-05, -5.6566670536994934e-05, -5.4203905165195465e-05, -5.1841139793395996e-05, -4.947837442159653e-05, -4.711560904979706e-05, -4.475284367799759e-05, -4.239007830619812e-05, -4.002731293439865e-05, -3.766454756259918e-05, -3.530178219079971e-05, -3.2939016819000244e-05, -3.0576251447200775e-05, -2.8213486075401306e-05, -2.5850720703601837e-05, -2.3487955331802368e-05, -2.11251899600029e-05, -1.876242458820343e-05, -1.639965921640396e-05, -1.4036893844604492e-05, -1.1674128472805023e-05, -9.311363101005554e-06, -6.948597729206085e-06, -4.585832357406616e-06, -2.2230669856071472e-06, 1.3969838619232178e-07, 2.5024637579917908e-06, 4.86522912979126e-06, 7.227994501590729e-06, 9.590759873390198e-06, 1.1953525245189667e-05, 1.4316290616989136e-05, 1.6679055988788605e-05, 1.9041821360588074e-05, 2.1404586732387543e-05, 2.3767352104187012e-05, 2.613011747598648e-05, 2.849288284778595e-05, 3.085564821958542e-05, 3.321841359138489e-05, 3.558117896318436e-05, 3.7943944334983826e-05, 4.0306709706783295e-05, 4.2669475078582764e-05, 4.503224045038223e-05, 4.73950058221817e-05, 4.975777119398117e-05, 5.212053656578064e-05, 5.448330193758011e-05, 5.684606730937958e-05, 5.920883268117905e-05, 6.157159805297852e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 5.0, 13.0, 12.0, 17.0, 26.0, 58.0, 101.0, 187.0, 375.0, 725.0, 1784.0, 4947.0, 15075.0, 63252.0, 536504.0, 348523.0, 55350.0, 13788.0, 4509.0, 1789.0, 733.0, 363.0, 172.0, 92.0, 60.0, 25.0, 21.0, 15.0, 9.0, 9.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.16937637329101562, -0.16309356689453125, -0.15681076049804688, -0.1505279541015625, -0.14424514770507812, -0.13796234130859375, -0.13167953491210938, -0.125396728515625, -0.11911392211914062, -0.11283111572265625, -0.10654830932617188, -0.1002655029296875, -0.09398269653320312, -0.08769989013671875, -0.08141708374023438, -0.07513427734375, -0.06885147094726562, -0.06256866455078125, -0.056285858154296875, -0.0500030517578125, -0.043720245361328125, -0.03743743896484375, -0.031154632568359375, -0.024871826171875, -0.018589019775390625, -0.01230621337890625, -0.006023406982421875, 0.0002593994140625, 0.006542205810546875, 0.01282501220703125, 0.019107818603515625, 0.025390625, 0.031673431396484375, 0.03795623779296875, 0.044239044189453125, 0.0505218505859375, 0.056804656982421875, 0.06308746337890625, 0.06937026977539062, 0.075653076171875, 0.08193588256835938, 0.08821868896484375, 0.09450149536132812, 0.1007843017578125, 0.10706710815429688, 0.11334991455078125, 0.11963272094726562, 0.12591552734375, 0.13219833374023438, 0.13848114013671875, 0.14476394653320312, 0.1510467529296875, 0.15732955932617188, 0.16361236572265625, 0.16989517211914062, 0.176177978515625, 0.18246078491210938, 0.18874359130859375, 0.19502639770507812, 0.2013092041015625, 0.20759201049804688, 0.21387481689453125, 0.22015762329101562, 0.2264404296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 0.0, 4.0, 3.0, 9.0, 7.0, 14.0, 12.0, 19.0, 31.0, 27.0, 60.0, 58.0, 81.0, 82.0, 107.0, 110.0, 108.0, 69.0, 54.0, 37.0, 30.0, 18.0, 12.0, 10.0, 11.0, 5.0, 6.0, 8.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.203125, -0.1975860595703125, -0.192047119140625, -0.1865081787109375, -0.18096923828125, -0.1754302978515625, -0.169891357421875, -0.1643524169921875, -0.1588134765625, -0.1532745361328125, -0.147735595703125, -0.1421966552734375, -0.13665771484375, -0.1311187744140625, -0.125579833984375, -0.1200408935546875, -0.114501953125, -0.1089630126953125, -0.103424072265625, -0.0978851318359375, -0.09234619140625, -0.0868072509765625, -0.081268310546875, -0.0757293701171875, -0.0701904296875, -0.0646514892578125, -0.059112548828125, -0.0535736083984375, -0.04803466796875, -0.0424957275390625, -0.036956787109375, -0.0314178466796875, -0.02587890625, -0.0203399658203125, -0.014801025390625, -0.0092620849609375, -0.00372314453125, 0.0018157958984375, 0.007354736328125, 0.0128936767578125, 0.0184326171875, 0.0239715576171875, 0.029510498046875, 0.0350494384765625, 0.04058837890625, 0.0461273193359375, 0.051666259765625, 0.0572052001953125, 0.062744140625, 0.0682830810546875, 0.073822021484375, 0.0793609619140625, 0.08489990234375, 0.0904388427734375, 0.095977783203125, 0.1015167236328125, 0.1070556640625, 0.1125946044921875, 0.118133544921875, 0.1236724853515625, 0.12921142578125, 0.1347503662109375, 0.140289306640625, 0.1458282470703125, 0.1513671875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 4.0, 10.0, 15.0, 28.0, 49.0, 102.0, 198.0, 280.0, 137.0, 74.0, 56.0, 18.0, 10.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.534957408905029, -5.3976263999938965, -5.260295867919922, -5.122964859008789, -4.985633850097656, -4.848302841186523, -4.710972309112549, -4.573641300201416, -4.436310768127441, -4.298979759216309, -4.161649227142334, -4.024318218231201, -3.8869872093200684, -3.7496564388275146, -3.612325668334961, -3.474994659423828, -3.3376636505126953, -3.2003328800201416, -3.063001871109009, -2.925671100616455, -2.7883400917053223, -2.6510093212127686, -2.513678550720215, -2.376347541809082, -2.2390167713165283, -2.1016860008239746, -1.9643549919128418, -1.827024221420288, -1.6896933317184448, -1.5523624420166016, -1.4150316715240479, -1.2777007818222046, -1.1403703689575195, -1.0030394792556763, -0.8657086491584778, -0.7283778190612793, -0.591046929359436, -0.4537160396575928, -0.3163852095603943, -0.1790543794631958, -0.04172348976135254, 0.09560737013816833, 0.2329382300376892, 0.3702690899372101, 0.507599949836731, 0.6449308395385742, 0.7822616696357727, 0.9195924997329712, 1.0569233894348145, 1.1942542791366577, 1.331585168838501, 1.4689159393310547, 1.606246829032898, 1.7435777187347412, 1.880908489227295, 2.0182394981384277, 2.1555702686309814, 2.292901039123535, 2.430232048034668, 2.5675628185272217, 2.7048935890197754, 2.842224597930908, 2.979555368423462, 3.1168861389160156, 3.2542171478271484]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 5.0, 4.0, 7.0, 8.0, 7.0, 9.0, 12.0, 13.0, 15.0, 22.0, 19.0, 12.0, 13.0, 23.0, 19.0, 24.0, 35.0, 27.0, 27.0, 30.0, 46.0, 56.0, 47.0, 51.0, 57.0, 47.0, 42.0, 34.0, 34.0, 28.0, 29.0, 29.0, 19.0, 27.0, 20.0, 15.0, 18.0, 11.0, 6.0, 10.0, 12.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5275356769561768, -1.4823319911956787, -1.4371283054351807, -1.3919246196746826, -1.346720814704895, -1.301517128944397, -1.256313443183899, -1.2111097574234009, -1.1659060716629028, -1.1207023859024048, -1.0754987001419067, -1.0302948951721191, -0.9850912690162659, -0.939887523651123, -0.894683837890625, -0.849480152130127, -0.8042764067649841, -0.7590727210044861, -0.7138689756393433, -0.6686652898788452, -0.6234616041183472, -0.5782579183578491, -0.5330541729927063, -0.48785048723220825, -0.4426467716693878, -0.3974430561065674, -0.35223937034606934, -0.3070356547832489, -0.26183193922042847, -0.21662825345993042, -0.17142453789710999, -0.12622085213661194, -0.0810171365737915, -0.035813432186841965, 0.009390272200107574, 0.05459398031234741, 0.09979768097400665, 0.1450013816356659, 0.19020509719848633, 0.23540878295898438, 0.2806124985218048, 0.32581621408462524, 0.3710198998451233, 0.4162236154079437, 0.46142733097076416, 0.5066310167312622, 0.5518347024917603, 0.5970383882522583, 0.6422421336174011, 0.6874458193778992, 0.732649564743042, 0.77785325050354, 0.8230569362640381, 0.8682606220245361, 0.913464367389679, 0.958668053150177, 1.0038717985153198, 1.0490754842758179, 1.094279170036316, 1.1394829750061035, 1.1846866607666016, 1.2298903465270996, 1.2750940322875977, 1.3202977180480957, 1.3655014038085938]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 12.0, 17.0, 21.0, 32.0, 57.0, 84.0, 101.0, 166.0, 446.0, 2981.0, 217765.0, 3963469.0, 7893.0, 676.0, 197.0, 107.0, 62.0, 41.0, 45.0, 28.0, 23.0, 13.0, 14.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90576171875, -0.8711318969726562, -0.8365020751953125, -0.8018722534179688, -0.767242431640625, -0.7326126098632812, -0.6979827880859375, -0.6633529663085938, -0.62872314453125, -0.5940933227539062, -0.5594635009765625, -0.5248336791992188, -0.490203857421875, -0.45557403564453125, -0.4209442138671875, -0.38631439208984375, -0.3516845703125, -0.31705474853515625, -0.2824249267578125, -0.24779510498046875, -0.213165283203125, -0.17853546142578125, -0.1439056396484375, -0.10927581787109375, -0.07464599609375, -0.04001617431640625, -0.0053863525390625, 0.02924346923828125, 0.063873291015625, 0.09850311279296875, 0.1331329345703125, 0.16776275634765625, 0.202392578125, 0.23702239990234375, 0.2716522216796875, 0.30628204345703125, 0.340911865234375, 0.37554168701171875, 0.4101715087890625, 0.44480133056640625, 0.47943115234375, 0.5140609741210938, 0.5486907958984375, 0.5833206176757812, 0.617950439453125, 0.6525802612304688, 0.6872100830078125, 0.7218399047851562, 0.7564697265625, 0.7910995483398438, 0.8257293701171875, 0.8603591918945312, 0.894989013671875, 0.9296188354492188, 0.9642486572265625, 0.9988784790039062, 1.03350830078125, 1.0681381225585938, 1.1027679443359375, 1.1373977661132812, 1.172027587890625, 1.2066574096679688, 1.2412872314453125, 1.2759170532226562, 1.310546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 7.0, 8.0, 10.0, 12.0, 14.0, 27.0, 31.0, 36.0, 63.0, 70.0, 74.0, 58.0, 98.0, 68.0, 79.0, 74.0, 46.0, 53.0, 43.0, 39.0, 26.0, 25.0, 12.0, 18.0, 5.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135986328125, -0.13185882568359375, -0.1277313232421875, -0.12360382080078125, -0.119476318359375, -0.11534881591796875, -0.1112213134765625, -0.10709381103515625, -0.10296630859375, -0.09883880615234375, -0.0947113037109375, -0.09058380126953125, -0.086456298828125, -0.08232879638671875, -0.0782012939453125, -0.07407379150390625, -0.0699462890625, -0.06581878662109375, -0.0616912841796875, -0.05756378173828125, -0.053436279296875, -0.04930877685546875, -0.0451812744140625, -0.04105377197265625, -0.03692626953125, -0.03279876708984375, -0.0286712646484375, -0.02454376220703125, -0.020416259765625, -0.01628875732421875, -0.0121612548828125, -0.00803375244140625, -0.00390625, 0.00022125244140625, 0.0043487548828125, 0.00847625732421875, 0.012603759765625, 0.01673126220703125, 0.0208587646484375, 0.02498626708984375, 0.02911376953125, 0.03324127197265625, 0.0373687744140625, 0.04149627685546875, 0.045623779296875, 0.04975128173828125, 0.0538787841796875, 0.05800628662109375, 0.0621337890625, 0.06626129150390625, 0.0703887939453125, 0.07451629638671875, 0.078643798828125, 0.08277130126953125, 0.0868988037109375, 0.09102630615234375, 0.09515380859375, 0.09928131103515625, 0.1034088134765625, 0.10753631591796875, 0.111663818359375, 0.11579132080078125, 0.1199188232421875, 0.12404632568359375, 0.128173828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 10.0, 17.0, 18.0, 25.0, 44.0, 63.0, 150.0, 265.0, 653.0, 1794.0, 6242.0, 36591.0, 2873162.0, 1238624.0, 28697.0, 5267.0, 1592.0, 509.0, 226.0, 132.0, 57.0, 44.0, 18.0, 21.0, 11.0, 13.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.60302734375, -0.5847244262695312, -0.5664215087890625, -0.5481185913085938, -0.529815673828125, -0.5115127563476562, -0.4932098388671875, -0.47490692138671875, -0.45660400390625, -0.43830108642578125, -0.4199981689453125, -0.40169525146484375, -0.383392333984375, -0.36508941650390625, -0.3467864990234375, -0.32848358154296875, -0.3101806640625, -0.29187774658203125, -0.2735748291015625, -0.25527191162109375, -0.236968994140625, -0.21866607666015625, -0.2003631591796875, -0.18206024169921875, -0.16375732421875, -0.14545440673828125, -0.1271514892578125, -0.10884857177734375, -0.090545654296875, -0.07224273681640625, -0.0539398193359375, -0.03563690185546875, -0.017333984375, 0.00096893310546875, 0.0192718505859375, 0.03757476806640625, 0.055877685546875, 0.07418060302734375, 0.0924835205078125, 0.11078643798828125, 0.12908935546875, 0.14739227294921875, 0.1656951904296875, 0.18399810791015625, 0.202301025390625, 0.22060394287109375, 0.2389068603515625, 0.25720977783203125, 0.2755126953125, 0.29381561279296875, 0.3121185302734375, 0.33042144775390625, 0.348724365234375, 0.36702728271484375, 0.3853302001953125, 0.40363311767578125, 0.42193603515625, 0.44023895263671875, 0.4585418701171875, 0.47684478759765625, 0.495147705078125, 0.5134506225585938, 0.5317535400390625, 0.5500564575195312, 0.568359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 2.0, 9.0, 14.0, 14.0, 18.0, 22.0, 35.0, 68.0, 95.0, 149.0, 401.0, 1052.0, 1288.0, 430.0, 206.0, 97.0, 45.0, 40.0, 20.0, 20.0, 12.0, 4.0, 5.0, 4.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.461669921875, -0.4488868713378906, -0.43610382080078125, -0.4233207702636719, -0.4105377197265625, -0.3977546691894531, -0.38497161865234375, -0.3721885681152344, -0.359405517578125, -0.3466224670410156, -0.33383941650390625, -0.3210563659667969, -0.3082733154296875, -0.2954902648925781, -0.28270721435546875, -0.2699241638183594, -0.25714111328125, -0.24435806274414062, -0.23157501220703125, -0.21879196166992188, -0.2060089111328125, -0.19322586059570312, -0.18044281005859375, -0.16765975952148438, -0.154876708984375, -0.14209365844726562, -0.12931060791015625, -0.11652755737304688, -0.1037445068359375, -0.09096145629882812, -0.07817840576171875, -0.06539535522460938, -0.0526123046875, -0.039829254150390625, -0.02704620361328125, -0.014263153076171875, -0.0014801025390625, 0.011302947998046875, 0.02408599853515625, 0.036869049072265625, 0.049652099609375, 0.062435150146484375, 0.07521820068359375, 0.08800125122070312, 0.1007843017578125, 0.11356735229492188, 0.12635040283203125, 0.13913345336914062, 0.15191650390625, 0.16469955444335938, 0.17748260498046875, 0.19026565551757812, 0.2030487060546875, 0.21583175659179688, 0.22861480712890625, 0.24139785766601562, 0.254180908203125, 0.2669639587402344, 0.27974700927734375, 0.2925300598144531, 0.3053131103515625, 0.3180961608886719, 0.33087921142578125, 0.3436622619628906, 0.3564453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 19.0, 33.0, 64.0, 142.0, 256.0, 266.0, 123.0, 51.0, 23.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30051326751709, -6.150554656982422, -6.000596523284912, -5.850637912750244, -5.700679779052734, -5.550721168518066, -5.400762557983398, -5.250804424285889, -5.100845813751221, -4.950887203216553, -4.800929069519043, -4.650970458984375, -4.501012325286865, -4.351053714752197, -4.2010955810546875, -4.0511369705200195, -3.9011785984039307, -3.751220226287842, -3.601261854171753, -3.451303482055664, -3.301344871520996, -3.1513864994049072, -3.0014281272888184, -2.8514695167541504, -2.7015113830566406, -2.5515530109405518, -2.401594638824463, -2.251636028289795, -2.101677656173706, -1.9517192840576172, -1.8017609119415283, -1.65180242061615, -1.5018439292907715, -1.3518855571746826, -1.2019270658493042, -1.0519686937332153, -0.9020102620124817, -0.752051830291748, -0.6020934581756592, -0.45213496685028076, -0.3021765947341919, -0.15221817791461945, -0.002259761095046997, 0.14769864082336426, 0.2976570725440979, 0.44761550426483154, 0.5975738763809204, 0.7475323677062988, 0.8974907398223877, 1.0474491119384766, 1.197407603263855, 1.3473659753799438, 1.4973244667053223, 1.6472828388214111, 1.7972412109375, 1.9471997022628784, 2.0971579551696777, 2.2471163272857666, 2.3970746994018555, 2.5470333099365234, 2.6969916820526123, 2.846950054168701, 2.99690842628479, 3.146866798400879, 3.296825408935547]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 4.0, 7.0, 9.0, 9.0, 19.0, 9.0, 26.0, 20.0, 29.0, 26.0, 26.0, 46.0, 45.0, 46.0, 52.0, 45.0, 55.0, 44.0, 48.0, 46.0, 48.0, 50.0, 52.0, 40.0, 36.0, 27.0, 29.0, 21.0, 18.0, 20.0, 8.0, 12.0, 8.0, 4.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2660889625549316, -1.2179960012435913, -1.1699029207229614, -1.121809959411621, -1.0737169981002808, -1.0256239175796509, -0.9775309562683105, -0.9294379353523254, -0.8813449144363403, -0.8332518935203552, -0.7851589322090149, -0.7370659112930298, -0.6889728903770447, -0.6408798694610596, -0.5927869081497192, -0.5446938872337341, -0.4966009259223938, -0.4485079348087311, -0.40041491389274597, -0.35232192277908325, -0.30422890186309814, -0.2561359107494354, -0.2080429196357727, -0.1599498987197876, -0.11185690760612488, -0.06376390159130096, -0.015670903027057648, 0.03242209553718567, 0.08051510155200958, 0.1286081075668335, 0.17670109868049622, 0.22479411959648132, 0.27288711071014404, 0.32098010182380676, 0.36907312273979187, 0.4171661138534546, 0.4652591347694397, 0.5133521556854248, 0.5614451169967651, 0.6095381379127502, 0.6576311588287354, 0.7057241797447205, 0.7538171410560608, 0.8019101619720459, 0.850003182888031, 0.8980962038040161, 0.9461891651153564, 0.9942821860313416, 1.042375087738037, 1.0904680490493774, 1.1385611295700073, 1.1866540908813477, 1.234747052192688, 1.2828401327133179, 1.3309330940246582, 1.379026174545288, 1.4271191358566284, 1.4752120971679688, 1.5233051776885986, 1.571398138999939, 1.6194911003112793, 1.6675841808319092, 1.7156771421432495, 1.7637701034545898, 1.8118631839752197]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 24.0, 33.0, 42.0, 86.0, 155.0, 295.0, 500.0, 1122.0, 2892.0, 8076.0, 26420.0, 109310.0, 425304.0, 357406.0, 84147.0, 21561.0, 6562.0, 2477.0, 1041.0, 527.0, 233.0, 136.0, 81.0, 46.0, 24.0, 19.0, 7.0, 4.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.360595703125, -0.350555419921875, -0.34051513671875, -0.330474853515625, -0.3204345703125, -0.310394287109375, -0.30035400390625, -0.290313720703125, -0.2802734375, -0.270233154296875, -0.26019287109375, -0.250152587890625, -0.2401123046875, -0.230072021484375, -0.22003173828125, -0.209991455078125, -0.199951171875, -0.189910888671875, -0.17987060546875, -0.169830322265625, -0.1597900390625, -0.149749755859375, -0.13970947265625, -0.129669189453125, -0.11962890625, -0.109588623046875, -0.09954833984375, -0.089508056640625, -0.0794677734375, -0.069427490234375, -0.05938720703125, -0.049346923828125, -0.039306640625, -0.029266357421875, -0.01922607421875, -0.009185791015625, 0.0008544921875, 0.010894775390625, 0.02093505859375, 0.030975341796875, 0.041015625, 0.051055908203125, 0.06109619140625, 0.071136474609375, 0.0811767578125, 0.091217041015625, 0.10125732421875, 0.111297607421875, 0.121337890625, 0.131378173828125, 0.14141845703125, 0.151458740234375, 0.1614990234375, 0.171539306640625, 0.18157958984375, 0.191619873046875, 0.20166015625, 0.211700439453125, 0.22174072265625, 0.231781005859375, 0.2418212890625, 0.251861572265625, 0.26190185546875, 0.271942138671875, 0.281982421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 11.0, 23.0, 31.0, 28.0, 35.0, 47.0, 58.0, 68.0, 63.0, 62.0, 70.0, 51.0, 74.0, 73.0, 53.0, 59.0, 43.0, 33.0, 18.0, 29.0, 12.0, 16.0, 8.0, 8.0, 3.0, 4.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1427001953125, -0.13846397399902344, -0.13422775268554688, -0.1299915313720703, -0.12575531005859375, -0.12151908874511719, -0.11728286743164062, -0.11304664611816406, -0.1088104248046875, -0.10457420349121094, -0.10033798217773438, -0.09610176086425781, -0.09186553955078125, -0.08762931823730469, -0.08339309692382812, -0.07915687561035156, -0.074920654296875, -0.07068443298339844, -0.06644821166992188, -0.06221199035644531, -0.05797576904296875, -0.05373954772949219, -0.049503326416015625, -0.04526710510253906, -0.0410308837890625, -0.03679466247558594, -0.032558441162109375, -0.028322219848632812, -0.02408599853515625, -0.019849777221679688, -0.015613555908203125, -0.011377334594726562, -0.00714111328125, -0.0029048919677734375, 0.001331329345703125, 0.0055675506591796875, 0.00980377197265625, 0.014039993286132812, 0.018276214599609375, 0.022512435913085938, 0.0267486572265625, 0.030984878540039062, 0.035221099853515625, 0.03945732116699219, 0.04369354248046875, 0.04792976379394531, 0.052165985107421875, 0.05640220642089844, 0.060638427734375, 0.06487464904785156, 0.06911087036132812, 0.07334709167480469, 0.07758331298828125, 0.08181953430175781, 0.08605575561523438, 0.09029197692871094, 0.0945281982421875, 0.09876441955566406, 0.10300064086914062, 0.10723686218261719, 0.11147308349609375, 0.11570930480957031, 0.11994552612304688, 0.12418174743652344, 0.12841796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 9.0, 21.0, 11.0, 23.0, 42.0, 62.0, 77.0, 108.0, 163.0, 277.0, 454.0, 780.0, 1577.0, 3703.0, 10071.0, 34432.0, 151426.0, 651223.0, 144324.0, 32702.0, 9793.0, 3578.0, 1599.0, 799.0, 447.0, 290.0, 192.0, 117.0, 67.0, 57.0, 31.0, 24.0, 19.0, 10.0, 9.0, 8.0, 2.0, 6.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3642578125, -0.3536949157714844, -0.34313201904296875, -0.3325691223144531, -0.3220062255859375, -0.3114433288574219, -0.30088043212890625, -0.2903175354003906, -0.279754638671875, -0.2691917419433594, -0.25862884521484375, -0.24806594848632812, -0.2375030517578125, -0.22694015502929688, -0.21637725830078125, -0.20581436157226562, -0.19525146484375, -0.18468856811523438, -0.17412567138671875, -0.16356277465820312, -0.1529998779296875, -0.14243698120117188, -0.13187408447265625, -0.12131118774414062, -0.110748291015625, -0.10018539428710938, -0.08962249755859375, -0.07905960083007812, -0.0684967041015625, -0.057933807373046875, -0.04737091064453125, -0.036808013916015625, -0.0262451171875, -0.015682220458984375, -0.00511932373046875, 0.005443572998046875, 0.0160064697265625, 0.026569366455078125, 0.03713226318359375, 0.047695159912109375, 0.058258056640625, 0.06882095336914062, 0.07938385009765625, 0.08994674682617188, 0.1005096435546875, 0.11107254028320312, 0.12163543701171875, 0.13219833374023438, 0.14276123046875, 0.15332412719726562, 0.16388702392578125, 0.17444992065429688, 0.1850128173828125, 0.19557571411132812, 0.20613861083984375, 0.21670150756835938, 0.227264404296875, 0.23782730102539062, 0.24839019775390625, 0.2589530944824219, 0.2695159912109375, 0.2800788879394531, 0.29064178466796875, 0.3012046813964844, 0.311767578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 13.0, 10.0, 3.0, 16.0, 21.0, 27.0, 27.0, 35.0, 47.0, 57.0, 65.0, 62.0, 75.0, 82.0, 73.0, 72.0, 56.0, 49.0, 44.0, 40.0, 25.0, 26.0, 16.0, 15.0, 12.0, 6.0, 2.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5625, -0.5445785522460938, -0.5266571044921875, -0.5087356567382812, -0.490814208984375, -0.47289276123046875, -0.4549713134765625, -0.43704986572265625, -0.41912841796875, -0.40120697021484375, -0.3832855224609375, -0.36536407470703125, -0.347442626953125, -0.32952117919921875, -0.3115997314453125, -0.29367828369140625, -0.2757568359375, -0.25783538818359375, -0.2399139404296875, -0.22199249267578125, -0.204071044921875, -0.18614959716796875, -0.1682281494140625, -0.15030670166015625, -0.13238525390625, -0.11446380615234375, -0.0965423583984375, -0.07862091064453125, -0.060699462890625, -0.04277801513671875, -0.0248565673828125, -0.00693511962890625, 0.010986328125, 0.02890777587890625, 0.0468292236328125, 0.06475067138671875, 0.082672119140625, 0.10059356689453125, 0.1185150146484375, 0.13643646240234375, 0.15435791015625, 0.17227935791015625, 0.1902008056640625, 0.20812225341796875, 0.226043701171875, 0.24396514892578125, 0.2618865966796875, 0.27980804443359375, 0.2977294921875, 0.31565093994140625, 0.3335723876953125, 0.35149383544921875, 0.369415283203125, 0.38733673095703125, 0.4052581787109375, 0.42317962646484375, 0.44110107421875, 0.45902252197265625, 0.4769439697265625, 0.49486541748046875, 0.512786865234375, 0.5307083129882812, 0.5486297607421875, 0.5665512084960938, 0.58447265625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 10.0, 2.0, 2.0, 3.0, 10.0, 13.0, 20.0, 25.0, 47.0, 63.0, 85.0, 136.0, 216.0, 391.0, 670.0, 1350.0, 2664.0, 6204.0, 16216.0, 48742.0, 207956.0, 631815.0, 88175.0, 26234.0, 9577.0, 3962.0, 1810.0, 871.0, 477.0, 296.0, 175.0, 122.0, 63.0, 48.0, 29.0, 30.0, 18.0, 12.0, 8.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.114013671875, -0.11011314392089844, -0.10621261596679688, -0.10231208801269531, -0.09841156005859375, -0.09451103210449219, -0.09061050415039062, -0.08670997619628906, -0.0828094482421875, -0.07890892028808594, -0.07500839233398438, -0.07110786437988281, -0.06720733642578125, -0.06330680847167969, -0.059406280517578125, -0.05550575256347656, -0.051605224609375, -0.04770469665527344, -0.043804168701171875, -0.03990364074707031, -0.03600311279296875, -0.03210258483886719, -0.028202056884765625, -0.024301528930664062, -0.0204010009765625, -0.016500473022460938, -0.012599945068359375, -0.008699417114257812, -0.00479888916015625, -0.0008983612060546875, 0.003002166748046875, 0.0069026947021484375, 0.01080322265625, 0.014703750610351562, 0.018604278564453125, 0.022504806518554688, 0.02640533447265625, 0.030305862426757812, 0.034206390380859375, 0.03810691833496094, 0.0420074462890625, 0.04590797424316406, 0.049808502197265625, 0.05370903015136719, 0.05760955810546875, 0.06151008605957031, 0.06541061401367188, 0.06931114196777344, 0.073211669921875, 0.07711219787597656, 0.08101272583007812, 0.08491325378417969, 0.08881378173828125, 0.09271430969238281, 0.09661483764648438, 0.10051536560058594, 0.1044158935546875, 0.10831642150878906, 0.11221694946289062, 0.11611747741699219, 0.12001800537109375, 0.12391853332519531, 0.12781906127929688, 0.13171958923339844, 0.1356201171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 3.0, 5.0, 9.0, 8.0, 8.0, 22.0, 16.0, 30.0, 35.0, 65.0, 74.0, 84.0, 130.0, 146.0, 110.0, 61.0, 33.0, 47.0, 23.0, 20.0, 15.0, 20.0, 7.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5239925384521484e-05, -4.3684616684913635e-05, -4.2129307985305786e-05, -4.057399928569794e-05, -3.901869058609009e-05, -3.746338188648224e-05, -3.590807318687439e-05, -3.435276448726654e-05, -3.279745578765869e-05, -3.124214708805084e-05, -2.9686838388442993e-05, -2.8131529688835144e-05, -2.6576220989227295e-05, -2.5020912289619446e-05, -2.3465603590011597e-05, -2.1910294890403748e-05, -2.03549861907959e-05, -1.879967749118805e-05, -1.72443687915802e-05, -1.568906009197235e-05, -1.4133751392364502e-05, -1.2578442692756653e-05, -1.1023133993148804e-05, -9.467825293540955e-06, -7.912516593933105e-06, -6.357207894325256e-06, -4.801899194717407e-06, -3.246590495109558e-06, -1.691281795501709e-06, -1.3597309589385986e-07, 1.4193356037139893e-06, 2.9746443033218384e-06, 4.5299530029296875e-06, 6.085261702537537e-06, 7.640570402145386e-06, 9.195879101753235e-06, 1.0751187801361084e-05, 1.2306496500968933e-05, 1.3861805200576782e-05, 1.541711390018463e-05, 1.697242259979248e-05, 1.852773129940033e-05, 2.008303999900818e-05, 2.1638348698616028e-05, 2.3193657398223877e-05, 2.4748966097831726e-05, 2.6304274797439575e-05, 2.7859583497047424e-05, 2.9414892196655273e-05, 3.097020089626312e-05, 3.252550959587097e-05, 3.408081829547882e-05, 3.563612699508667e-05, 3.719143569469452e-05, 3.874674439430237e-05, 4.030205309391022e-05, 4.1857361793518066e-05, 4.3412670493125916e-05, 4.4967979192733765e-05, 4.6523287892341614e-05, 4.807859659194946e-05, 4.963390529155731e-05, 5.118921399116516e-05, 5.274452269077301e-05, 5.429983139038086e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 8.0, 10.0, 10.0, 8.0, 17.0, 17.0, 33.0, 55.0, 70.0, 107.0, 152.0, 238.0, 379.0, 629.0, 1054.0, 1975.0, 3905.0, 8366.0, 20293.0, 59538.0, 259834.0, 566791.0, 78895.0, 25862.0, 10285.0, 4619.0, 2270.0, 1278.0, 680.0, 392.0, 264.0, 154.0, 124.0, 64.0, 54.0, 35.0, 20.0, 24.0, 17.0, 7.0, 5.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.12164306640625, -0.11773395538330078, -0.11382484436035156, -0.10991573333740234, -0.10600662231445312, -0.1020975112915039, -0.09818840026855469, -0.09427928924560547, -0.09037017822265625, -0.08646106719970703, -0.08255195617675781, -0.0786428451538086, -0.07473373413085938, -0.07082462310791016, -0.06691551208496094, -0.06300640106201172, -0.0590972900390625, -0.05518817901611328, -0.05127906799316406, -0.047369956970214844, -0.043460845947265625, -0.039551734924316406, -0.03564262390136719, -0.03173351287841797, -0.02782440185546875, -0.02391529083251953, -0.020006179809570312, -0.016097068786621094, -0.012187957763671875, -0.008278846740722656, -0.0043697357177734375, -0.00046062469482421875, 0.003448486328125, 0.007357597351074219, 0.011266708374023438, 0.015175819396972656, 0.019084930419921875, 0.022994041442871094, 0.026903152465820312, 0.03081226348876953, 0.03472137451171875, 0.03863048553466797, 0.04253959655761719, 0.046448707580566406, 0.050357818603515625, 0.054266929626464844, 0.05817604064941406, 0.06208515167236328, 0.0659942626953125, 0.06990337371826172, 0.07381248474121094, 0.07772159576416016, 0.08163070678710938, 0.0855398178100586, 0.08944892883300781, 0.09335803985595703, 0.09726715087890625, 0.10117626190185547, 0.10508537292480469, 0.1089944839477539, 0.11290359497070312, 0.11681270599365234, 0.12072181701660156, 0.12463092803955078, 0.1285400390625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 8.0, 7.0, 8.0, 14.0, 8.0, 22.0, 20.0, 27.0, 46.0, 56.0, 97.0, 117.0, 190.0, 107.0, 79.0, 56.0, 29.0, 30.0, 14.0, 14.0, 12.0, 12.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.231201171875, -0.22546768188476562, -0.21973419189453125, -0.21400070190429688, -0.2082672119140625, -0.20253372192382812, -0.19680023193359375, -0.19106674194335938, -0.185333251953125, -0.17959976196289062, -0.17386627197265625, -0.16813278198242188, -0.1623992919921875, -0.15666580200195312, -0.15093231201171875, -0.14519882202148438, -0.13946533203125, -0.13373184204101562, -0.12799835205078125, -0.12226486206054688, -0.1165313720703125, -0.11079788208007812, -0.10506439208984375, -0.09933090209960938, -0.093597412109375, -0.08786392211914062, -0.08213043212890625, -0.07639694213867188, -0.0706634521484375, -0.06492996215820312, -0.05919647216796875, -0.053462982177734375, -0.0477294921875, -0.041996002197265625, -0.03626251220703125, -0.030529022216796875, -0.0247955322265625, -0.019062042236328125, -0.01332855224609375, -0.007595062255859375, -0.001861572265625, 0.003871917724609375, 0.00960540771484375, 0.015338897705078125, 0.0210723876953125, 0.026805877685546875, 0.03253936767578125, 0.038272857666015625, 0.04400634765625, 0.049739837646484375, 0.05547332763671875, 0.061206817626953125, 0.0669403076171875, 0.07267379760742188, 0.07840728759765625, 0.08414077758789062, 0.089874267578125, 0.09560775756835938, 0.10134124755859375, 0.10707473754882812, 0.1128082275390625, 0.11854171752929688, 0.12427520751953125, 0.13000869750976562, 0.1357421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 6.0, 13.0, 8.0, 29.0, 38.0, 77.0, 137.0, 218.0, 177.0, 127.0, 62.0, 38.0, 27.0, 21.0, 6.0, 3.0, 2.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8909107446670532, -1.7903063297271729, -1.6897019147872925, -1.589097499847412, -1.4884930849075317, -1.3878886699676514, -1.2872843742370605, -1.1866798400878906, -1.0860755443572998, -0.9854711294174194, -0.8848667144775391, -0.7842622995376587, -0.6836578845977783, -0.5830535292625427, -0.48244911432266235, -0.381844699382782, -0.28124022483825684, -0.18063580989837646, -0.08003140985965729, 0.02057299017906189, 0.12117740511894226, 0.22178179025650024, 0.3223862051963806, 0.422990620136261, 0.5235950350761414, 0.6241994500160217, 0.7248038649559021, 0.8254082202911377, 0.9260126352310181, 1.0266170501708984, 1.1272214651107788, 1.2278258800506592, 1.328430414199829, 1.4290348291397095, 1.5296392440795898, 1.6302436590194702, 1.7308480739593506, 1.8314523696899414, 1.9320569038391113, 2.032661199569702, 2.133265733718872, 2.233870029449463, 2.334474563598633, 2.4350788593292236, 2.5356833934783936, 2.6362876892089844, 2.7368922233581543, 2.837496519088745, 2.938100814819336, 3.0387051105499268, 3.1393096446990967, 3.2399139404296875, 3.3405184745788574, 3.4411227703094482, 3.541727304458618, 3.642331600189209, 3.742936134338379, 3.8435404300689697, 3.9441449642181396, 4.0447492599487305, 4.1453537940979, 4.24595832824707, 4.346562385559082, 4.447166919708252, 4.547771453857422]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 2.0, 7.0, 8.0, 6.0, 3.0, 6.0, 12.0, 14.0, 13.0, 20.0, 14.0, 30.0, 17.0, 31.0, 26.0, 34.0, 40.0, 40.0, 55.0, 64.0, 72.0, 71.0, 47.0, 47.0, 33.0, 23.0, 25.0, 32.0, 20.0, 19.0, 30.0, 20.0, 20.0, 14.0, 13.0, 13.0, 8.0, 9.0, 9.0, 7.0, 8.0, 7.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.7454392910003662, -1.6966986656188965, -1.6479579210281372, -1.5992172956466675, -1.5504765510559082, -1.5017359256744385, -1.4529953002929688, -1.4042545557022095, -1.3555139303207397, -1.30677330493927, -1.2580325603485107, -1.209291934967041, -1.1605511903762817, -1.111810564994812, -1.0630698204040527, -1.014329195022583, -0.9655885100364685, -0.916847825050354, -0.8681071400642395, -0.819366455078125, -0.7706258296966553, -0.7218851447105408, -0.6731444597244263, -0.6244038343429565, -0.5756630897521973, -0.5269224047660828, -0.47818174958229065, -0.42944106459617615, -0.38070040941238403, -0.33195972442626953, -0.28321903944015503, -0.23447838425636292, -0.1857377290725708, -0.1369970589876175, -0.08825638145208359, -0.03951570391654968, 0.009224966168403625, 0.057965636253356934, 0.10670632123947144, 0.15544697642326355, 0.20418766140937805, 0.25292834639549255, 0.30166900157928467, 0.35040968656539917, 0.39915037155151367, 0.4478910267353058, 0.4966317117214203, 0.5453723669052124, 0.5941130518913269, 0.6428537368774414, 0.6915944218635559, 0.7403351068496704, 0.7890757322311401, 0.8378164172172546, 0.8865571022033691, 0.9352977275848389, 0.9840384721755981, 1.0327790975570679, 1.0815198421478271, 1.1302604675292969, 1.1790012121200562, 1.2277418375015259, 1.2764825820922852, 1.3252232074737549, 1.3739638328552246]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 13.0, 13.0, 22.0, 38.0, 61.0, 108.0, 177.0, 310.0, 628.0, 1551.0, 4382.0, 16977.0, 129775.0, 3754935.0, 252899.0, 23202.0, 5719.0, 1835.0, 763.0, 363.0, 195.0, 110.0, 62.0, 46.0, 27.0, 22.0, 13.0, 10.0, 9.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.351806640625, -0.3385810852050781, -0.32535552978515625, -0.3121299743652344, -0.2989044189453125, -0.2856788635253906, -0.27245330810546875, -0.2592277526855469, -0.246002197265625, -0.23277664184570312, -0.21955108642578125, -0.20632553100585938, -0.1930999755859375, -0.17987442016601562, -0.16664886474609375, -0.15342330932617188, -0.14019775390625, -0.12697219848632812, -0.11374664306640625, -0.10052108764648438, -0.0872955322265625, -0.07406997680664062, -0.06084442138671875, -0.047618865966796875, -0.034393310546875, -0.021167755126953125, -0.00794219970703125, 0.005283355712890625, 0.0185089111328125, 0.031734466552734375, 0.04496002197265625, 0.058185577392578125, 0.0714111328125, 0.08463668823242188, 0.09786224365234375, 0.11108779907226562, 0.1243133544921875, 0.13753890991210938, 0.15076446533203125, 0.16399002075195312, 0.177215576171875, 0.19044113159179688, 0.20366668701171875, 0.21689224243164062, 0.2301177978515625, 0.24334335327148438, 0.25656890869140625, 0.2697944641113281, 0.28302001953125, 0.2962455749511719, 0.30947113037109375, 0.3226966857910156, 0.3359222412109375, 0.3491477966308594, 0.36237335205078125, 0.3755989074707031, 0.388824462890625, 0.4020500183105469, 0.41527557373046875, 0.4285011291503906, 0.4417266845703125, 0.4549522399902344, 0.46817779541015625, 0.4814033508300781, 0.49462890625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 6.0, 4.0, 2.0, 6.0, 13.0, 13.0, 22.0, 25.0, 33.0, 37.0, 51.0, 67.0, 65.0, 64.0, 68.0, 60.0, 71.0, 77.0, 61.0, 52.0, 65.0, 36.0, 31.0, 21.0, 20.0, 9.0, 7.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1429443359375, -0.1386566162109375, -0.134368896484375, -0.1300811767578125, -0.12579345703125, -0.1215057373046875, -0.117218017578125, -0.1129302978515625, -0.108642578125, -0.1043548583984375, -0.100067138671875, -0.0957794189453125, -0.09149169921875, -0.0872039794921875, -0.082916259765625, -0.0786285400390625, -0.0743408203125, -0.0700531005859375, -0.065765380859375, -0.0614776611328125, -0.05718994140625, -0.0529022216796875, -0.048614501953125, -0.0443267822265625, -0.0400390625, -0.0357513427734375, -0.031463623046875, -0.0271759033203125, -0.02288818359375, -0.0186004638671875, -0.014312744140625, -0.0100250244140625, -0.0057373046875, -0.0014495849609375, 0.002838134765625, 0.0071258544921875, 0.01141357421875, 0.0157012939453125, 0.019989013671875, 0.0242767333984375, 0.028564453125, 0.0328521728515625, 0.037139892578125, 0.0414276123046875, 0.04571533203125, 0.0500030517578125, 0.054290771484375, 0.0585784912109375, 0.0628662109375, 0.0671539306640625, 0.071441650390625, 0.0757293701171875, 0.08001708984375, 0.0843048095703125, 0.088592529296875, 0.0928802490234375, 0.09716796875, 0.1014556884765625, 0.105743408203125, 0.1100311279296875, 0.11431884765625, 0.1186065673828125, 0.122894287109375, 0.1271820068359375, 0.1314697265625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 11.0, 12.0, 11.0, 21.0, 34.0, 51.0, 79.0, 178.0, 416.0, 1043.0, 3638.0, 17990.0, 295150.0, 3799945.0, 64187.0, 8076.0, 2098.0, 719.0, 288.0, 139.0, 72.0, 42.0, 17.0, 19.0, 8.0, 8.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6181640625, -0.597747802734375, -0.57733154296875, -0.556915283203125, -0.5364990234375, -0.516082763671875, -0.49566650390625, -0.475250244140625, -0.454833984375, -0.434417724609375, -0.41400146484375, -0.393585205078125, -0.3731689453125, -0.352752685546875, -0.33233642578125, -0.311920166015625, -0.29150390625, -0.271087646484375, -0.25067138671875, -0.230255126953125, -0.2098388671875, -0.189422607421875, -0.16900634765625, -0.148590087890625, -0.128173828125, -0.107757568359375, -0.08734130859375, -0.066925048828125, -0.0465087890625, -0.026092529296875, -0.00567626953125, 0.014739990234375, 0.03515625, 0.055572509765625, 0.07598876953125, 0.096405029296875, 0.1168212890625, 0.137237548828125, 0.15765380859375, 0.178070068359375, 0.198486328125, 0.218902587890625, 0.23931884765625, 0.259735107421875, 0.2801513671875, 0.300567626953125, 0.32098388671875, 0.341400146484375, 0.36181640625, 0.382232666015625, 0.40264892578125, 0.423065185546875, 0.4434814453125, 0.463897705078125, 0.48431396484375, 0.504730224609375, 0.525146484375, 0.545562744140625, 0.56597900390625, 0.586395263671875, 0.6068115234375, 0.627227783203125, 0.64764404296875, 0.668060302734375, 0.6884765625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 6.0, 1.0, 9.0, 8.0, 17.0, 24.0, 33.0, 34.0, 73.0, 89.0, 182.0, 408.0, 1162.0, 1114.0, 432.0, 198.0, 101.0, 42.0, 37.0, 28.0, 26.0, 9.0, 8.0, 7.0, 12.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.424072265625, -0.4094505310058594, -0.39482879638671875, -0.3802070617675781, -0.3655853271484375, -0.3509635925292969, -0.33634185791015625, -0.3217201232910156, -0.307098388671875, -0.2924766540527344, -0.27785491943359375, -0.2632331848144531, -0.2486114501953125, -0.23398971557617188, -0.21936798095703125, -0.20474624633789062, -0.19012451171875, -0.17550277709960938, -0.16088104248046875, -0.14625930786132812, -0.1316375732421875, -0.11701583862304688, -0.10239410400390625, -0.08777236938476562, -0.073150634765625, -0.058528900146484375, -0.04390716552734375, -0.029285430908203125, -0.0146636962890625, -4.1961669921875e-05, 0.01457977294921875, 0.029201507568359375, 0.0438232421875, 0.058444976806640625, 0.07306671142578125, 0.08768844604492188, 0.1023101806640625, 0.11693191528320312, 0.13155364990234375, 0.14617538452148438, 0.160797119140625, 0.17541885375976562, 0.19004058837890625, 0.20466232299804688, 0.2192840576171875, 0.23390579223632812, 0.24852752685546875, 0.2631492614746094, 0.27777099609375, 0.2923927307128906, 0.30701446533203125, 0.3216361999511719, 0.3362579345703125, 0.3508796691894531, 0.36550140380859375, 0.3801231384277344, 0.394744873046875, 0.4093666076660156, 0.42398834228515625, 0.4386100769042969, 0.4532318115234375, 0.4678535461425781, 0.48247528076171875, 0.4970970153808594, 0.51171875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 7.0, 8.0, 18.0, 44.0, 73.0, 143.0, 235.0, 207.0, 130.0, 74.0, 27.0, 11.0, 7.0, 6.0, 7.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.619357585906982, -6.483953952789307, -6.348550796508789, -6.213147163391113, -6.0777435302734375, -5.94234037399292, -5.806936740875244, -5.671533107757568, -5.536129951477051, -5.400726318359375, -5.265323162078857, -5.129919528961182, -4.994515895843506, -4.859112739562988, -4.7237091064453125, -4.588305473327637, -4.452901840209961, -4.317498207092285, -4.182095050811768, -4.046691417694092, -3.911288022994995, -3.7758846282958984, -3.6404809951782227, -3.505077600479126, -3.3696742057800293, -3.2342708110809326, -3.098867177963257, -2.96346378326416, -2.8280603885650635, -2.692656993865967, -2.557253360748291, -2.4218499660491943, -2.2864463329315186, -2.151042938232422, -2.015639305114746, -1.8802359104156494, -1.7448325157165527, -1.6094290018081665, -1.4740254878997803, -1.3386220932006836, -1.2032185792922974, -1.0678150653839111, -0.9324116706848145, -0.7970081567764282, -0.6616047024726868, -0.5262012481689453, -0.3907977342605591, -0.2553942799568176, -0.11999082565307617, 0.015412643551826477, 0.15081611275672913, 0.28621959686279297, 0.4216230511665344, 0.5570265054702759, 0.6924300193786621, 0.8278334736824036, 0.963236927986145, 1.0986404418945312, 1.234043836593628, 1.3694473505020142, 1.5048508644104004, 1.640254259109497, 1.7756577730178833, 1.9110612869262695, 2.046464681625366]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 14.0, 14.0, 8.0, 11.0, 22.0, 18.0, 28.0, 21.0, 23.0, 35.0, 43.0, 42.0, 51.0, 58.0, 59.0, 48.0, 52.0, 45.0, 53.0, 43.0, 36.0, 36.0, 40.0, 27.0, 25.0, 26.0, 24.0, 14.0, 17.0, 10.0, 14.0, 11.0, 10.0, 3.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8770756721496582, -1.8248622417449951, -1.7726486921310425, -1.7204352617263794, -1.6682217121124268, -1.6160082817077637, -1.5637948513031006, -1.5115814208984375, -1.4593678712844849, -1.4071544408798218, -1.3549408912658691, -1.302727460861206, -1.250514030456543, -1.1983004808425903, -1.1460870504379272, -1.0938735008239746, -1.0416600704193115, -0.9894465804100037, -0.9372330904006958, -0.8850196599960327, -0.8328061699867249, -0.780592679977417, -0.7283792495727539, -0.676165759563446, -0.6239522695541382, -0.5717387795448303, -0.5195252895355225, -0.4673118591308594, -0.4150983691215515, -0.36288487911224365, -0.3106714189052582, -0.2584579586982727, -0.20624446868896484, -0.15403099358081818, -0.10181751847267151, -0.04960404336452484, 0.002609431743621826, 0.05482292175292969, 0.10703638195991516, 0.15924984216690063, 0.2114633321762085, 0.26367682218551636, 0.31589028239250183, 0.3681037425994873, 0.42031723260879517, 0.472530722618103, 0.5247441530227661, 0.576957643032074, 0.6291711330413818, 0.6813846230506897, 0.7335981130599976, 0.7858115434646606, 0.8380250334739685, 0.8902385234832764, 0.9424519538879395, 0.9946654438972473, 1.0468789339065552, 1.0990923643112183, 1.151305913925171, 1.203519344329834, 1.255732774734497, 1.3079463243484497, 1.3601597547531128, 1.4123733043670654, 1.4645867347717285]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 6.0, 19.0, 42.0, 34.0, 57.0, 101.0, 164.0, 279.0, 518.0, 1051.0, 2106.0, 4512.0, 10808.0, 28629.0, 86034.0, 278871.0, 408688.0, 149433.0, 47516.0, 16696.0, 6870.0, 3066.0, 1434.0, 681.0, 362.0, 238.0, 119.0, 89.0, 38.0, 34.0, 14.0, 13.0, 9.0, 7.0, 3.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.254638671875, -0.24528884887695312, -0.23593902587890625, -0.22658920288085938, -0.2172393798828125, -0.20788955688476562, -0.19853973388671875, -0.18918991088867188, -0.179840087890625, -0.17049026489257812, -0.16114044189453125, -0.15179061889648438, -0.1424407958984375, -0.13309097290039062, -0.12374114990234375, -0.11439132690429688, -0.10504150390625, -0.09569168090820312, -0.08634185791015625, -0.07699203491210938, -0.0676422119140625, -0.058292388916015625, -0.04894256591796875, -0.039592742919921875, -0.030242919921875, -0.020893096923828125, -0.01154327392578125, -0.002193450927734375, 0.0071563720703125, 0.016506195068359375, 0.02585601806640625, 0.035205841064453125, 0.0445556640625, 0.053905487060546875, 0.06325531005859375, 0.07260513305664062, 0.0819549560546875, 0.09130477905273438, 0.10065460205078125, 0.11000442504882812, 0.119354248046875, 0.12870407104492188, 0.13805389404296875, 0.14740371704101562, 0.1567535400390625, 0.16610336303710938, 0.17545318603515625, 0.18480300903320312, 0.19415283203125, 0.20350265502929688, 0.21285247802734375, 0.22220230102539062, 0.2315521240234375, 0.24090194702148438, 0.25025177001953125, 0.2596015930175781, 0.268951416015625, 0.2783012390136719, 0.28765106201171875, 0.2970008850097656, 0.3063507080078125, 0.3157005310058594, 0.32505035400390625, 0.3344001770019531, 0.34375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 7.0, 6.0, 11.0, 19.0, 22.0, 27.0, 30.0, 45.0, 48.0, 57.0, 70.0, 71.0, 65.0, 71.0, 69.0, 65.0, 49.0, 53.0, 48.0, 40.0, 34.0, 24.0, 30.0, 15.0, 9.0, 8.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1832275390625, -0.1783123016357422, -0.17339706420898438, -0.16848182678222656, -0.16356658935546875, -0.15865135192871094, -0.15373611450195312, -0.1488208770751953, -0.1439056396484375, -0.1389904022216797, -0.13407516479492188, -0.12915992736816406, -0.12424468994140625, -0.11932945251464844, -0.11441421508789062, -0.10949897766113281, -0.104583740234375, -0.09966850280761719, -0.09475326538085938, -0.08983802795410156, -0.08492279052734375, -0.08000755310058594, -0.07509231567382812, -0.07017707824707031, -0.0652618408203125, -0.06034660339355469, -0.055431365966796875, -0.05051612854003906, -0.04560089111328125, -0.04068565368652344, -0.035770416259765625, -0.030855178833007812, -0.02593994140625, -0.021024703979492188, -0.016109466552734375, -0.011194229125976562, -0.00627899169921875, -0.0013637542724609375, 0.003551483154296875, 0.008466720581054688, 0.0133819580078125, 0.018297195434570312, 0.023212432861328125, 0.028127670288085938, 0.03304290771484375, 0.03795814514160156, 0.042873382568359375, 0.04778861999511719, 0.052703857421875, 0.05761909484863281, 0.06253433227539062, 0.06744956970214844, 0.07236480712890625, 0.07728004455566406, 0.08219528198242188, 0.08711051940917969, 0.0920257568359375, 0.09694099426269531, 0.10185623168945312, 0.10677146911621094, 0.11168670654296875, 0.11660194396972656, 0.12151718139648438, 0.1264324188232422, 0.13134765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 10.0, 10.0, 14.0, 19.0, 25.0, 35.0, 37.0, 56.0, 93.0, 127.0, 218.0, 314.0, 584.0, 1048.0, 2094.0, 4697.0, 14074.0, 58791.0, 597610.0, 300985.0, 47324.0, 11991.0, 4221.0, 1788.0, 939.0, 530.0, 322.0, 203.0, 121.0, 73.0, 61.0, 40.0, 24.0, 26.0, 9.0, 9.0, 13.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.483642578125, -0.4705467224121094, -0.45745086669921875, -0.4443550109863281, -0.4312591552734375, -0.4181632995605469, -0.40506744384765625, -0.3919715881347656, -0.378875732421875, -0.3657798767089844, -0.35268402099609375, -0.3395881652832031, -0.3264923095703125, -0.3133964538574219, -0.30030059814453125, -0.2872047424316406, -0.27410888671875, -0.2610130310058594, -0.24791717529296875, -0.23482131958007812, -0.2217254638671875, -0.20862960815429688, -0.19553375244140625, -0.18243789672851562, -0.169342041015625, -0.15624618530273438, -0.14315032958984375, -0.13005447387695312, -0.1169586181640625, -0.10386276245117188, -0.09076690673828125, -0.07767105102539062, -0.0645751953125, -0.051479339599609375, -0.03838348388671875, -0.025287628173828125, -0.0121917724609375, 0.000904083251953125, 0.01399993896484375, 0.027095794677734375, 0.040191650390625, 0.053287506103515625, 0.06638336181640625, 0.07947921752929688, 0.0925750732421875, 0.10567092895507812, 0.11876678466796875, 0.13186264038085938, 0.14495849609375, 0.15805435180664062, 0.17115020751953125, 0.18424606323242188, 0.1973419189453125, 0.21043777465820312, 0.22353363037109375, 0.23662948608398438, 0.249725341796875, 0.2628211975097656, 0.27591705322265625, 0.2890129089355469, 0.3021087646484375, 0.3152046203613281, 0.32830047607421875, 0.3413963317871094, 0.3544921875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 2.0, 7.0, 14.0, 13.0, 13.0, 19.0, 23.0, 33.0, 35.0, 34.0, 55.0, 61.0, 66.0, 82.0, 85.0, 73.0, 78.0, 54.0, 54.0, 44.0, 25.0, 34.0, 23.0, 9.0, 10.0, 7.0, 4.0, 6.0, 6.0, 7.0, 4.0, 2.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.72998046875, -0.7104415893554688, -0.6909027099609375, -0.6713638305664062, -0.651824951171875, -0.6322860717773438, -0.6127471923828125, -0.5932083129882812, -0.57366943359375, -0.5541305541992188, -0.5345916748046875, -0.5150527954101562, -0.495513916015625, -0.47597503662109375, -0.4564361572265625, -0.43689727783203125, -0.4173583984375, -0.39781951904296875, -0.3782806396484375, -0.35874176025390625, -0.339202880859375, -0.31966400146484375, -0.3001251220703125, -0.28058624267578125, -0.26104736328125, -0.24150848388671875, -0.2219696044921875, -0.20243072509765625, -0.182891845703125, -0.16335296630859375, -0.1438140869140625, -0.12427520751953125, -0.104736328125, -0.08519744873046875, -0.0656585693359375, -0.04611968994140625, -0.026580810546875, -0.00704193115234375, 0.0124969482421875, 0.03203582763671875, 0.05157470703125, 0.07111358642578125, 0.0906524658203125, 0.11019134521484375, 0.129730224609375, 0.14926910400390625, 0.1688079833984375, 0.18834686279296875, 0.2078857421875, 0.22742462158203125, 0.2469635009765625, 0.26650238037109375, 0.286041259765625, 0.30558013916015625, 0.3251190185546875, 0.34465789794921875, 0.36419677734375, 0.38373565673828125, 0.4032745361328125, 0.42281341552734375, 0.442352294921875, 0.46189117431640625, 0.4814300537109375, 0.5009689331054688, 0.5205078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 3.0, 11.0, 8.0, 9.0, 15.0, 20.0, 33.0, 61.0, 75.0, 121.0, 204.0, 389.0, 955.0, 2742.0, 8920.0, 44488.0, 768922.0, 190086.0, 22854.0, 5514.0, 1692.0, 652.0, 311.0, 158.0, 86.0, 57.0, 43.0, 32.0, 34.0, 22.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.253173828125, -0.24568557739257812, -0.23819732666015625, -0.23070907592773438, -0.2232208251953125, -0.21573257446289062, -0.20824432373046875, -0.20075607299804688, -0.193267822265625, -0.18577957153320312, -0.17829132080078125, -0.17080307006835938, -0.1633148193359375, -0.15582656860351562, -0.14833831787109375, -0.14085006713867188, -0.13336181640625, -0.12587356567382812, -0.11838531494140625, -0.11089706420898438, -0.1034088134765625, -0.09592056274414062, -0.08843231201171875, -0.08094406127929688, -0.073455810546875, -0.06596755981445312, -0.05847930908203125, -0.050991058349609375, -0.0435028076171875, -0.036014556884765625, -0.02852630615234375, -0.021038055419921875, -0.0135498046875, -0.006061553955078125, 0.00142669677734375, 0.008914947509765625, 0.0164031982421875, 0.023891448974609375, 0.03137969970703125, 0.038867950439453125, 0.046356201171875, 0.053844451904296875, 0.06133270263671875, 0.06882095336914062, 0.0763092041015625, 0.08379745483398438, 0.09128570556640625, 0.09877395629882812, 0.10626220703125, 0.11375045776367188, 0.12123870849609375, 0.12872695922851562, 0.1362152099609375, 0.14370346069335938, 0.15119171142578125, 0.15867996215820312, 0.166168212890625, 0.17365646362304688, 0.18114471435546875, 0.18863296508789062, 0.1961212158203125, 0.20360946655273438, 0.21109771728515625, 0.21858596801757812, 0.22607421875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 6.0, 14.0, 11.0, 18.0, 18.0, 15.0, 43.0, 39.0, 59.0, 77.0, 124.0, 123.0, 109.0, 73.0, 64.0, 45.0, 31.0, 20.0, 20.0, 15.0, 11.0, 9.0, 8.0, 5.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8770179748535156e-05, -5.7009048759937286e-05, -5.5247917771339417e-05, -5.348678678274155e-05, -5.172565579414368e-05, -4.996452480554581e-05, -4.820339381694794e-05, -4.644226282835007e-05, -4.46811318397522e-05, -4.292000085115433e-05, -4.115886986255646e-05, -3.939773887395859e-05, -3.763660788536072e-05, -3.587547689676285e-05, -3.411434590816498e-05, -3.235321491956711e-05, -3.059208393096924e-05, -2.883095294237137e-05, -2.70698219537735e-05, -2.530869096517563e-05, -2.354755997657776e-05, -2.178642898797989e-05, -2.002529799938202e-05, -1.826416701078415e-05, -1.650303602218628e-05, -1.474190503358841e-05, -1.298077404499054e-05, -1.121964305639267e-05, -9.4585120677948e-06, -7.69738107919693e-06, -5.93625009059906e-06, -4.17511910200119e-06, -2.4139881134033203e-06, -6.528571248054504e-07, 1.1082738637924194e-06, 2.8694048523902893e-06, 4.630535840988159e-06, 6.391666829586029e-06, 8.152797818183899e-06, 9.913928806781769e-06, 1.1675059795379639e-05, 1.3436190783977509e-05, 1.5197321772575378e-05, 1.6958452761173248e-05, 1.8719583749771118e-05, 2.0480714738368988e-05, 2.2241845726966858e-05, 2.4002976715564728e-05, 2.5764107704162598e-05, 2.7525238692760468e-05, 2.9286369681358337e-05, 3.104750066995621e-05, 3.280863165855408e-05, 3.456976264715195e-05, 3.633089363574982e-05, 3.809202462434769e-05, 3.985315561294556e-05, 4.1614286601543427e-05, 4.3375417590141296e-05, 4.5136548578739166e-05, 4.6897679567337036e-05, 4.8658810555934906e-05, 5.0419941544532776e-05, 5.2181072533130646e-05, 5.3942203521728516e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 7.0, 10.0, 7.0, 21.0, 28.0, 30.0, 49.0, 71.0, 130.0, 183.0, 315.0, 507.0, 903.0, 1731.0, 3951.0, 10032.0, 33946.0, 358694.0, 582779.0, 36477.0, 10381.0, 4092.0, 1949.0, 973.0, 486.0, 293.0, 176.0, 118.0, 53.0, 50.0, 32.0, 21.0, 16.0, 13.0, 8.0, 5.0, 8.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.28271484375, -0.27486610412597656, -0.2670173645019531, -0.2591686248779297, -0.25131988525390625, -0.2434711456298828, -0.23562240600585938, -0.22777366638183594, -0.2199249267578125, -0.21207618713378906, -0.20422744750976562, -0.1963787078857422, -0.18852996826171875, -0.1806812286376953, -0.17283248901367188, -0.16498374938964844, -0.157135009765625, -0.14928627014160156, -0.14143753051757812, -0.1335887908935547, -0.12574005126953125, -0.11789131164550781, -0.11004257202148438, -0.10219383239746094, -0.0943450927734375, -0.08649635314941406, -0.07864761352539062, -0.07079887390136719, -0.06295013427734375, -0.05510139465332031, -0.047252655029296875, -0.03940391540527344, -0.03155517578125, -0.023706436157226562, -0.015857696533203125, -0.008008956909179688, -0.00016021728515625, 0.0076885223388671875, 0.015537261962890625, 0.023386001586914062, 0.0312347412109375, 0.03908348083496094, 0.046932220458984375, 0.05478096008300781, 0.06262969970703125, 0.07047843933105469, 0.07832717895507812, 0.08617591857910156, 0.094024658203125, 0.10187339782714844, 0.10972213745117188, 0.11757087707519531, 0.12541961669921875, 0.1332683563232422, 0.14111709594726562, 0.14896583557128906, 0.1568145751953125, 0.16466331481933594, 0.17251205444335938, 0.1803607940673828, 0.18820953369140625, 0.1960582733154297, 0.20390701293945312, 0.21175575256347656, 0.2196044921875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 2.0, 7.0, 7.0, 5.0, 8.0, 8.0, 12.0, 20.0, 35.0, 37.0, 40.0, 71.0, 109.0, 134.0, 124.0, 107.0, 86.0, 45.0, 48.0, 24.0, 15.0, 14.0, 13.0, 10.0, 3.0, 7.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27001953125, -0.2618598937988281, -0.25370025634765625, -0.24554061889648438, -0.2373809814453125, -0.22922134399414062, -0.22106170654296875, -0.21290206909179688, -0.204742431640625, -0.19658279418945312, -0.18842315673828125, -0.18026351928710938, -0.1721038818359375, -0.16394424438476562, -0.15578460693359375, -0.14762496948242188, -0.13946533203125, -0.13130569458007812, -0.12314605712890625, -0.11498641967773438, -0.1068267822265625, -0.09866714477539062, -0.09050750732421875, -0.08234786987304688, -0.074188232421875, -0.06602859497070312, -0.05786895751953125, -0.049709320068359375, -0.0415496826171875, -0.033390045166015625, -0.02523040771484375, -0.017070770263671875, -0.0089111328125, -0.000751495361328125, 0.00740814208984375, 0.015567779541015625, 0.0237274169921875, 0.031887054443359375, 0.04004669189453125, 0.048206329345703125, 0.056365966796875, 0.06452560424804688, 0.07268524169921875, 0.08084487915039062, 0.0890045166015625, 0.09716415405273438, 0.10532379150390625, 0.11348342895507812, 0.12164306640625, 0.12980270385742188, 0.13796234130859375, 0.14612197875976562, 0.1542816162109375, 0.16244125366210938, 0.17060089111328125, 0.17876052856445312, 0.186920166015625, 0.19507980346679688, 0.20323944091796875, 0.21139907836914062, 0.2195587158203125, 0.22771835327148438, 0.23587799072265625, 0.24403762817382812, 0.252197265625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 15.0, 31.0, 42.0, 107.0, 196.0, 309.0, 140.0, 67.0, 38.0, 21.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.654610633850098, -5.490706443786621, -5.326802730560303, -5.162898540496826, -4.998994827270508, -4.835090637207031, -4.671186447143555, -4.507282257080078, -4.34337854385376, -4.179474353790283, -4.015570640563965, -3.8516664505004883, -3.687762498855591, -3.5238585472106934, -3.359954357147217, -3.1960504055023193, -3.032146453857422, -2.8682425022125244, -2.704338550567627, -2.5404343605041504, -2.376530408859253, -2.2126264572143555, -2.048722267150879, -1.8848183155059814, -1.720914363861084, -1.5570104122161865, -1.3931063413619995, -1.2292022705078125, -1.065298318862915, -0.9013943076133728, -0.7374902963638306, -0.5735862255096436, -0.4096822738647461, -0.24577826261520386, -0.08187425136566162, 0.08202975988388062, 0.24593377113342285, 0.4098377823829651, 0.5737417936325073, 0.7376458644866943, 0.9015498161315918, 1.0654537677764893, 1.2293578386306763, 1.3932619094848633, 1.5571658611297607, 1.7210698127746582, 1.8849738836288452, 2.0488779544830322, 2.2127819061279297, 2.376685857772827, 2.5405898094177246, 2.704493999481201, 2.8683979511260986, 3.032301902770996, 3.1962060928344727, 3.36011004447937, 3.5240139961242676, 3.687917947769165, 3.8518218994140625, 4.015726089477539, 4.179630279541016, 4.343533992767334, 4.5074381828308105, 4.671341896057129, 4.8352460861206055]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 7.0, 3.0, 5.0, 5.0, 13.0, 15.0, 14.0, 23.0, 15.0, 22.0, 28.0, 31.0, 41.0, 53.0, 52.0, 57.0, 62.0, 90.0, 71.0, 85.0, 55.0, 45.0, 35.0, 23.0, 20.0, 25.0, 16.0, 19.0, 20.0, 14.0, 6.0, 6.0, 7.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7739622592926025, -1.7097135782241821, -1.6454648971557617, -1.5812163352966309, -1.5169676542282104, -1.45271897315979, -1.3884704113006592, -1.3242217302322388, -1.2599730491638184, -1.195724368095398, -1.1314756870269775, -1.0672271251678467, -1.0029784440994263, -0.9387297630310059, -0.8744811415672302, -0.8102325201034546, -0.7459838390350342, -0.6817351579666138, -0.6174865365028381, -0.5532379150390625, -0.4889892339706421, -0.42474058270454407, -0.36049193143844604, -0.296243280172348, -0.23199462890625, -0.16774597764015198, -0.10349732637405396, -0.03924867510795593, 0.02499997615814209, 0.08924862742424011, 0.15349727869033813, 0.21774592995643616, 0.2819948196411133, 0.3462434709072113, 0.4104921221733093, 0.47474077343940735, 0.5389894247055054, 0.6032381057739258, 0.6674867272377014, 0.731735348701477, 0.7959840297698975, 0.8602327108383179, 0.9244813323020935, 0.9887299537658691, 1.0529786348342896, 1.11722731590271, 1.1814758777618408, 1.2457245588302612, 1.3099732398986816, 1.374221920967102, 1.4384706020355225, 1.5027191638946533, 1.5669678449630737, 1.6312165260314941, 1.695465087890625, 1.7597137689590454, 1.8239624500274658, 1.8882111310958862, 1.9524598121643066, 2.0167083740234375, 2.0809569358825684, 2.1452057361602783, 2.209454298019409, 2.273703098297119, 2.33795166015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 2.0, 3.0, 5.0, 3.0, 12.0, 17.0, 17.0, 24.0, 39.0, 57.0, 88.0, 115.0, 179.0, 325.0, 598.0, 1152.0, 2166.0, 5073.0, 13826.0, 48317.0, 267252.0, 2733127.0, 973616.0, 108212.0, 25137.0, 8251.0, 3326.0, 1528.0, 773.0, 435.0, 212.0, 142.0, 69.0, 52.0, 42.0, 35.0, 24.0, 11.0, 7.0, 3.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3984375, -0.38458251953125, -0.3707275390625, -0.35687255859375, -0.343017578125, -0.32916259765625, -0.3153076171875, -0.30145263671875, -0.28759765625, -0.27374267578125, -0.2598876953125, -0.24603271484375, -0.232177734375, -0.21832275390625, -0.2044677734375, -0.19061279296875, -0.1767578125, -0.16290283203125, -0.1490478515625, -0.13519287109375, -0.121337890625, -0.10748291015625, -0.0936279296875, -0.07977294921875, -0.06591796875, -0.05206298828125, -0.0382080078125, -0.02435302734375, -0.010498046875, 0.00335693359375, 0.0172119140625, 0.03106689453125, 0.044921875, 0.05877685546875, 0.0726318359375, 0.08648681640625, 0.100341796875, 0.11419677734375, 0.1280517578125, 0.14190673828125, 0.15576171875, 0.16961669921875, 0.1834716796875, 0.19732666015625, 0.211181640625, 0.22503662109375, 0.2388916015625, 0.25274658203125, 0.2666015625, 0.28045654296875, 0.2943115234375, 0.30816650390625, 0.322021484375, 0.33587646484375, 0.3497314453125, 0.36358642578125, 0.37744140625, 0.39129638671875, 0.4051513671875, 0.41900634765625, 0.432861328125, 0.44671630859375, 0.4605712890625, 0.47442626953125, 0.48828125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 5.0, 20.0, 20.0, 33.0, 53.0, 57.0, 60.0, 72.0, 62.0, 81.0, 72.0, 80.0, 73.0, 69.0, 49.0, 58.0, 34.0, 25.0, 25.0, 13.0, 12.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.17835235595703125, -0.1729888916015625, -0.16762542724609375, -0.162261962890625, -0.15689849853515625, -0.1515350341796875, -0.14617156982421875, -0.14080810546875, -0.13544464111328125, -0.1300811767578125, -0.12471771240234375, -0.119354248046875, -0.11399078369140625, -0.1086273193359375, -0.10326385498046875, -0.097900390625, -0.09253692626953125, -0.0871734619140625, -0.08180999755859375, -0.076446533203125, -0.07108306884765625, -0.0657196044921875, -0.06035614013671875, -0.05499267578125, -0.04962921142578125, -0.0442657470703125, -0.03890228271484375, -0.033538818359375, -0.02817535400390625, -0.0228118896484375, -0.01744842529296875, -0.0120849609375, -0.00672149658203125, -0.0013580322265625, 0.00400543212890625, 0.009368896484375, 0.01473236083984375, 0.0200958251953125, 0.02545928955078125, 0.03082275390625, 0.03618621826171875, 0.0415496826171875, 0.04691314697265625, 0.052276611328125, 0.05764007568359375, 0.0630035400390625, 0.06836700439453125, 0.07373046875, 0.07909393310546875, 0.0844573974609375, 0.08982086181640625, 0.095184326171875, 0.10054779052734375, 0.1059112548828125, 0.11127471923828125, 0.11663818359375, 0.12200164794921875, 0.1273651123046875, 0.13272857666015625, 0.138092041015625, 0.14345550537109375, 0.1488189697265625, 0.15418243408203125, 0.1595458984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 10.0, 19.0, 26.0, 40.0, 50.0, 80.0, 110.0, 177.0, 286.0, 574.0, 1170.0, 2822.0, 9073.0, 51527.0, 2193937.0, 1872098.0, 48485.0, 8489.0, 2631.0, 1186.0, 603.0, 338.0, 189.0, 119.0, 76.0, 54.0, 30.0, 20.0, 17.0, 10.0, 9.0, 7.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.025390625, -0.9960861206054688, -0.9667816162109375, -0.9374771118164062, -0.908172607421875, -0.8788681030273438, -0.8495635986328125, -0.8202590942382812, -0.79095458984375, -0.7616500854492188, -0.7323455810546875, -0.7030410766601562, -0.673736572265625, -0.6444320678710938, -0.6151275634765625, -0.5858230590820312, -0.5565185546875, -0.5272140502929688, -0.4979095458984375, -0.46860504150390625, -0.439300537109375, -0.40999603271484375, -0.3806915283203125, -0.35138702392578125, -0.32208251953125, -0.29277801513671875, -0.2634735107421875, -0.23416900634765625, -0.204864501953125, -0.17555999755859375, -0.1462554931640625, -0.11695098876953125, -0.087646484375, -0.05834197998046875, -0.0290374755859375, 0.00026702880859375, 0.029571533203125, 0.05887603759765625, 0.0881805419921875, 0.11748504638671875, 0.14678955078125, 0.17609405517578125, 0.2053985595703125, 0.23470306396484375, 0.264007568359375, 0.29331207275390625, 0.3226165771484375, 0.35192108154296875, 0.3812255859375, 0.41053009033203125, 0.4398345947265625, 0.46913909912109375, 0.498443603515625, 0.5277481079101562, 0.5570526123046875, 0.5863571166992188, 0.61566162109375, 0.6449661254882812, 0.6742706298828125, 0.7035751342773438, 0.732879638671875, 0.7621841430664062, 0.7914886474609375, 0.8207931518554688, 0.85009765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 7.0, 10.0, 14.0, 28.0, 36.0, 49.0, 67.0, 107.0, 140.0, 225.0, 290.0, 491.0, 771.0, 618.0, 410.0, 250.0, 182.0, 111.0, 74.0, 49.0, 32.0, 32.0, 13.0, 8.0, 10.0, 8.0, 8.0, 7.0, 2.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75341796875, -0.7317657470703125, -0.710113525390625, -0.6884613037109375, -0.66680908203125, -0.6451568603515625, -0.623504638671875, -0.6018524169921875, -0.5802001953125, -0.5585479736328125, -0.536895751953125, -0.5152435302734375, -0.49359130859375, -0.4719390869140625, -0.450286865234375, -0.4286346435546875, -0.406982421875, -0.3853302001953125, -0.363677978515625, -0.3420257568359375, -0.32037353515625, -0.2987213134765625, -0.277069091796875, -0.2554168701171875, -0.2337646484375, -0.2121124267578125, -0.190460205078125, -0.1688079833984375, -0.14715576171875, -0.1255035400390625, -0.103851318359375, -0.0821990966796875, -0.060546875, -0.0388946533203125, -0.017242431640625, 0.0044097900390625, 0.02606201171875, 0.0477142333984375, 0.069366455078125, 0.0910186767578125, 0.1126708984375, 0.1343231201171875, 0.155975341796875, 0.1776275634765625, 0.19927978515625, 0.2209320068359375, 0.242584228515625, 0.2642364501953125, 0.285888671875, 0.3075408935546875, 0.329193115234375, 0.3508453369140625, 0.37249755859375, 0.3941497802734375, 0.415802001953125, 0.4374542236328125, 0.4591064453125, 0.4807586669921875, 0.502410888671875, 0.5240631103515625, 0.54571533203125, 0.5673675537109375, 0.589019775390625, 0.6106719970703125, 0.63232421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 13.0, 5.0, 15.0, 26.0, 52.0, 62.0, 143.0, 190.0, 196.0, 124.0, 70.0, 37.0, 17.0, 12.0, 4.0, 8.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.430160522460938, -8.1155366897583, -7.8009138107299805, -7.486290454864502, -7.171667098999023, -6.857043266296387, -6.542419910430908, -6.22779655456543, -5.913173198699951, -5.598549842834473, -5.283926486968994, -4.969303131103516, -4.654679298400879, -4.340056419372559, -4.025432586669922, -3.7108092308044434, -3.396185874938965, -3.0815625190734863, -2.766939163208008, -2.45231556892395, -2.1376922130584717, -1.8230688571929932, -1.508445382118225, -1.193821907043457, -0.8791985511779785, -0.5645751357078552, -0.24995172023773193, 0.06467169523239136, 0.37929511070251465, 0.6939184665679932, 1.0085419416427612, 1.3231654167175293, 1.6377887725830078, 1.9524121284484863, 2.267035484313965, 2.5816590785980225, 2.896282434463501, 3.2109057903289795, 3.525529384613037, 3.8401527404785156, 4.154776096343994, 4.469399452209473, 4.784022808074951, 5.09864616394043, 5.413269996643066, 5.727892875671387, 6.042516708374023, 6.357140064239502, 6.6717634201049805, 6.986386775970459, 7.3010101318359375, 7.615633487701416, 7.9302568435668945, 8.244880676269531, 8.559503555297852, 8.874127388000488, 9.188751220703125, 9.503375053405762, 9.817997932434082, 10.132621765136719, 10.447244644165039, 10.761868476867676, 11.076491355895996, 11.391115188598633, 11.705738067626953]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 10.0, 6.0, 12.0, 23.0, 25.0, 18.0, 27.0, 50.0, 37.0, 56.0, 53.0, 68.0, 67.0, 76.0, 83.0, 62.0, 54.0, 47.0, 42.0, 33.0, 26.0, 28.0, 20.0, 19.0, 18.0, 10.0, 16.0, 0.0, 3.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.484915733337402, -5.342550277709961, -5.200184345245361, -5.057818412780762, -4.91545295715332, -4.773087501525879, -4.630721569061279, -4.48835563659668, -4.345990180969238, -4.203624725341797, -4.061258792877197, -3.9188930988311768, -3.7765274047851562, -3.6341617107391357, -3.4917960166931152, -3.3494303226470947, -3.207064628601074, -3.0646989345550537, -2.922333240509033, -2.7799675464630127, -2.637601852416992, -2.4952361583709717, -2.352870464324951, -2.2105047702789307, -2.06813907623291, -1.9257733821868896, -1.7834076881408691, -1.6410419940948486, -1.4986763000488281, -1.3563106060028076, -1.213944911956787, -1.0715792179107666, -0.9292135238647461, -0.7868478298187256, -0.6444821357727051, -0.5021164417266846, -0.35975074768066406, -0.21738505363464355, -0.07501935958862305, 0.06734633445739746, 0.20971202850341797, 0.3520777225494385, 0.494443416595459, 0.6368091106414795, 0.7791748046875, 0.9215404987335205, 1.063906192779541, 1.2062718868255615, 1.348637580871582, 1.4910032749176025, 1.633368968963623, 1.7757346630096436, 1.918100357055664, 2.0604660511016846, 2.202831745147705, 2.3451974391937256, 2.487563133239746, 2.6299288272857666, 2.772294521331787, 2.9146602153778076, 3.057025909423828, 3.1993916034698486, 3.341757297515869, 3.4841229915618896, 3.62648868560791]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 5.0, 9.0, 15.0, 15.0, 24.0, 46.0, 65.0, 126.0, 176.0, 300.0, 573.0, 1111.0, 2337.0, 5476.0, 15703.0, 53462.0, 238637.0, 559859.0, 122011.0, 31153.0, 9942.0, 3893.0, 1719.0, 805.0, 433.0, 252.0, 143.0, 79.0, 59.0, 45.0, 23.0, 17.0, 11.0, 8.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.4501953125, -0.43843841552734375, -0.4266815185546875, -0.41492462158203125, -0.403167724609375, -0.39141082763671875, -0.3796539306640625, -0.36789703369140625, -0.35614013671875, -0.34438323974609375, -0.3326263427734375, -0.32086944580078125, -0.309112548828125, -0.29735565185546875, -0.2855987548828125, -0.27384185791015625, -0.2620849609375, -0.25032806396484375, -0.2385711669921875, -0.22681427001953125, -0.215057373046875, -0.20330047607421875, -0.1915435791015625, -0.17978668212890625, -0.16802978515625, -0.15627288818359375, -0.1445159912109375, -0.13275909423828125, -0.121002197265625, -0.10924530029296875, -0.0974884033203125, -0.08573150634765625, -0.073974609375, -0.06221771240234375, -0.0504608154296875, -0.03870391845703125, -0.026947021484375, -0.01519012451171875, -0.0034332275390625, 0.00832366943359375, 0.02008056640625, 0.03183746337890625, 0.0435943603515625, 0.05535125732421875, 0.067108154296875, 0.07886505126953125, 0.0906219482421875, 0.10237884521484375, 0.1141357421875, 0.12589263916015625, 0.1376495361328125, 0.14940643310546875, 0.161163330078125, 0.17292022705078125, 0.1846771240234375, 0.19643402099609375, 0.20819091796875, 0.21994781494140625, 0.2317047119140625, 0.24346160888671875, 0.255218505859375, 0.26697540283203125, 0.2787322998046875, 0.29048919677734375, 0.30224609375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 9.0, 7.0, 16.0, 24.0, 31.0, 35.0, 43.0, 54.0, 72.0, 81.0, 67.0, 92.0, 82.0, 79.0, 57.0, 57.0, 40.0, 42.0, 33.0, 21.0, 15.0, 19.0, 9.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26513671875, -0.256195068359375, -0.24725341796875, -0.238311767578125, -0.2293701171875, -0.220428466796875, -0.21148681640625, -0.202545166015625, -0.193603515625, -0.184661865234375, -0.17572021484375, -0.166778564453125, -0.1578369140625, -0.148895263671875, -0.13995361328125, -0.131011962890625, -0.1220703125, -0.113128662109375, -0.10418701171875, -0.095245361328125, -0.0863037109375, -0.077362060546875, -0.06842041015625, -0.059478759765625, -0.050537109375, -0.041595458984375, -0.03265380859375, -0.023712158203125, -0.0147705078125, -0.005828857421875, 0.00311279296875, 0.012054443359375, 0.02099609375, 0.029937744140625, 0.03887939453125, 0.047821044921875, 0.0567626953125, 0.065704345703125, 0.07464599609375, 0.083587646484375, 0.092529296875, 0.101470947265625, 0.11041259765625, 0.119354248046875, 0.1282958984375, 0.137237548828125, 0.14617919921875, 0.155120849609375, 0.1640625, 0.173004150390625, 0.18194580078125, 0.190887451171875, 0.1998291015625, 0.208770751953125, 0.21771240234375, 0.226654052734375, 0.235595703125, 0.244537353515625, 0.25347900390625, 0.262420654296875, 0.2713623046875, 0.280303955078125, 0.28924560546875, 0.298187255859375, 0.30712890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 9.0, 13.0, 11.0, 15.0, 57.0, 65.0, 84.0, 144.0, 213.0, 332.0, 684.0, 1521.0, 4759.0, 21110.0, 198469.0, 776765.0, 33427.0, 6738.0, 2039.0, 888.0, 437.0, 273.0, 166.0, 102.0, 59.0, 50.0, 30.0, 29.0, 17.0, 14.0, 9.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5478515625, -0.53179931640625, -0.5157470703125, -0.49969482421875, -0.483642578125, -0.46759033203125, -0.4515380859375, -0.43548583984375, -0.41943359375, -0.40338134765625, -0.3873291015625, -0.37127685546875, -0.355224609375, -0.33917236328125, -0.3231201171875, -0.30706787109375, -0.291015625, -0.27496337890625, -0.2589111328125, -0.24285888671875, -0.226806640625, -0.21075439453125, -0.1947021484375, -0.17864990234375, -0.16259765625, -0.14654541015625, -0.1304931640625, -0.11444091796875, -0.098388671875, -0.08233642578125, -0.0662841796875, -0.05023193359375, -0.0341796875, -0.01812744140625, -0.0020751953125, 0.01397705078125, 0.030029296875, 0.04608154296875, 0.0621337890625, 0.07818603515625, 0.09423828125, 0.11029052734375, 0.1263427734375, 0.14239501953125, 0.158447265625, 0.17449951171875, 0.1905517578125, 0.20660400390625, 0.22265625, 0.23870849609375, 0.2547607421875, 0.27081298828125, 0.286865234375, 0.30291748046875, 0.3189697265625, 0.33502197265625, 0.35107421875, 0.36712646484375, 0.3831787109375, 0.39923095703125, 0.415283203125, 0.43133544921875, 0.4473876953125, 0.46343994140625, 0.4794921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 3.0, 3.0, 6.0, 4.0, 6.0, 8.0, 11.0, 12.0, 7.0, 20.0, 28.0, 29.0, 43.0, 40.0, 70.0, 70.0, 91.0, 104.0, 97.0, 63.0, 50.0, 43.0, 30.0, 31.0, 20.0, 27.0, 16.0, 16.0, 7.0, 7.0, 8.0, 9.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0068359375, -0.975341796875, -0.94384765625, -0.912353515625, -0.880859375, -0.849365234375, -0.81787109375, -0.786376953125, -0.7548828125, -0.723388671875, -0.69189453125, -0.660400390625, -0.62890625, -0.597412109375, -0.56591796875, -0.534423828125, -0.5029296875, -0.471435546875, -0.43994140625, -0.408447265625, -0.376953125, -0.345458984375, -0.31396484375, -0.282470703125, -0.2509765625, -0.219482421875, -0.18798828125, -0.156494140625, -0.125, -0.093505859375, -0.06201171875, -0.030517578125, 0.0009765625, 0.032470703125, 0.06396484375, 0.095458984375, 0.126953125, 0.158447265625, 0.18994140625, 0.221435546875, 0.2529296875, 0.284423828125, 0.31591796875, 0.347412109375, 0.37890625, 0.410400390625, 0.44189453125, 0.473388671875, 0.5048828125, 0.536376953125, 0.56787109375, 0.599365234375, 0.630859375, 0.662353515625, 0.69384765625, 0.725341796875, 0.7568359375, 0.788330078125, 0.81982421875, 0.851318359375, 0.8828125, 0.914306640625, 0.94580078125, 0.977294921875, 1.0087890625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 6.0, 5.0, 9.0, 18.0, 15.0, 22.0, 20.0, 50.0, 69.0, 95.0, 174.0, 278.0, 539.0, 1117.0, 2709.0, 8319.0, 37317.0, 816774.0, 151818.0, 20165.0, 5211.0, 1924.0, 861.0, 392.0, 231.0, 146.0, 72.0, 52.0, 36.0, 25.0, 24.0, 22.0, 14.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.100341796875, -0.09685897827148438, -0.09337615966796875, -0.08989334106445312, -0.0864105224609375, -0.08292770385742188, -0.07944488525390625, -0.07596206665039062, -0.072479248046875, -0.06899642944335938, -0.06551361083984375, -0.062030792236328125, -0.0585479736328125, -0.055065155029296875, -0.05158233642578125, -0.048099517822265625, -0.04461669921875, -0.041133880615234375, -0.03765106201171875, -0.034168243408203125, -0.0306854248046875, -0.027202606201171875, -0.02371978759765625, -0.020236968994140625, -0.016754150390625, -0.013271331787109375, -0.00978851318359375, -0.006305694580078125, -0.0028228759765625, 0.000659942626953125, 0.00414276123046875, 0.007625579833984375, 0.0111083984375, 0.014591217041015625, 0.01807403564453125, 0.021556854248046875, 0.0250396728515625, 0.028522491455078125, 0.03200531005859375, 0.035488128662109375, 0.038970947265625, 0.042453765869140625, 0.04593658447265625, 0.049419403076171875, 0.0529022216796875, 0.056385040283203125, 0.05986785888671875, 0.06335067749023438, 0.06683349609375, 0.07031631469726562, 0.07379913330078125, 0.07728195190429688, 0.0807647705078125, 0.08424758911132812, 0.08773040771484375, 0.09121322631835938, 0.094696044921875, 0.09817886352539062, 0.10166168212890625, 0.10514450073242188, 0.1086273193359375, 0.11211013793945312, 0.11559295654296875, 0.11907577514648438, 0.12255859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 11.0, 10.0, 10.0, 15.0, 22.0, 27.0, 41.0, 61.0, 105.0, 127.0, 127.0, 115.0, 89.0, 66.0, 45.0, 38.0, 25.0, 13.0, 8.0, 15.0, 7.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.93986701965332e-05, -3.8144178688526154e-05, -3.6889687180519104e-05, -3.5635195672512054e-05, -3.4380704164505005e-05, -3.3126212656497955e-05, -3.1871721148490906e-05, -3.0617229640483856e-05, -2.9362738132476807e-05, -2.8108246624469757e-05, -2.6853755116462708e-05, -2.5599263608455658e-05, -2.434477210044861e-05, -2.309028059244156e-05, -2.183578908443451e-05, -2.058129757642746e-05, -1.932680606842041e-05, -1.807231456041336e-05, -1.681782305240631e-05, -1.556333154439926e-05, -1.4308840036392212e-05, -1.3054348528385162e-05, -1.1799857020378113e-05, -1.0545365512371063e-05, -9.290874004364014e-06, -8.036382496356964e-06, -6.7818909883499146e-06, -5.527399480342865e-06, -4.2729079723358154e-06, -3.018416464328766e-06, -1.7639249563217163e-06, -5.094334483146667e-07, 7.450580596923828e-07, 1.9995495676994324e-06, 3.254041075706482e-06, 4.5085325837135315e-06, 5.763024091720581e-06, 7.017515599727631e-06, 8.27200710773468e-06, 9.52649861574173e-06, 1.078099012374878e-05, 1.2035481631755829e-05, 1.3289973139762878e-05, 1.4544464647769928e-05, 1.5798956155776978e-05, 1.7053447663784027e-05, 1.8307939171791077e-05, 1.9562430679798126e-05, 2.0816922187805176e-05, 2.2071413695812225e-05, 2.3325905203819275e-05, 2.4580396711826324e-05, 2.5834888219833374e-05, 2.7089379727840424e-05, 2.8343871235847473e-05, 2.9598362743854523e-05, 3.085285425186157e-05, 3.210734575986862e-05, 3.336183726787567e-05, 3.461632877588272e-05, 3.587082028388977e-05, 3.712531179189682e-05, 3.837980329990387e-05, 3.963429480791092e-05, 4.088878631591797e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 7.0, 6.0, 6.0, 5.0, 12.0, 13.0, 20.0, 23.0, 42.0, 36.0, 54.0, 79.0, 113.0, 217.0, 256.0, 402.0, 720.0, 1253.0, 2024.0, 3918.0, 7694.0, 17140.0, 44826.0, 198080.0, 672239.0, 58899.0, 20797.0, 9144.0, 4401.0, 2407.0, 1389.0, 814.0, 500.0, 303.0, 224.0, 150.0, 94.0, 74.0, 43.0, 36.0, 26.0, 22.0, 14.0, 2.0, 6.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.061614990234375, -0.05956888198852539, -0.05752277374267578, -0.05547666549682617, -0.05343055725097656, -0.05138444900512695, -0.049338340759277344, -0.047292232513427734, -0.045246124267578125, -0.043200016021728516, -0.041153907775878906, -0.0391077995300293, -0.03706169128417969, -0.03501558303833008, -0.03296947479248047, -0.03092336654663086, -0.02887725830078125, -0.02683115005493164, -0.02478504180908203, -0.022738933563232422, -0.020692825317382812, -0.018646717071533203, -0.016600608825683594, -0.014554500579833984, -0.012508392333984375, -0.010462284088134766, -0.008416175842285156, -0.006370067596435547, -0.0043239593505859375, -0.002277851104736328, -0.00023174285888671875, 0.0018143653869628906, 0.0038604736328125, 0.005906581878662109, 0.007952690124511719, 0.009998798370361328, 0.012044906616210938, 0.014091014862060547, 0.016137123107910156, 0.018183231353759766, 0.020229339599609375, 0.022275447845458984, 0.024321556091308594, 0.026367664337158203, 0.028413772583007812, 0.030459880828857422, 0.03250598907470703, 0.03455209732055664, 0.03659820556640625, 0.03864431381225586, 0.04069042205810547, 0.04273653030395508, 0.04478263854980469, 0.0468287467956543, 0.048874855041503906, 0.050920963287353516, 0.052967071533203125, 0.055013179779052734, 0.057059288024902344, 0.05910539627075195, 0.06115150451660156, 0.06319761276245117, 0.06524372100830078, 0.06728982925415039, 0.0693359375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 4.0, 6.0, 11.0, 12.0, 11.0, 17.0, 15.0, 34.0, 23.0, 19.0, 39.0, 59.0, 70.0, 103.0, 112.0, 103.0, 92.0, 60.0, 48.0, 24.0, 21.0, 23.0, 20.0, 12.0, 13.0, 13.0, 4.0, 8.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08319091796875, -0.08018112182617188, -0.07717132568359375, -0.07416152954101562, -0.0711517333984375, -0.06814193725585938, -0.06513214111328125, -0.062122344970703125, -0.059112548828125, -0.056102752685546875, -0.05309295654296875, -0.050083160400390625, -0.0470733642578125, -0.044063568115234375, -0.04105377197265625, -0.038043975830078125, -0.0350341796875, -0.032024383544921875, -0.02901458740234375, -0.026004791259765625, -0.0229949951171875, -0.019985198974609375, -0.01697540283203125, -0.013965606689453125, -0.010955810546875, -0.007946014404296875, -0.00493621826171875, -0.001926422119140625, 0.0010833740234375, 0.004093170166015625, 0.00710296630859375, 0.010112762451171875, 0.01312255859375, 0.016132354736328125, 0.01914215087890625, 0.022151947021484375, 0.0251617431640625, 0.028171539306640625, 0.03118133544921875, 0.034191131591796875, 0.037200927734375, 0.040210723876953125, 0.04322052001953125, 0.046230316162109375, 0.0492401123046875, 0.052249908447265625, 0.05525970458984375, 0.058269500732421875, 0.061279296875, 0.06428909301757812, 0.06729888916015625, 0.07030868530273438, 0.0733184814453125, 0.07632827758789062, 0.07933807373046875, 0.08234786987304688, 0.085357666015625, 0.08836746215820312, 0.09137725830078125, 0.09438705444335938, 0.0973968505859375, 0.10040664672851562, 0.10341644287109375, 0.10642623901367188, 0.10943603515625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 7.0, 7.0, 14.0, 27.0, 28.0, 70.0, 200.0, 300.0, 182.0, 67.0, 30.0, 25.0, 16.0, 15.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4611735343933105, -3.3397510051727295, -3.2183284759521484, -3.0969057083129883, -2.9754831790924072, -2.854060649871826, -2.732638120651245, -2.611215591430664, -2.489792823791504, -2.368370294570923, -2.246947765350342, -2.1255249977111816, -2.0041024684906006, -1.8826799392700195, -1.7612574100494385, -1.6398347616195679, -1.5184122323989868, -1.3969897031784058, -1.2755670547485352, -1.154144525527954, -1.0327218770980835, -0.9112993478775024, -0.7898767590522766, -0.6684541702270508, -0.547031581401825, -0.4256089925765991, -0.3041864037513733, -0.18276384472846985, -0.06134125590324402, 0.060081303119659424, 0.18150389194488525, 0.3029264807701111, 0.4243490695953369, 0.5457716584205627, 0.6671942472457886, 0.7886167764663696, 0.9100394248962402, 1.0314619541168213, 1.1528844833374023, 1.274307131767273, 1.3957297801971436, 1.5171523094177246, 1.6385749578475952, 1.7599974870681763, 1.8814201354980469, 2.002842664718628, 2.124265193939209, 2.245687961578369, 2.367110252380371, 2.488532781600952, 2.609955310821533, 2.7313780784606934, 2.8528006076812744, 2.9742231369018555, 3.0956456661224365, 3.2170681953430176, 3.3384909629821777, 3.459913492202759, 3.58133602142334, 3.7027587890625, 3.824181318283081, 3.945603847503662, 4.067026615142822, 4.188448905944824, 4.309871673583984]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 13.0, 19.0, 18.0, 20.0, 25.0, 34.0, 57.0, 134.0, 124.0, 96.0, 129.0, 105.0, 46.0, 31.0, 29.0, 26.0, 20.0, 14.0, 11.0, 13.0, 8.0, 7.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.718404769897461, -4.604491710662842, -4.490578651428223, -4.3766655921936035, -4.262752532958984, -4.148839473724365, -4.034926414489746, -3.921013355255127, -3.807100296020508, -3.6931872367858887, -3.5792741775512695, -3.4653611183166504, -3.3514480590820312, -3.237534999847412, -3.123621940612793, -3.009708881378174, -2.8957958221435547, -2.7818827629089355, -2.6679697036743164, -2.5540566444396973, -2.440143585205078, -2.326230525970459, -2.21231746673584, -2.0984044075012207, -1.9844913482666016, -1.8705782890319824, -1.7566652297973633, -1.6427521705627441, -1.528839111328125, -1.4149260520935059, -1.3010129928588867, -1.1870999336242676, -1.0731868743896484, -0.9592738151550293, -0.8453607559204102, -0.731447696685791, -0.6175346374511719, -0.5036215782165527, -0.3897085189819336, -0.27579545974731445, -0.1618824005126953, -0.04796934127807617, 0.06594371795654297, 0.1798567771911621, 0.29376983642578125, 0.4076828956604004, 0.5215959548950195, 0.6355090141296387, 0.7494220733642578, 0.863335132598877, 0.9772481918334961, 1.0911612510681152, 1.2050743103027344, 1.3189873695373535, 1.4329004287719727, 1.5468134880065918, 1.660726547241211, 1.77463960647583, 1.8885526657104492, 2.0024657249450684, 2.1163787841796875, 2.2302918434143066, 2.344204902648926, 2.458117961883545, 2.572031021118164]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 10.0, 10.0, 7.0, 7.0, 13.0, 13.0, 6.0, 16.0, 18.0, 19.0, 19.0, 23.0, 29.0, 34.0, 48.0, 27.0, 98.0, 238.0, 72.0, 41.0, 26.0, 24.0, 23.0, 24.0, 24.0, 16.0, 12.0, 17.0, 13.0, 14.0, 7.0, 8.0, 7.0, 6.0, 8.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.173828125, -0.16828155517578125, -0.1627349853515625, -0.15718841552734375, -0.151641845703125, -0.14609527587890625, -0.1405487060546875, -0.13500213623046875, -0.12945556640625, -0.12390899658203125, -0.1183624267578125, -0.11281585693359375, -0.107269287109375, -0.10172271728515625, -0.0961761474609375, -0.09062957763671875, -0.0850830078125, -0.07953643798828125, -0.0739898681640625, -0.06844329833984375, -0.062896728515625, -0.05735015869140625, -0.0518035888671875, -0.04625701904296875, -0.04071044921875, -0.03516387939453125, -0.0296173095703125, -0.02407073974609375, -0.018524169921875, -0.01297760009765625, -0.0074310302734375, -0.00188446044921875, 0.003662109375, 0.00920867919921875, 0.0147552490234375, 0.02030181884765625, 0.025848388671875, 0.03139495849609375, 0.0369415283203125, 0.04248809814453125, 0.04803466796875, 0.05358123779296875, 0.0591278076171875, 0.06467437744140625, 0.070220947265625, 0.07576751708984375, 0.0813140869140625, 0.08686065673828125, 0.0924072265625, 0.09795379638671875, 0.1035003662109375, 0.10904693603515625, 0.114593505859375, 0.12014007568359375, 0.1256866455078125, 0.13123321533203125, 0.13677978515625, 0.14232635498046875, 0.1478729248046875, 0.15341949462890625, 0.158966064453125, 0.16451263427734375, 0.1700592041015625, 0.17560577392578125, 0.18115234375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 6.0, 7.0, 14.0, 14.0, 10.0, 26.0, 41.0, 73.0, 210.0, 751.0, 3586.0, 277741.0, 8100601.0, 4185.0, 842.0, 255.0, 113.0, 28.0, 34.0, 22.0, 10.0, 3.0, 4.0, 11.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9718711376190186, -3.855161666870117, -3.738452196121216, -3.6217427253723145, -3.505033493041992, -3.3883237838745117, -3.2716145515441895, -3.154905080795288, -3.0381956100463867, -2.9214861392974854, -2.804776668548584, -2.6880671977996826, -2.5713577270507812, -2.454648494720459, -2.3379390239715576, -2.2212295532226562, -2.104520082473755, -1.9878106117248535, -1.8711011409759521, -1.7543917894363403, -1.637682318687439, -1.5209728479385376, -1.4042634963989258, -1.2875540256500244, -1.170844554901123, -1.0541350841522217, -0.9374256730079651, -0.8207162618637085, -0.7040067911148071, -0.5872973203659058, -0.47058790922164917, -0.3538784980773926, -0.2371690273284912, -0.12045958638191223, -0.003750145435333252, 0.11295929551124573, 0.2296687364578247, 0.3463782072067261, 0.46308761835098267, 0.5797970294952393, 0.6965065002441406, 0.813215970993042, 0.9299253821372986, 1.0466347932815552, 1.1633442640304565, 1.280053734779358, 1.3967630863189697, 1.513472557067871, 1.6301820278167725, 1.7468914985656738, 1.8636009693145752, 1.980310320854187, 2.097019672393799, 2.2137293815612793, 2.3304386138916016, 2.447148084640503, 2.5638575553894043, 2.6805670261383057, 2.797276496887207, 2.9139859676361084, 3.0306954383850098, 3.147404670715332, 3.2641141414642334, 3.3808236122131348, 3.497533082962036]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 6.0, 5.0, 4.0, 10.0, 6.0, 4.0, 5.0, 6.0, 1.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-5.073133945465088, -4.937679767608643, -4.802225589752197, -4.666771411895752, -4.531317234039307, -4.395863056182861, -4.260408878326416, -4.1249542236328125, -3.9895002841949463, -3.854046106338501, -3.7185919284820557, -3.5831377506256104, -3.447683334350586, -3.3122291564941406, -3.1767749786376953, -3.04132080078125, -2.9058666229248047, -2.7704124450683594, -2.634958267211914, -2.4995040893554688, -2.3640499114990234, -2.228595733642578, -2.0931413173675537, -1.9576871395111084, -1.822232961654663, -1.6867787837982178, -1.5513246059417725, -1.4158703088760376, -1.2804161310195923, -1.144961953163147, -1.009507656097412, -0.8740534782409668, -0.7385990619659424, -0.6031448841094971, -0.467690646648407, -0.3322364389896393, -0.19678223133087158, -0.06132805347442627, 0.07412618398666382, 0.2095804214477539, 0.3450345993041992, 0.4804888069629669, 0.6159430146217346, 0.7513972520828247, 0.88685142993927, 1.0223056077957153, 1.1577599048614502, 1.2932140827178955, 1.4286682605743408, 1.5641224384307861, 1.6995766162872314, 1.8350309133529663, 1.9704850912094116, 2.1059393882751465, 2.241393566131592, 2.376847743988037, 2.5123019218444824, 2.6477560997009277, 2.783210277557373, 2.9186644554138184, 3.0541186332702637, 3.189572811126709, 3.3250272274017334, 3.4604814052581787, 3.595935583114624]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 6.0, 8.0, 13.0, 19.0, 29.0, 44.0, 64.0, 125.0, 282.0, 668.0, 1922.0, 6328.0, 26925.0, 148481.0, 264678.0, 57681.0, 11917.0, 3134.0, 1025.0, 410.0, 202.0, 112.0, 65.0, 41.0, 29.0, 18.0, 13.0, 7.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.212890625, -3.1190185546875, -3.025146484375, -2.9312744140625, -2.83740234375, -2.7435302734375, -2.649658203125, -2.5557861328125, -2.4619140625, -2.3680419921875, -2.274169921875, -2.1802978515625, -2.08642578125, -1.9925537109375, -1.898681640625, -1.8048095703125, -1.7109375, -1.6170654296875, -1.523193359375, -1.4293212890625, -1.33544921875, -1.2415771484375, -1.147705078125, -1.0538330078125, -0.9599609375, -0.8660888671875, -0.772216796875, -0.6783447265625, -0.58447265625, -0.4906005859375, -0.396728515625, -0.3028564453125, -0.208984375, -0.1151123046875, -0.021240234375, 0.0726318359375, 0.16650390625, 0.2603759765625, 0.354248046875, 0.4481201171875, 0.5419921875, 0.6358642578125, 0.729736328125, 0.8236083984375, 0.91748046875, 1.0113525390625, 1.105224609375, 1.1990966796875, 1.29296875, 1.3868408203125, 1.480712890625, 1.5745849609375, 1.66845703125, 1.7623291015625, 1.856201171875, 1.9500732421875, 2.0439453125, 2.1378173828125, 2.231689453125, 2.3255615234375, 2.41943359375, 2.5133056640625, 2.607177734375, 2.7010498046875, 2.794921875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 4.0, 6.0, 8.0, 10.0, 8.0, 10.0, 11.0, 19.0, 25.0, 33.0, 34.0, 27.0, 44.0, 42.0, 56.0, 64.0, 62.0, 72.0, 68.0, 62.0, 63.0, 46.0, 47.0, 36.0, 36.0, 22.0, 17.0, 18.0, 14.0, 8.0, 6.0, 6.0, 5.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.28515625, -0.2776813507080078, -0.2702064514160156, -0.26273155212402344, -0.25525665283203125, -0.24778175354003906, -0.24030685424804688, -0.2328319549560547, -0.2253570556640625, -0.2178821563720703, -0.21040725708007812, -0.20293235778808594, -0.19545745849609375, -0.18798255920410156, -0.18050765991210938, -0.1730327606201172, -0.165557861328125, -0.1580829620361328, -0.15060806274414062, -0.14313316345214844, -0.13565826416015625, -0.12818336486816406, -0.12070846557617188, -0.11323356628417969, -0.1057586669921875, -0.09828376770019531, -0.09080886840820312, -0.08333396911621094, -0.07585906982421875, -0.06838417053222656, -0.060909271240234375, -0.05343437194824219, -0.04595947265625, -0.03848457336425781, -0.031009674072265625, -0.023534774780273438, -0.01605987548828125, -0.008584976196289062, -0.001110076904296875, 0.0063648223876953125, 0.0138397216796875, 0.021314620971679688, 0.028789520263671875, 0.03626441955566406, 0.04373931884765625, 0.05121421813964844, 0.058689117431640625, 0.06616401672363281, 0.073638916015625, 0.08111381530761719, 0.08858871459960938, 0.09606361389160156, 0.10353851318359375, 0.11101341247558594, 0.11848831176757812, 0.1259632110595703, 0.1334381103515625, 0.1409130096435547, 0.14838790893554688, 0.15586280822753906, 0.16333770751953125, 0.17081260681152344, 0.17828750610351562, 0.1857624053955078, 0.1932373046875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 4.0, 4.0, 3.0, 12.0, 42.0, 118.0, 185.0, 77.0, 31.0, 10.0, 4.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.390362739562988, -11.176735877990723, -10.963109016418457, -10.749483108520508, -10.535856246948242, -10.322229385375977, -10.108602523803711, -9.894975662231445, -9.68134880065918, -9.467721939086914, -9.254095077514648, -9.0404691696167, -8.826842308044434, -8.613215446472168, -8.399588584899902, -8.185961723327637, -7.9723358154296875, -7.758708953857422, -7.5450825691223145, -7.331455707550049, -7.117829322814941, -6.904202461242676, -6.69057559967041, -6.4769487380981445, -6.263322353363037, -6.0496954917907715, -5.836069107055664, -5.622442245483398, -5.408815383911133, -5.195188999176025, -4.98156213760376, -4.767935752868652, -4.554309368133545, -4.340682506561279, -4.127056121826172, -3.9134292602539062, -3.6998026371002197, -3.486176013946533, -3.2725491523742676, -3.058922529220581, -2.8452959060668945, -2.631669282913208, -2.4180426597595215, -2.204415798187256, -1.9907891750335693, -1.7771625518798828, -1.5635358095169067, -1.3499090671539307, -1.1362824440002441, -0.9226557612419128, -0.7090290784835815, -0.49540239572525024, -0.28177571296691895, -0.06814908981323242, 0.14547765254974365, 0.3591043949127197, 0.5727310180664062, 0.7863577008247375, 0.9999843835830688, 1.213611125946045, 1.4272377490997314, 1.640864372253418, 1.854491114616394, 2.06811785697937, 2.2817444801330566]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 7.0, 2.0, 4.0, 4.0, 4.0, 8.0, 19.0, 36.0, 56.0, 68.0, 64.0, 70.0, 45.0, 34.0, 11.0, 10.0, 3.0, 4.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0], "bins": [-2.398483991622925, -2.340806722640991, -2.2831294536590576, -2.225451946258545, -2.1677746772766113, -2.1100974082946777, -2.052420139312744, -1.9947428703308105, -1.937065601348877, -1.8793883323669434, -1.8217109441757202, -1.7640336751937866, -1.706356406211853, -1.6486790180206299, -1.5910017490386963, -1.5333244800567627, -1.4756470918655396, -1.417969822883606, -1.3602924346923828, -1.3026151657104492, -1.2449378967285156, -1.187260627746582, -1.1295832395553589, -1.0719059705734253, -1.0142285823822021, -0.9565512537956238, -0.8988739848136902, -0.8411966562271118, -0.7835193872451782, -0.7258420586585999, -0.6681647300720215, -0.6104874610900879, -0.5528103113174438, -0.49513301253318787, -0.4374557137489319, -0.3797783851623535, -0.32210108637809753, -0.26442378759384155, -0.20674645900726318, -0.1490691602230072, -0.09139186143875122, -0.03371455520391464, 0.023962751030921936, 0.08164006471633911, 0.1393173635005951, 0.19699466228485107, 0.25467199087142944, 0.3123492896556854, 0.3700265884399414, 0.4277038872241974, 0.48538118600845337, 0.5430585145950317, 0.6007357835769653, 0.6584131121635437, 0.7160904407501221, 0.7737677097320557, 0.831445038318634, 0.8891223669052124, 0.946799635887146, 1.0044770240783691, 1.0621542930603027, 1.1198315620422363, 1.17750883102417, 1.235186219215393, 1.2928634881973267]}, "eval/loss": 5.553798675537109, "eval/wer": 2.01330821102737, "eval/runtime": 947.3214, "eval/samples_per_second": 2.789, "eval/steps_per_second": 0.349} \ No newline at end of file