diff --git "a/wandb/run-20220323_161519-3jzxl68o/files/wandb-summary.json" "b/wandb/run-20220323_161519-3jzxl68o/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220323_161519-3jzxl68o/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 7.098, "train/learning_rate": 1.305e-05, "train/epoch": 0.49, "train/global_step": 435, "_runtime": 2388, "_timestamp": 1648054507, "_step": 434, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 7.0, 4.0, 4.0, 3.0, 6.0, 4.0, 8.0, 9.0, 7.0, 8.0, 13.0, 13.0, 17.0, 23.0, 23.0, 23.0, 23.0, 23.0, 37.0, 45.0, 41.0, 41.0, 56.0, 50.0, 50.0, 56.0, 59.0, 71.0, 58.0, 40.0, 42.0, 36.0, 19.0, 24.0, 16.0, 11.0, 12.0, 4.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-104.813232421875, -102.5434799194336, -100.27372741699219, -98.00398254394531, -95.7342300415039, -93.4644775390625, -91.1947250366211, -88.92497253417969, -86.65522003173828, -84.38546752929688, -82.11571502685547, -79.84596252441406, -77.57621765136719, -75.30646514892578, -73.03671264648438, -70.76696014404297, -68.49720764160156, -66.22745513916016, -63.957706451416016, -61.68795394897461, -59.4182014465332, -57.14845275878906, -54.878700256347656, -52.60894775390625, -50.339202880859375, -48.06945037841797, -45.79970169067383, -43.52994918823242, -41.260196685791016, -38.990447998046875, -36.72069549560547, -34.45094299316406, -32.18119430541992, -29.91144371032715, -27.641691207885742, -25.37194061279297, -23.102188110351562, -20.83243751525879, -18.562686920166016, -16.29293441772461, -14.023183822631836, -11.753432273864746, -9.483680725097656, -7.213930130004883, -4.944178581237793, -2.674427032470703, -0.4046764373779297, 1.8650751113891602, 4.13482666015625, 6.40457820892334, 8.67432975769043, 10.944080352783203, 13.213831901550293, 15.483583450317383, 17.753334045410156, 20.023086547851562, 22.292837142944336, 24.56258773803711, 26.832340240478516, 29.10209083557129, 31.371841430664062, 33.64159393310547, 35.911346435546875, 38.181095123291016, 40.45084762573242]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 9.0, 4.0, 15.0, 9.0, 13.0, 13.0, 10.0, 21.0, 13.0, 28.0, 26.0, 24.0, 37.0, 25.0, 29.0, 18.0, 44.0, 49.0, 38.0, 40.0, 40.0, 45.0, 38.0, 36.0, 40.0, 29.0, 35.0, 31.0, 37.0, 19.0, 31.0, 18.0, 18.0, 16.0, 11.0, 11.0, 14.0, 13.0, 9.0, 10.0, 7.0, 3.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.41203308105469, -63.31178283691406, -61.21152877807617, -59.11127853393555, -57.011024475097656, -54.91077423095703, -52.810523986816406, -50.71027374267578, -48.61001968383789, -46.509769439697266, -44.409515380859375, -42.30926513671875, -40.209014892578125, -38.108760833740234, -36.00851058959961, -33.90825653076172, -31.808006286621094, -29.707754135131836, -27.607501983642578, -25.507251739501953, -23.406999588012695, -21.306747436523438, -19.206497192382812, -17.106245040893555, -15.005992889404297, -12.905740737915039, -10.805489540100098, -8.705238342285156, -6.604986190795898, -4.504734039306641, -2.404482841491699, -0.3042316436767578, 1.7960281372070312, 3.896279811859131, 5.9965314865112305, 8.096782684326172, 10.19703483581543, 12.297286987304688, 14.397538185119629, 16.49778938293457, 18.598041534423828, 20.698293685913086, 22.798545837402344, 24.89879608154297, 26.999048233032227, 29.099300384521484, 31.19955062866211, 33.2998046875, 35.400054931640625, 37.50030517578125, 39.60055923461914, 41.700809478759766, 43.801063537597656, 45.90131378173828, 48.001564025878906, 50.10181427001953, 52.20206832885742, 54.30231857299805, 56.40257263183594, 58.50282287597656, 60.60307312011719, 62.70332717895508, 64.80358123779297, 66.9038314819336, 69.00408172607422]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 12.0, 15.0, 23.0, 32.0, 49.0, 64.0, 105.0, 151.0, 226.0, 308.0, 422.0, 636.0, 892.0, 1279.0, 1779.0, 2492.0, 3679.0, 5357.0, 7838.0, 11738.0, 17663.0, 27398.0, 45141.0, 81802.0, 203771.0, 686652.0, 1550811.0, 1000163.0, 298539.0, 103822.0, 51698.0, 30536.0, 19726.0, 12821.0, 8385.0, 5800.0, 3961.0, 2642.0, 1883.0, 1195.0, 863.0, 643.0, 422.0, 263.0, 205.0, 137.0, 91.0, 59.0, 40.0, 22.0, 16.0, 9.0, 7.0, 3.0, 2.0, 0.0, 1.0], "bins": [-69.875, -67.79931640625, -65.7236328125, -63.64794921875, -61.572265625, -59.49658203125, -57.4208984375, -55.34521484375, -53.26953125, -51.19384765625, -49.1181640625, -47.04248046875, -44.966796875, -42.89111328125, -40.8154296875, -38.73974609375, -36.6640625, -34.58837890625, -32.5126953125, -30.43701171875, -28.361328125, -26.28564453125, -24.2099609375, -22.13427734375, -20.05859375, -17.98291015625, -15.9072265625, -13.83154296875, -11.755859375, -9.68017578125, -7.6044921875, -5.52880859375, -3.453125, -1.37744140625, 0.6982421875, 2.77392578125, 4.849609375, 6.92529296875, 9.0009765625, 11.07666015625, 13.15234375, 15.22802734375, 17.3037109375, 19.37939453125, 21.455078125, 23.53076171875, 25.6064453125, 27.68212890625, 29.7578125, 31.83349609375, 33.9091796875, 35.98486328125, 38.060546875, 40.13623046875, 42.2119140625, 44.28759765625, 46.36328125, 48.43896484375, 50.5146484375, 52.59033203125, 54.666015625, 56.74169921875, 58.8173828125, 60.89306640625, 62.96875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 6.0, 4.0, 7.0, 11.0, 7.0, 6.0, 10.0, 14.0, 24.0, 21.0, 24.0, 13.0, 22.0, 30.0, 32.0, 36.0, 29.0, 36.0, 32.0, 45.0, 41.0, 35.0, 43.0, 34.0, 39.0, 35.0, 36.0, 35.0, 25.0, 31.0, 23.0, 36.0, 27.0, 20.0, 17.0, 9.0, 24.0, 13.0, 13.0, 7.0, 15.0, 2.0, 7.0, 6.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-39.75, -38.55615234375, -37.3623046875, -36.16845703125, -34.974609375, -33.78076171875, -32.5869140625, -31.39306640625, -30.19921875, -29.00537109375, -27.8115234375, -26.61767578125, -25.423828125, -24.22998046875, -23.0361328125, -21.84228515625, -20.6484375, -19.45458984375, -18.2607421875, -17.06689453125, -15.873046875, -14.67919921875, -13.4853515625, -12.29150390625, -11.09765625, -9.90380859375, -8.7099609375, -7.51611328125, -6.322265625, -5.12841796875, -3.9345703125, -2.74072265625, -1.546875, -0.35302734375, 0.8408203125, 2.03466796875, 3.228515625, 4.42236328125, 5.6162109375, 6.81005859375, 8.00390625, 9.19775390625, 10.3916015625, 11.58544921875, 12.779296875, 13.97314453125, 15.1669921875, 16.36083984375, 17.5546875, 18.74853515625, 19.9423828125, 21.13623046875, 22.330078125, 23.52392578125, 24.7177734375, 25.91162109375, 27.10546875, 28.29931640625, 29.4931640625, 30.68701171875, 31.880859375, 33.07470703125, 34.2685546875, 35.46240234375, 36.65625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 5.0, 10.0, 8.0, 16.0, 27.0, 49.0, 90.0, 119.0, 189.0, 287.0, 426.0, 675.0, 1046.0, 1531.0, 2333.0, 3536.0, 5214.0, 7616.0, 11134.0, 16317.0, 23357.0, 34938.0, 52367.0, 80743.0, 128363.0, 212063.0, 389567.0, 1034058.0, 1156869.0, 419814.0, 223815.0, 134938.0, 84887.0, 54545.0, 36316.0, 24494.0, 16800.0, 11559.0, 8076.0, 5374.0, 3575.0, 2425.0, 1654.0, 1066.0, 693.0, 475.0, 305.0, 192.0, 121.0, 74.0, 43.0, 38.0, 25.0, 10.0, 10.0, 9.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-56.21875, -54.408203125, -52.59765625, -50.787109375, -48.9765625, -47.166015625, -45.35546875, -43.544921875, -41.734375, -39.923828125, -38.11328125, -36.302734375, -34.4921875, -32.681640625, -30.87109375, -29.060546875, -27.25, -25.439453125, -23.62890625, -21.818359375, -20.0078125, -18.197265625, -16.38671875, -14.576171875, -12.765625, -10.955078125, -9.14453125, -7.333984375, -5.5234375, -3.712890625, -1.90234375, -0.091796875, 1.71875, 3.529296875, 5.33984375, 7.150390625, 8.9609375, 10.771484375, 12.58203125, 14.392578125, 16.203125, 18.013671875, 19.82421875, 21.634765625, 23.4453125, 25.255859375, 27.06640625, 28.876953125, 30.6875, 32.498046875, 34.30859375, 36.119140625, 37.9296875, 39.740234375, 41.55078125, 43.361328125, 45.171875, 46.982421875, 48.79296875, 50.603515625, 52.4140625, 54.224609375, 56.03515625, 57.845703125, 59.65625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 5.0, 8.0, 6.0, 16.0, 11.0, 19.0, 19.0, 20.0, 25.0, 42.0, 47.0, 58.0, 79.0, 91.0, 123.0, 146.0, 162.0, 254.0, 398.0, 589.0, 556.0, 317.0, 233.0, 166.0, 127.0, 101.0, 106.0, 63.0, 53.0, 37.0, 32.0, 36.0, 24.0, 24.0, 21.0, 12.0, 8.0, 9.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.234375, -28.37109375, -27.5078125, -26.64453125, -25.78125, -24.91796875, -24.0546875, -23.19140625, -22.328125, -21.46484375, -20.6015625, -19.73828125, -18.875, -18.01171875, -17.1484375, -16.28515625, -15.421875, -14.55859375, -13.6953125, -12.83203125, -11.96875, -11.10546875, -10.2421875, -9.37890625, -8.515625, -7.65234375, -6.7890625, -5.92578125, -5.0625, -4.19921875, -3.3359375, -2.47265625, -1.609375, -0.74609375, 0.1171875, 0.98046875, 1.84375, 2.70703125, 3.5703125, 4.43359375, 5.296875, 6.16015625, 7.0234375, 7.88671875, 8.75, 9.61328125, 10.4765625, 11.33984375, 12.203125, 13.06640625, 13.9296875, 14.79296875, 15.65625, 16.51953125, 17.3828125, 18.24609375, 19.109375, 19.97265625, 20.8359375, 21.69921875, 22.5625, 23.42578125, 24.2890625, 25.15234375, 26.015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 7.0, 2.0, 4.0, 4.0, 9.0, 12.0, 11.0, 15.0, 26.0, 14.0, 18.0, 25.0, 45.0, 35.0, 59.0, 54.0, 67.0, 58.0, 51.0, 67.0, 70.0, 43.0, 41.0, 37.0, 34.0, 30.0, 20.0, 23.0, 18.0, 15.0, 10.0, 14.0, 7.0, 7.0, 0.0, 8.0, 12.0, 4.0, 7.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-53.91518020629883, -52.30253982543945, -50.689903259277344, -49.07726287841797, -47.464622497558594, -45.851985931396484, -44.23934555053711, -42.626708984375, -41.014068603515625, -39.40142822265625, -37.78879165649414, -36.176151275634766, -34.56351089477539, -32.95087432861328, -31.338233947753906, -29.725595474243164, -28.11295509338379, -26.500316619873047, -24.887676239013672, -23.27503776550293, -21.662399291992188, -20.049758911132812, -18.43712043762207, -16.824481964111328, -15.21184253692627, -13.599203109741211, -11.986564636230469, -10.37392520904541, -8.761285781860352, -7.148647308349609, -5.536007881164551, -3.9233694076538086, -2.31072998046875, -0.6980909109115601, 0.9145481586456299, 2.5271873474121094, 4.13982629776001, 5.75246524810791, 7.365104675292969, 8.977743148803711, 10.59038257598877, 12.203022003173828, 13.81566047668457, 15.428299903869629, 17.040939331054688, 18.65357780456543, 20.266216278076172, 21.878856658935547, 23.49149513244629, 25.10413360595703, 26.716773986816406, 28.32941246032715, 29.94205093383789, 31.554691314697266, 33.167327880859375, 34.77996826171875, 36.392608642578125, 38.0052490234375, 39.61788558959961, 41.230525970458984, 42.84316635131836, 44.45580291748047, 46.068443298339844, 47.68108367919922, 49.29372024536133]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 0.0, 8.0, 3.0, 5.0, 4.0, 7.0, 7.0, 5.0, 3.0, 9.0, 13.0, 7.0, 9.0, 21.0, 18.0, 18.0, 29.0, 15.0, 13.0, 28.0, 24.0, 29.0, 31.0, 31.0, 31.0, 41.0, 34.0, 32.0, 47.0, 35.0, 29.0, 37.0, 31.0, 53.0, 29.0, 32.0, 26.0, 26.0, 27.0, 13.0, 18.0, 12.0, 17.0, 14.0, 13.0, 12.0, 16.0, 11.0, 9.0, 7.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-40.18162536621094, -38.9515380859375, -37.7214469909668, -36.49135971069336, -35.261268615722656, -34.03118133544922, -32.80109405517578, -31.57100486755371, -30.34091567993164, -29.11082649230957, -27.8807373046875, -26.650650024414062, -25.420560836791992, -24.190471649169922, -22.960384368896484, -21.730295181274414, -20.500205993652344, -19.270116806030273, -18.040027618408203, -16.809940338134766, -15.579851150512695, -14.349761962890625, -13.119673728942871, -11.889585494995117, -10.659496307373047, -9.429407119750977, -8.199318885803223, -6.9692301750183105, -5.739141464233398, -4.509052753448486, -3.278964042663574, -2.0488758087158203, -0.8187828063964844, 0.41130590438842773, 1.6413946151733398, 2.871483325958252, 4.101572036743164, 5.331660747528076, 6.561749458312988, 7.791837692260742, 9.021926879882812, 10.252016067504883, 11.482104301452637, 12.71219253540039, 13.942281723022461, 15.172370910644531, 16.40245819091797, 17.63254737854004, 18.86263656616211, 20.09272575378418, 21.32281494140625, 22.552902221679688, 23.782991409301758, 25.013080596923828, 26.243167877197266, 27.473257064819336, 28.703346252441406, 29.933435440063477, 31.163524627685547, 32.393611907958984, 33.62370300292969, 34.853790283203125, 36.08387756347656, 37.31396484375, 38.5440559387207]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 5.0, 5.0, 3.0, 11.0, 11.0, 22.0, 43.0, 63.0, 97.0, 155.0, 211.0, 308.0, 459.0, 657.0, 917.0, 1258.0, 1843.0, 2557.0, 3674.0, 5141.0, 7535.0, 10453.0, 14451.0, 21587.0, 31162.0, 46514.0, 70297.0, 115298.0, 266829.0, 170461.0, 91510.0, 58444.0, 38812.0, 26547.0, 18617.0, 12620.0, 8729.0, 6111.0, 4400.0, 3194.0, 2418.0, 1644.0, 1154.0, 742.0, 501.0, 354.0, 234.0, 146.0, 116.0, 94.0, 55.0, 36.0, 24.0, 14.0, 12.0, 4.0, 3.0, 7.0, 1.0, 1.0, 1.0], "bins": [-25.078125, -24.2890625, -23.5, -22.7109375, -21.921875, -21.1328125, -20.34375, -19.5546875, -18.765625, -17.9765625, -17.1875, -16.3984375, -15.609375, -14.8203125, -14.03125, -13.2421875, -12.453125, -11.6640625, -10.875, -10.0859375, -9.296875, -8.5078125, -7.71875, -6.9296875, -6.140625, -5.3515625, -4.5625, -3.7734375, -2.984375, -2.1953125, -1.40625, -0.6171875, 0.171875, 0.9609375, 1.75, 2.5390625, 3.328125, 4.1171875, 4.90625, 5.6953125, 6.484375, 7.2734375, 8.0625, 8.8515625, 9.640625, 10.4296875, 11.21875, 12.0078125, 12.796875, 13.5859375, 14.375, 15.1640625, 15.953125, 16.7421875, 17.53125, 18.3203125, 19.109375, 19.8984375, 20.6875, 21.4765625, 22.265625, 23.0546875, 23.84375, 24.6328125, 25.421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 6.0, 5.0, 7.0, 8.0, 5.0, 6.0, 5.0, 7.0, 9.0, 14.0, 15.0, 16.0, 21.0, 11.0, 33.0, 31.0, 17.0, 31.0, 22.0, 26.0, 39.0, 39.0, 42.0, 32.0, 42.0, 35.0, 36.0, 34.0, 27.0, 34.0, 31.0, 27.0, 40.0, 32.0, 28.0, 26.0, 28.0, 19.0, 11.0, 14.0, 12.0, 7.0, 14.0, 15.0, 7.0, 10.0, 5.0, 6.0, 7.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-36.28125, -35.16259765625, -34.0439453125, -32.92529296875, -31.806640625, -30.68798828125, -29.5693359375, -28.45068359375, -27.33203125, -26.21337890625, -25.0947265625, -23.97607421875, -22.857421875, -21.73876953125, -20.6201171875, -19.50146484375, -18.3828125, -17.26416015625, -16.1455078125, -15.02685546875, -13.908203125, -12.78955078125, -11.6708984375, -10.55224609375, -9.43359375, -8.31494140625, -7.1962890625, -6.07763671875, -4.958984375, -3.84033203125, -2.7216796875, -1.60302734375, -0.484375, 0.63427734375, 1.7529296875, 2.87158203125, 3.990234375, 5.10888671875, 6.2275390625, 7.34619140625, 8.46484375, 9.58349609375, 10.7021484375, 11.82080078125, 12.939453125, 14.05810546875, 15.1767578125, 16.29541015625, 17.4140625, 18.53271484375, 19.6513671875, 20.77001953125, 21.888671875, 23.00732421875, 24.1259765625, 25.24462890625, 26.36328125, 27.48193359375, 28.6005859375, 29.71923828125, 30.837890625, 31.95654296875, 33.0751953125, 34.19384765625, 35.3125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 8.0, 12.0, 10.0, 18.0, 26.0, 24.0, 52.0, 74.0, 102.0, 159.0, 250.0, 343.0, 503.0, 820.0, 1300.0, 1976.0, 2887.0, 4558.0, 7154.0, 11757.0, 18660.0, 30145.0, 49916.0, 84649.0, 171776.0, 342924.0, 133517.0, 71829.0, 42556.0, 26396.0, 16384.0, 10075.0, 6295.0, 3911.0, 2596.0, 1641.0, 1147.0, 697.0, 455.0, 305.0, 200.0, 145.0, 97.0, 72.0, 43.0, 39.0, 18.0, 13.0, 11.0, 5.0, 2.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.53125, -18.84228515625, -18.1533203125, -17.46435546875, -16.775390625, -16.08642578125, -15.3974609375, -14.70849609375, -14.01953125, -13.33056640625, -12.6416015625, -11.95263671875, -11.263671875, -10.57470703125, -9.8857421875, -9.19677734375, -8.5078125, -7.81884765625, -7.1298828125, -6.44091796875, -5.751953125, -5.06298828125, -4.3740234375, -3.68505859375, -2.99609375, -2.30712890625, -1.6181640625, -0.92919921875, -0.240234375, 0.44873046875, 1.1376953125, 1.82666015625, 2.515625, 3.20458984375, 3.8935546875, 4.58251953125, 5.271484375, 5.96044921875, 6.6494140625, 7.33837890625, 8.02734375, 8.71630859375, 9.4052734375, 10.09423828125, 10.783203125, 11.47216796875, 12.1611328125, 12.85009765625, 13.5390625, 14.22802734375, 14.9169921875, 15.60595703125, 16.294921875, 16.98388671875, 17.6728515625, 18.36181640625, 19.05078125, 19.73974609375, 20.4287109375, 21.11767578125, 21.806640625, 22.49560546875, 23.1845703125, 23.87353515625, 24.5625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 19.0, 17.0, 10.0, 21.0, 13.0, 25.0, 24.0, 34.0, 35.0, 43.0, 46.0, 31.0, 35.0, 48.0, 48.0, 35.0, 30.0, 40.0, 41.0, 31.0, 42.0, 26.0, 39.0, 35.0, 29.0, 27.0, 24.0, 27.0, 16.0, 16.0, 20.0, 15.0, 10.0, 11.0, 4.0, 6.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.46875, -23.605712890625, -22.74267578125, -21.879638671875, -21.0166015625, -20.153564453125, -19.29052734375, -18.427490234375, -17.564453125, -16.701416015625, -15.83837890625, -14.975341796875, -14.1123046875, -13.249267578125, -12.38623046875, -11.523193359375, -10.66015625, -9.797119140625, -8.93408203125, -8.071044921875, -7.2080078125, -6.344970703125, -5.48193359375, -4.618896484375, -3.755859375, -2.892822265625, -2.02978515625, -1.166748046875, -0.3037109375, 0.559326171875, 1.42236328125, 2.285400390625, 3.1484375, 4.011474609375, 4.87451171875, 5.737548828125, 6.6005859375, 7.463623046875, 8.32666015625, 9.189697265625, 10.052734375, 10.915771484375, 11.77880859375, 12.641845703125, 13.5048828125, 14.367919921875, 15.23095703125, 16.093994140625, 16.95703125, 17.820068359375, 18.68310546875, 19.546142578125, 20.4091796875, 21.272216796875, 22.13525390625, 22.998291015625, 23.861328125, 24.724365234375, 25.58740234375, 26.450439453125, 27.3134765625, 28.176513671875, 29.03955078125, 29.902587890625, 30.765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 7.0, 9.0, 8.0, 14.0, 21.0, 34.0, 68.0, 80.0, 107.0, 173.0, 229.0, 327.0, 466.0, 607.0, 872.0, 1255.0, 1728.0, 2628.0, 3835.0, 6043.0, 9272.0, 14634.0, 23900.0, 40460.0, 72990.0, 148295.0, 320208.0, 189774.0, 87332.0, 47767.0, 27635.0, 16597.0, 10428.0, 6728.0, 4354.0, 2946.0, 2047.0, 1332.0, 905.0, 714.0, 500.0, 397.0, 240.0, 192.0, 129.0, 75.0, 62.0, 52.0, 31.0, 19.0, 17.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.080078125, -0.07769775390625, -0.0753173828125, -0.07293701171875, -0.070556640625, -0.06817626953125, -0.0657958984375, -0.06341552734375, -0.06103515625, -0.05865478515625, -0.0562744140625, -0.05389404296875, -0.051513671875, -0.04913330078125, -0.0467529296875, -0.04437255859375, -0.0419921875, -0.03961181640625, -0.0372314453125, -0.03485107421875, -0.032470703125, -0.03009033203125, -0.0277099609375, -0.02532958984375, -0.02294921875, -0.02056884765625, -0.0181884765625, -0.01580810546875, -0.013427734375, -0.01104736328125, -0.0086669921875, -0.00628662109375, -0.00390625, -0.00152587890625, 0.0008544921875, 0.00323486328125, 0.005615234375, 0.00799560546875, 0.0103759765625, 0.01275634765625, 0.01513671875, 0.01751708984375, 0.0198974609375, 0.02227783203125, 0.024658203125, 0.02703857421875, 0.0294189453125, 0.03179931640625, 0.0341796875, 0.03656005859375, 0.0389404296875, 0.04132080078125, 0.043701171875, 0.04608154296875, 0.0484619140625, 0.05084228515625, 0.05322265625, 0.05560302734375, 0.0579833984375, 0.06036376953125, 0.062744140625, 0.06512451171875, 0.0675048828125, 0.06988525390625, 0.072265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 4.0, 5.0, 9.0, 8.0, 5.0, 7.0, 11.0, 22.0, 17.0, 16.0, 25.0, 41.0, 28.0, 45.0, 56.0, 62.0, 82.0, 79.0, 81.0, 70.0, 41.0, 54.0, 28.0, 30.0, 33.0, 26.0, 16.0, 14.0, 19.0, 4.0, 9.0, 10.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.920099258422852e-05, -6.685778498649597e-05, -6.451457738876343e-05, -6.217136979103088e-05, -5.982816219329834e-05, -5.7484954595565796e-05, -5.514174699783325e-05, -5.279853940010071e-05, -5.0455331802368164e-05, -4.811212420463562e-05, -4.5768916606903076e-05, -4.342570900917053e-05, -4.108250141143799e-05, -3.8739293813705444e-05, -3.63960862159729e-05, -3.4052878618240356e-05, -3.170967102050781e-05, -2.936646342277527e-05, -2.7023255825042725e-05, -2.468004822731018e-05, -2.2336840629577637e-05, -1.9993633031845093e-05, -1.765042543411255e-05, -1.5307217836380005e-05, -1.2964010238647461e-05, -1.0620802640914917e-05, -8.277595043182373e-06, -5.934387445449829e-06, -3.591179847717285e-06, -1.2479722499847412e-06, 1.0952353477478027e-06, 3.4384429454803467e-06, 5.781650543212891e-06, 8.124858140945435e-06, 1.0468065738677979e-05, 1.2811273336410522e-05, 1.5154480934143066e-05, 1.749768853187561e-05, 1.9840896129608154e-05, 2.2184103727340698e-05, 2.4527311325073242e-05, 2.6870518922805786e-05, 2.921372652053833e-05, 3.1556934118270874e-05, 3.390014171600342e-05, 3.624334931373596e-05, 3.8586556911468506e-05, 4.092976450920105e-05, 4.3272972106933594e-05, 4.561617970466614e-05, 4.795938730239868e-05, 5.0302594900131226e-05, 5.264580249786377e-05, 5.4989010095596313e-05, 5.733221769332886e-05, 5.96754252910614e-05, 6.201863288879395e-05, 6.436184048652649e-05, 6.670504808425903e-05, 6.904825568199158e-05, 7.139146327972412e-05, 7.373467087745667e-05, 7.607787847518921e-05, 7.842108607292175e-05, 8.07642936706543e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 10.0, 12.0, 16.0, 22.0, 33.0, 37.0, 51.0, 78.0, 116.0, 186.0, 265.0, 399.0, 609.0, 992.0, 1610.0, 2618.0, 4321.0, 6820.0, 10657.0, 16319.0, 25078.0, 38421.0, 60731.0, 96539.0, 150385.0, 206974.0, 153305.0, 98797.0, 62159.0, 39136.0, 25570.0, 16599.0, 10914.0, 6986.0, 4380.0, 2859.0, 1651.0, 1032.0, 592.0, 403.0, 250.0, 162.0, 130.0, 94.0, 70.0, 45.0, 35.0, 27.0, 17.0, 12.0, 10.0, 11.0, 2.0, 4.0, 2.0, 0.0, 3.0], "bins": [-0.0633544921875, -0.061406612396240234, -0.05945873260498047, -0.0575108528137207, -0.05556297302246094, -0.05361509323120117, -0.051667213439941406, -0.04971933364868164, -0.047771453857421875, -0.04582357406616211, -0.043875694274902344, -0.04192781448364258, -0.03997993469238281, -0.03803205490112305, -0.03608417510986328, -0.034136295318603516, -0.03218841552734375, -0.030240535736083984, -0.02829265594482422, -0.026344776153564453, -0.024396896362304688, -0.022449016571044922, -0.020501136779785156, -0.01855325698852539, -0.016605377197265625, -0.01465749740600586, -0.012709617614746094, -0.010761737823486328, -0.008813858032226562, -0.006865978240966797, -0.004918098449707031, -0.0029702186584472656, -0.0010223388671875, 0.0009255409240722656, 0.0028734207153320312, 0.004821300506591797, 0.0067691802978515625, 0.008717060089111328, 0.010664939880371094, 0.01261281967163086, 0.014560699462890625, 0.01650857925415039, 0.018456459045410156, 0.020404338836669922, 0.022352218627929688, 0.024300098419189453, 0.02624797821044922, 0.028195858001708984, 0.03014373779296875, 0.032091617584228516, 0.03403949737548828, 0.03598737716674805, 0.03793525695800781, 0.03988313674926758, 0.041831016540527344, 0.04377889633178711, 0.045726776123046875, 0.04767465591430664, 0.049622535705566406, 0.05157041549682617, 0.05351829528808594, 0.0554661750793457, 0.05741405487060547, 0.059361934661865234, 0.061309814453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 3.0, 8.0, 8.0, 7.0, 5.0, 11.0, 9.0, 18.0, 18.0, 23.0, 17.0, 27.0, 20.0, 27.0, 26.0, 44.0, 41.0, 47.0, 32.0, 43.0, 49.0, 43.0, 41.0, 39.0, 34.0, 34.0, 40.0, 43.0, 37.0, 35.0, 20.0, 11.0, 19.0, 22.0, 11.0, 21.0, 5.0, 14.0, 13.0, 5.0, 2.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0215606689453125, -0.020953655242919922, -0.020346641540527344, -0.019739627838134766, -0.019132614135742188, -0.01852560043334961, -0.01791858673095703, -0.017311573028564453, -0.016704559326171875, -0.016097545623779297, -0.015490531921386719, -0.01488351821899414, -0.014276504516601562, -0.013669490814208984, -0.013062477111816406, -0.012455463409423828, -0.01184844970703125, -0.011241436004638672, -0.010634422302246094, -0.010027408599853516, -0.009420394897460938, -0.00881338119506836, -0.008206367492675781, -0.007599353790283203, -0.006992340087890625, -0.006385326385498047, -0.005778312683105469, -0.005171298980712891, -0.0045642852783203125, -0.003957271575927734, -0.0033502578735351562, -0.002743244171142578, -0.00213623046875, -0.0015292167663574219, -0.0009222030639648438, -0.0003151893615722656, 0.0002918243408203125, 0.0008988380432128906, 0.0015058517456054688, 0.002112865447998047, 0.002719879150390625, 0.003326892852783203, 0.003933906555175781, 0.004540920257568359, 0.0051479339599609375, 0.005754947662353516, 0.006361961364746094, 0.006968975067138672, 0.00757598876953125, 0.008183002471923828, 0.008790016174316406, 0.009397029876708984, 0.010004043579101562, 0.01061105728149414, 0.011218070983886719, 0.011825084686279297, 0.012432098388671875, 0.013039112091064453, 0.013646125793457031, 0.01425313949584961, 0.014860153198242188, 0.015467166900634766, 0.016074180603027344, 0.016681194305419922, 0.0172882080078125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 7.0, 5.0, 5.0, 5.0, 2.0, 14.0, 6.0, 19.0, 22.0, 13.0, 14.0, 23.0, 37.0, 34.0, 48.0, 64.0, 62.0, 60.0, 44.0, 61.0, 67.0, 73.0, 35.0, 35.0, 37.0, 32.0, 24.0, 22.0, 20.0, 20.0, 13.0, 5.0, 14.0, 7.0, 7.0, 7.0, 6.0, 8.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-49.26988983154297, -47.9041748046875, -46.5384635925293, -45.17274856567383, -43.807037353515625, -42.441322326660156, -41.07560729980469, -39.709896087646484, -38.34418487548828, -36.97846984863281, -35.61275863647461, -34.24704360961914, -32.88133239746094, -31.51561737060547, -30.149904251098633, -28.784191131591797, -27.418476104736328, -26.052762985229492, -24.687049865722656, -23.321334838867188, -21.955623626708984, -20.589908599853516, -19.22419548034668, -17.858482360839844, -16.492769241333008, -15.127056121826172, -13.761343002319336, -12.395628929138184, -11.029915809631348, -9.664202690124512, -8.29848861694336, -6.932775497436523, -5.5670623779296875, -4.201349258422852, -2.8356356620788574, -1.4699220657348633, -0.10420894622802734, 1.2615041732788086, 2.627218246459961, 3.992931365966797, 5.358644485473633, 6.724357604980469, 8.090070724487305, 9.455784797668457, 10.821497917175293, 12.187211036682129, 13.552925109863281, 14.918638229370117, 16.284351348876953, 17.65006446838379, 19.015777587890625, 20.381492614746094, 21.747203826904297, 23.112918853759766, 24.4786319732666, 25.844345092773438, 27.210058212280273, 28.57577133178711, 29.941484451293945, 31.30719757080078, 32.67291259765625, 34.03862380981445, 35.40433883666992, 36.770050048828125, 38.135765075683594]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 7.0, 7.0, 5.0, 5.0, 7.0, 11.0, 8.0, 11.0, 21.0, 18.0, 16.0, 29.0, 15.0, 14.0, 24.0, 24.0, 33.0, 26.0, 35.0, 34.0, 39.0, 36.0, 31.0, 41.0, 37.0, 31.0, 38.0, 30.0, 49.0, 35.0, 27.0, 29.0, 27.0, 25.0, 15.0, 17.0, 12.0, 16.0, 16.0, 13.0, 13.0, 15.0, 13.0, 6.0, 8.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-34.36526107788086, -33.30716323852539, -32.24906539916992, -31.19096565246582, -30.13286781311035, -29.074769973754883, -28.01667022705078, -26.958572387695312, -25.900474548339844, -24.842376708984375, -23.784278869628906, -22.726179122924805, -21.668081283569336, -20.609983444213867, -19.551883697509766, -18.493785858154297, -17.435688018798828, -16.37759017944336, -15.319491386413574, -14.261392593383789, -13.20329475402832, -12.145196914672852, -11.087098121643066, -10.028999328613281, -8.970901489257812, -7.9128031730651855, -6.854704856872559, -5.796606540679932, -4.738508224487305, -3.6804099082946777, -2.622311592102051, -1.5642132759094238, -0.5061187744140625, 0.5519795417785645, 1.6100778579711914, 2.6681761741638184, 3.7262744903564453, 4.784372806549072, 5.842471122741699, 6.900569438934326, 7.958667755126953, 9.016765594482422, 10.074864387512207, 11.132963180541992, 12.191061019897461, 13.24915885925293, 14.307257652282715, 15.3653564453125, 16.42345428466797, 17.481552124023438, 18.539649963378906, 19.597749710083008, 20.655847549438477, 21.713945388793945, 22.772045135498047, 23.830142974853516, 24.888240814208984, 25.946338653564453, 27.004436492919922, 28.062536239624023, 29.120634078979492, 30.17873191833496, 31.236831665039062, 32.29492950439453, 33.35302734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 13.0, 19.0, 26.0, 45.0, 54.0, 106.0, 137.0, 205.0, 384.0, 600.0, 863.0, 1288.0, 1924.0, 3063.0, 4646.0, 7053.0, 10925.0, 17230.0, 27527.0, 45048.0, 77165.0, 143014.0, 243478.0, 200688.0, 106118.0, 59690.0, 35358.0, 22340.0, 13826.0, 8952.0, 5881.0, 3778.0, 2464.0, 1627.0, 1064.0, 697.0, 448.0, 289.0, 200.0, 109.0, 79.0, 50.0, 35.0, 16.0, 21.0, 9.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.125, -66.0458984375, -63.966796875, -61.8876953125, -59.80859375, -57.7294921875, -55.650390625, -53.5712890625, -51.4921875, -49.4130859375, -47.333984375, -45.2548828125, -43.17578125, -41.0966796875, -39.017578125, -36.9384765625, -34.859375, -32.7802734375, -30.701171875, -28.6220703125, -26.54296875, -24.4638671875, -22.384765625, -20.3056640625, -18.2265625, -16.1474609375, -14.068359375, -11.9892578125, -9.91015625, -7.8310546875, -5.751953125, -3.6728515625, -1.59375, 0.4853515625, 2.564453125, 4.6435546875, 6.72265625, 8.8017578125, 10.880859375, 12.9599609375, 15.0390625, 17.1181640625, 19.197265625, 21.2763671875, 23.35546875, 25.4345703125, 27.513671875, 29.5927734375, 31.671875, 33.7509765625, 35.830078125, 37.9091796875, 39.98828125, 42.0673828125, 44.146484375, 46.2255859375, 48.3046875, 50.3837890625, 52.462890625, 54.5419921875, 56.62109375, 58.7001953125, 60.779296875, 62.8583984375, 64.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 10.0, 6.0, 13.0, 6.0, 6.0, 13.0, 23.0, 15.0, 18.0, 22.0, 26.0, 26.0, 22.0, 31.0, 34.0, 34.0, 27.0, 33.0, 38.0, 42.0, 50.0, 43.0, 42.0, 36.0, 31.0, 31.0, 36.0, 35.0, 33.0, 35.0, 22.0, 24.0, 22.0, 16.0, 8.0, 13.0, 14.0, 12.0, 8.0, 12.0, 3.0, 4.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.078125, -29.155029296875, -28.23193359375, -27.308837890625, -26.3857421875, -25.462646484375, -24.53955078125, -23.616455078125, -22.693359375, -21.770263671875, -20.84716796875, -19.924072265625, -19.0009765625, -18.077880859375, -17.15478515625, -16.231689453125, -15.30859375, -14.385498046875, -13.46240234375, -12.539306640625, -11.6162109375, -10.693115234375, -9.77001953125, -8.846923828125, -7.923828125, -7.000732421875, -6.07763671875, -5.154541015625, -4.2314453125, -3.308349609375, -2.38525390625, -1.462158203125, -0.5390625, 0.384033203125, 1.30712890625, 2.230224609375, 3.1533203125, 4.076416015625, 4.99951171875, 5.922607421875, 6.845703125, 7.768798828125, 8.69189453125, 9.614990234375, 10.5380859375, 11.461181640625, 12.38427734375, 13.307373046875, 14.23046875, 15.153564453125, 16.07666015625, 16.999755859375, 17.9228515625, 18.845947265625, 19.76904296875, 20.692138671875, 21.615234375, 22.538330078125, 23.46142578125, 24.384521484375, 25.3076171875, 26.230712890625, 27.15380859375, 28.076904296875, 29.0]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 6.0, 8.0, 12.0, 17.0, 41.0, 37.0, 73.0, 110.0, 179.0, 259.0, 381.0, 628.0, 880.0, 1408.0, 2260.0, 3521.0, 5575.0, 8510.0, 12945.0, 18906.0, 28029.0, 40725.0, 58134.0, 82700.0, 116758.0, 147506.0, 145816.0, 113922.0, 80639.0, 57114.0, 39737.0, 27325.0, 18666.0, 12446.0, 8291.0, 5408.0, 3381.0, 2257.0, 1385.0, 906.0, 575.0, 382.0, 249.0, 161.0, 122.0, 65.0, 43.0, 24.0, 11.0, 12.0, 10.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.0, -42.53173828125, -41.0634765625, -39.59521484375, -38.126953125, -36.65869140625, -35.1904296875, -33.72216796875, -32.25390625, -30.78564453125, -29.3173828125, -27.84912109375, -26.380859375, -24.91259765625, -23.4443359375, -21.97607421875, -20.5078125, -19.03955078125, -17.5712890625, -16.10302734375, -14.634765625, -13.16650390625, -11.6982421875, -10.22998046875, -8.76171875, -7.29345703125, -5.8251953125, -4.35693359375, -2.888671875, -1.42041015625, 0.0478515625, 1.51611328125, 2.984375, 4.45263671875, 5.9208984375, 7.38916015625, 8.857421875, 10.32568359375, 11.7939453125, 13.26220703125, 14.73046875, 16.19873046875, 17.6669921875, 19.13525390625, 20.603515625, 22.07177734375, 23.5400390625, 25.00830078125, 26.4765625, 27.94482421875, 29.4130859375, 30.88134765625, 32.349609375, 33.81787109375, 35.2861328125, 36.75439453125, 38.22265625, 39.69091796875, 41.1591796875, 42.62744140625, 44.095703125, 45.56396484375, 47.0322265625, 48.50048828125, 49.96875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 6.0, 10.0, 15.0, 14.0, 16.0, 19.0, 26.0, 23.0, 33.0, 23.0, 37.0, 32.0, 31.0, 38.0, 31.0, 34.0, 40.0, 38.0, 36.0, 34.0, 46.0, 45.0, 41.0, 36.0, 36.0, 26.0, 29.0, 34.0, 23.0, 23.0, 15.0, 22.0, 23.0, 15.0, 5.0, 8.0, 8.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.109375, -16.50830078125, -15.9072265625, -15.30615234375, -14.705078125, -14.10400390625, -13.5029296875, -12.90185546875, -12.30078125, -11.69970703125, -11.0986328125, -10.49755859375, -9.896484375, -9.29541015625, -8.6943359375, -8.09326171875, -7.4921875, -6.89111328125, -6.2900390625, -5.68896484375, -5.087890625, -4.48681640625, -3.8857421875, -3.28466796875, -2.68359375, -2.08251953125, -1.4814453125, -0.88037109375, -0.279296875, 0.32177734375, 0.9228515625, 1.52392578125, 2.125, 2.72607421875, 3.3271484375, 3.92822265625, 4.529296875, 5.13037109375, 5.7314453125, 6.33251953125, 6.93359375, 7.53466796875, 8.1357421875, 8.73681640625, 9.337890625, 9.93896484375, 10.5400390625, 11.14111328125, 11.7421875, 12.34326171875, 12.9443359375, 13.54541015625, 14.146484375, 14.74755859375, 15.3486328125, 15.94970703125, 16.55078125, 17.15185546875, 17.7529296875, 18.35400390625, 18.955078125, 19.55615234375, 20.1572265625, 20.75830078125, 21.359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 11.0, 13.0, 20.0, 24.0, 48.0, 74.0, 71.0, 118.0, 179.0, 212.0, 305.0, 410.0, 604.0, 835.0, 1140.0, 1709.0, 2540.0, 3960.0, 6227.0, 10394.0, 18196.0, 34227.0, 72576.0, 206676.0, 413867.0, 146770.0, 58052.0, 28394.0, 15433.0, 8889.0, 5532.0, 3481.0, 2227.0, 1573.0, 1141.0, 776.0, 504.0, 399.0, 256.0, 206.0, 151.0, 110.0, 66.0, 45.0, 36.0, 22.0, 20.0, 17.0, 6.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0234375, -3.8951416015625, -3.766845703125, -3.6385498046875, -3.51025390625, -3.3819580078125, -3.253662109375, -3.1253662109375, -2.9970703125, -2.8687744140625, -2.740478515625, -2.6121826171875, -2.48388671875, -2.3555908203125, -2.227294921875, -2.0989990234375, -1.970703125, -1.8424072265625, -1.714111328125, -1.5858154296875, -1.45751953125, -1.3292236328125, -1.200927734375, -1.0726318359375, -0.9443359375, -0.8160400390625, -0.687744140625, -0.5594482421875, -0.43115234375, -0.3028564453125, -0.174560546875, -0.0462646484375, 0.08203125, 0.2103271484375, 0.338623046875, 0.4669189453125, 0.59521484375, 0.7235107421875, 0.851806640625, 0.9801025390625, 1.1083984375, 1.2366943359375, 1.364990234375, 1.4932861328125, 1.62158203125, 1.7498779296875, 1.878173828125, 2.0064697265625, 2.134765625, 2.2630615234375, 2.391357421875, 2.5196533203125, 2.64794921875, 2.7762451171875, 2.904541015625, 3.0328369140625, 3.1611328125, 3.2894287109375, 3.417724609375, 3.5460205078125, 3.67431640625, 3.8026123046875, 3.930908203125, 4.0592041015625, 4.1875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 8.0, 9.0, 5.0, 9.0, 13.0, 19.0, 20.0, 21.0, 35.0, 44.0, 58.0, 85.0, 117.0, 98.0, 117.0, 98.0, 61.0, 34.0, 38.0, 15.0, 28.0, 10.0, 17.0, 12.0, 7.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0005679130554199219, -0.0005479753017425537, -0.0005280375480651855, -0.0005080997943878174, -0.0004881620407104492, -0.00046822428703308105, -0.0004482865333557129, -0.0004283487796783447, -0.00040841102600097656, -0.0003884732723236084, -0.00036853551864624023, -0.00034859776496887207, -0.0003286600112915039, -0.00030872225761413574, -0.0002887845039367676, -0.0002688467502593994, -0.00024890899658203125, -0.00022897124290466309, -0.00020903348922729492, -0.00018909573554992676, -0.0001691579818725586, -0.00014922022819519043, -0.00012928247451782227, -0.0001093447208404541, -8.940696716308594e-05, -6.946921348571777e-05, -4.953145980834961e-05, -2.9593706130981445e-05, -9.655952453613281e-06, 1.0281801223754883e-05, 3.0219554901123047e-05, 5.015730857849121e-05, 7.009506225585938e-05, 9.003281593322754e-05, 0.0001099705696105957, 0.00012990832328796387, 0.00014984607696533203, 0.0001697838306427002, 0.00018972158432006836, 0.00020965933799743652, 0.0002295970916748047, 0.00024953484535217285, 0.000269472599029541, 0.0002894103527069092, 0.00030934810638427734, 0.0003292858600616455, 0.00034922361373901367, 0.00036916136741638184, 0.00038909912109375, 0.00040903687477111816, 0.00042897462844848633, 0.0004489123821258545, 0.00046885013580322266, 0.0004887878894805908, 0.000508725643157959, 0.0005286633968353271, 0.0005486011505126953, 0.0005685389041900635, 0.0005884766578674316, 0.0006084144115447998, 0.000628352165222168, 0.0006482899188995361, 0.0006682276725769043, 0.0006881654262542725, 0.0007081031799316406]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 0.0, 5.0, 4.0, 10.0, 10.0, 16.0, 36.0, 50.0, 49.0, 88.0, 124.0, 185.0, 267.0, 423.0, 590.0, 852.0, 1297.0, 1949.0, 2761.0, 4070.0, 6210.0, 9577.0, 15811.0, 28818.0, 54198.0, 111862.0, 255540.0, 284934.0, 127892.0, 61193.0, 31843.0, 17531.0, 10069.0, 6545.0, 4324.0, 2955.0, 2086.0, 1439.0, 967.0, 693.0, 431.0, 272.0, 201.0, 115.0, 93.0, 59.0, 37.0, 31.0, 16.0, 11.0, 4.0, 9.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.06640625, -2.9644775390625, -2.862548828125, -2.7606201171875, -2.65869140625, -2.5567626953125, -2.454833984375, -2.3529052734375, -2.2509765625, -2.1490478515625, -2.047119140625, -1.9451904296875, -1.84326171875, -1.7413330078125, -1.639404296875, -1.5374755859375, -1.435546875, -1.3336181640625, -1.231689453125, -1.1297607421875, -1.02783203125, -0.9259033203125, -0.823974609375, -0.7220458984375, -0.6201171875, -0.5181884765625, -0.416259765625, -0.3143310546875, -0.21240234375, -0.1104736328125, -0.008544921875, 0.0933837890625, 0.1953125, 0.2972412109375, 0.399169921875, 0.5010986328125, 0.60302734375, 0.7049560546875, 0.806884765625, 0.9088134765625, 1.0107421875, 1.1126708984375, 1.214599609375, 1.3165283203125, 1.41845703125, 1.5203857421875, 1.622314453125, 1.7242431640625, 1.826171875, 1.9281005859375, 2.030029296875, 2.1319580078125, 2.23388671875, 2.3358154296875, 2.437744140625, 2.5396728515625, 2.6416015625, 2.7435302734375, 2.845458984375, 2.9473876953125, 3.04931640625, 3.1512451171875, 3.253173828125, 3.3551025390625, 3.45703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 6.0, 6.0, 7.0, 8.0, 16.0, 19.0, 36.0, 33.0, 49.0, 53.0, 78.0, 71.0, 71.0, 89.0, 82.0, 78.0, 63.0, 38.0, 31.0, 31.0, 25.0, 22.0, 15.0, 14.0, 9.0, 9.0, 4.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -0.99224853515625, -0.9542236328125, -0.91619873046875, -0.878173828125, -0.84014892578125, -0.8021240234375, -0.76409912109375, -0.72607421875, -0.68804931640625, -0.6500244140625, -0.61199951171875, -0.573974609375, -0.53594970703125, -0.4979248046875, -0.45989990234375, -0.421875, -0.38385009765625, -0.3458251953125, -0.30780029296875, -0.269775390625, -0.23175048828125, -0.1937255859375, -0.15570068359375, -0.11767578125, -0.07965087890625, -0.0416259765625, -0.00360107421875, 0.034423828125, 0.07244873046875, 0.1104736328125, 0.14849853515625, 0.1865234375, 0.22454833984375, 0.2625732421875, 0.30059814453125, 0.338623046875, 0.37664794921875, 0.4146728515625, 0.45269775390625, 0.49072265625, 0.52874755859375, 0.5667724609375, 0.60479736328125, 0.642822265625, 0.68084716796875, 0.7188720703125, 0.75689697265625, 0.794921875, 0.83294677734375, 0.8709716796875, 0.90899658203125, 0.947021484375, 0.98504638671875, 1.0230712890625, 1.06109619140625, 1.09912109375, 1.13714599609375, 1.1751708984375, 1.21319580078125, 1.251220703125, 1.28924560546875, 1.3272705078125, 1.36529541015625, 1.4033203125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 4.0, 5.0, 2.0, 4.0, 5.0, 8.0, 9.0, 12.0, 11.0, 12.0, 19.0, 16.0, 30.0, 26.0, 33.0, 46.0, 57.0, 64.0, 55.0, 76.0, 64.0, 55.0, 59.0, 59.0, 45.0, 38.0, 35.0, 16.0, 20.0, 21.0, 13.0, 17.0, 12.0, 8.0, 9.0, 7.0, 5.0, 4.0, 10.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-43.960716247558594, -42.77522277832031, -41.58972930908203, -40.404239654541016, -39.218746185302734, -38.03325271606445, -36.84775924682617, -35.66226577758789, -34.476776123046875, -33.291282653808594, -32.10578918457031, -30.920297622680664, -29.734806060791016, -28.549312591552734, -27.363819122314453, -26.178325653076172, -24.99283218383789, -23.80733871459961, -22.62184715270996, -21.43635368347168, -20.25086212158203, -19.06536865234375, -17.87987518310547, -16.694381713867188, -15.508890151977539, -14.323397636413574, -13.13790512084961, -11.952411651611328, -10.766919136047363, -9.581426620483398, -8.395933151245117, -7.210440635681152, -6.024951934814453, -4.839459419250488, -3.6539664268493652, -2.4684736728668213, -1.2829809188842773, -0.0974884033203125, 1.0880045890808105, 2.2734975814819336, 3.4589900970458984, 4.644482612609863, 5.829975605010986, 7.015468597412109, 8.200961112976074, 9.386453628540039, 10.57194709777832, 11.757439613342285, 12.94293212890625, 14.128424644470215, 15.31391716003418, 16.49941062927246, 17.68490219116211, 18.87039566040039, 20.055889129638672, 21.241382598876953, 22.4268741607666, 23.612367630004883, 24.79785919189453, 25.983352661132812, 27.168846130371094, 28.354337692260742, 29.539831161499023, 30.725322723388672, 31.910816192626953]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 0.0, 1.0, 5.0, 3.0, 11.0, 5.0, 9.0, 12.0, 11.0, 13.0, 23.0, 12.0, 13.0, 21.0, 20.0, 26.0, 31.0, 21.0, 20.0, 29.0, 32.0, 39.0, 31.0, 38.0, 30.0, 25.0, 46.0, 32.0, 32.0, 29.0, 39.0, 34.0, 28.0, 29.0, 32.0, 23.0, 32.0, 21.0, 21.0, 12.0, 18.0, 17.0, 10.0, 8.0, 13.0, 8.0, 7.0, 4.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-27.42071533203125, -26.5557861328125, -25.69085693359375, -24.825927734375, -23.96099853515625, -23.0960693359375, -22.23114013671875, -21.3662109375, -20.50128173828125, -19.6363525390625, -18.77142333984375, -17.906494140625, -17.04156494140625, -16.1766357421875, -15.311705589294434, -14.446776390075684, -13.581846237182617, -12.716917037963867, -11.851987838745117, -10.987058639526367, -10.122129440307617, -9.257200241088867, -8.3922700881958, -7.527340888977051, -6.662411689758301, -5.797482490539551, -4.932553291320801, -4.067623615264893, -3.2026944160461426, -2.3377652168273926, -1.4728355407714844, -0.6079063415527344, 0.2570209503173828, 1.1219502687454224, 1.986879587173462, 2.851809024810791, 3.716738224029541, 4.581667423248291, 5.446597099304199, 6.311526298522949, 7.176455497741699, 8.04138469696045, 8.9063138961792, 9.771244049072266, 10.636173248291016, 11.501102447509766, 12.366031646728516, 13.230960845947266, 14.095890045166016, 14.960819244384766, 15.825748443603516, 16.690677642822266, 17.555606842041016, 18.420536041259766, 19.285465240478516, 20.150394439697266, 21.015323638916016, 21.880252838134766, 22.745182037353516, 23.610111236572266, 24.475040435791016, 25.339969635009766, 26.204898834228516, 27.069828033447266, 27.93475914001465]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 7.0, 6.0, 13.0, 17.0, 17.0, 40.0, 37.0, 84.0, 107.0, 164.0, 246.0, 329.0, 479.0, 741.0, 1076.0, 1606.0, 2340.0, 3514.0, 5107.0, 7658.0, 11333.0, 17250.0, 27285.0, 44737.0, 77666.0, 156422.0, 465212.0, 1317876.0, 1259101.0, 449943.0, 151777.0, 75176.0, 43240.0, 26118.0, 16147.0, 10538.0, 6941.0, 4530.0, 3054.0, 2076.0, 1359.0, 943.0, 614.0, 444.0, 287.0, 213.0, 135.0, 94.0, 64.0, 41.0, 28.0, 20.0, 19.0, 10.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-38.0625, -36.83349609375, -35.6044921875, -34.37548828125, -33.146484375, -31.91748046875, -30.6884765625, -29.45947265625, -28.23046875, -27.00146484375, -25.7724609375, -24.54345703125, -23.314453125, -22.08544921875, -20.8564453125, -19.62744140625, -18.3984375, -17.16943359375, -15.9404296875, -14.71142578125, -13.482421875, -12.25341796875, -11.0244140625, -9.79541015625, -8.56640625, -7.33740234375, -6.1083984375, -4.87939453125, -3.650390625, -2.42138671875, -1.1923828125, 0.03662109375, 1.265625, 2.49462890625, 3.7236328125, 4.95263671875, 6.181640625, 7.41064453125, 8.6396484375, 9.86865234375, 11.09765625, 12.32666015625, 13.5556640625, 14.78466796875, 16.013671875, 17.24267578125, 18.4716796875, 19.70068359375, 20.9296875, 22.15869140625, 23.3876953125, 24.61669921875, 25.845703125, 27.07470703125, 28.3037109375, 29.53271484375, 30.76171875, 31.99072265625, 33.2197265625, 34.44873046875, 35.677734375, 36.90673828125, 38.1357421875, 39.36474609375, 40.59375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 7.0, 7.0, 6.0, 2.0, 7.0, 7.0, 7.0, 15.0, 18.0, 10.0, 21.0, 21.0, 13.0, 15.0, 26.0, 29.0, 30.0, 21.0, 34.0, 33.0, 39.0, 24.0, 33.0, 36.0, 38.0, 36.0, 27.0, 27.0, 37.0, 40.0, 27.0, 32.0, 36.0, 37.0, 28.0, 22.0, 19.0, 28.0, 16.0, 22.0, 9.0, 9.0, 11.0, 7.0, 7.0, 8.0, 3.0, 3.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.671875, -18.047119140625, -17.42236328125, -16.797607421875, -16.1728515625, -15.548095703125, -14.92333984375, -14.298583984375, -13.673828125, -13.049072265625, -12.42431640625, -11.799560546875, -11.1748046875, -10.550048828125, -9.92529296875, -9.300537109375, -8.67578125, -8.051025390625, -7.42626953125, -6.801513671875, -6.1767578125, -5.552001953125, -4.92724609375, -4.302490234375, -3.677734375, -3.052978515625, -2.42822265625, -1.803466796875, -1.1787109375, -0.553955078125, 0.07080078125, 0.695556640625, 1.3203125, 1.945068359375, 2.56982421875, 3.194580078125, 3.8193359375, 4.444091796875, 5.06884765625, 5.693603515625, 6.318359375, 6.943115234375, 7.56787109375, 8.192626953125, 8.8173828125, 9.442138671875, 10.06689453125, 10.691650390625, 11.31640625, 11.941162109375, 12.56591796875, 13.190673828125, 13.8154296875, 14.440185546875, 15.06494140625, 15.689697265625, 16.314453125, 16.939208984375, 17.56396484375, 18.188720703125, 18.8134765625, 19.438232421875, 20.06298828125, 20.687744140625, 21.3125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 14.0, 17.0, 15.0, 29.0, 61.0, 80.0, 134.0, 239.0, 366.0, 494.0, 839.0, 1280.0, 1856.0, 2935.0, 4429.0, 6747.0, 10448.0, 16287.0, 25968.0, 44040.0, 78309.0, 145930.0, 304656.0, 732698.0, 1550278.0, 663260.0, 281020.0, 137796.0, 73260.0, 41653.0, 25022.0, 15526.0, 9798.0, 6480.0, 4309.0, 2796.0, 1838.0, 1229.0, 720.0, 524.0, 347.0, 187.0, 139.0, 79.0, 54.0, 32.0, 18.0, 13.0, 9.0, 5.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-40.21875, -38.93994140625, -37.6611328125, -36.38232421875, -35.103515625, -33.82470703125, -32.5458984375, -31.26708984375, -29.98828125, -28.70947265625, -27.4306640625, -26.15185546875, -24.873046875, -23.59423828125, -22.3154296875, -21.03662109375, -19.7578125, -18.47900390625, -17.2001953125, -15.92138671875, -14.642578125, -13.36376953125, -12.0849609375, -10.80615234375, -9.52734375, -8.24853515625, -6.9697265625, -5.69091796875, -4.412109375, -3.13330078125, -1.8544921875, -0.57568359375, 0.703125, 1.98193359375, 3.2607421875, 4.53955078125, 5.818359375, 7.09716796875, 8.3759765625, 9.65478515625, 10.93359375, 12.21240234375, 13.4912109375, 14.77001953125, 16.048828125, 17.32763671875, 18.6064453125, 19.88525390625, 21.1640625, 22.44287109375, 23.7216796875, 25.00048828125, 26.279296875, 27.55810546875, 28.8369140625, 30.11572265625, 31.39453125, 32.67333984375, 33.9521484375, 35.23095703125, 36.509765625, 37.78857421875, 39.0673828125, 40.34619140625, 41.625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 3.0, 4.0, 2.0, 10.0, 8.0, 7.0, 9.0, 15.0, 10.0, 27.0, 28.0, 23.0, 36.0, 40.0, 58.0, 76.0, 94.0, 143.0, 165.0, 225.0, 285.0, 359.0, 502.0, 475.0, 333.0, 241.0, 213.0, 150.0, 93.0, 95.0, 85.0, 64.0, 40.0, 29.0, 24.0, 25.0, 18.0, 15.0, 10.0, 10.0, 10.0, 2.0, 9.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.65625, -12.167236328125, -11.67822265625, -11.189208984375, -10.7001953125, -10.211181640625, -9.72216796875, -9.233154296875, -8.744140625, -8.255126953125, -7.76611328125, -7.277099609375, -6.7880859375, -6.299072265625, -5.81005859375, -5.321044921875, -4.83203125, -4.343017578125, -3.85400390625, -3.364990234375, -2.8759765625, -2.386962890625, -1.89794921875, -1.408935546875, -0.919921875, -0.430908203125, 0.05810546875, 0.547119140625, 1.0361328125, 1.525146484375, 2.01416015625, 2.503173828125, 2.9921875, 3.481201171875, 3.97021484375, 4.459228515625, 4.9482421875, 5.437255859375, 5.92626953125, 6.415283203125, 6.904296875, 7.393310546875, 7.88232421875, 8.371337890625, 8.8603515625, 9.349365234375, 9.83837890625, 10.327392578125, 10.81640625, 11.305419921875, 11.79443359375, 12.283447265625, 12.7724609375, 13.261474609375, 13.75048828125, 14.239501953125, 14.728515625, 15.217529296875, 15.70654296875, 16.195556640625, 16.6845703125, 17.173583984375, 17.66259765625, 18.151611328125, 18.640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 5.0, 10.0, 12.0, 7.0, 5.0, 10.0, 11.0, 19.0, 23.0, 32.0, 36.0, 55.0, 60.0, 58.0, 71.0, 74.0, 90.0, 74.0, 67.0, 48.0, 54.0, 30.0, 27.0, 27.0, 9.0, 19.0, 13.0, 15.0, 8.0, 11.0, 3.0, 4.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.906770706176758, -28.844207763671875, -27.78164291381836, -26.719079971313477, -25.656517028808594, -24.59395408630371, -23.531391143798828, -22.468826293945312, -21.40626335144043, -20.343700408935547, -19.28113555908203, -18.21857261657715, -17.156009674072266, -16.093446731567383, -15.030882835388184, -13.968318939208984, -12.905755996704102, -11.843193054199219, -10.78062915802002, -9.71806526184082, -8.655502319335938, -7.5929388999938965, -6.5303754806518555, -5.4678120613098145, -4.405248641967773, -3.3426852226257324, -2.2801218032836914, -1.2175583839416504, -0.15499496459960938, 0.9075684547424316, 1.9701318740844727, 3.0326952934265137, 4.095256805419922, 5.157820224761963, 6.220383644104004, 7.282947063446045, 8.345510482788086, 9.408073425292969, 10.470637321472168, 11.533201217651367, 12.59576416015625, 13.658327102661133, 14.720890998840332, 15.783454895019531, 16.846017837524414, 17.908580780029297, 18.971145629882812, 20.033708572387695, 21.096271514892578, 22.15883445739746, 23.221397399902344, 24.28396224975586, 25.346525192260742, 26.409088134765625, 27.47165298461914, 28.534215927124023, 29.596778869628906, 30.65934181213379, 31.721904754638672, 32.78446960449219, 33.84703063964844, 34.90959548950195, 35.97216033935547, 37.03472137451172, 38.097286224365234]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 7.0, 4.0, 13.0, 13.0, 21.0, 17.0, 18.0, 20.0, 22.0, 31.0, 33.0, 30.0, 27.0, 28.0, 25.0, 43.0, 33.0, 40.0, 46.0, 38.0, 50.0, 32.0, 23.0, 36.0, 36.0, 35.0, 47.0, 27.0, 18.0, 17.0, 31.0, 25.0, 18.0, 16.0, 11.0, 14.0, 10.0, 5.0, 3.0, 5.0, 3.0, 2.0, 7.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-25.48984146118164, -24.740720748901367, -23.991600036621094, -23.242477416992188, -22.493356704711914, -21.74423599243164, -20.995115280151367, -20.245994567871094, -19.496871948242188, -18.747751235961914, -17.99863052368164, -17.249507904052734, -16.50038719177246, -15.751266479492188, -15.002145767211914, -14.253024101257324, -13.50390338897705, -12.754782676696777, -12.005661010742188, -11.256540298461914, -10.507418632507324, -9.75829792022705, -9.009176254272461, -8.260055541992188, -7.510934352874756, -6.761813163757324, -6.012691974639893, -5.263570785522461, -4.5144500732421875, -3.7653286457061768, -3.016207695007324, -2.2670865058898926, -1.517965316772461, -0.7688441872596741, -0.019723057746887207, 0.7293980121612549, 1.4785192012786865, 2.227640390396118, 2.9767613410949707, 3.7258825302124023, 4.475003719329834, 5.224124908447266, 5.973246097564697, 6.722367286682129, 7.471487998962402, 8.220609664916992, 8.969730377197266, 9.718851089477539, 10.467972755432129, 11.217093467712402, 11.966215133666992, 12.715335845947266, 13.464457511901855, 14.213578224182129, 14.962699890136719, 15.711820602416992, 16.460941314697266, 17.21006202697754, 17.959182739257812, 18.70830535888672, 19.457426071166992, 20.206546783447266, 20.95566749572754, 21.704788208007812, 22.45391082763672]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 8.0, 4.0, 11.0, 17.0, 22.0, 31.0, 66.0, 100.0, 135.0, 181.0, 274.0, 468.0, 621.0, 890.0, 1413.0, 1885.0, 2808.0, 4167.0, 6014.0, 8689.0, 12664.0, 18837.0, 27555.0, 41315.0, 63974.0, 108087.0, 243680.0, 216171.0, 102821.0, 61828.0, 39746.0, 26435.0, 18071.0, 12383.0, 8557.0, 5935.0, 4051.0, 2712.0, 1963.0, 1286.0, 886.0, 577.0, 422.0, 276.0, 166.0, 129.0, 91.0, 54.0, 30.0, 16.0, 18.0, 9.0, 6.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.953125, -11.5670166015625, -11.180908203125, -10.7947998046875, -10.40869140625, -10.0225830078125, -9.636474609375, -9.2503662109375, -8.8642578125, -8.4781494140625, -8.092041015625, -7.7059326171875, -7.31982421875, -6.9337158203125, -6.547607421875, -6.1614990234375, -5.775390625, -5.3892822265625, -5.003173828125, -4.6170654296875, -4.23095703125, -3.8448486328125, -3.458740234375, -3.0726318359375, -2.6865234375, -2.3004150390625, -1.914306640625, -1.5281982421875, -1.14208984375, -0.7559814453125, -0.369873046875, 0.0162353515625, 0.40234375, 0.7884521484375, 1.174560546875, 1.5606689453125, 1.94677734375, 2.3328857421875, 2.718994140625, 3.1051025390625, 3.4912109375, 3.8773193359375, 4.263427734375, 4.6495361328125, 5.03564453125, 5.4217529296875, 5.807861328125, 6.1939697265625, 6.580078125, 6.9661865234375, 7.352294921875, 7.7384033203125, 8.12451171875, 8.5106201171875, 8.896728515625, 9.2828369140625, 9.6689453125, 10.0550537109375, 10.441162109375, 10.8272705078125, 11.21337890625, 11.5994873046875, 11.985595703125, 12.3717041015625, 12.7578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 10.0, 2.0, 9.0, 6.0, 8.0, 18.0, 7.0, 15.0, 14.0, 14.0, 26.0, 19.0, 20.0, 22.0, 24.0, 25.0, 36.0, 31.0, 38.0, 35.0, 31.0, 33.0, 44.0, 37.0, 39.0, 25.0, 31.0, 36.0, 42.0, 25.0, 35.0, 26.0, 28.0, 30.0, 24.0, 25.0, 14.0, 16.0, 16.0, 14.0, 15.0, 8.0, 5.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.75, -20.07861328125, -19.4072265625, -18.73583984375, -18.064453125, -17.39306640625, -16.7216796875, -16.05029296875, -15.37890625, -14.70751953125, -14.0361328125, -13.36474609375, -12.693359375, -12.02197265625, -11.3505859375, -10.67919921875, -10.0078125, -9.33642578125, -8.6650390625, -7.99365234375, -7.322265625, -6.65087890625, -5.9794921875, -5.30810546875, -4.63671875, -3.96533203125, -3.2939453125, -2.62255859375, -1.951171875, -1.27978515625, -0.6083984375, 0.06298828125, 0.734375, 1.40576171875, 2.0771484375, 2.74853515625, 3.419921875, 4.09130859375, 4.7626953125, 5.43408203125, 6.10546875, 6.77685546875, 7.4482421875, 8.11962890625, 8.791015625, 9.46240234375, 10.1337890625, 10.80517578125, 11.4765625, 12.14794921875, 12.8193359375, 13.49072265625, 14.162109375, 14.83349609375, 15.5048828125, 16.17626953125, 16.84765625, 17.51904296875, 18.1904296875, 18.86181640625, 19.533203125, 20.20458984375, 20.8759765625, 21.54736328125, 22.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 3.0, 10.0, 9.0, 17.0, 24.0, 18.0, 43.0, 65.0, 112.0, 160.0, 222.0, 302.0, 421.0, 628.0, 863.0, 1275.0, 1938.0, 2914.0, 4291.0, 6199.0, 9501.0, 14382.0, 21866.0, 33706.0, 52189.0, 85542.0, 170151.0, 327722.0, 120207.0, 68270.0, 42828.0, 28089.0, 18221.0, 11923.0, 7890.0, 5316.0, 3597.0, 2405.0, 1615.0, 1102.0, 777.0, 518.0, 368.0, 296.0, 196.0, 121.0, 85.0, 61.0, 42.0, 24.0, 19.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.6875, -10.3345947265625, -9.981689453125, -9.6287841796875, -9.27587890625, -8.9229736328125, -8.570068359375, -8.2171630859375, -7.8642578125, -7.5113525390625, -7.158447265625, -6.8055419921875, -6.45263671875, -6.0997314453125, -5.746826171875, -5.3939208984375, -5.041015625, -4.6881103515625, -4.335205078125, -3.9822998046875, -3.62939453125, -3.2764892578125, -2.923583984375, -2.5706787109375, -2.2177734375, -1.8648681640625, -1.511962890625, -1.1590576171875, -0.80615234375, -0.4532470703125, -0.100341796875, 0.2525634765625, 0.60546875, 0.9583740234375, 1.311279296875, 1.6641845703125, 2.01708984375, 2.3699951171875, 2.722900390625, 3.0758056640625, 3.4287109375, 3.7816162109375, 4.134521484375, 4.4874267578125, 4.84033203125, 5.1932373046875, 5.546142578125, 5.8990478515625, 6.251953125, 6.6048583984375, 6.957763671875, 7.3106689453125, 7.66357421875, 8.0164794921875, 8.369384765625, 8.7222900390625, 9.0751953125, 9.4281005859375, 9.781005859375, 10.1339111328125, 10.48681640625, 10.8397216796875, 11.192626953125, 11.5455322265625, 11.8984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 2.0, 6.0, 6.0, 6.0, 7.0, 10.0, 16.0, 13.0, 22.0, 23.0, 19.0, 25.0, 28.0, 31.0, 23.0, 36.0, 34.0, 24.0, 37.0, 35.0, 37.0, 31.0, 44.0, 42.0, 36.0, 31.0, 35.0, 41.0, 32.0, 30.0, 26.0, 22.0, 32.0, 20.0, 18.0, 23.0, 24.0, 10.0, 14.0, 7.0, 9.0, 5.0, 5.0, 2.0, 2.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.7421875, -13.2889404296875, -12.835693359375, -12.3824462890625, -11.92919921875, -11.4759521484375, -11.022705078125, -10.5694580078125, -10.1162109375, -9.6629638671875, -9.209716796875, -8.7564697265625, -8.30322265625, -7.8499755859375, -7.396728515625, -6.9434814453125, -6.490234375, -6.0369873046875, -5.583740234375, -5.1304931640625, -4.67724609375, -4.2239990234375, -3.770751953125, -3.3175048828125, -2.8642578125, -2.4110107421875, -1.957763671875, -1.5045166015625, -1.05126953125, -0.5980224609375, -0.144775390625, 0.3084716796875, 0.76171875, 1.2149658203125, 1.668212890625, 2.1214599609375, 2.57470703125, 3.0279541015625, 3.481201171875, 3.9344482421875, 4.3876953125, 4.8409423828125, 5.294189453125, 5.7474365234375, 6.20068359375, 6.6539306640625, 7.107177734375, 7.5604248046875, 8.013671875, 8.4669189453125, 8.920166015625, 9.3734130859375, 9.82666015625, 10.2799072265625, 10.733154296875, 11.1864013671875, 11.6396484375, 12.0928955078125, 12.546142578125, 12.9993896484375, 13.45263671875, 13.9058837890625, 14.359130859375, 14.8123779296875, 15.265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 8.0, 10.0, 21.0, 25.0, 47.0, 59.0, 104.0, 109.0, 195.0, 269.0, 438.0, 677.0, 1145.0, 1885.0, 3117.0, 5527.0, 9920.0, 19742.0, 41226.0, 101321.0, 301207.0, 347032.0, 119468.0, 47258.0, 21953.0, 11222.0, 5860.0, 3430.0, 1980.0, 1214.0, 720.0, 449.0, 320.0, 189.0, 137.0, 84.0, 54.0, 40.0, 27.0, 27.0, 12.0, 6.0, 8.0, 3.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.043548583984375, -0.0421910285949707, -0.040833473205566406, -0.03947591781616211, -0.03811836242675781, -0.036760807037353516, -0.03540325164794922, -0.03404569625854492, -0.032688140869140625, -0.03133058547973633, -0.02997303009033203, -0.028615474700927734, -0.027257919311523438, -0.02590036392211914, -0.024542808532714844, -0.023185253143310547, -0.02182769775390625, -0.020470142364501953, -0.019112586975097656, -0.01775503158569336, -0.016397476196289062, -0.015039920806884766, -0.013682365417480469, -0.012324810028076172, -0.010967254638671875, -0.009609699249267578, -0.008252143859863281, -0.006894588470458984, -0.0055370330810546875, -0.004179477691650391, -0.0028219223022460938, -0.0014643669128417969, -0.0001068115234375, 0.0012507438659667969, 0.0026082992553710938, 0.003965854644775391, 0.0053234100341796875, 0.006680965423583984, 0.008038520812988281, 0.009396076202392578, 0.010753631591796875, 0.012111186981201172, 0.013468742370605469, 0.014826297760009766, 0.016183853149414062, 0.01754140853881836, 0.018898963928222656, 0.020256519317626953, 0.02161407470703125, 0.022971630096435547, 0.024329185485839844, 0.02568674087524414, 0.027044296264648438, 0.028401851654052734, 0.02975940704345703, 0.031116962432861328, 0.032474517822265625, 0.03383207321166992, 0.03518962860107422, 0.036547183990478516, 0.03790473937988281, 0.03926229476928711, 0.040619850158691406, 0.0419774055480957, 0.0433349609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 9.0, 8.0, 9.0, 18.0, 32.0, 46.0, 64.0, 104.0, 147.0, 135.0, 132.0, 90.0, 64.0, 48.0, 31.0, 20.0, 15.0, 9.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6133995056152344e-05, -4.4442713260650635e-05, -4.2751431465148926e-05, -4.106014966964722e-05, -3.936886787414551e-05, -3.76775860786438e-05, -3.598630428314209e-05, -3.429502248764038e-05, -3.260374069213867e-05, -3.091245889663696e-05, -2.9221177101135254e-05, -2.7529895305633545e-05, -2.5838613510131836e-05, -2.4147331714630127e-05, -2.2456049919128418e-05, -2.076476812362671e-05, -1.9073486328125e-05, -1.738220453262329e-05, -1.5690922737121582e-05, -1.3999640941619873e-05, -1.2308359146118164e-05, -1.0617077350616455e-05, -8.925795555114746e-06, -7.234513759613037e-06, -5.543231964111328e-06, -3.851950168609619e-06, -2.16066837310791e-06, -4.6938657760620117e-07, 1.2218952178955078e-06, 2.913177013397217e-06, 4.604458808898926e-06, 6.295740604400635e-06, 7.987022399902344e-06, 9.678304195404053e-06, 1.1369585990905762e-05, 1.306086778640747e-05, 1.475214958190918e-05, 1.644343137741089e-05, 1.8134713172912598e-05, 1.9825994968414307e-05, 2.1517276763916016e-05, 2.3208558559417725e-05, 2.4899840354919434e-05, 2.6591122150421143e-05, 2.828240394592285e-05, 2.997368574142456e-05, 3.166496753692627e-05, 3.335624933242798e-05, 3.504753112792969e-05, 3.6738812923431396e-05, 3.8430094718933105e-05, 4.0121376514434814e-05, 4.1812658309936523e-05, 4.350394010543823e-05, 4.519522190093994e-05, 4.688650369644165e-05, 4.857778549194336e-05, 5.026906728744507e-05, 5.196034908294678e-05, 5.3651630878448486e-05, 5.5342912673950195e-05, 5.7034194469451904e-05, 5.872547626495361e-05, 6.041675806045532e-05, 6.210803985595703e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 9.0, 13.0, 24.0, 22.0, 38.0, 74.0, 102.0, 152.0, 238.0, 352.0, 534.0, 833.0, 1158.0, 1741.0, 2736.0, 4041.0, 5999.0, 9279.0, 14509.0, 23137.0, 39422.0, 71377.0, 139694.0, 247149.0, 220039.0, 114658.0, 60218.0, 33581.0, 20514.0, 12775.0, 8078.0, 5337.0, 3542.0, 2369.0, 1625.0, 1050.0, 731.0, 461.0, 297.0, 238.0, 164.0, 88.0, 58.0, 30.0, 27.0, 20.0, 12.0, 10.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03167724609375, -0.03074169158935547, -0.029806137084960938, -0.028870582580566406, -0.027935028076171875, -0.026999473571777344, -0.026063919067382812, -0.02512836456298828, -0.02419281005859375, -0.02325725555419922, -0.022321701049804688, -0.021386146545410156, -0.020450592041015625, -0.019515037536621094, -0.018579483032226562, -0.01764392852783203, -0.0167083740234375, -0.01577281951904297, -0.014837265014648438, -0.013901710510253906, -0.012966156005859375, -0.012030601501464844, -0.011095046997070312, -0.010159492492675781, -0.00922393798828125, -0.008288383483886719, -0.0073528289794921875, -0.006417274475097656, -0.005481719970703125, -0.004546165466308594, -0.0036106109619140625, -0.0026750564575195312, -0.001739501953125, -0.0008039474487304688, 0.0001316070556640625, 0.0010671615600585938, 0.002002716064453125, 0.0029382705688476562, 0.0038738250732421875, 0.004809379577636719, 0.00574493408203125, 0.006680488586425781, 0.0076160430908203125, 0.008551597595214844, 0.009487152099609375, 0.010422706604003906, 0.011358261108398438, 0.012293815612792969, 0.0132293701171875, 0.014164924621582031, 0.015100479125976562, 0.016036033630371094, 0.016971588134765625, 0.017907142639160156, 0.018842697143554688, 0.01977825164794922, 0.02071380615234375, 0.02164936065673828, 0.022584915161132812, 0.023520469665527344, 0.024456024169921875, 0.025391578674316406, 0.026327133178710938, 0.02726268768310547, 0.0281982421875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 3.0, 3.0, 5.0, 11.0, 6.0, 5.0, 11.0, 9.0, 16.0, 9.0, 22.0, 27.0, 34.0, 38.0, 49.0, 51.0, 71.0, 91.0, 67.0, 74.0, 59.0, 57.0, 51.0, 46.0, 32.0, 29.0, 18.0, 13.0, 14.0, 8.0, 11.0, 9.0, 13.0, 3.0, 7.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00937652587890625, -0.00902402400970459, -0.00867152214050293, -0.00831902027130127, -0.00796651840209961, -0.007614016532897949, -0.007261514663696289, -0.006909012794494629, -0.006556510925292969, -0.006204009056091309, -0.0058515071868896484, -0.005499005317687988, -0.005146503448486328, -0.004794001579284668, -0.004441499710083008, -0.004088997840881348, -0.0037364959716796875, -0.0033839941024780273, -0.003031492233276367, -0.002678990364074707, -0.002326488494873047, -0.0019739866256713867, -0.0016214847564697266, -0.0012689828872680664, -0.0009164810180664062, -0.0005639791488647461, -0.00021147727966308594, 0.00014102458953857422, 0.0004935264587402344, 0.0008460283279418945, 0.0011985301971435547, 0.0015510320663452148, 0.001903533935546875, 0.002256035804748535, 0.0026085376739501953, 0.0029610395431518555, 0.0033135414123535156, 0.0036660432815551758, 0.004018545150756836, 0.004371047019958496, 0.004723548889160156, 0.005076050758361816, 0.0054285526275634766, 0.005781054496765137, 0.006133556365966797, 0.006486058235168457, 0.006838560104370117, 0.007191061973571777, 0.0075435638427734375, 0.007896065711975098, 0.008248567581176758, 0.008601069450378418, 0.008953571319580078, 0.009306073188781738, 0.009658575057983398, 0.010011076927185059, 0.010363578796386719, 0.010716080665588379, 0.011068582534790039, 0.0114210844039917, 0.01177358627319336, 0.01212608814239502, 0.01247859001159668, 0.01283109188079834, 0.01318359375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 6.0, 12.0, 6.0, 8.0, 6.0, 13.0, 12.0, 23.0, 39.0, 29.0, 45.0, 68.0, 67.0, 60.0, 88.0, 81.0, 70.0, 81.0, 48.0, 48.0, 36.0, 29.0, 20.0, 12.0, 18.0, 14.0, 18.0, 12.0, 7.0, 7.0, 2.0, 1.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.6807861328125, -26.699974060058594, -25.719161987304688, -24.73834991455078, -23.757537841796875, -22.77672576904297, -21.795913696289062, -20.815101623535156, -19.83428955078125, -18.853477478027344, -17.872665405273438, -16.89185333251953, -15.911041259765625, -14.930229187011719, -13.949418067932129, -12.968605995178223, -11.987794876098633, -11.006982803344727, -10.02617073059082, -9.045358657836914, -8.064546585083008, -7.08373498916626, -6.102923393249512, -5.1221113204956055, -4.141299247741699, -3.160487174987793, -2.179675340652466, -1.1988635063171387, -0.21805143356323242, 0.7627606391906738, 1.7435722351074219, 2.724384307861328, 3.7051963806152344, 4.686008453369141, 5.666820526123047, 6.647632122039795, 7.628444194793701, 8.609256744384766, 9.590067863464355, 10.570879936218262, 11.551692008972168, 12.532504081726074, 13.51331615447998, 14.49412727355957, 15.474939346313477, 16.455751419067383, 17.43656349182129, 18.417375564575195, 19.3981876373291, 20.378999710083008, 21.359811782836914, 22.34062385559082, 23.321435928344727, 24.302248001098633, 25.283058166503906, 26.263870239257812, 27.24468231201172, 28.225494384765625, 29.20630645751953, 30.187118530273438, 31.167930603027344, 32.14874267578125, 33.129554748535156, 34.11036682128906, 35.09117889404297]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 5.0, 5.0, 8.0, 8.0, 6.0, 7.0, 18.0, 17.0, 19.0, 19.0, 18.0, 24.0, 29.0, 33.0, 27.0, 29.0, 31.0, 29.0, 39.0, 35.0, 34.0, 49.0, 40.0, 44.0, 34.0, 23.0, 34.0, 40.0, 35.0, 47.0, 28.0, 16.0, 21.0, 25.0, 30.0, 16.0, 17.0, 13.0, 13.0, 7.0, 9.0, 3.0, 5.0, 3.0, 1.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.423294067382812, -22.736289978027344, -22.049285888671875, -21.362281799316406, -20.675277709960938, -19.988271713256836, -19.301267623901367, -18.6142635345459, -17.92725944519043, -17.24025535583496, -16.553251266479492, -15.866246223449707, -15.179242134094238, -14.49223804473877, -13.805233001708984, -13.118228912353516, -12.431224822998047, -11.744220733642578, -11.05721664428711, -10.370211601257324, -9.683207511901855, -8.996203422546387, -8.309198379516602, -7.622194290161133, -6.935190200805664, -6.248186111450195, -5.561181545257568, -4.874176979064941, -4.187172889709473, -3.500168561935425, -2.813164234161377, -2.12615966796875, -1.4391536712646484, -0.7521493434906006, -0.06514501571655273, 0.6218593120574951, 1.308863639831543, 1.9958679676055908, 2.6828722953796387, 3.3698768615722656, 4.056880950927734, 4.743885040283203, 5.43088960647583, 6.117894172668457, 6.804898262023926, 7.4919023513793945, 8.17890739440918, 8.865911483764648, 9.552915573120117, 10.239919662475586, 10.926923751831055, 11.61392879486084, 12.300932884216309, 12.987936973571777, 13.674942016601562, 14.361946105957031, 15.0489501953125, 15.735954284667969, 16.422958374023438, 17.109962463378906, 17.796966552734375, 18.483972549438477, 19.170976638793945, 19.857980728149414, 20.544984817504883]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [6.0, 0.0, 3.0, 2.0, 10.0, 11.0, 16.0, 25.0, 31.0, 46.0, 57.0, 94.0, 108.0, 162.0, 241.0, 371.0, 484.0, 755.0, 1035.0, 1489.0, 2216.0, 3093.0, 4526.0, 6809.0, 10347.0, 15615.0, 23888.0, 37640.0, 60687.0, 98157.0, 154178.0, 192772.0, 158642.0, 101176.0, 62202.0, 38393.0, 24849.0, 15802.0, 10388.0, 6967.0, 4750.0, 3215.0, 2223.0, 1543.0, 1039.0, 719.0, 529.0, 395.0, 252.0, 182.0, 135.0, 90.0, 72.0, 41.0, 34.0, 20.0, 9.0, 11.0, 8.0, 7.0, 3.0, 1.0, 4.0, 1.0], "bins": [-31.46875, -30.470703125, -29.47265625, -28.474609375, -27.4765625, -26.478515625, -25.48046875, -24.482421875, -23.484375, -22.486328125, -21.48828125, -20.490234375, -19.4921875, -18.494140625, -17.49609375, -16.498046875, -15.5, -14.501953125, -13.50390625, -12.505859375, -11.5078125, -10.509765625, -9.51171875, -8.513671875, -7.515625, -6.517578125, -5.51953125, -4.521484375, -3.5234375, -2.525390625, -1.52734375, -0.529296875, 0.46875, 1.466796875, 2.46484375, 3.462890625, 4.4609375, 5.458984375, 6.45703125, 7.455078125, 8.453125, 9.451171875, 10.44921875, 11.447265625, 12.4453125, 13.443359375, 14.44140625, 15.439453125, 16.4375, 17.435546875, 18.43359375, 19.431640625, 20.4296875, 21.427734375, 22.42578125, 23.423828125, 24.421875, 25.419921875, 26.41796875, 27.416015625, 28.4140625, 29.412109375, 30.41015625, 31.408203125, 32.40625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 4.0, 8.0, 10.0, 6.0, 10.0, 13.0, 17.0, 15.0, 26.0, 21.0, 32.0, 25.0, 28.0, 24.0, 29.0, 32.0, 46.0, 48.0, 37.0, 43.0, 35.0, 47.0, 37.0, 38.0, 29.0, 42.0, 32.0, 30.0, 31.0, 37.0, 32.0, 20.0, 23.0, 26.0, 9.0, 17.0, 8.0, 7.0, 7.0, 6.0, 0.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.578125, -19.96728515625, -19.3564453125, -18.74560546875, -18.134765625, -17.52392578125, -16.9130859375, -16.30224609375, -15.69140625, -15.08056640625, -14.4697265625, -13.85888671875, -13.248046875, -12.63720703125, -12.0263671875, -11.41552734375, -10.8046875, -10.19384765625, -9.5830078125, -8.97216796875, -8.361328125, -7.75048828125, -7.1396484375, -6.52880859375, -5.91796875, -5.30712890625, -4.6962890625, -4.08544921875, -3.474609375, -2.86376953125, -2.2529296875, -1.64208984375, -1.03125, -0.42041015625, 0.1904296875, 0.80126953125, 1.412109375, 2.02294921875, 2.6337890625, 3.24462890625, 3.85546875, 4.46630859375, 5.0771484375, 5.68798828125, 6.298828125, 6.90966796875, 7.5205078125, 8.13134765625, 8.7421875, 9.35302734375, 9.9638671875, 10.57470703125, 11.185546875, 11.79638671875, 12.4072265625, 13.01806640625, 13.62890625, 14.23974609375, 14.8505859375, 15.46142578125, 16.072265625, 16.68310546875, 17.2939453125, 17.90478515625, 18.515625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 10.0, 21.0, 20.0, 30.0, 50.0, 88.0, 122.0, 151.0, 258.0, 397.0, 600.0, 832.0, 1296.0, 1958.0, 2853.0, 4242.0, 6325.0, 9335.0, 13667.0, 20140.0, 29983.0, 44684.0, 66543.0, 99147.0, 140878.0, 164842.0, 139958.0, 98404.0, 65965.0, 44119.0, 29783.0, 20091.0, 13394.0, 9183.0, 6232.0, 4256.0, 2878.0, 1938.0, 1305.0, 847.0, 558.0, 384.0, 261.0, 163.0, 121.0, 71.0, 57.0, 36.0, 26.0, 16.0, 9.0, 9.0, 7.0, 4.0, 3.0, 0.0, 0.0, 3.0], "bins": [-28.375, -27.473876953125, -26.57275390625, -25.671630859375, -24.7705078125, -23.869384765625, -22.96826171875, -22.067138671875, -21.166015625, -20.264892578125, -19.36376953125, -18.462646484375, -17.5615234375, -16.660400390625, -15.75927734375, -14.858154296875, -13.95703125, -13.055908203125, -12.15478515625, -11.253662109375, -10.3525390625, -9.451416015625, -8.55029296875, -7.649169921875, -6.748046875, -5.846923828125, -4.94580078125, -4.044677734375, -3.1435546875, -2.242431640625, -1.34130859375, -0.440185546875, 0.4609375, 1.362060546875, 2.26318359375, 3.164306640625, 4.0654296875, 4.966552734375, 5.86767578125, 6.768798828125, 7.669921875, 8.571044921875, 9.47216796875, 10.373291015625, 11.2744140625, 12.175537109375, 13.07666015625, 13.977783203125, 14.87890625, 15.780029296875, 16.68115234375, 17.582275390625, 18.4833984375, 19.384521484375, 20.28564453125, 21.186767578125, 22.087890625, 22.989013671875, 23.89013671875, 24.791259765625, 25.6923828125, 26.593505859375, 27.49462890625, 28.395751953125, 29.296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 5.0, 10.0, 14.0, 10.0, 20.0, 20.0, 13.0, 18.0, 15.0, 25.0, 23.0, 36.0, 38.0, 33.0, 38.0, 57.0, 37.0, 36.0, 37.0, 38.0, 41.0, 41.0, 43.0, 31.0, 35.0, 32.0, 27.0, 35.0, 25.0, 24.0, 23.0, 19.0, 18.0, 14.0, 14.0, 14.0, 10.0, 8.0, 5.0, 4.0, 3.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.3828125, -11.9949951171875, -11.607177734375, -11.2193603515625, -10.83154296875, -10.4437255859375, -10.055908203125, -9.6680908203125, -9.2802734375, -8.8924560546875, -8.504638671875, -8.1168212890625, -7.72900390625, -7.3411865234375, -6.953369140625, -6.5655517578125, -6.177734375, -5.7899169921875, -5.402099609375, -5.0142822265625, -4.62646484375, -4.2386474609375, -3.850830078125, -3.4630126953125, -3.0751953125, -2.6873779296875, -2.299560546875, -1.9117431640625, -1.52392578125, -1.1361083984375, -0.748291015625, -0.3604736328125, 0.02734375, 0.4151611328125, 0.802978515625, 1.1907958984375, 1.57861328125, 1.9664306640625, 2.354248046875, 2.7420654296875, 3.1298828125, 3.5177001953125, 3.905517578125, 4.2933349609375, 4.68115234375, 5.0689697265625, 5.456787109375, 5.8446044921875, 6.232421875, 6.6202392578125, 7.008056640625, 7.3958740234375, 7.78369140625, 8.1715087890625, 8.559326171875, 8.9471435546875, 9.3349609375, 9.7227783203125, 10.110595703125, 10.4984130859375, 10.88623046875, 11.2740478515625, 11.661865234375, 12.0496826171875, 12.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 11.0, 7.0, 17.0, 24.0, 34.0, 72.0, 90.0, 130.0, 199.0, 287.0, 413.0, 661.0, 941.0, 1407.0, 2178.0, 3471.0, 5776.0, 9817.0, 18192.0, 39337.0, 100055.0, 294646.0, 346977.0, 126638.0, 47368.0, 21364.0, 11206.0, 6273.0, 3844.0, 2395.0, 1582.0, 1038.0, 686.0, 437.0, 316.0, 207.0, 146.0, 95.0, 79.0, 48.0, 31.0, 17.0, 13.0, 13.0, 8.0, 4.0, 3.0, 2.0, 1.0, 3.0], "bins": [-3.69921875, -3.596771240234375, -3.49432373046875, -3.391876220703125, -3.2894287109375, -3.186981201171875, -3.08453369140625, -2.982086181640625, -2.879638671875, -2.777191162109375, -2.67474365234375, -2.572296142578125, -2.4698486328125, -2.367401123046875, -2.26495361328125, -2.162506103515625, -2.06005859375, -1.957611083984375, -1.85516357421875, -1.752716064453125, -1.6502685546875, -1.547821044921875, -1.44537353515625, -1.342926025390625, -1.240478515625, -1.138031005859375, -1.03558349609375, -0.933135986328125, -0.8306884765625, -0.728240966796875, -0.62579345703125, -0.523345947265625, -0.4208984375, -0.318450927734375, -0.21600341796875, -0.113555908203125, -0.0111083984375, 0.091339111328125, 0.19378662109375, 0.296234130859375, 0.398681640625, 0.501129150390625, 0.60357666015625, 0.706024169921875, 0.8084716796875, 0.910919189453125, 1.01336669921875, 1.115814208984375, 1.21826171875, 1.320709228515625, 1.42315673828125, 1.525604248046875, 1.6280517578125, 1.730499267578125, 1.83294677734375, 1.935394287109375, 2.037841796875, 2.140289306640625, 2.24273681640625, 2.345184326171875, 2.4476318359375, 2.550079345703125, 2.65252685546875, 2.754974365234375, 2.857421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 6.0, 14.0, 11.0, 11.0, 16.0, 24.0, 21.0, 44.0, 49.0, 85.0, 95.0, 118.0, 116.0, 89.0, 65.0, 55.0, 53.0, 36.0, 22.0, 17.0, 12.0, 13.0, 8.0, 8.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004119873046875, -0.0003994256258010864, -0.00038686394691467285, -0.0003743022680282593, -0.0003617405891418457, -0.00034917891025543213, -0.00033661723136901855, -0.000324055552482605, -0.0003114938735961914, -0.00029893219470977783, -0.00028637051582336426, -0.0002738088369369507, -0.0002612471580505371, -0.00024868547916412354, -0.00023612380027770996, -0.0002235621213912964, -0.0002110004425048828, -0.00019843876361846924, -0.00018587708473205566, -0.0001733154058456421, -0.00016075372695922852, -0.00014819204807281494, -0.00013563036918640137, -0.0001230686902999878, -0.00011050701141357422, -9.794533252716064e-05, -8.538365364074707e-05, -7.28219747543335e-05, -6.026029586791992e-05, -4.769861698150635e-05, -3.5136938095092773e-05, -2.25752592086792e-05, -1.0013580322265625e-05, 2.5480985641479492e-06, 1.5109777450561523e-05, 2.7671456336975098e-05, 4.023313522338867e-05, 5.2794814109802246e-05, 6.535649299621582e-05, 7.79181718826294e-05, 9.047985076904297e-05, 0.00010304152965545654, 0.00011560320854187012, 0.0001281648874282837, 0.00014072656631469727, 0.00015328824520111084, 0.00016584992408752441, 0.000178411602973938, 0.00019097328186035156, 0.00020353496074676514, 0.0002160966396331787, 0.00022865831851959229, 0.00024121999740600586, 0.00025378167629241943, 0.000266343355178833, 0.0002789050340652466, 0.00029146671295166016, 0.00030402839183807373, 0.0003165900707244873, 0.0003291517496109009, 0.00034171342849731445, 0.00035427510738372803, 0.0003668367862701416, 0.0003793984651565552, 0.00039196014404296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 7.0, 5.0, 12.0, 16.0, 15.0, 18.0, 34.0, 38.0, 62.0, 80.0, 119.0, 164.0, 265.0, 445.0, 716.0, 1199.0, 2077.0, 3658.0, 6921.0, 14453.0, 37651.0, 135363.0, 474369.0, 264045.0, 64370.0, 21506.0, 9559.0, 4744.0, 2642.0, 1489.0, 906.0, 556.0, 338.0, 216.0, 149.0, 103.0, 67.0, 46.0, 39.0, 25.0, 16.0, 11.0, 11.0, 11.0, 7.0, 7.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.58203125, -4.4420166015625, -4.302001953125, -4.1619873046875, -4.02197265625, -3.8819580078125, -3.741943359375, -3.6019287109375, -3.4619140625, -3.3218994140625, -3.181884765625, -3.0418701171875, -2.90185546875, -2.7618408203125, -2.621826171875, -2.4818115234375, -2.341796875, -2.2017822265625, -2.061767578125, -1.9217529296875, -1.78173828125, -1.6417236328125, -1.501708984375, -1.3616943359375, -1.2216796875, -1.0816650390625, -0.941650390625, -0.8016357421875, -0.66162109375, -0.5216064453125, -0.381591796875, -0.2415771484375, -0.1015625, 0.0384521484375, 0.178466796875, 0.3184814453125, 0.45849609375, 0.5985107421875, 0.738525390625, 0.8785400390625, 1.0185546875, 1.1585693359375, 1.298583984375, 1.4385986328125, 1.57861328125, 1.7186279296875, 1.858642578125, 1.9986572265625, 2.138671875, 2.2786865234375, 2.418701171875, 2.5587158203125, 2.69873046875, 2.8387451171875, 2.978759765625, 3.1187744140625, 3.2587890625, 3.3988037109375, 3.538818359375, 3.6788330078125, 3.81884765625, 3.9588623046875, 4.098876953125, 4.2388916015625, 4.37890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 1.0, 9.0, 8.0, 4.0, 11.0, 23.0, 18.0, 29.0, 39.0, 79.0, 86.0, 119.0, 121.0, 120.0, 109.0, 82.0, 38.0, 34.0, 20.0, 12.0, 12.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.669921875, -1.6276702880859375, -1.585418701171875, -1.5431671142578125, -1.50091552734375, -1.4586639404296875, -1.416412353515625, -1.3741607666015625, -1.3319091796875, -1.2896575927734375, -1.247406005859375, -1.2051544189453125, -1.16290283203125, -1.1206512451171875, -1.078399658203125, -1.0361480712890625, -0.993896484375, -0.9516448974609375, -0.909393310546875, -0.8671417236328125, -0.82489013671875, -0.7826385498046875, -0.740386962890625, -0.6981353759765625, -0.6558837890625, -0.6136322021484375, -0.571380615234375, -0.5291290283203125, -0.48687744140625, -0.4446258544921875, -0.402374267578125, -0.3601226806640625, -0.31787109375, -0.2756195068359375, -0.233367919921875, -0.1911163330078125, -0.14886474609375, -0.1066131591796875, -0.064361572265625, -0.0221099853515625, 0.0201416015625, 0.0623931884765625, 0.104644775390625, 0.1468963623046875, 0.18914794921875, 0.2313995361328125, 0.273651123046875, 0.3159027099609375, 0.358154296875, 0.4004058837890625, 0.442657470703125, 0.4849090576171875, 0.52716064453125, 0.5694122314453125, 0.611663818359375, 0.6539154052734375, 0.6961669921875, 0.7384185791015625, 0.780670166015625, 0.8229217529296875, 0.86517333984375, 0.9074249267578125, 0.949676513671875, 0.9919281005859375, 1.0341796875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 2.0, 10.0, 11.0, 13.0, 12.0, 10.0, 20.0, 20.0, 25.0, 40.0, 46.0, 67.0, 73.0, 74.0, 66.0, 85.0, 78.0, 62.0, 47.0, 51.0, 40.0, 25.0, 22.0, 20.0, 17.0, 15.0, 11.0, 7.0, 6.0, 2.0, 7.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.850786209106445, -28.997779846191406, -28.144771575927734, -27.291763305664062, -26.438756942749023, -25.585750579833984, -24.732742309570312, -23.87973403930664, -23.0267276763916, -22.173721313476562, -21.32071304321289, -20.46770477294922, -19.61469841003418, -18.76169204711914, -17.90868377685547, -17.055675506591797, -16.202669143676758, -15.349661827087402, -14.496654510498047, -13.643647193908691, -12.790639877319336, -11.93763256072998, -11.084625244140625, -10.23161792755127, -9.378610610961914, -8.525603294372559, -7.672595977783203, -6.819588661193848, -5.966581344604492, -5.113574028015137, -4.260566711425781, -3.407559394836426, -2.5545501708984375, -1.701542854309082, -0.8485355377197266, 0.004471778869628906, 0.8574790954589844, 1.7104864120483398, 2.5634937286376953, 3.416501045227051, 4.269508361816406, 5.122515678405762, 5.975522994995117, 6.828530311584473, 7.681537628173828, 8.534544944763184, 9.387552261352539, 10.240559577941895, 11.09356689453125, 11.946574211120605, 12.799581527709961, 13.652588844299316, 14.505596160888672, 15.358603477478027, 16.211610794067383, 17.064617156982422, 17.917625427246094, 18.770633697509766, 19.623640060424805, 20.476646423339844, 21.329654693603516, 22.182662963867188, 23.035669326782227, 23.888675689697266, 24.741683959960938]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 2.0, 3.0, 5.0, 5.0, 8.0, 7.0, 11.0, 17.0, 20.0, 16.0, 25.0, 22.0, 25.0, 27.0, 35.0, 29.0, 34.0, 32.0, 37.0, 42.0, 31.0, 38.0, 44.0, 48.0, 41.0, 27.0, 39.0, 38.0, 40.0, 34.0, 26.0, 27.0, 28.0, 17.0, 11.0, 17.0, 25.0, 18.0, 15.0, 7.0, 5.0, 8.0, 4.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.489757537841797, -18.868820190429688, -18.247880935668945, -17.626943588256836, -17.006006240844727, -16.385066986083984, -15.764129638671875, -15.143192291259766, -14.52225399017334, -13.901315689086914, -13.280378341674805, -12.659440040588379, -12.038501739501953, -11.417564392089844, -10.796626091003418, -10.175687789916992, -9.554750442504883, -8.933812141418457, -8.312874794006348, -7.691936492919922, -7.070998668670654, -6.450060844421387, -5.829122543334961, -5.208184719085693, -4.587246894836426, -3.966309070587158, -3.3453710079193115, -2.724432945251465, -2.1034951210021973, -1.4825572967529297, -0.861619234085083, -0.24068117141723633, 0.38025474548339844, 1.0011926889419556, 1.6221306324005127, 2.2430686950683594, 2.864006519317627, 3.4849443435668945, 4.10588264465332, 4.726820468902588, 5.3477582931518555, 5.968696117401123, 6.589633941650391, 7.210572242736816, 7.831510066986084, 8.452447891235352, 9.073386192321777, 9.694324493408203, 10.315261840820312, 10.936200141906738, 11.557137489318848, 12.178075790405273, 12.799013137817383, 13.419951438903809, 14.040889739990234, 14.661827087402344, 15.28276538848877, 15.903703689575195, 16.524641036987305, 17.145578384399414, 17.766517639160156, 18.387454986572266, 19.008392333984375, 19.629331588745117, 20.250268936157227]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 14.0, 13.0, 21.0, 30.0, 42.0, 84.0, 107.0, 182.0, 245.0, 352.0, 526.0, 752.0, 1176.0, 1737.0, 2491.0, 3992.0, 6044.0, 9338.0, 14274.0, 22511.0, 36194.0, 59262.0, 102528.0, 208704.0, 564530.0, 1223610.0, 1090247.0, 446319.0, 171062.0, 89155.0, 51427.0, 31203.0, 19210.0, 12531.0, 7906.0, 5329.0, 3605.0, 2360.0, 1607.0, 1070.0, 787.0, 530.0, 356.0, 254.0, 184.0, 135.0, 76.0, 53.0, 40.0, 23.0, 31.0, 15.0, 5.0, 5.0, 2.0, 7.0, 0.0, 1.0, 1.0], "bins": [-23.625, -22.85986328125, -22.0947265625, -21.32958984375, -20.564453125, -19.79931640625, -19.0341796875, -18.26904296875, -17.50390625, -16.73876953125, -15.9736328125, -15.20849609375, -14.443359375, -13.67822265625, -12.9130859375, -12.14794921875, -11.3828125, -10.61767578125, -9.8525390625, -9.08740234375, -8.322265625, -7.55712890625, -6.7919921875, -6.02685546875, -5.26171875, -4.49658203125, -3.7314453125, -2.96630859375, -2.201171875, -1.43603515625, -0.6708984375, 0.09423828125, 0.859375, 1.62451171875, 2.3896484375, 3.15478515625, 3.919921875, 4.68505859375, 5.4501953125, 6.21533203125, 6.98046875, 7.74560546875, 8.5107421875, 9.27587890625, 10.041015625, 10.80615234375, 11.5712890625, 12.33642578125, 13.1015625, 13.86669921875, 14.6318359375, 15.39697265625, 16.162109375, 16.92724609375, 17.6923828125, 18.45751953125, 19.22265625, 19.98779296875, 20.7529296875, 21.51806640625, 22.283203125, 23.04833984375, 23.8134765625, 24.57861328125, 25.34375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 3.0, 4.0, 7.0, 5.0, 10.0, 8.0, 13.0, 20.0, 14.0, 26.0, 27.0, 23.0, 15.0, 27.0, 26.0, 40.0, 29.0, 32.0, 29.0, 25.0, 42.0, 36.0, 45.0, 45.0, 48.0, 27.0, 35.0, 26.0, 37.0, 32.0, 29.0, 27.0, 24.0, 24.0, 25.0, 17.0, 16.0, 12.0, 20.0, 8.0, 7.0, 9.0, 13.0, 1.0, 2.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.25439453125, -12.8212890625, -12.38818359375, -11.955078125, -11.52197265625, -11.0888671875, -10.65576171875, -10.22265625, -9.78955078125, -9.3564453125, -8.92333984375, -8.490234375, -8.05712890625, -7.6240234375, -7.19091796875, -6.7578125, -6.32470703125, -5.8916015625, -5.45849609375, -5.025390625, -4.59228515625, -4.1591796875, -3.72607421875, -3.29296875, -2.85986328125, -2.4267578125, -1.99365234375, -1.560546875, -1.12744140625, -0.6943359375, -0.26123046875, 0.171875, 0.60498046875, 1.0380859375, 1.47119140625, 1.904296875, 2.33740234375, 2.7705078125, 3.20361328125, 3.63671875, 4.06982421875, 4.5029296875, 4.93603515625, 5.369140625, 5.80224609375, 6.2353515625, 6.66845703125, 7.1015625, 7.53466796875, 7.9677734375, 8.40087890625, 8.833984375, 9.26708984375, 9.7001953125, 10.13330078125, 10.56640625, 10.99951171875, 11.4326171875, 11.86572265625, 12.298828125, 12.73193359375, 13.1650390625, 13.59814453125, 14.03125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 4.0, 12.0, 12.0, 27.0, 34.0, 57.0, 91.0, 129.0, 172.0, 322.0, 479.0, 647.0, 1072.0, 1654.0, 2539.0, 3915.0, 6190.0, 9876.0, 15637.0, 25771.0, 42577.0, 73510.0, 134488.0, 257686.0, 528826.0, 1124991.0, 992614.0, 458277.0, 225939.0, 119422.0, 66360.0, 38348.0, 23324.0, 14543.0, 8867.0, 5649.0, 3592.0, 2338.0, 1488.0, 974.0, 620.0, 384.0, 263.0, 183.0, 123.0, 88.0, 59.0, 37.0, 27.0, 18.0, 11.0, 7.0, 5.0, 7.0, 1.0, 0.0, 2.0], "bins": [-24.75, -23.997802734375, -23.24560546875, -22.493408203125, -21.7412109375, -20.989013671875, -20.23681640625, -19.484619140625, -18.732421875, -17.980224609375, -17.22802734375, -16.475830078125, -15.7236328125, -14.971435546875, -14.21923828125, -13.467041015625, -12.71484375, -11.962646484375, -11.21044921875, -10.458251953125, -9.7060546875, -8.953857421875, -8.20166015625, -7.449462890625, -6.697265625, -5.945068359375, -5.19287109375, -4.440673828125, -3.6884765625, -2.936279296875, -2.18408203125, -1.431884765625, -0.6796875, 0.072509765625, 0.82470703125, 1.576904296875, 2.3291015625, 3.081298828125, 3.83349609375, 4.585693359375, 5.337890625, 6.090087890625, 6.84228515625, 7.594482421875, 8.3466796875, 9.098876953125, 9.85107421875, 10.603271484375, 11.35546875, 12.107666015625, 12.85986328125, 13.612060546875, 14.3642578125, 15.116455078125, 15.86865234375, 16.620849609375, 17.373046875, 18.125244140625, 18.87744140625, 19.629638671875, 20.3818359375, 21.134033203125, 21.88623046875, 22.638427734375, 23.390625]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 12.0, 17.0, 12.0, 24.0, 28.0, 33.0, 41.0, 48.0, 49.0, 75.0, 84.0, 103.0, 150.0, 178.0, 191.0, 275.0, 307.0, 336.0, 385.0, 354.0, 279.0, 195.0, 166.0, 133.0, 107.0, 90.0, 75.0, 68.0, 42.0, 50.0, 38.0, 22.0, 25.0, 17.0, 7.0, 15.0, 12.0, 5.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-9.15625, -8.8717041015625, -8.587158203125, -8.3026123046875, -8.01806640625, -7.7335205078125, -7.448974609375, -7.1644287109375, -6.8798828125, -6.5953369140625, -6.310791015625, -6.0262451171875, -5.74169921875, -5.4571533203125, -5.172607421875, -4.8880615234375, -4.603515625, -4.3189697265625, -4.034423828125, -3.7498779296875, -3.46533203125, -3.1807861328125, -2.896240234375, -2.6116943359375, -2.3271484375, -2.0426025390625, -1.758056640625, -1.4735107421875, -1.18896484375, -0.9044189453125, -0.619873046875, -0.3353271484375, -0.05078125, 0.2337646484375, 0.518310546875, 0.8028564453125, 1.08740234375, 1.3719482421875, 1.656494140625, 1.9410400390625, 2.2255859375, 2.5101318359375, 2.794677734375, 3.0792236328125, 3.36376953125, 3.6483154296875, 3.932861328125, 4.2174072265625, 4.501953125, 4.7864990234375, 5.071044921875, 5.3555908203125, 5.64013671875, 5.9246826171875, 6.209228515625, 6.4937744140625, 6.7783203125, 7.0628662109375, 7.347412109375, 7.6319580078125, 7.91650390625, 8.2010498046875, 8.485595703125, 8.7701416015625, 9.0546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 14.0, 10.0, 10.0, 20.0, 27.0, 24.0, 45.0, 48.0, 50.0, 65.0, 63.0, 79.0, 80.0, 74.0, 65.0, 60.0, 39.0, 38.0, 31.0, 29.0, 22.0, 18.0, 20.0, 9.0, 11.0, 10.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.679685592651367, -19.997987747192383, -19.3162899017334, -18.63459014892578, -17.952892303466797, -17.271194458007812, -16.589496612548828, -15.907798767089844, -15.226099967956543, -14.544402122497559, -13.862703323364258, -13.181005477905273, -12.499307632446289, -11.817608833312988, -11.135910987854004, -10.454212188720703, -9.772514343261719, -9.090816497802734, -8.409117698669434, -7.727419853210449, -7.045721530914307, -6.364023208618164, -5.68232536315918, -5.000627040863037, -4.3189287185668945, -3.637230396270752, -2.9555323123931885, -2.273834228515625, -1.5921359062194824, -0.9104375839233398, -0.22873973846435547, 0.4529585838317871, 1.1346549987792969, 1.81635320186615, 2.498051404953003, 3.1797494888305664, 3.861447811126709, 4.543146133422852, 5.224843978881836, 5.9065423011779785, 6.588240623474121, 7.269938945770264, 7.951637268066406, 8.63333511352539, 9.315032958984375, 9.996731758117676, 10.67842960357666, 11.360128402709961, 12.041826248168945, 12.72352409362793, 13.40522289276123, 14.086920738220215, 14.768619537353516, 15.4503173828125, 16.132015228271484, 16.81371307373047, 17.495410919189453, 18.177108764648438, 18.858806610107422, 19.540504455566406, 20.222204208374023, 20.903902053833008, 21.585599899291992, 22.267297744750977, 22.948997497558594]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 8.0, 8.0, 12.0, 9.0, 11.0, 14.0, 15.0, 12.0, 22.0, 19.0, 23.0, 24.0, 32.0, 31.0, 27.0, 32.0, 39.0, 41.0, 36.0, 32.0, 39.0, 37.0, 43.0, 37.0, 39.0, 33.0, 31.0, 29.0, 24.0, 27.0, 37.0, 26.0, 23.0, 24.0, 14.0, 15.0, 10.0, 10.0, 8.0, 16.0, 10.0, 10.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.605203628540039, -14.124284744262695, -13.643365859985352, -13.162446975708008, -12.68152904510498, -12.200610160827637, -11.719691276550293, -11.23877239227295, -10.757854461669922, -10.276935577392578, -9.796016693115234, -9.31509780883789, -8.834179878234863, -8.35326099395752, -7.872342109680176, -7.391423225402832, -6.910504341125488, -6.4295854568481445, -5.948667049407959, -5.467748165130615, -4.98682975769043, -4.505910873413086, -4.024991989135742, -3.5440733432769775, -3.063154697418213, -2.5822360515594482, -2.1013174057006836, -1.6203985214233398, -1.1394798755645752, -0.6585612297058105, -0.1776423454284668, 0.30327630043029785, 0.7841949462890625, 1.2651135921478271, 1.7460323572158813, 2.2269511222839355, 2.7078697681427, 3.188788414001465, 3.6697072982788086, 4.150626182556152, 4.631544589996338, 5.112463474273682, 5.593381881713867, 6.074300765991211, 6.555219650268555, 7.03613805770874, 7.517056941986084, 7.9979753494262695, 8.478894233703613, 8.959813117980957, 9.4407320022583, 9.921649932861328, 10.402568817138672, 10.883487701416016, 11.36440658569336, 11.845325469970703, 12.326244354248047, 12.80716323852539, 13.288082122802734, 13.769001007080078, 14.249918937683105, 14.73083782196045, 15.211756706237793, 15.692675590515137, 16.173593521118164]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 0.0, 2.0, 4.0, 11.0, 6.0, 17.0, 12.0, 17.0, 27.0, 43.0, 45.0, 77.0, 98.0, 158.0, 259.0, 372.0, 560.0, 891.0, 1336.0, 2028.0, 3084.0, 4871.0, 7564.0, 11960.0, 19003.0, 30891.0, 49942.0, 85877.0, 171894.0, 340979.0, 131458.0, 71469.0, 42416.0, 25825.0, 16465.0, 10416.0, 6501.0, 4190.0, 2689.0, 1753.0, 1126.0, 710.0, 506.0, 342.0, 190.0, 147.0, 92.0, 52.0, 55.0, 39.0, 36.0, 12.0, 10.0, 10.0, 5.0, 8.0, 10.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.8046875, -8.523681640625, -8.24267578125, -7.961669921875, -7.6806640625, -7.399658203125, -7.11865234375, -6.837646484375, -6.556640625, -6.275634765625, -5.99462890625, -5.713623046875, -5.4326171875, -5.151611328125, -4.87060546875, -4.589599609375, -4.30859375, -4.027587890625, -3.74658203125, -3.465576171875, -3.1845703125, -2.903564453125, -2.62255859375, -2.341552734375, -2.060546875, -1.779541015625, -1.49853515625, -1.217529296875, -0.9365234375, -0.655517578125, -0.37451171875, -0.093505859375, 0.1875, 0.468505859375, 0.74951171875, 1.030517578125, 1.3115234375, 1.592529296875, 1.87353515625, 2.154541015625, 2.435546875, 2.716552734375, 2.99755859375, 3.278564453125, 3.5595703125, 3.840576171875, 4.12158203125, 4.402587890625, 4.68359375, 4.964599609375, 5.24560546875, 5.526611328125, 5.8076171875, 6.088623046875, 6.36962890625, 6.650634765625, 6.931640625, 7.212646484375, 7.49365234375, 7.774658203125, 8.0556640625, 8.336669921875, 8.61767578125, 8.898681640625, 9.1796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 8.0, 6.0, 10.0, 15.0, 16.0, 12.0, 28.0, 17.0, 18.0, 16.0, 27.0, 35.0, 26.0, 29.0, 35.0, 42.0, 36.0, 36.0, 38.0, 41.0, 49.0, 40.0, 22.0, 40.0, 26.0, 32.0, 21.0, 34.0, 27.0, 26.0, 25.0, 26.0, 15.0, 23.0, 16.0, 12.0, 8.0, 10.0, 4.0, 9.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-15.0390625, -14.58154296875, -14.1240234375, -13.66650390625, -13.208984375, -12.75146484375, -12.2939453125, -11.83642578125, -11.37890625, -10.92138671875, -10.4638671875, -10.00634765625, -9.548828125, -9.09130859375, -8.6337890625, -8.17626953125, -7.71875, -7.26123046875, -6.8037109375, -6.34619140625, -5.888671875, -5.43115234375, -4.9736328125, -4.51611328125, -4.05859375, -3.60107421875, -3.1435546875, -2.68603515625, -2.228515625, -1.77099609375, -1.3134765625, -0.85595703125, -0.3984375, 0.05908203125, 0.5166015625, 0.97412109375, 1.431640625, 1.88916015625, 2.3466796875, 2.80419921875, 3.26171875, 3.71923828125, 4.1767578125, 4.63427734375, 5.091796875, 5.54931640625, 6.0068359375, 6.46435546875, 6.921875, 7.37939453125, 7.8369140625, 8.29443359375, 8.751953125, 9.20947265625, 9.6669921875, 10.12451171875, 10.58203125, 11.03955078125, 11.4970703125, 11.95458984375, 12.412109375, 12.86962890625, 13.3271484375, 13.78466796875, 14.2421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 12.0, 16.0, 18.0, 42.0, 50.0, 68.0, 123.0, 155.0, 301.0, 342.0, 596.0, 822.0, 1305.0, 1908.0, 2863.0, 4588.0, 7033.0, 10933.0, 16924.0, 26727.0, 43027.0, 71746.0, 139333.0, 381725.0, 144502.0, 73544.0, 43654.0, 27288.0, 17374.0, 10965.0, 7035.0, 4660.0, 2978.0, 1995.0, 1321.0, 880.0, 548.0, 413.0, 225.0, 186.0, 102.0, 90.0, 47.0, 35.0, 19.0, 11.0, 8.0, 8.0, 8.0, 2.0, 5.0, 2.0, 1.0], "bins": [-8.4296875, -8.18548583984375, -7.9412841796875, -7.69708251953125, -7.452880859375, -7.20867919921875, -6.9644775390625, -6.72027587890625, -6.47607421875, -6.23187255859375, -5.9876708984375, -5.74346923828125, -5.499267578125, -5.25506591796875, -5.0108642578125, -4.76666259765625, -4.5224609375, -4.27825927734375, -4.0340576171875, -3.78985595703125, -3.545654296875, -3.30145263671875, -3.0572509765625, -2.81304931640625, -2.56884765625, -2.32464599609375, -2.0804443359375, -1.83624267578125, -1.592041015625, -1.34783935546875, -1.1036376953125, -0.85943603515625, -0.615234375, -0.37103271484375, -0.1268310546875, 0.11737060546875, 0.361572265625, 0.60577392578125, 0.8499755859375, 1.09417724609375, 1.33837890625, 1.58258056640625, 1.8267822265625, 2.07098388671875, 2.315185546875, 2.55938720703125, 2.8035888671875, 3.04779052734375, 3.2919921875, 3.53619384765625, 3.7803955078125, 4.02459716796875, 4.268798828125, 4.51300048828125, 4.7572021484375, 5.00140380859375, 5.24560546875, 5.48980712890625, 5.7340087890625, 5.97821044921875, 6.222412109375, 6.46661376953125, 6.7108154296875, 6.95501708984375, 7.19921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 8.0, 2.0, 12.0, 7.0, 14.0, 18.0, 7.0, 15.0, 20.0, 22.0, 18.0, 25.0, 32.0, 33.0, 33.0, 34.0, 30.0, 43.0, 34.0, 48.0, 55.0, 57.0, 49.0, 37.0, 29.0, 38.0, 35.0, 27.0, 30.0, 22.0, 34.0, 25.0, 20.0, 15.0, 15.0, 14.0, 10.0, 7.0, 8.0, 6.0, 2.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-10.859375, -10.544189453125, -10.22900390625, -9.913818359375, -9.5986328125, -9.283447265625, -8.96826171875, -8.653076171875, -8.337890625, -8.022705078125, -7.70751953125, -7.392333984375, -7.0771484375, -6.761962890625, -6.44677734375, -6.131591796875, -5.81640625, -5.501220703125, -5.18603515625, -4.870849609375, -4.5556640625, -4.240478515625, -3.92529296875, -3.610107421875, -3.294921875, -2.979736328125, -2.66455078125, -2.349365234375, -2.0341796875, -1.718994140625, -1.40380859375, -1.088623046875, -0.7734375, -0.458251953125, -0.14306640625, 0.172119140625, 0.4873046875, 0.802490234375, 1.11767578125, 1.432861328125, 1.748046875, 2.063232421875, 2.37841796875, 2.693603515625, 3.0087890625, 3.323974609375, 3.63916015625, 3.954345703125, 4.26953125, 4.584716796875, 4.89990234375, 5.215087890625, 5.5302734375, 5.845458984375, 6.16064453125, 6.475830078125, 6.791015625, 7.106201171875, 7.42138671875, 7.736572265625, 8.0517578125, 8.366943359375, 8.68212890625, 8.997314453125, 9.3125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 5.0, 11.0, 12.0, 13.0, 10.0, 34.0, 63.0, 90.0, 132.0, 208.0, 361.0, 594.0, 1135.0, 2049.0, 4229.0, 9277.0, 22551.0, 63411.0, 229916.0, 471241.0, 161692.0, 48618.0, 17866.0, 7395.0, 3554.0, 1750.0, 975.0, 524.0, 307.0, 179.0, 117.0, 87.0, 48.0, 27.0, 16.0, 12.0, 7.0, 5.0, 11.0, 7.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.037109375, -0.036029815673828125, -0.03495025634765625, -0.033870697021484375, -0.0327911376953125, -0.031711578369140625, -0.03063201904296875, -0.029552459716796875, -0.028472900390625, -0.027393341064453125, -0.02631378173828125, -0.025234222412109375, -0.0241546630859375, -0.023075103759765625, -0.02199554443359375, -0.020915985107421875, -0.01983642578125, -0.018756866455078125, -0.01767730712890625, -0.016597747802734375, -0.0155181884765625, -0.014438629150390625, -0.01335906982421875, -0.012279510498046875, -0.011199951171875, -0.010120391845703125, -0.00904083251953125, -0.007961273193359375, -0.0068817138671875, -0.005802154541015625, -0.00472259521484375, -0.003643035888671875, -0.0025634765625, -0.001483917236328125, -0.00040435791015625, 0.000675201416015625, 0.0017547607421875, 0.002834320068359375, 0.00391387939453125, 0.004993438720703125, 0.006072998046875, 0.007152557373046875, 0.00823211669921875, 0.009311676025390625, 0.0103912353515625, 0.011470794677734375, 0.01255035400390625, 0.013629913330078125, 0.01470947265625, 0.015789031982421875, 0.01686859130859375, 0.017948150634765625, 0.0190277099609375, 0.020107269287109375, 0.02118682861328125, 0.022266387939453125, 0.023345947265625, 0.024425506591796875, 0.02550506591796875, 0.026584625244140625, 0.0276641845703125, 0.028743743896484375, 0.02982330322265625, 0.030902862548828125, 0.031982421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 2.0, 4.0, 3.0, 3.0, 17.0, 11.0, 15.0, 24.0, 35.0, 36.0, 45.0, 46.0, 48.0, 52.0, 68.0, 72.0, 75.0, 63.0, 57.0, 59.0, 41.0, 35.0, 31.0, 32.0, 27.0, 26.0, 14.0, 12.0, 8.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7344951629638672e-05, -1.6839243471622467e-05, -1.6333535313606262e-05, -1.5827827155590057e-05, -1.5322118997573853e-05, -1.4816410839557648e-05, -1.4310702681541443e-05, -1.3804994523525238e-05, -1.3299286365509033e-05, -1.2793578207492828e-05, -1.2287870049476624e-05, -1.1782161891460419e-05, -1.1276453733444214e-05, -1.0770745575428009e-05, -1.0265037417411804e-05, -9.7593292593956e-06, -9.253621101379395e-06, -8.74791294336319e-06, -8.242204785346985e-06, -7.73649662733078e-06, -7.230788469314575e-06, -6.72508031129837e-06, -6.2193721532821655e-06, -5.713663995265961e-06, -5.207955837249756e-06, -4.702247679233551e-06, -4.196539521217346e-06, -3.6908313632011414e-06, -3.1851232051849365e-06, -2.6794150471687317e-06, -2.173706889152527e-06, -1.667998731136322e-06, -1.1622905731201172e-06, -6.565824151039124e-07, -1.5087425708770752e-07, 3.548339009284973e-07, 8.605420589447021e-07, 1.366250216960907e-06, 1.8719583749771118e-06, 2.3776665329933167e-06, 2.8833746910095215e-06, 3.3890828490257263e-06, 3.894791007041931e-06, 4.400499165058136e-06, 4.906207323074341e-06, 5.411915481090546e-06, 5.9176236391067505e-06, 6.423331797122955e-06, 6.92903995513916e-06, 7.434748113155365e-06, 7.94045627117157e-06, 8.446164429187775e-06, 8.95187258720398e-06, 9.457580745220184e-06, 9.96328890323639e-06, 1.0468997061252594e-05, 1.0974705219268799e-05, 1.1480413377285004e-05, 1.1986121535301208e-05, 1.2491829693317413e-05, 1.2997537851333618e-05, 1.3503246009349823e-05, 1.4008954167366028e-05, 1.4514662325382233e-05, 1.5020370483398438e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 5.0, 16.0, 18.0, 32.0, 37.0, 61.0, 91.0, 131.0, 205.0, 303.0, 475.0, 709.0, 1083.0, 1569.0, 2547.0, 4184.0, 7068.0, 12830.0, 24401.0, 48456.0, 104553.0, 233240.0, 299533.0, 159536.0, 71361.0, 34359.0, 17283.0, 9694.0, 5609.0, 3298.0, 2080.0, 1301.0, 811.0, 531.0, 385.0, 250.0, 165.0, 104.0, 69.0, 44.0, 37.0, 34.0, 16.0, 9.0, 10.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.021453857421875, -0.0207674503326416, -0.020081043243408203, -0.019394636154174805, -0.018708229064941406, -0.018021821975708008, -0.01733541488647461, -0.01664900779724121, -0.015962600708007812, -0.015276193618774414, -0.014589786529541016, -0.013903379440307617, -0.013216972351074219, -0.01253056526184082, -0.011844158172607422, -0.011157751083374023, -0.010471343994140625, -0.009784936904907227, -0.009098529815673828, -0.00841212272644043, -0.007725715637207031, -0.007039308547973633, -0.006352901458740234, -0.005666494369506836, -0.0049800872802734375, -0.004293680191040039, -0.0036072731018066406, -0.002920866012573242, -0.0022344589233398438, -0.0015480518341064453, -0.0008616447448730469, -0.00017523765563964844, 0.00051116943359375, 0.0011975765228271484, 0.0018839836120605469, 0.0025703907012939453, 0.0032567977905273438, 0.003943204879760742, 0.004629611968994141, 0.005316019058227539, 0.0060024261474609375, 0.006688833236694336, 0.007375240325927734, 0.008061647415161133, 0.008748054504394531, 0.00943446159362793, 0.010120868682861328, 0.010807275772094727, 0.011493682861328125, 0.012180089950561523, 0.012866497039794922, 0.01355290412902832, 0.014239311218261719, 0.014925718307495117, 0.015612125396728516, 0.016298532485961914, 0.016984939575195312, 0.01767134666442871, 0.01835775375366211, 0.019044160842895508, 0.019730567932128906, 0.020416975021362305, 0.021103382110595703, 0.0217897891998291, 0.0224761962890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 8.0, 12.0, 15.0, 10.0, 20.0, 18.0, 39.0, 29.0, 39.0, 63.0, 61.0, 96.0, 103.0, 67.0, 80.0, 67.0, 54.0, 48.0, 33.0, 27.0, 24.0, 18.0, 7.0, 12.0, 6.0, 5.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.00960540771484375, -0.009357154369354248, -0.009108901023864746, -0.008860647678375244, -0.008612394332885742, -0.00836414098739624, -0.008115887641906738, -0.007867634296417236, -0.007619380950927734, -0.007371127605438232, -0.0071228742599487305, -0.0068746209144592285, -0.0066263675689697266, -0.006378114223480225, -0.006129860877990723, -0.005881607532501221, -0.005633354187011719, -0.005385100841522217, -0.005136847496032715, -0.004888594150543213, -0.004640340805053711, -0.004392087459564209, -0.004143834114074707, -0.003895580768585205, -0.003647327423095703, -0.003399074077606201, -0.0031508207321166992, -0.0029025673866271973, -0.0026543140411376953, -0.0024060606956481934, -0.0021578073501586914, -0.0019095540046691895, -0.0016613006591796875, -0.0014130473136901855, -0.0011647939682006836, -0.0009165406227111816, -0.0006682872772216797, -0.00042003393173217773, -0.00017178058624267578, 7.647275924682617e-05, 0.0003247261047363281, 0.0005729794502258301, 0.000821232795715332, 0.001069486141204834, 0.001317739486694336, 0.0015659928321838379, 0.0018142461776733398, 0.002062499523162842, 0.0023107528686523438, 0.0025590062141418457, 0.0028072595596313477, 0.0030555129051208496, 0.0033037662506103516, 0.0035520195960998535, 0.0038002729415893555, 0.004048526287078857, 0.004296779632568359, 0.004545032978057861, 0.004793286323547363, 0.005041539669036865, 0.005289793014526367, 0.005538046360015869, 0.005786299705505371, 0.006034553050994873, 0.006282806396484375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 10.0, 14.0, 16.0, 14.0, 33.0, 30.0, 36.0, 51.0, 62.0, 59.0, 76.0, 84.0, 82.0, 71.0, 65.0, 52.0, 34.0, 39.0, 29.0, 31.0, 22.0, 21.0, 13.0, 9.0, 10.0, 4.0, 8.0, 5.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.241357803344727, -19.568178176879883, -18.89499855041504, -18.221817016601562, -17.54863739013672, -16.875457763671875, -16.20227813720703, -15.529098510742188, -14.855918884277344, -14.1827392578125, -13.50955867767334, -12.836379051208496, -12.163199424743652, -11.490018844604492, -10.816839218139648, -10.143659591674805, -9.470479011535645, -8.7972993850708, -8.12411880493164, -7.450939178466797, -6.777759552001953, -6.104579448699951, -5.431399345397949, -4.7582197189331055, -4.0850396156311035, -3.4118597507476807, -2.738679885864258, -2.065499782562256, -1.392319917678833, -0.7191400527954102, -0.0459599494934082, 0.6272196769714355, 1.3003997802734375, 1.9735796451568604, 2.646759510040283, 3.319939613342285, 3.993119478225708, 4.666299343109131, 5.339479446411133, 6.012659072875977, 6.6858391761779785, 7.3590192794799805, 8.032198905944824, 8.705379486083984, 9.378559112548828, 10.051738739013672, 10.724918365478516, 11.39809799194336, 12.07127857208252, 12.744458198547363, 13.417638778686523, 14.090818405151367, 14.763998031616211, 15.437177658081055, 16.11035919189453, 16.783538818359375, 17.45671844482422, 18.129898071289062, 18.803077697753906, 19.47625732421875, 20.149438858032227, 20.82261848449707, 21.495798110961914, 22.168977737426758, 22.8421573638916]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 5.0, 9.0, 9.0, 13.0, 12.0, 11.0, 15.0, 12.0, 19.0, 19.0, 25.0, 22.0, 32.0, 32.0, 30.0, 29.0, 37.0, 42.0, 35.0, 31.0, 40.0, 38.0, 46.0, 33.0, 43.0, 31.0, 33.0, 29.0, 26.0, 25.0, 36.0, 29.0, 22.0, 21.0, 16.0, 15.0, 11.0, 11.0, 8.0, 15.0, 8.0, 13.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.959293365478516, -13.50209903717041, -13.044903755187988, -12.587709426879883, -12.130515098571777, -11.673320770263672, -11.21612548828125, -10.758931159973145, -10.301736831665039, -9.844542503356934, -9.387347221374512, -8.930152893066406, -8.4729585647583, -8.015764236450195, -7.558568954467773, -7.101374626159668, -6.644179344177246, -6.186984539031982, -5.729790210723877, -5.272595405578613, -4.815401077270508, -4.358206272125244, -3.9010114669799805, -3.443816900253296, -2.9866223335266113, -2.5294277667999268, -2.072233200073242, -1.6150383949279785, -1.157843828201294, -0.7006492614746094, -0.2434544563293457, 0.21374011039733887, 0.6709356307983398, 1.1281301975250244, 1.5853248834609985, 2.0425195693969727, 2.4997141361236572, 2.956908702850342, 3.4141035079956055, 3.87129807472229, 4.328492641448975, 4.785687446594238, 5.242881774902344, 5.700076580047607, 6.157271385192871, 6.614465713500977, 7.07166051864624, 7.528855323791504, 7.986049652099609, 8.443243980407715, 8.900439262390137, 9.357633590698242, 9.814827919006348, 10.272022247314453, 10.729217529296875, 11.18641185760498, 11.643606185913086, 12.100800514221191, 12.557995796203613, 13.015190124511719, 13.472384452819824, 13.92957878112793, 14.386774063110352, 14.843968391418457, 15.301163673400879]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 10.0, 9.0, 17.0, 36.0, 45.0, 85.0, 117.0, 163.0, 288.0, 359.0, 545.0, 843.0, 1309.0, 1853.0, 2617.0, 4083.0, 5760.0, 8416.0, 12297.0, 18195.0, 26734.0, 39463.0, 58851.0, 86820.0, 122404.0, 149746.0, 146106.0, 114138.0, 80063.0, 54048.0, 36093.0, 24491.0, 16698.0, 11328.0, 7909.0, 5236.0, 3661.0, 2489.0, 1724.0, 1158.0, 796.0, 526.0, 351.0, 248.0, 150.0, 98.0, 65.0, 34.0, 29.0, 21.0, 13.0, 8.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.359375, -17.78369140625, -17.2080078125, -16.63232421875, -16.056640625, -15.48095703125, -14.9052734375, -14.32958984375, -13.75390625, -13.17822265625, -12.6025390625, -12.02685546875, -11.451171875, -10.87548828125, -10.2998046875, -9.72412109375, -9.1484375, -8.57275390625, -7.9970703125, -7.42138671875, -6.845703125, -6.27001953125, -5.6943359375, -5.11865234375, -4.54296875, -3.96728515625, -3.3916015625, -2.81591796875, -2.240234375, -1.66455078125, -1.0888671875, -0.51318359375, 0.0625, 0.63818359375, 1.2138671875, 1.78955078125, 2.365234375, 2.94091796875, 3.5166015625, 4.09228515625, 4.66796875, 5.24365234375, 5.8193359375, 6.39501953125, 6.970703125, 7.54638671875, 8.1220703125, 8.69775390625, 9.2734375, 9.84912109375, 10.4248046875, 11.00048828125, 11.576171875, 12.15185546875, 12.7275390625, 13.30322265625, 13.87890625, 14.45458984375, 15.0302734375, 15.60595703125, 16.181640625, 16.75732421875, 17.3330078125, 17.90869140625, 18.484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 3.0, 13.0, 13.0, 13.0, 9.0, 25.0, 18.0, 16.0, 23.0, 25.0, 24.0, 38.0, 30.0, 34.0, 29.0, 39.0, 36.0, 37.0, 27.0, 34.0, 41.0, 48.0, 38.0, 31.0, 48.0, 34.0, 23.0, 30.0, 33.0, 30.0, 18.0, 26.0, 13.0, 12.0, 10.0, 13.0, 17.0, 13.0, 5.0, 8.0, 4.0, 8.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1640625, -11.7535400390625, -11.343017578125, -10.9324951171875, -10.52197265625, -10.1114501953125, -9.700927734375, -9.2904052734375, -8.8798828125, -8.4693603515625, -8.058837890625, -7.6483154296875, -7.23779296875, -6.8272705078125, -6.416748046875, -6.0062255859375, -5.595703125, -5.1851806640625, -4.774658203125, -4.3641357421875, -3.95361328125, -3.5430908203125, -3.132568359375, -2.7220458984375, -2.3115234375, -1.9010009765625, -1.490478515625, -1.0799560546875, -0.66943359375, -0.2589111328125, 0.151611328125, 0.5621337890625, 0.97265625, 1.3831787109375, 1.793701171875, 2.2042236328125, 2.61474609375, 3.0252685546875, 3.435791015625, 3.8463134765625, 4.2568359375, 4.6673583984375, 5.077880859375, 5.4884033203125, 5.89892578125, 6.3094482421875, 6.719970703125, 7.1304931640625, 7.541015625, 7.9515380859375, 8.362060546875, 8.7725830078125, 9.18310546875, 9.5936279296875, 10.004150390625, 10.4146728515625, 10.8251953125, 11.2357177734375, 11.646240234375, 12.0567626953125, 12.46728515625, 12.8778076171875, 13.288330078125, 13.6988525390625, 14.109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 21.0, 25.0, 31.0, 63.0, 99.0, 136.0, 157.0, 232.0, 371.0, 547.0, 759.0, 966.0, 1450.0, 2106.0, 2967.0, 4339.0, 6331.0, 9039.0, 13401.0, 19656.0, 28735.0, 42218.0, 61996.0, 89062.0, 120918.0, 143847.0, 138776.0, 109982.0, 79089.0, 54082.0, 37005.0, 25216.0, 16988.0, 11667.0, 8042.0, 5538.0, 3788.0, 2703.0, 1825.0, 1283.0, 919.0, 670.0, 469.0, 347.0, 229.0, 157.0, 104.0, 73.0, 51.0, 23.0, 25.0, 11.0, 7.0, 10.0, 5.0, 1.0, 0.0, 1.0], "bins": [-17.265625, -16.72314453125, -16.1806640625, -15.63818359375, -15.095703125, -14.55322265625, -14.0107421875, -13.46826171875, -12.92578125, -12.38330078125, -11.8408203125, -11.29833984375, -10.755859375, -10.21337890625, -9.6708984375, -9.12841796875, -8.5859375, -8.04345703125, -7.5009765625, -6.95849609375, -6.416015625, -5.87353515625, -5.3310546875, -4.78857421875, -4.24609375, -3.70361328125, -3.1611328125, -2.61865234375, -2.076171875, -1.53369140625, -0.9912109375, -0.44873046875, 0.09375, 0.63623046875, 1.1787109375, 1.72119140625, 2.263671875, 2.80615234375, 3.3486328125, 3.89111328125, 4.43359375, 4.97607421875, 5.5185546875, 6.06103515625, 6.603515625, 7.14599609375, 7.6884765625, 8.23095703125, 8.7734375, 9.31591796875, 9.8583984375, 10.40087890625, 10.943359375, 11.48583984375, 12.0283203125, 12.57080078125, 13.11328125, 13.65576171875, 14.1982421875, 14.74072265625, 15.283203125, 15.82568359375, 16.3681640625, 16.91064453125, 17.453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 3.0, 4.0, 19.0, 7.0, 7.0, 6.0, 12.0, 16.0, 15.0, 17.0, 23.0, 28.0, 25.0, 28.0, 37.0, 25.0, 24.0, 23.0, 46.0, 36.0, 42.0, 41.0, 39.0, 38.0, 32.0, 30.0, 36.0, 31.0, 27.0, 36.0, 26.0, 37.0, 24.0, 24.0, 23.0, 22.0, 12.0, 13.0, 7.0, 10.0, 10.0, 4.0, 3.0, 10.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-7.76171875, -7.51409912109375, -7.2664794921875, -7.01885986328125, -6.771240234375, -6.52362060546875, -6.2760009765625, -6.02838134765625, -5.78076171875, -5.53314208984375, -5.2855224609375, -5.03790283203125, -4.790283203125, -4.54266357421875, -4.2950439453125, -4.04742431640625, -3.7998046875, -3.55218505859375, -3.3045654296875, -3.05694580078125, -2.809326171875, -2.56170654296875, -2.3140869140625, -2.06646728515625, -1.81884765625, -1.57122802734375, -1.3236083984375, -1.07598876953125, -0.828369140625, -0.58074951171875, -0.3331298828125, -0.08551025390625, 0.162109375, 0.40972900390625, 0.6573486328125, 0.90496826171875, 1.152587890625, 1.40020751953125, 1.6478271484375, 1.89544677734375, 2.14306640625, 2.39068603515625, 2.6383056640625, 2.88592529296875, 3.133544921875, 3.38116455078125, 3.6287841796875, 3.87640380859375, 4.1240234375, 4.37164306640625, 4.6192626953125, 4.86688232421875, 5.114501953125, 5.36212158203125, 5.6097412109375, 5.85736083984375, 6.10498046875, 6.35260009765625, 6.6002197265625, 6.84783935546875, 7.095458984375, 7.34307861328125, 7.5906982421875, 7.83831787109375, 8.0859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 11.0, 13.0, 17.0, 27.0, 28.0, 48.0, 72.0, 110.0, 147.0, 178.0, 245.0, 365.0, 508.0, 683.0, 960.0, 1483.0, 2099.0, 3135.0, 4679.0, 7505.0, 12552.0, 22544.0, 47219.0, 115317.0, 281258.0, 302382.0, 130802.0, 52708.0, 24615.0, 13353.0, 7923.0, 4939.0, 3175.0, 2306.0, 1539.0, 1054.0, 718.0, 561.0, 376.0, 239.0, 190.0, 136.0, 92.0, 77.0, 50.0, 34.0, 26.0, 18.0, 12.0, 15.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.013671875, -2.916656494140625, -2.81964111328125, -2.722625732421875, -2.6256103515625, -2.528594970703125, -2.43157958984375, -2.334564208984375, -2.237548828125, -2.140533447265625, -2.04351806640625, -1.946502685546875, -1.8494873046875, -1.752471923828125, -1.65545654296875, -1.558441162109375, -1.46142578125, -1.364410400390625, -1.26739501953125, -1.170379638671875, -1.0733642578125, -0.976348876953125, -0.87933349609375, -0.782318115234375, -0.685302734375, -0.588287353515625, -0.49127197265625, -0.394256591796875, -0.2972412109375, -0.200225830078125, -0.10321044921875, -0.006195068359375, 0.0908203125, 0.187835693359375, 0.28485107421875, 0.381866455078125, 0.4788818359375, 0.575897216796875, 0.67291259765625, 0.769927978515625, 0.866943359375, 0.963958740234375, 1.06097412109375, 1.157989501953125, 1.2550048828125, 1.352020263671875, 1.44903564453125, 1.546051025390625, 1.64306640625, 1.740081787109375, 1.83709716796875, 1.934112548828125, 2.0311279296875, 2.128143310546875, 2.22515869140625, 2.322174072265625, 2.419189453125, 2.516204833984375, 2.61322021484375, 2.710235595703125, 2.8072509765625, 2.904266357421875, 3.00128173828125, 3.098297119140625, 3.1953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 8.0, 14.0, 24.0, 24.0, 27.0, 49.0, 66.0, 72.0, 91.0, 115.0, 97.0, 80.0, 72.0, 59.0, 66.0, 24.0, 29.0, 23.0, 6.0, 10.0, 7.0, 4.0, 5.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002524852752685547, -0.00024150311946868896, -0.00023052096366882324, -0.00021953880786895752, -0.0002085566520690918, -0.00019757449626922607, -0.00018659234046936035, -0.00017561018466949463, -0.0001646280288696289, -0.00015364587306976318, -0.00014266371726989746, -0.00013168156147003174, -0.00012069940567016602, -0.00010971724987030029, -9.873509407043457e-05, -8.775293827056885e-05, -7.677078247070312e-05, -6.57886266708374e-05, -5.480647087097168e-05, -4.382431507110596e-05, -3.2842159271240234e-05, -2.1860003471374512e-05, -1.0877847671508789e-05, 1.043081283569336e-07, 1.1086463928222656e-05, 2.206861972808838e-05, 3.30507755279541e-05, 4.4032931327819824e-05, 5.501508712768555e-05, 6.599724292755127e-05, 7.697939872741699e-05, 8.796155452728271e-05, 9.894371032714844e-05, 0.00010992586612701416, 0.00012090802192687988, 0.0001318901777267456, 0.00014287233352661133, 0.00015385448932647705, 0.00016483664512634277, 0.0001758188009262085, 0.00018680095672607422, 0.00019778311252593994, 0.00020876526832580566, 0.0002197474241256714, 0.0002307295799255371, 0.00024171173572540283, 0.00025269389152526855, 0.0002636760473251343, 0.000274658203125, 0.0002856403589248657, 0.00029662251472473145, 0.00030760467052459717, 0.0003185868263244629, 0.0003295689821243286, 0.00034055113792419434, 0.00035153329372406006, 0.0003625154495239258, 0.0003734976053237915, 0.0003844797611236572, 0.00039546191692352295, 0.00040644407272338867, 0.0004174262285232544, 0.0004284083843231201, 0.00043939054012298584, 0.00045037269592285156]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 11.0, 17.0, 29.0, 25.0, 44.0, 49.0, 79.0, 101.0, 142.0, 205.0, 322.0, 426.0, 656.0, 1011.0, 1607.0, 2364.0, 3911.0, 6134.0, 10717.0, 19815.0, 43933.0, 128161.0, 363131.0, 295568.0, 94430.0, 34753.0, 16484.0, 9343.0, 5408.0, 3375.0, 2144.0, 1326.0, 875.0, 571.0, 414.0, 329.0, 194.0, 112.0, 93.0, 57.0, 45.0, 55.0, 29.0, 18.0, 17.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.669921875, -3.551025390625, -3.43212890625, -3.313232421875, -3.1943359375, -3.075439453125, -2.95654296875, -2.837646484375, -2.71875, -2.599853515625, -2.48095703125, -2.362060546875, -2.2431640625, -2.124267578125, -2.00537109375, -1.886474609375, -1.767578125, -1.648681640625, -1.52978515625, -1.410888671875, -1.2919921875, -1.173095703125, -1.05419921875, -0.935302734375, -0.81640625, -0.697509765625, -0.57861328125, -0.459716796875, -0.3408203125, -0.221923828125, -0.10302734375, 0.015869140625, 0.134765625, 0.253662109375, 0.37255859375, 0.491455078125, 0.6103515625, 0.729248046875, 0.84814453125, 0.967041015625, 1.0859375, 1.204833984375, 1.32373046875, 1.442626953125, 1.5615234375, 1.680419921875, 1.79931640625, 1.918212890625, 2.037109375, 2.156005859375, 2.27490234375, 2.393798828125, 2.5126953125, 2.631591796875, 2.75048828125, 2.869384765625, 2.98828125, 3.107177734375, 3.22607421875, 3.344970703125, 3.4638671875, 3.582763671875, 3.70166015625, 3.820556640625, 3.939453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 7.0, 12.0, 14.0, 17.0, 13.0, 29.0, 24.0, 38.0, 61.0, 100.0, 109.0, 121.0, 125.0, 93.0, 77.0, 46.0, 31.0, 18.0, 15.0, 9.0, 8.0, 5.0, 5.0, 1.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.325225830078125, -1.28033447265625, -1.235443115234375, -1.1905517578125, -1.145660400390625, -1.10076904296875, -1.055877685546875, -1.010986328125, -0.966094970703125, -0.92120361328125, -0.876312255859375, -0.8314208984375, -0.786529541015625, -0.74163818359375, -0.696746826171875, -0.65185546875, -0.606964111328125, -0.56207275390625, -0.517181396484375, -0.4722900390625, -0.427398681640625, -0.38250732421875, -0.337615966796875, -0.292724609375, -0.247833251953125, -0.20294189453125, -0.158050537109375, -0.1131591796875, -0.068267822265625, -0.02337646484375, 0.021514892578125, 0.06640625, 0.111297607421875, 0.15618896484375, 0.201080322265625, 0.2459716796875, 0.290863037109375, 0.33575439453125, 0.380645751953125, 0.425537109375, 0.470428466796875, 0.51531982421875, 0.560211181640625, 0.6051025390625, 0.649993896484375, 0.69488525390625, 0.739776611328125, 0.78466796875, 0.829559326171875, 0.87445068359375, 0.919342041015625, 0.9642333984375, 1.009124755859375, 1.05401611328125, 1.098907470703125, 1.143798828125, 1.188690185546875, 1.23358154296875, 1.278472900390625, 1.3233642578125, 1.368255615234375, 1.41314697265625, 1.458038330078125, 1.5029296875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 4.0, 8.0, 18.0, 15.0, 23.0, 24.0, 25.0, 31.0, 44.0, 44.0, 71.0, 89.0, 93.0, 62.0, 52.0, 68.0, 57.0, 41.0, 32.0, 41.0, 33.0, 21.0, 18.0, 23.0, 12.0, 8.0, 11.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-19.892127990722656, -19.311201095581055, -18.730274200439453, -18.149349212646484, -17.568422317504883, -16.98749542236328, -16.406570434570312, -15.825643539428711, -15.24471664428711, -14.663789749145508, -14.082863807678223, -13.501937866210938, -12.921010971069336, -12.340084075927734, -11.75915813446045, -11.178232192993164, -10.597305297851562, -10.016378402709961, -9.435452461242676, -8.85452651977539, -8.273599624633789, -7.692673206329346, -7.111746788024902, -6.530820369720459, -5.949893951416016, -5.368967533111572, -4.788041114807129, -4.2071146965026855, -3.626188278198242, -3.045261859893799, -2.4643354415893555, -1.883409023284912, -1.302480697631836, -0.7215542793273926, -0.14062786102294922, 0.44029855728149414, 1.0212249755859375, 1.6021513938903809, 2.183077812194824, 2.7640042304992676, 3.344930648803711, 3.9258570671081543, 4.506783485412598, 5.087709903717041, 5.668636322021484, 6.249562740325928, 6.830489158630371, 7.4114155769348145, 7.992341995239258, 8.57326889038086, 9.154194831848145, 9.73512077331543, 10.316047668457031, 10.896974563598633, 11.477900505065918, 12.058826446533203, 12.639753341674805, 13.220680236816406, 13.801606178283691, 14.382532119750977, 14.963459014892578, 15.54438591003418, 16.12531280517578, 16.70623779296875, 17.28716468811035]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 1.0, 6.0, 5.0, 12.0, 8.0, 6.0, 9.0, 18.0, 17.0, 15.0, 17.0, 17.0, 23.0, 31.0, 38.0, 33.0, 39.0, 38.0, 41.0, 43.0, 30.0, 44.0, 41.0, 31.0, 41.0, 39.0, 36.0, 31.0, 31.0, 30.0, 32.0, 23.0, 16.0, 23.0, 25.0, 18.0, 23.0, 8.0, 8.0, 11.0, 6.0, 11.0, 10.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.08172607421875, -11.65276050567627, -11.223794937133789, -10.794828414916992, -10.365862846374512, -9.936897277832031, -9.50793170928955, -9.07896614074707, -8.649999618530273, -8.221034049987793, -7.792068004608154, -7.363102436065674, -6.934136390686035, -6.505170822143555, -6.076205253601074, -5.647239685058594, -5.218274116516113, -4.789308547973633, -4.360342502593994, -3.9313769340515137, -3.502411127090454, -3.0734453201293945, -2.644479751586914, -2.2155139446258545, -1.786548137664795, -1.3575823307037354, -0.9286166429519653, -0.4996509552001953, -0.07068514823913574, 0.35828065872192383, 0.7872462272644043, 1.2162120342254639, 1.6451787948608398, 2.0741446018218994, 2.503110408782959, 2.9320759773254395, 3.361041784286499, 3.7900075912475586, 4.218973159790039, 4.6479387283325195, 5.076904773712158, 5.505870342254639, 5.934836387634277, 6.363801956176758, 6.792767524719238, 7.221733570098877, 7.650699138641357, 8.079665184020996, 8.508630752563477, 8.937596321105957, 9.366561889648438, 9.795528411865234, 10.224493980407715, 10.653459548950195, 11.082425117492676, 11.511390686035156, 11.940357208251953, 12.369322776794434, 12.798288345336914, 13.227254867553711, 13.656220436096191, 14.085186004638672, 14.514151573181152, 14.943117141723633, 15.372082710266113]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 11.0, 26.0, 47.0, 65.0, 112.0, 155.0, 244.0, 375.0, 543.0, 885.0, 1365.0, 2147.0, 3099.0, 5048.0, 7554.0, 12066.0, 19052.0, 31235.0, 51834.0, 92064.0, 176051.0, 408160.0, 934372.0, 1184870.0, 681782.0, 272068.0, 127933.0, 70562.0, 41336.0, 24928.0, 15516.0, 9916.0, 6379.0, 4235.0, 2792.0, 1807.0, 1203.0, 794.0, 520.0, 366.0, 252.0, 154.0, 97.0, 81.0, 59.0, 36.0, 25.0, 26.0, 20.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-16.8125, -16.25732421875, -15.7021484375, -15.14697265625, -14.591796875, -14.03662109375, -13.4814453125, -12.92626953125, -12.37109375, -11.81591796875, -11.2607421875, -10.70556640625, -10.150390625, -9.59521484375, -9.0400390625, -8.48486328125, -7.9296875, -7.37451171875, -6.8193359375, -6.26416015625, -5.708984375, -5.15380859375, -4.5986328125, -4.04345703125, -3.48828125, -2.93310546875, -2.3779296875, -1.82275390625, -1.267578125, -0.71240234375, -0.1572265625, 0.39794921875, 0.953125, 1.50830078125, 2.0634765625, 2.61865234375, 3.173828125, 3.72900390625, 4.2841796875, 4.83935546875, 5.39453125, 5.94970703125, 6.5048828125, 7.06005859375, 7.615234375, 8.17041015625, 8.7255859375, 9.28076171875, 9.8359375, 10.39111328125, 10.9462890625, 11.50146484375, 12.056640625, 12.61181640625, 13.1669921875, 13.72216796875, 14.27734375, 14.83251953125, 15.3876953125, 15.94287109375, 16.498046875, 17.05322265625, 17.6083984375, 18.16357421875, 18.71875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 6.0, 1.0, 6.0, 5.0, 10.0, 8.0, 7.0, 11.0, 10.0, 10.0, 19.0, 15.0, 18.0, 23.0, 21.0, 28.0, 40.0, 29.0, 43.0, 47.0, 55.0, 37.0, 35.0, 50.0, 45.0, 25.0, 38.0, 25.0, 35.0, 31.0, 26.0, 31.0, 32.0, 38.0, 21.0, 23.0, 21.0, 14.0, 14.0, 8.0, 17.0, 7.0, 3.0, 6.0, 2.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.1741943359375, -8.832763671875, -8.4913330078125, -8.14990234375, -7.8084716796875, -7.467041015625, -7.1256103515625, -6.7841796875, -6.4427490234375, -6.101318359375, -5.7598876953125, -5.41845703125, -5.0770263671875, -4.735595703125, -4.3941650390625, -4.052734375, -3.7113037109375, -3.369873046875, -3.0284423828125, -2.68701171875, -2.3455810546875, -2.004150390625, -1.6627197265625, -1.3212890625, -0.9798583984375, -0.638427734375, -0.2969970703125, 0.04443359375, 0.3858642578125, 0.727294921875, 1.0687255859375, 1.41015625, 1.7515869140625, 2.093017578125, 2.4344482421875, 2.77587890625, 3.1173095703125, 3.458740234375, 3.8001708984375, 4.1416015625, 4.4830322265625, 4.824462890625, 5.1658935546875, 5.50732421875, 5.8487548828125, 6.190185546875, 6.5316162109375, 6.873046875, 7.2144775390625, 7.555908203125, 7.8973388671875, 8.23876953125, 8.5802001953125, 8.921630859375, 9.2630615234375, 9.6044921875, 9.9459228515625, 10.287353515625, 10.6287841796875, 10.97021484375, 11.3116455078125, 11.653076171875, 11.9945068359375, 12.3359375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 8.0, 8.0, 9.0, 20.0, 16.0, 21.0, 32.0, 66.0, 63.0, 97.0, 167.0, 247.0, 332.0, 558.0, 797.0, 1293.0, 1951.0, 3218.0, 5248.0, 8515.0, 14285.0, 24607.0, 43602.0, 78072.0, 143676.0, 271258.0, 516526.0, 924899.0, 963952.0, 551948.0, 290252.0, 154128.0, 83090.0, 46305.0, 26304.0, 15037.0, 9012.0, 5405.0, 3343.0, 2056.0, 1296.0, 851.0, 587.0, 370.0, 233.0, 161.0, 124.0, 68.0, 59.0, 48.0, 21.0, 20.0, 12.0, 7.0, 4.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0], "bins": [-16.125, -15.605712890625, -15.08642578125, -14.567138671875, -14.0478515625, -13.528564453125, -13.00927734375, -12.489990234375, -11.970703125, -11.451416015625, -10.93212890625, -10.412841796875, -9.8935546875, -9.374267578125, -8.85498046875, -8.335693359375, -7.81640625, -7.297119140625, -6.77783203125, -6.258544921875, -5.7392578125, -5.219970703125, -4.70068359375, -4.181396484375, -3.662109375, -3.142822265625, -2.62353515625, -2.104248046875, -1.5849609375, -1.065673828125, -0.54638671875, -0.027099609375, 0.4921875, 1.011474609375, 1.53076171875, 2.050048828125, 2.5693359375, 3.088623046875, 3.60791015625, 4.127197265625, 4.646484375, 5.165771484375, 5.68505859375, 6.204345703125, 6.7236328125, 7.242919921875, 7.76220703125, 8.281494140625, 8.80078125, 9.320068359375, 9.83935546875, 10.358642578125, 10.8779296875, 11.397216796875, 11.91650390625, 12.435791015625, 12.955078125, 13.474365234375, 13.99365234375, 14.512939453125, 15.0322265625, 15.551513671875, 16.07080078125, 16.590087890625, 17.109375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 1.0, 8.0, 9.0, 11.0, 15.0, 30.0, 25.0, 23.0, 36.0, 39.0, 57.0, 60.0, 86.0, 93.0, 118.0, 162.0, 160.0, 209.0, 248.0, 283.0, 349.0, 337.0, 276.0, 271.0, 220.0, 181.0, 129.0, 136.0, 113.0, 90.0, 59.0, 67.0, 43.0, 25.0, 24.0, 19.0, 17.0, 9.0, 9.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.905517578125, -5.70166015625, -5.497802734375, -5.2939453125, -5.090087890625, -4.88623046875, -4.682373046875, -4.478515625, -4.274658203125, -4.07080078125, -3.866943359375, -3.6630859375, -3.459228515625, -3.25537109375, -3.051513671875, -2.84765625, -2.643798828125, -2.43994140625, -2.236083984375, -2.0322265625, -1.828369140625, -1.62451171875, -1.420654296875, -1.216796875, -1.012939453125, -0.80908203125, -0.605224609375, -0.4013671875, -0.197509765625, 0.00634765625, 0.210205078125, 0.4140625, 0.617919921875, 0.82177734375, 1.025634765625, 1.2294921875, 1.433349609375, 1.63720703125, 1.841064453125, 2.044921875, 2.248779296875, 2.45263671875, 2.656494140625, 2.8603515625, 3.064208984375, 3.26806640625, 3.471923828125, 3.67578125, 3.879638671875, 4.08349609375, 4.287353515625, 4.4912109375, 4.695068359375, 4.89892578125, 5.102783203125, 5.306640625, 5.510498046875, 5.71435546875, 5.918212890625, 6.1220703125, 6.325927734375, 6.52978515625, 6.733642578125, 6.9375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 13.0, 7.0, 16.0, 12.0, 22.0, 24.0, 38.0, 47.0, 49.0, 70.0, 79.0, 67.0, 94.0, 49.0, 77.0, 68.0, 58.0, 58.0, 34.0, 30.0, 16.0, 19.0, 12.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.69126319885254, -16.157350540161133, -15.62343692779541, -15.089523315429688, -14.555610656738281, -14.021697998046875, -13.487784385681152, -12.95387077331543, -12.419958114624023, -11.886045455932617, -11.352131843566895, -10.818218231201172, -10.284305572509766, -9.75039291381836, -9.216479301452637, -8.682565689086914, -8.148653030395508, -7.614739894866943, -7.080826759338379, -6.5469136238098145, -6.01300048828125, -5.4790873527526855, -4.945174217224121, -4.411261081695557, -3.877347946166992, -3.3434348106384277, -2.8095216751098633, -2.275608539581299, -1.7416954040527344, -1.20778226852417, -0.6738691329956055, -0.13995599746704102, 0.39395904541015625, 0.9278721809387207, 1.4617853164672852, 1.9956984519958496, 2.529611587524414, 3.0635247230529785, 3.597437858581543, 4.131350994110107, 4.665264129638672, 5.199177265167236, 5.733090400695801, 6.267003536224365, 6.80091667175293, 7.334829807281494, 7.868742942810059, 8.402656555175781, 8.936569213867188, 9.470481872558594, 10.004395484924316, 10.538309097290039, 11.072221755981445, 11.606134414672852, 12.140048027038574, 12.673961639404297, 13.207874298095703, 13.74178695678711, 14.275700569152832, 14.809614181518555, 15.343526840209961, 15.877439498901367, 16.411354064941406, 16.945266723632812, 17.47917938232422]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 12.0, 6.0, 9.0, 10.0, 9.0, 14.0, 24.0, 24.0, 17.0, 20.0, 37.0, 31.0, 38.0, 31.0, 34.0, 40.0, 37.0, 43.0, 28.0, 48.0, 42.0, 39.0, 37.0, 39.0, 42.0, 27.0, 33.0, 35.0, 18.0, 24.0, 20.0, 18.0, 12.0, 21.0, 13.0, 17.0, 7.0, 7.0, 6.0, 4.0, 5.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.320253372192383, -10.951154708862305, -10.582056999206543, -10.212958335876465, -9.843860626220703, -9.474761962890625, -9.105663299560547, -8.736565589904785, -8.367466926574707, -7.998368740081787, -7.629270553588867, -7.260171890258789, -6.891073703765869, -6.521975517272949, -6.152877330780029, -5.783779144287109, -5.4146809577941895, -5.0455827713012695, -4.67648458480835, -4.30738639831543, -3.9382877349853516, -3.5691895484924316, -3.2000913619995117, -2.8309929370880127, -2.4618947505950928, -2.092796564102173, -1.7236981391906738, -1.354599952697754, -0.9855016469955444, -0.616403341293335, -0.24730515480041504, 0.12179327011108398, 0.4908914566040039, 0.8599897623062134, 1.2290880680084229, 1.5981862545013428, 1.9672845602035522, 2.3363828659057617, 2.7054810523986816, 3.0745794773101807, 3.4436776638031006, 3.8127758502960205, 4.1818742752075195, 4.5509724617004395, 4.920070648193359, 5.2891693115234375, 5.658267021179199, 6.027365684509277, 6.396463871002197, 6.765562057495117, 7.134660243988037, 7.503758430480957, 7.872857093811035, 8.241954803466797, 8.611053466796875, 8.980152130126953, 9.349249839782715, 9.718348503112793, 10.087446212768555, 10.456544876098633, 10.825642585754395, 11.194741249084473, 11.563838958740234, 11.932937622070312, 12.30203628540039]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 5.0, 15.0, 12.0, 28.0, 47.0, 61.0, 88.0, 115.0, 185.0, 278.0, 385.0, 573.0, 742.0, 1143.0, 1644.0, 2278.0, 3346.0, 4837.0, 7019.0, 10530.0, 15793.0, 24356.0, 38616.0, 63514.0, 114483.0, 308700.0, 204289.0, 93788.0, 54148.0, 33494.0, 21062.0, 13678.0, 9126.0, 6192.0, 4183.0, 2954.0, 2099.0, 1426.0, 1015.0, 710.0, 501.0, 340.0, 233.0, 186.0, 108.0, 80.0, 52.0, 37.0, 21.0, 15.0, 12.0, 11.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.84375, -5.66021728515625, -5.4766845703125, -5.29315185546875, -5.109619140625, -4.92608642578125, -4.7425537109375, -4.55902099609375, -4.37548828125, -4.19195556640625, -4.0084228515625, -3.82489013671875, -3.641357421875, -3.45782470703125, -3.2742919921875, -3.09075927734375, -2.9072265625, -2.72369384765625, -2.5401611328125, -2.35662841796875, -2.173095703125, -1.98956298828125, -1.8060302734375, -1.62249755859375, -1.43896484375, -1.25543212890625, -1.0718994140625, -0.88836669921875, -0.704833984375, -0.52130126953125, -0.3377685546875, -0.15423583984375, 0.029296875, 0.21282958984375, 0.3963623046875, 0.57989501953125, 0.763427734375, 0.94696044921875, 1.1304931640625, 1.31402587890625, 1.49755859375, 1.68109130859375, 1.8646240234375, 2.04815673828125, 2.231689453125, 2.41522216796875, 2.5987548828125, 2.78228759765625, 2.9658203125, 3.14935302734375, 3.3328857421875, 3.51641845703125, 3.699951171875, 3.88348388671875, 4.0670166015625, 4.25054931640625, 4.43408203125, 4.61761474609375, 4.8011474609375, 4.98468017578125, 5.168212890625, 5.35174560546875, 5.5352783203125, 5.71881103515625, 5.90234375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 3.0, 6.0, 4.0, 5.0, 11.0, 12.0, 15.0, 12.0, 16.0, 25.0, 25.0, 22.0, 32.0, 33.0, 37.0, 35.0, 40.0, 34.0, 36.0, 46.0, 49.0, 37.0, 52.0, 41.0, 43.0, 33.0, 43.0, 21.0, 33.0, 24.0, 27.0, 16.0, 17.0, 16.0, 18.0, 11.0, 11.0, 12.0, 15.0, 9.0, 7.0, 4.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.7109375, -11.323486328125, -10.93603515625, -10.548583984375, -10.1611328125, -9.773681640625, -9.38623046875, -8.998779296875, -8.611328125, -8.223876953125, -7.83642578125, -7.448974609375, -7.0615234375, -6.674072265625, -6.28662109375, -5.899169921875, -5.51171875, -5.124267578125, -4.73681640625, -4.349365234375, -3.9619140625, -3.574462890625, -3.18701171875, -2.799560546875, -2.412109375, -2.024658203125, -1.63720703125, -1.249755859375, -0.8623046875, -0.474853515625, -0.08740234375, 0.300048828125, 0.6875, 1.074951171875, 1.46240234375, 1.849853515625, 2.2373046875, 2.624755859375, 3.01220703125, 3.399658203125, 3.787109375, 4.174560546875, 4.56201171875, 4.949462890625, 5.3369140625, 5.724365234375, 6.11181640625, 6.499267578125, 6.88671875, 7.274169921875, 7.66162109375, 8.049072265625, 8.4365234375, 8.823974609375, 9.21142578125, 9.598876953125, 9.986328125, 10.373779296875, 10.76123046875, 11.148681640625, 11.5361328125, 11.923583984375, 12.31103515625, 12.698486328125, 13.0859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 14.0, 22.0, 26.0, 54.0, 66.0, 112.0, 131.0, 218.0, 329.0, 446.0, 713.0, 1018.0, 1449.0, 2142.0, 3211.0, 5024.0, 7447.0, 11521.0, 17625.0, 27856.0, 45157.0, 76605.0, 146026.0, 352491.0, 146931.0, 76994.0, 45189.0, 27924.0, 17699.0, 11601.0, 7512.0, 4925.0, 3241.0, 2223.0, 1509.0, 976.0, 672.0, 483.0, 325.0, 214.0, 139.0, 81.0, 66.0, 49.0, 22.0, 23.0, 15.0, 15.0, 7.0, 7.0, 7.0, 0.0, 2.0], "bins": [-6.19140625, -6.011962890625, -5.83251953125, -5.653076171875, -5.4736328125, -5.294189453125, -5.11474609375, -4.935302734375, -4.755859375, -4.576416015625, -4.39697265625, -4.217529296875, -4.0380859375, -3.858642578125, -3.67919921875, -3.499755859375, -3.3203125, -3.140869140625, -2.96142578125, -2.781982421875, -2.6025390625, -2.423095703125, -2.24365234375, -2.064208984375, -1.884765625, -1.705322265625, -1.52587890625, -1.346435546875, -1.1669921875, -0.987548828125, -0.80810546875, -0.628662109375, -0.44921875, -0.269775390625, -0.09033203125, 0.089111328125, 0.2685546875, 0.447998046875, 0.62744140625, 0.806884765625, 0.986328125, 1.165771484375, 1.34521484375, 1.524658203125, 1.7041015625, 1.883544921875, 2.06298828125, 2.242431640625, 2.421875, 2.601318359375, 2.78076171875, 2.960205078125, 3.1396484375, 3.319091796875, 3.49853515625, 3.677978515625, 3.857421875, 4.036865234375, 4.21630859375, 4.395751953125, 4.5751953125, 4.754638671875, 4.93408203125, 5.113525390625, 5.29296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 7.0, 7.0, 13.0, 9.0, 13.0, 7.0, 16.0, 16.0, 17.0, 20.0, 32.0, 24.0, 37.0, 28.0, 34.0, 37.0, 36.0, 37.0, 39.0, 50.0, 31.0, 38.0, 44.0, 31.0, 48.0, 40.0, 40.0, 34.0, 28.0, 25.0, 23.0, 25.0, 16.0, 13.0, 13.0, 16.0, 10.0, 6.0, 12.0, 5.0, 5.0, 1.0, 8.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-7.9765625, -7.7445068359375, -7.512451171875, -7.2803955078125, -7.04833984375, -6.8162841796875, -6.584228515625, -6.3521728515625, -6.1201171875, -5.8880615234375, -5.656005859375, -5.4239501953125, -5.19189453125, -4.9598388671875, -4.727783203125, -4.4957275390625, -4.263671875, -4.0316162109375, -3.799560546875, -3.5675048828125, -3.33544921875, -3.1033935546875, -2.871337890625, -2.6392822265625, -2.4072265625, -2.1751708984375, -1.943115234375, -1.7110595703125, -1.47900390625, -1.2469482421875, -1.014892578125, -0.7828369140625, -0.55078125, -0.3187255859375, -0.086669921875, 0.1453857421875, 0.37744140625, 0.6094970703125, 0.841552734375, 1.0736083984375, 1.3056640625, 1.5377197265625, 1.769775390625, 2.0018310546875, 2.23388671875, 2.4659423828125, 2.697998046875, 2.9300537109375, 3.162109375, 3.3941650390625, 3.626220703125, 3.8582763671875, 4.09033203125, 4.3223876953125, 4.554443359375, 4.7864990234375, 5.0185546875, 5.2506103515625, 5.482666015625, 5.7147216796875, 5.94677734375, 6.1788330078125, 6.410888671875, 6.6429443359375, 6.875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 12.0, 7.0, 11.0, 17.0, 31.0, 37.0, 41.0, 77.0, 112.0, 188.0, 240.0, 388.0, 610.0, 956.0, 1537.0, 2573.0, 4489.0, 8270.0, 16559.0, 35541.0, 89433.0, 271458.0, 378476.0, 139481.0, 50784.0, 22273.0, 10935.0, 5660.0, 3219.0, 1892.0, 1162.0, 670.0, 455.0, 324.0, 190.0, 128.0, 89.0, 57.0, 40.0, 31.0, 29.0, 19.0, 16.0, 13.0, 11.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.024627685546875, -0.023928165435791016, -0.02322864532470703, -0.022529125213623047, -0.021829605102539062, -0.021130084991455078, -0.020430564880371094, -0.01973104476928711, -0.019031524658203125, -0.01833200454711914, -0.017632484436035156, -0.016932964324951172, -0.016233444213867188, -0.015533924102783203, -0.014834403991699219, -0.014134883880615234, -0.01343536376953125, -0.012735843658447266, -0.012036323547363281, -0.011336803436279297, -0.010637283325195312, -0.009937763214111328, -0.009238243103027344, -0.00853872299194336, -0.007839202880859375, -0.007139682769775391, -0.006440162658691406, -0.005740642547607422, -0.0050411224365234375, -0.004341602325439453, -0.0036420822143554688, -0.0029425621032714844, -0.0022430419921875, -0.0015435218811035156, -0.0008440017700195312, -0.00014448165893554688, 0.0005550384521484375, 0.0012545585632324219, 0.0019540786743164062, 0.0026535987854003906, 0.003353118896484375, 0.004052639007568359, 0.004752159118652344, 0.005451679229736328, 0.0061511993408203125, 0.006850719451904297, 0.007550239562988281, 0.008249759674072266, 0.00894927978515625, 0.009648799896240234, 0.010348320007324219, 0.011047840118408203, 0.011747360229492188, 0.012446880340576172, 0.013146400451660156, 0.01384592056274414, 0.014545440673828125, 0.01524496078491211, 0.015944480895996094, 0.016644001007080078, 0.017343521118164062, 0.018043041229248047, 0.01874256134033203, 0.019442081451416016, 0.0201416015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 9.0, 8.0, 6.0, 7.0, 12.0, 15.0, 21.0, 25.0, 31.0, 28.0, 35.0, 48.0, 67.0, 64.0, 56.0, 51.0, 56.0, 59.0, 47.0, 56.0, 35.0, 37.0, 34.0, 35.0, 30.0, 24.0, 27.0, 10.0, 5.0, 10.0, 5.0, 7.0, 9.0, 3.0, 2.0, 5.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.1563301086425781e-05, -1.1225230991840363e-05, -1.0887160897254944e-05, -1.0549090802669525e-05, -1.0211020708084106e-05, -9.872950613498688e-06, -9.534880518913269e-06, -9.19681042432785e-06, -8.858740329742432e-06, -8.520670235157013e-06, -8.182600140571594e-06, -7.844530045986176e-06, -7.506459951400757e-06, -7.168389856815338e-06, -6.8303197622299194e-06, -6.492249667644501e-06, -6.154179573059082e-06, -5.816109478473663e-06, -5.478039383888245e-06, -5.139969289302826e-06, -4.801899194717407e-06, -4.4638291001319885e-06, -4.12575900554657e-06, -3.787688910961151e-06, -3.4496188163757324e-06, -3.1115487217903137e-06, -2.773478627204895e-06, -2.4354085326194763e-06, -2.0973384380340576e-06, -1.759268343448639e-06, -1.4211982488632202e-06, -1.0831281542778015e-06, -7.450580596923828e-07, -4.069879651069641e-07, -6.891787052154541e-08, 2.691522240638733e-07, 6.07222318649292e-07, 9.452924132347107e-07, 1.2833625078201294e-06, 1.621432602405548e-06, 1.959502696990967e-06, 2.2975727915763855e-06, 2.635642886161804e-06, 2.973712980747223e-06, 3.3117830753326416e-06, 3.6498531699180603e-06, 3.987923264503479e-06, 4.325993359088898e-06, 4.664063453674316e-06, 5.002133548259735e-06, 5.340203642845154e-06, 5.6782737374305725e-06, 6.016343832015991e-06, 6.35441392660141e-06, 6.692484021186829e-06, 7.030554115772247e-06, 7.368624210357666e-06, 7.706694304943085e-06, 8.044764399528503e-06, 8.382834494113922e-06, 8.72090458869934e-06, 9.05897468328476e-06, 9.397044777870178e-06, 9.735114872455597e-06, 1.0073184967041016e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 7.0, 15.0, 13.0, 29.0, 39.0, 62.0, 73.0, 89.0, 138.0, 237.0, 321.0, 442.0, 664.0, 907.0, 1323.0, 1824.0, 2896.0, 4281.0, 6809.0, 10888.0, 18034.0, 32784.0, 63456.0, 133523.0, 244248.0, 245618.0, 134239.0, 63488.0, 32595.0, 18299.0, 10860.0, 6878.0, 4374.0, 2924.0, 1882.0, 1336.0, 880.0, 646.0, 435.0, 317.0, 222.0, 123.0, 116.0, 73.0, 40.0, 30.0, 31.0, 17.0, 9.0, 9.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.01506805419921875, -0.014582037925720215, -0.01409602165222168, -0.013610005378723145, -0.01312398910522461, -0.012637972831726074, -0.012151956558227539, -0.011665940284729004, -0.011179924011230469, -0.010693907737731934, -0.010207891464233398, -0.009721875190734863, -0.009235858917236328, -0.008749842643737793, -0.008263826370239258, -0.007777810096740723, -0.0072917938232421875, -0.006805777549743652, -0.006319761276245117, -0.005833745002746582, -0.005347728729248047, -0.004861712455749512, -0.0043756961822509766, -0.0038896799087524414, -0.0034036636352539062, -0.002917647361755371, -0.002431631088256836, -0.0019456148147583008, -0.0014595985412597656, -0.0009735822677612305, -0.0004875659942626953, -1.5497207641601562e-06, 0.000484466552734375, 0.0009704828262329102, 0.0014564990997314453, 0.0019425153732299805, 0.0024285316467285156, 0.0029145479202270508, 0.003400564193725586, 0.003886580467224121, 0.004372596740722656, 0.004858613014221191, 0.0053446292877197266, 0.005830645561218262, 0.006316661834716797, 0.006802678108215332, 0.007288694381713867, 0.007774710655212402, 0.008260726928710938, 0.008746743202209473, 0.009232759475708008, 0.009718775749206543, 0.010204792022705078, 0.010690808296203613, 0.011176824569702148, 0.011662840843200684, 0.012148857116699219, 0.012634873390197754, 0.013120889663696289, 0.013606905937194824, 0.01409292221069336, 0.014578938484191895, 0.01506495475769043, 0.015550971031188965, 0.0160369873046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 8.0, 5.0, 4.0, 4.0, 6.0, 6.0, 12.0, 18.0, 22.0, 29.0, 34.0, 32.0, 46.0, 53.0, 59.0, 57.0, 63.0, 64.0, 61.0, 65.0, 66.0, 52.0, 38.0, 28.0, 30.0, 24.0, 19.0, 20.0, 12.0, 9.0, 9.0, 13.0, 8.0, 5.0, 3.0, 2.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.004970550537109375, -0.004820764064788818, -0.004670977592468262, -0.004521191120147705, -0.0043714046478271484, -0.004221618175506592, -0.004071831703186035, -0.0039220452308654785, -0.003772258758544922, -0.0036224722862243652, -0.0034726858139038086, -0.003322899341583252, -0.0031731128692626953, -0.0030233263969421387, -0.002873539924621582, -0.0027237534523010254, -0.0025739669799804688, -0.002424180507659912, -0.0022743940353393555, -0.002124607563018799, -0.001974821090698242, -0.0018250346183776855, -0.001675248146057129, -0.0015254616737365723, -0.0013756752014160156, -0.001225888729095459, -0.0010761022567749023, -0.0009263157844543457, -0.0007765293121337891, -0.0006267428398132324, -0.0004769563674926758, -0.00032716989517211914, -0.0001773834228515625, -2.759695053100586e-05, 0.00012218952178955078, 0.0002719759941101074, 0.00042176246643066406, 0.0005715489387512207, 0.0007213354110717773, 0.000871121883392334, 0.0010209083557128906, 0.0011706948280334473, 0.001320481300354004, 0.0014702677726745605, 0.0016200542449951172, 0.0017698407173156738, 0.0019196271896362305, 0.002069413661956787, 0.0022192001342773438, 0.0023689866065979004, 0.002518773078918457, 0.0026685595512390137, 0.0028183460235595703, 0.002968132495880127, 0.0031179189682006836, 0.0032677054405212402, 0.003417491912841797, 0.0035672783851623535, 0.00371706485748291, 0.003866851329803467, 0.0040166378021240234, 0.00416642427444458, 0.004316210746765137, 0.004465997219085693, 0.00461578369140625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 4.0, 10.0, 10.0, 9.0, 12.0, 22.0, 19.0, 24.0, 40.0, 46.0, 66.0, 64.0, 75.0, 69.0, 85.0, 59.0, 76.0, 62.0, 57.0, 47.0, 36.0, 25.0, 17.0, 20.0, 9.0, 10.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.180983543395996, -14.676055908203125, -14.171127319335938, -13.666199684143066, -13.161271095275879, -12.656343460083008, -12.15141487121582, -11.64648723602295, -11.141559600830078, -10.636631965637207, -10.13170337677002, -9.626775741577148, -9.121847152709961, -8.61691951751709, -8.111991882324219, -7.607063293457031, -7.102134704589844, -6.5972065925598145, -6.092278480529785, -5.587350845336914, -5.082422256469727, -4.5774946212768555, -4.072566509246826, -3.567638397216797, -3.0627102851867676, -2.5577821731567383, -2.052854061126709, -1.5479261875152588, -1.0429980754852295, -0.5380699634552002, -0.03314208984375, 0.4717860221862793, 0.9767131805419922, 1.4816412925720215, 1.9865692853927612, 2.491497278213501, 2.9964253902435303, 3.5013535022735596, 4.00628137588501, 4.511209487915039, 5.016137599945068, 5.521065711975098, 6.025993824005127, 6.530921936035156, 7.035849571228027, 7.540778160095215, 8.045705795288086, 8.550634384155273, 9.055562019348145, 9.560489654541016, 10.065418243408203, 10.570345878601074, 11.075274467468262, 11.580202102661133, 12.08513069152832, 12.590058326721191, 13.094985961914062, 13.599913597106934, 14.104842185974121, 14.609769821166992, 15.11469841003418, 15.61962604522705, 16.124553680419922, 16.62948226928711, 17.134410858154297]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 10.0, 9.0, 9.0, 7.0, 10.0, 17.0, 22.0, 24.0, 16.0, 19.0, 37.0, 31.0, 43.0, 26.0, 36.0, 40.0, 36.0, 42.0, 32.0, 43.0, 42.0, 45.0, 39.0, 35.0, 41.0, 30.0, 31.0, 34.0, 19.0, 22.0, 22.0, 17.0, 14.0, 19.0, 13.0, 17.0, 7.0, 8.0, 5.0, 6.0, 3.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.984770774841309, -10.625107765197754, -10.2654447555542, -9.905782699584961, -9.546119689941406, -9.186456680297852, -8.826793670654297, -8.467130661010742, -8.107467651367188, -7.747804641723633, -7.388142108917236, -7.028479099273682, -6.668816566467285, -6.3091535568237305, -5.949490547180176, -5.589827537536621, -5.230165481567383, -4.870502471923828, -4.510839939117432, -4.151176929473877, -3.7915141582489014, -3.431851387023926, -3.072188377380371, -2.7125256061553955, -2.35286283493042, -1.9932000637054443, -1.6335371732711792, -1.273874282836914, -0.9142115116119385, -0.5545487403869629, -0.1948857307434082, 0.16477704048156738, 0.5244407653808594, 0.8841035962104797, 1.2437664270401, 1.6034293174743652, 1.9630920886993408, 2.3227548599243164, 2.682417869567871, 3.0420806407928467, 3.4017434120178223, 3.761406183242798, 4.121068954467773, 4.480731964111328, 4.840394973754883, 5.200057506561279, 5.559720516204834, 5.9193830490112305, 6.279046058654785, 6.63870906829834, 6.998371601104736, 7.358034610748291, 7.7176971435546875, 8.077360153198242, 8.437023162841797, 8.796686172485352, 9.156349182128906, 9.516012191772461, 9.875675201416016, 10.23533821105957, 10.595000267028809, 10.954663276672363, 11.314326286315918, 11.673989295959473, 12.033651351928711]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 13.0, 16.0, 26.0, 37.0, 38.0, 62.0, 102.0, 115.0, 184.0, 254.0, 423.0, 588.0, 844.0, 1225.0, 1947.0, 2928.0, 4165.0, 6471.0, 9998.0, 15110.0, 23156.0, 35817.0, 54759.0, 82822.0, 117703.0, 148225.0, 151645.0, 125879.0, 89940.0, 59797.0, 39337.0, 25884.0, 16914.0, 10864.0, 7060.0, 4830.0, 3134.0, 2020.0, 1360.0, 927.0, 586.0, 408.0, 271.0, 196.0, 149.0, 85.0, 85.0, 59.0, 30.0, 24.0, 9.0, 12.0, 11.0, 3.0, 5.0, 3.0, 0.0, 6.0], "bins": [-14.3984375, -13.9500732421875, -13.501708984375, -13.0533447265625, -12.60498046875, -12.1566162109375, -11.708251953125, -11.2598876953125, -10.8115234375, -10.3631591796875, -9.914794921875, -9.4664306640625, -9.01806640625, -8.5697021484375, -8.121337890625, -7.6729736328125, -7.224609375, -6.7762451171875, -6.327880859375, -5.8795166015625, -5.43115234375, -4.9827880859375, -4.534423828125, -4.0860595703125, -3.6376953125, -3.1893310546875, -2.740966796875, -2.2926025390625, -1.84423828125, -1.3958740234375, -0.947509765625, -0.4991455078125, -0.05078125, 0.3975830078125, 0.845947265625, 1.2943115234375, 1.74267578125, 2.1910400390625, 2.639404296875, 3.0877685546875, 3.5361328125, 3.9844970703125, 4.432861328125, 4.8812255859375, 5.32958984375, 5.7779541015625, 6.226318359375, 6.6746826171875, 7.123046875, 7.5714111328125, 8.019775390625, 8.4681396484375, 8.91650390625, 9.3648681640625, 9.813232421875, 10.2615966796875, 10.7099609375, 11.1583251953125, 11.606689453125, 12.0550537109375, 12.50341796875, 12.9517822265625, 13.400146484375, 13.8485107421875, 14.296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 8.0, 9.0, 9.0, 13.0, 14.0, 16.0, 17.0, 22.0, 31.0, 25.0, 28.0, 32.0, 31.0, 35.0, 35.0, 37.0, 41.0, 40.0, 36.0, 49.0, 46.0, 37.0, 46.0, 27.0, 33.0, 39.0, 27.0, 22.0, 26.0, 17.0, 22.0, 12.0, 21.0, 10.0, 25.0, 9.0, 11.0, 7.0, 6.0, 5.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.625, -9.293212890625, -8.96142578125, -8.629638671875, -8.2978515625, -7.966064453125, -7.63427734375, -7.302490234375, -6.970703125, -6.638916015625, -6.30712890625, -5.975341796875, -5.6435546875, -5.311767578125, -4.97998046875, -4.648193359375, -4.31640625, -3.984619140625, -3.65283203125, -3.321044921875, -2.9892578125, -2.657470703125, -2.32568359375, -1.993896484375, -1.662109375, -1.330322265625, -0.99853515625, -0.666748046875, -0.3349609375, -0.003173828125, 0.32861328125, 0.660400390625, 0.9921875, 1.323974609375, 1.65576171875, 1.987548828125, 2.3193359375, 2.651123046875, 2.98291015625, 3.314697265625, 3.646484375, 3.978271484375, 4.31005859375, 4.641845703125, 4.9736328125, 5.305419921875, 5.63720703125, 5.968994140625, 6.30078125, 6.632568359375, 6.96435546875, 7.296142578125, 7.6279296875, 7.959716796875, 8.29150390625, 8.623291015625, 8.955078125, 9.286865234375, 9.61865234375, 9.950439453125, 10.2822265625, 10.614013671875, 10.94580078125, 11.277587890625, 11.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 18.0, 16.0, 31.0, 37.0, 88.0, 118.0, 178.0, 268.0, 399.0, 639.0, 973.0, 1580.0, 2355.0, 3678.0, 5613.0, 8534.0, 13200.0, 20717.0, 32029.0, 49764.0, 76333.0, 112498.0, 147934.0, 158724.0, 135171.0, 95699.0, 64157.0, 41691.0, 26968.0, 17337.0, 11251.0, 7231.0, 4704.0, 3046.0, 1968.0, 1236.0, 810.0, 524.0, 358.0, 222.0, 149.0, 97.0, 79.0, 46.0, 30.0, 23.0, 15.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5, -13.0391845703125, -12.578369140625, -12.1175537109375, -11.65673828125, -11.1959228515625, -10.735107421875, -10.2742919921875, -9.8134765625, -9.3526611328125, -8.891845703125, -8.4310302734375, -7.97021484375, -7.5093994140625, -7.048583984375, -6.5877685546875, -6.126953125, -5.6661376953125, -5.205322265625, -4.7445068359375, -4.28369140625, -3.8228759765625, -3.362060546875, -2.9012451171875, -2.4404296875, -1.9796142578125, -1.518798828125, -1.0579833984375, -0.59716796875, -0.1363525390625, 0.324462890625, 0.7852783203125, 1.24609375, 1.7069091796875, 2.167724609375, 2.6285400390625, 3.08935546875, 3.5501708984375, 4.010986328125, 4.4718017578125, 4.9326171875, 5.3934326171875, 5.854248046875, 6.3150634765625, 6.77587890625, 7.2366943359375, 7.697509765625, 8.1583251953125, 8.619140625, 9.0799560546875, 9.540771484375, 10.0015869140625, 10.46240234375, 10.9232177734375, 11.384033203125, 11.8448486328125, 12.3056640625, 12.7664794921875, 13.227294921875, 13.6881103515625, 14.14892578125, 14.6097412109375, 15.070556640625, 15.5313720703125, 15.9921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 3.0, 3.0, 7.0, 10.0, 15.0, 6.0, 14.0, 14.0, 27.0, 22.0, 23.0, 22.0, 28.0, 28.0, 26.0, 32.0, 43.0, 50.0, 36.0, 38.0, 50.0, 39.0, 32.0, 47.0, 46.0, 26.0, 46.0, 28.0, 29.0, 24.0, 30.0, 18.0, 23.0, 17.0, 21.0, 13.0, 9.0, 9.0, 4.0, 12.0, 6.0, 12.0, 5.0, 4.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.69140625, -6.476806640625, -6.26220703125, -6.047607421875, -5.8330078125, -5.618408203125, -5.40380859375, -5.189208984375, -4.974609375, -4.760009765625, -4.54541015625, -4.330810546875, -4.1162109375, -3.901611328125, -3.68701171875, -3.472412109375, -3.2578125, -3.043212890625, -2.82861328125, -2.614013671875, -2.3994140625, -2.184814453125, -1.97021484375, -1.755615234375, -1.541015625, -1.326416015625, -1.11181640625, -0.897216796875, -0.6826171875, -0.468017578125, -0.25341796875, -0.038818359375, 0.17578125, 0.390380859375, 0.60498046875, 0.819580078125, 1.0341796875, 1.248779296875, 1.46337890625, 1.677978515625, 1.892578125, 2.107177734375, 2.32177734375, 2.536376953125, 2.7509765625, 2.965576171875, 3.18017578125, 3.394775390625, 3.609375, 3.823974609375, 4.03857421875, 4.253173828125, 4.4677734375, 4.682373046875, 4.89697265625, 5.111572265625, 5.326171875, 5.540771484375, 5.75537109375, 5.969970703125, 6.1845703125, 6.399169921875, 6.61376953125, 6.828369140625, 7.04296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 6.0, 10.0, 7.0, 15.0, 15.0, 28.0, 29.0, 43.0, 61.0, 101.0, 141.0, 193.0, 329.0, 520.0, 850.0, 1373.0, 2476.0, 4372.0, 8411.0, 17656.0, 39676.0, 95086.0, 207064.0, 288772.0, 208550.0, 95897.0, 40036.0, 17549.0, 8597.0, 4487.0, 2477.0, 1394.0, 812.0, 533.0, 331.0, 212.0, 129.0, 97.0, 62.0, 43.0, 31.0, 22.0, 22.0, 7.0, 9.0, 6.0, 7.0, 3.0, 2.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.41015625, -2.331146240234375, -2.25213623046875, -2.173126220703125, -2.0941162109375, -2.015106201171875, -1.93609619140625, -1.857086181640625, -1.778076171875, -1.699066162109375, -1.62005615234375, -1.541046142578125, -1.4620361328125, -1.383026123046875, -1.30401611328125, -1.225006103515625, -1.14599609375, -1.066986083984375, -0.98797607421875, -0.908966064453125, -0.8299560546875, -0.750946044921875, -0.67193603515625, -0.592926025390625, -0.513916015625, -0.434906005859375, -0.35589599609375, -0.276885986328125, -0.1978759765625, -0.118865966796875, -0.03985595703125, 0.039154052734375, 0.1181640625, 0.197174072265625, 0.27618408203125, 0.355194091796875, 0.4342041015625, 0.513214111328125, 0.59222412109375, 0.671234130859375, 0.750244140625, 0.829254150390625, 0.90826416015625, 0.987274169921875, 1.0662841796875, 1.145294189453125, 1.22430419921875, 1.303314208984375, 1.38232421875, 1.461334228515625, 1.54034423828125, 1.619354248046875, 1.6983642578125, 1.777374267578125, 1.85638427734375, 1.935394287109375, 2.014404296875, 2.093414306640625, 2.17242431640625, 2.251434326171875, 2.3304443359375, 2.409454345703125, 2.48846435546875, 2.567474365234375, 2.646484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 8.0, 10.0, 10.0, 13.0, 12.0, 24.0, 28.0, 28.0, 59.0, 58.0, 66.0, 91.0, 87.0, 84.0, 74.0, 83.0, 58.0, 44.0, 28.0, 46.0, 27.0, 17.0, 9.0, 17.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002620220184326172, -0.00025417283177375793, -0.0002463236451148987, -0.00023847445845603943, -0.00023062527179718018, -0.00022277608513832092, -0.00021492689847946167, -0.00020707771182060242, -0.00019922852516174316, -0.0001913793385028839, -0.00018353015184402466, -0.0001756809651851654, -0.00016783177852630615, -0.0001599825918674469, -0.00015213340520858765, -0.0001442842185497284, -0.00013643503189086914, -0.0001285858452320099, -0.00012073665857315063, -0.00011288747191429138, -0.00010503828525543213, -9.718909859657288e-05, -8.933991193771362e-05, -8.149072527885437e-05, -7.364153861999512e-05, -6.579235196113586e-05, -5.794316530227661e-05, -5.009397864341736e-05, -4.2244791984558105e-05, -3.439560532569885e-05, -2.65464186668396e-05, -1.8697232007980347e-05, -1.0848045349121094e-05, -2.998858690261841e-06, 4.850327968597412e-06, 1.2699514627456665e-05, 2.0548701286315918e-05, 2.839788794517517e-05, 3.6247074604034424e-05, 4.409626126289368e-05, 5.194544792175293e-05, 5.979463458061218e-05, 6.764382123947144e-05, 7.549300789833069e-05, 8.334219455718994e-05, 9.11913812160492e-05, 9.904056787490845e-05, 0.0001068897545337677, 0.00011473894119262695, 0.0001225881278514862, 0.00013043731451034546, 0.0001382865011692047, 0.00014613568782806396, 0.00015398487448692322, 0.00016183406114578247, 0.00016968324780464172, 0.00017753243446350098, 0.00018538162112236023, 0.00019323080778121948, 0.00020107999444007874, 0.000208929181098938, 0.00021677836775779724, 0.0002246275544166565, 0.00023247674107551575, 0.000240325927734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 13.0, 19.0, 24.0, 28.0, 35.0, 63.0, 88.0, 129.0, 181.0, 266.0, 403.0, 542.0, 831.0, 1264.0, 2017.0, 3399.0, 6131.0, 11714.0, 25225.0, 58340.0, 135349.0, 252266.0, 267621.0, 156143.0, 67138.0, 29062.0, 13365.0, 6866.0, 3711.0, 2162.0, 1344.0, 905.0, 579.0, 430.0, 285.0, 178.0, 119.0, 88.0, 72.0, 44.0, 41.0, 21.0, 10.0, 14.0, 4.0, 4.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.437225341796875, -2.35882568359375, -2.280426025390625, -2.2020263671875, -2.123626708984375, -2.04522705078125, -1.966827392578125, -1.888427734375, -1.810028076171875, -1.73162841796875, -1.653228759765625, -1.5748291015625, -1.496429443359375, -1.41802978515625, -1.339630126953125, -1.26123046875, -1.182830810546875, -1.10443115234375, -1.026031494140625, -0.9476318359375, -0.869232177734375, -0.79083251953125, -0.712432861328125, -0.634033203125, -0.555633544921875, -0.47723388671875, -0.398834228515625, -0.3204345703125, -0.242034912109375, -0.16363525390625, -0.085235595703125, -0.0068359375, 0.071563720703125, 0.14996337890625, 0.228363037109375, 0.3067626953125, 0.385162353515625, 0.46356201171875, 0.541961669921875, 0.620361328125, 0.698760986328125, 0.77716064453125, 0.855560302734375, 0.9339599609375, 1.012359619140625, 1.09075927734375, 1.169158935546875, 1.24755859375, 1.325958251953125, 1.40435791015625, 1.482757568359375, 1.5611572265625, 1.639556884765625, 1.71795654296875, 1.796356201171875, 1.874755859375, 1.953155517578125, 2.03155517578125, 2.109954833984375, 2.1883544921875, 2.266754150390625, 2.34515380859375, 2.423553466796875, 2.501953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 7.0, 11.0, 7.0, 14.0, 22.0, 35.0, 32.0, 50.0, 55.0, 64.0, 74.0, 82.0, 83.0, 81.0, 68.0, 64.0, 61.0, 45.0, 32.0, 25.0, 15.0, 13.0, 15.0, 5.0, 13.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9208984375, -0.89276123046875, -0.8646240234375, -0.83648681640625, -0.808349609375, -0.78021240234375, -0.7520751953125, -0.72393798828125, -0.69580078125, -0.66766357421875, -0.6395263671875, -0.61138916015625, -0.583251953125, -0.55511474609375, -0.5269775390625, -0.49884033203125, -0.470703125, -0.44256591796875, -0.4144287109375, -0.38629150390625, -0.358154296875, -0.33001708984375, -0.3018798828125, -0.27374267578125, -0.24560546875, -0.21746826171875, -0.1893310546875, -0.16119384765625, -0.133056640625, -0.10491943359375, -0.0767822265625, -0.04864501953125, -0.0205078125, 0.00762939453125, 0.0357666015625, 0.06390380859375, 0.092041015625, 0.12017822265625, 0.1483154296875, 0.17645263671875, 0.20458984375, 0.23272705078125, 0.2608642578125, 0.28900146484375, 0.317138671875, 0.34527587890625, 0.3734130859375, 0.40155029296875, 0.4296875, 0.45782470703125, 0.4859619140625, 0.51409912109375, 0.542236328125, 0.57037353515625, 0.5985107421875, 0.62664794921875, 0.65478515625, 0.68292236328125, 0.7110595703125, 0.73919677734375, 0.767333984375, 0.79547119140625, 0.8236083984375, 0.85174560546875, 0.8798828125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 9.0, 14.0, 12.0, 23.0, 24.0, 32.0, 38.0, 57.0, 75.0, 91.0, 83.0, 70.0, 83.0, 96.0, 72.0, 52.0, 53.0, 42.0, 18.0, 24.0, 12.0, 7.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.64324188232422, -16.077667236328125, -15.512090682983398, -14.946516036987305, -14.380940437316895, -13.815364837646484, -13.24979019165039, -12.68421459197998, -12.11863899230957, -11.55306339263916, -10.98748779296875, -10.421913146972656, -9.856337547302246, -9.290761947631836, -8.725187301635742, -8.159611701965332, -7.594036102294922, -7.028460502624512, -6.46288537979126, -5.897310256958008, -5.331734657287598, -4.7661590576171875, -4.2005839347839355, -3.6350085735321045, -3.0694332122802734, -2.5038578510284424, -1.9382824897766113, -1.3727071285247803, -0.8071317672729492, -0.24155640602111816, 0.3240189552307129, 0.889594316482544, 1.455169677734375, 2.020745038986206, 2.586320400238037, 3.151895761489868, 3.717471122741699, 4.283046722412109, 4.848621845245361, 5.414196968078613, 5.979772567749023, 6.545348167419434, 7.1109232902526855, 7.6764984130859375, 8.242074012756348, 8.807649612426758, 9.373224258422852, 9.938799858093262, 10.504375457763672, 11.069951057434082, 11.635526657104492, 12.201101303100586, 12.766676902770996, 13.332252502441406, 13.8978271484375, 14.46340274810791, 15.02897834777832, 15.59455394744873, 16.16012954711914, 16.725704193115234, 17.291278839111328, 17.856855392456055, 18.42243003845215, 18.988006591796875, 19.55358123779297]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 4.0, 6.0, 3.0, 8.0, 17.0, 16.0, 17.0, 20.0, 20.0, 24.0, 18.0, 27.0, 25.0, 34.0, 35.0, 29.0, 51.0, 39.0, 34.0, 30.0, 45.0, 41.0, 45.0, 42.0, 36.0, 36.0, 39.0, 19.0, 24.0, 35.0, 23.0, 22.0, 18.0, 22.0, 15.0, 16.0, 9.0, 12.0, 10.0, 9.0, 2.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.034523010253906, -10.696233749389648, -10.357943534851074, -10.019654273986816, -9.681364059448242, -9.343074798583984, -9.004785537719727, -8.666496276855469, -8.328206062316895, -7.9899163246154785, -7.6516265869140625, -7.313337326049805, -6.975047588348389, -6.636757850646973, -6.298468589782715, -5.960178852081299, -5.621889114379883, -5.283599376678467, -4.945309638977051, -4.607020378112793, -4.268730640411377, -3.930440902709961, -3.592151403427124, -3.253861904144287, -2.915572166442871, -2.577282428741455, -2.238992929458618, -1.9007033109664917, -1.5624136924743652, -1.2241240739822388, -0.8858344554901123, -0.5475449562072754, -0.20925617218017578, 0.12903344631195068, 0.46732306480407715, 0.8056126832962036, 1.14390230178833, 1.4821919202804565, 1.820481538772583, 2.15877103805542, 2.497060775756836, 2.835350513458252, 3.173640012741089, 3.511929512023926, 3.850219249725342, 4.188508987426758, 4.526798248291016, 4.865087985992432, 5.203377723693848, 5.541667461395264, 5.87995719909668, 6.2182464599609375, 6.5565361976623535, 6.8948259353637695, 7.233115196228027, 7.571404933929443, 7.909694671630859, 8.247983932495117, 8.586274147033691, 8.92456340789795, 9.262853622436523, 9.601142883300781, 9.939432144165039, 10.277721405029297, 10.616011619567871]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 10.0, 16.0, 30.0, 27.0, 42.0, 88.0, 107.0, 158.0, 295.0, 379.0, 550.0, 805.0, 1265.0, 1929.0, 3110.0, 4696.0, 7295.0, 11205.0, 18342.0, 29376.0, 48008.0, 80606.0, 141200.0, 262722.0, 520838.0, 869618.0, 920805.0, 593283.0, 297838.0, 154569.0, 87323.0, 51741.0, 31228.0, 19531.0, 12259.0, 7714.0, 5012.0, 3317.0, 2195.0, 1499.0, 1042.0, 694.0, 496.0, 297.0, 220.0, 145.0, 108.0, 69.0, 53.0, 46.0, 30.0, 24.0, 14.0, 5.0, 7.0, 5.0, 2.0, 3.0, 0.0, 3.0], "bins": [-11.6328125, -11.246337890625, -10.85986328125, -10.473388671875, -10.0869140625, -9.700439453125, -9.31396484375, -8.927490234375, -8.541015625, -8.154541015625, -7.76806640625, -7.381591796875, -6.9951171875, -6.608642578125, -6.22216796875, -5.835693359375, -5.44921875, -5.062744140625, -4.67626953125, -4.289794921875, -3.9033203125, -3.516845703125, -3.13037109375, -2.743896484375, -2.357421875, -1.970947265625, -1.58447265625, -1.197998046875, -0.8115234375, -0.425048828125, -0.03857421875, 0.347900390625, 0.734375, 1.120849609375, 1.50732421875, 1.893798828125, 2.2802734375, 2.666748046875, 3.05322265625, 3.439697265625, 3.826171875, 4.212646484375, 4.59912109375, 4.985595703125, 5.3720703125, 5.758544921875, 6.14501953125, 6.531494140625, 6.91796875, 7.304443359375, 7.69091796875, 8.077392578125, 8.4638671875, 8.850341796875, 9.23681640625, 9.623291015625, 10.009765625, 10.396240234375, 10.78271484375, 11.169189453125, 11.5556640625, 11.942138671875, 12.32861328125, 12.715087890625, 13.1015625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 6.0, 5.0, 11.0, 16.0, 9.0, 22.0, 15.0, 22.0, 21.0, 29.0, 26.0, 27.0, 28.0, 37.0, 25.0, 30.0, 47.0, 44.0, 38.0, 47.0, 34.0, 35.0, 25.0, 32.0, 36.0, 38.0, 25.0, 39.0, 17.0, 19.0, 25.0, 29.0, 18.0, 13.0, 11.0, 14.0, 12.0, 10.0, 9.0, 10.0, 11.0, 2.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-8.21875, -7.962890625, -7.70703125, -7.451171875, -7.1953125, -6.939453125, -6.68359375, -6.427734375, -6.171875, -5.916015625, -5.66015625, -5.404296875, -5.1484375, -4.892578125, -4.63671875, -4.380859375, -4.125, -3.869140625, -3.61328125, -3.357421875, -3.1015625, -2.845703125, -2.58984375, -2.333984375, -2.078125, -1.822265625, -1.56640625, -1.310546875, -1.0546875, -0.798828125, -0.54296875, -0.287109375, -0.03125, 0.224609375, 0.48046875, 0.736328125, 0.9921875, 1.248046875, 1.50390625, 1.759765625, 2.015625, 2.271484375, 2.52734375, 2.783203125, 3.0390625, 3.294921875, 3.55078125, 3.806640625, 4.0625, 4.318359375, 4.57421875, 4.830078125, 5.0859375, 5.341796875, 5.59765625, 5.853515625, 6.109375, 6.365234375, 6.62109375, 6.876953125, 7.1328125, 7.388671875, 7.64453125, 7.900390625, 8.15625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 11.0, 8.0, 17.0, 32.0, 30.0, 66.0, 111.0, 197.0, 321.0, 549.0, 912.0, 1644.0, 2977.0, 5166.0, 9226.0, 17268.0, 32067.0, 61859.0, 120480.0, 233193.0, 438914.0, 758910.0, 960970.0, 706222.0, 401051.0, 211703.0, 109372.0, 56262.0, 29441.0, 15617.0, 8591.0, 4797.0, 2664.0, 1543.0, 857.0, 515.0, 270.0, 170.0, 113.0, 58.0, 48.0, 29.0, 17.0, 10.0, 5.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.251953125, -12.81640625, -12.380859375, -11.9453125, -11.509765625, -11.07421875, -10.638671875, -10.203125, -9.767578125, -9.33203125, -8.896484375, -8.4609375, -8.025390625, -7.58984375, -7.154296875, -6.71875, -6.283203125, -5.84765625, -5.412109375, -4.9765625, -4.541015625, -4.10546875, -3.669921875, -3.234375, -2.798828125, -2.36328125, -1.927734375, -1.4921875, -1.056640625, -0.62109375, -0.185546875, 0.25, 0.685546875, 1.12109375, 1.556640625, 1.9921875, 2.427734375, 2.86328125, 3.298828125, 3.734375, 4.169921875, 4.60546875, 5.041015625, 5.4765625, 5.912109375, 6.34765625, 6.783203125, 7.21875, 7.654296875, 8.08984375, 8.525390625, 8.9609375, 9.396484375, 9.83203125, 10.267578125, 10.703125, 11.138671875, 11.57421875, 12.009765625, 12.4453125, 12.880859375, 13.31640625, 13.751953125, 14.1875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 7.0, 1.0, 5.0, 5.0, 15.0, 12.0, 7.0, 16.0, 24.0, 28.0, 42.0, 43.0, 57.0, 60.0, 60.0, 103.0, 117.0, 141.0, 147.0, 173.0, 210.0, 224.0, 238.0, 245.0, 272.0, 297.0, 236.0, 228.0, 175.0, 160.0, 131.0, 112.0, 102.0, 77.0, 67.0, 45.0, 41.0, 35.0, 24.0, 22.0, 27.0, 12.0, 11.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.10546875, -4.95556640625, -4.8056640625, -4.65576171875, -4.505859375, -4.35595703125, -4.2060546875, -4.05615234375, -3.90625, -3.75634765625, -3.6064453125, -3.45654296875, -3.306640625, -3.15673828125, -3.0068359375, -2.85693359375, -2.70703125, -2.55712890625, -2.4072265625, -2.25732421875, -2.107421875, -1.95751953125, -1.8076171875, -1.65771484375, -1.5078125, -1.35791015625, -1.2080078125, -1.05810546875, -0.908203125, -0.75830078125, -0.6083984375, -0.45849609375, -0.30859375, -0.15869140625, -0.0087890625, 0.14111328125, 0.291015625, 0.44091796875, 0.5908203125, 0.74072265625, 0.890625, 1.04052734375, 1.1904296875, 1.34033203125, 1.490234375, 1.64013671875, 1.7900390625, 1.93994140625, 2.08984375, 2.23974609375, 2.3896484375, 2.53955078125, 2.689453125, 2.83935546875, 2.9892578125, 3.13916015625, 3.2890625, 3.43896484375, 3.5888671875, 3.73876953125, 3.888671875, 4.03857421875, 4.1884765625, 4.33837890625, 4.48828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 0.0, 4.0, 8.0, 5.0, 8.0, 18.0, 10.0, 12.0, 25.0, 32.0, 27.0, 31.0, 31.0, 45.0, 54.0, 53.0, 44.0, 56.0, 63.0, 49.0, 59.0, 51.0, 55.0, 51.0, 25.0, 36.0, 31.0, 22.0, 27.0, 22.0, 16.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.880816459655762, -10.544637680053711, -10.20845890045166, -9.87228012084961, -9.536101341247559, -9.199922561645508, -8.86374282836914, -8.527565002441406, -8.191385269165039, -7.855206489562988, -7.5190277099609375, -7.182848930358887, -6.846670150756836, -6.510491371154785, -6.174312114715576, -5.838133335113525, -5.501955032348633, -5.165776252746582, -4.829597473144531, -4.4934186935424805, -4.15723991394043, -3.8210608959198, -3.48488187789917, -3.148703098297119, -2.8125243186950684, -2.4763455390930176, -2.140166759490967, -1.803987741470337, -1.4678089618682861, -1.1316301822662354, -0.7954511642456055, -0.4592723846435547, -0.1230936050415039, 0.21308523416519165, 0.5492640733718872, 0.8854429721832275, 1.2216217517852783, 1.557800531387329, 1.893979549407959, 2.2301583290100098, 2.5663371086120605, 2.9025158882141113, 3.238694667816162, 3.574873685836792, 3.9110524654388428, 4.247231483459473, 4.583410263061523, 4.919589042663574, 5.255767822265625, 5.591946601867676, 5.928125381469727, 6.264304161071777, 6.600482940673828, 6.936661720275879, 7.272840976715088, 7.609019756317139, 7.9451985359191895, 8.281377792358398, 8.61755657196045, 8.9537353515625, 9.28991413116455, 9.626092910766602, 9.962271690368652, 10.298450469970703, 10.634629249572754]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 8.0, 10.0, 10.0, 12.0, 10.0, 23.0, 21.0, 19.0, 22.0, 19.0, 22.0, 28.0, 29.0, 26.0, 32.0, 33.0, 43.0, 47.0, 39.0, 37.0, 39.0, 49.0, 34.0, 49.0, 31.0, 31.0, 37.0, 24.0, 28.0, 16.0, 19.0, 17.0, 30.0, 13.0, 16.0, 13.0, 9.0, 8.0, 10.0, 9.0, 11.0, 6.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.259316444396973, -8.971468925476074, -8.683622360229492, -8.395774841308594, -8.107928276062012, -7.8200812339782715, -7.532234191894531, -7.244386672973633, -6.956540107727051, -6.6686930656433105, -6.38084602355957, -6.09299898147583, -5.80515193939209, -5.51730489730835, -5.229457855224609, -4.941610336303711, -4.653763294219971, -4.3659162521362305, -4.07806921005249, -3.79022216796875, -3.5023751258850098, -3.2145280838012695, -2.92668080329895, -2.63883376121521, -2.3509867191314697, -2.0631396770477295, -1.7752926349639893, -1.4874454736709595, -1.1995984315872192, -0.911751389503479, -0.6239042282104492, -0.336057186126709, -0.04821014404296875, 0.23963692784309387, 0.5274839997291565, 0.8153311014175415, 1.1031781435012817, 1.391025185585022, 1.6788723468780518, 1.966719388961792, 2.2545664310455322, 2.5424134731292725, 2.8302605152130127, 3.118107795715332, 3.4059548377990723, 3.6938018798828125, 3.9816489219665527, 4.269495964050293, 4.557343006134033, 4.845190048217773, 5.133037090301514, 5.420884132385254, 5.708731174468994, 5.996578216552734, 6.284425735473633, 6.572272300720215, 6.860119819641113, 7.1479668617248535, 7.435813903808594, 7.723660945892334, 8.011507987976074, 8.299355506896973, 8.587202072143555, 8.875049591064453, 9.162896156311035]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 4.0, 18.0, 17.0, 26.0, 29.0, 57.0, 76.0, 105.0, 158.0, 226.0, 306.0, 450.0, 602.0, 850.0, 1185.0, 1574.0, 2260.0, 3160.0, 4516.0, 6327.0, 9031.0, 12688.0, 17938.0, 26266.0, 39273.0, 60227.0, 98505.0, 220184.0, 245404.0, 103391.0, 62340.0, 40597.0, 27462.0, 18864.0, 12909.0, 9063.0, 6411.0, 4534.0, 3306.0, 2369.0, 1708.0, 1206.0, 860.0, 604.0, 438.0, 290.0, 218.0, 155.0, 116.0, 91.0, 49.0, 37.0, 35.0, 22.0, 10.0, 8.0, 4.0, 3.0, 1.0, 2.0], "bins": [-3.912109375, -3.790008544921875, -3.66790771484375, -3.545806884765625, -3.4237060546875, -3.301605224609375, -3.17950439453125, -3.057403564453125, -2.935302734375, -2.813201904296875, -2.69110107421875, -2.569000244140625, -2.4468994140625, -2.324798583984375, -2.20269775390625, -2.080596923828125, -1.95849609375, -1.836395263671875, -1.71429443359375, -1.592193603515625, -1.4700927734375, -1.347991943359375, -1.22589111328125, -1.103790283203125, -0.981689453125, -0.859588623046875, -0.73748779296875, -0.615386962890625, -0.4932861328125, -0.371185302734375, -0.24908447265625, -0.126983642578125, -0.0048828125, 0.117218017578125, 0.23931884765625, 0.361419677734375, 0.4835205078125, 0.605621337890625, 0.72772216796875, 0.849822998046875, 0.971923828125, 1.094024658203125, 1.21612548828125, 1.338226318359375, 1.4603271484375, 1.582427978515625, 1.70452880859375, 1.826629638671875, 1.94873046875, 2.070831298828125, 2.19293212890625, 2.315032958984375, 2.4371337890625, 2.559234619140625, 2.68133544921875, 2.803436279296875, 2.925537109375, 3.047637939453125, 3.16973876953125, 3.291839599609375, 3.4139404296875, 3.536041259765625, 3.65814208984375, 3.780242919921875, 3.90234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 6.0, 12.0, 11.0, 8.0, 17.0, 18.0, 23.0, 17.0, 21.0, 27.0, 23.0, 28.0, 28.0, 24.0, 33.0, 37.0, 39.0, 36.0, 40.0, 33.0, 40.0, 47.0, 46.0, 33.0, 38.0, 32.0, 30.0, 27.0, 26.0, 32.0, 20.0, 18.0, 15.0, 21.0, 15.0, 9.0, 14.0, 7.0, 10.0, 9.0, 5.0, 8.0, 4.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.4609375, -9.16796875, -8.875, -8.58203125, -8.2890625, -7.99609375, -7.703125, -7.41015625, -7.1171875, -6.82421875, -6.53125, -6.23828125, -5.9453125, -5.65234375, -5.359375, -5.06640625, -4.7734375, -4.48046875, -4.1875, -3.89453125, -3.6015625, -3.30859375, -3.015625, -2.72265625, -2.4296875, -2.13671875, -1.84375, -1.55078125, -1.2578125, -0.96484375, -0.671875, -0.37890625, -0.0859375, 0.20703125, 0.5, 0.79296875, 1.0859375, 1.37890625, 1.671875, 1.96484375, 2.2578125, 2.55078125, 2.84375, 3.13671875, 3.4296875, 3.72265625, 4.015625, 4.30859375, 4.6015625, 4.89453125, 5.1875, 5.48046875, 5.7734375, 6.06640625, 6.359375, 6.65234375, 6.9453125, 7.23828125, 7.53125, 7.82421875, 8.1171875, 8.41015625, 8.703125, 8.99609375, 9.2890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 8.0, 14.0, 24.0, 34.0, 49.0, 76.0, 114.0, 150.0, 251.0, 395.0, 614.0, 930.0, 1421.0, 2282.0, 3667.0, 5823.0, 9377.0, 15253.0, 24349.0, 40634.0, 69239.0, 135700.0, 368981.0, 168945.0, 80552.0, 46008.0, 28065.0, 17341.0, 10345.0, 6530.0, 4102.0, 2606.0, 1724.0, 1049.0, 695.0, 453.0, 267.0, 153.0, 102.0, 78.0, 51.0, 34.0, 19.0, 14.0, 13.0, 8.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.46484375, -5.29205322265625, -5.1192626953125, -4.94647216796875, -4.773681640625, -4.60089111328125, -4.4281005859375, -4.25531005859375, -4.08251953125, -3.90972900390625, -3.7369384765625, -3.56414794921875, -3.391357421875, -3.21856689453125, -3.0457763671875, -2.87298583984375, -2.7001953125, -2.52740478515625, -2.3546142578125, -2.18182373046875, -2.009033203125, -1.83624267578125, -1.6634521484375, -1.49066162109375, -1.31787109375, -1.14508056640625, -0.9722900390625, -0.79949951171875, -0.626708984375, -0.45391845703125, -0.2811279296875, -0.10833740234375, 0.064453125, 0.23724365234375, 0.4100341796875, 0.58282470703125, 0.755615234375, 0.92840576171875, 1.1011962890625, 1.27398681640625, 1.44677734375, 1.61956787109375, 1.7923583984375, 1.96514892578125, 2.137939453125, 2.31072998046875, 2.4835205078125, 2.65631103515625, 2.8291015625, 3.00189208984375, 3.1746826171875, 3.34747314453125, 3.520263671875, 3.69305419921875, 3.8658447265625, 4.03863525390625, 4.21142578125, 4.38421630859375, 4.5570068359375, 4.72979736328125, 4.902587890625, 5.07537841796875, 5.2481689453125, 5.42095947265625, 5.59375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 9.0, 12.0, 7.0, 16.0, 17.0, 17.0, 21.0, 15.0, 23.0, 16.0, 32.0, 44.0, 42.0, 45.0, 43.0, 43.0, 44.0, 49.0, 39.0, 39.0, 58.0, 51.0, 25.0, 36.0, 27.0, 36.0, 26.0, 23.0, 21.0, 27.0, 27.0, 16.0, 11.0, 14.0, 8.0, 6.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.140625, -6.91595458984375, -6.6912841796875, -6.46661376953125, -6.241943359375, -6.01727294921875, -5.7926025390625, -5.56793212890625, -5.34326171875, -5.11859130859375, -4.8939208984375, -4.66925048828125, -4.444580078125, -4.21990966796875, -3.9952392578125, -3.77056884765625, -3.5458984375, -3.32122802734375, -3.0965576171875, -2.87188720703125, -2.647216796875, -2.42254638671875, -2.1978759765625, -1.97320556640625, -1.74853515625, -1.52386474609375, -1.2991943359375, -1.07452392578125, -0.849853515625, -0.62518310546875, -0.4005126953125, -0.17584228515625, 0.048828125, 0.27349853515625, 0.4981689453125, 0.72283935546875, 0.947509765625, 1.17218017578125, 1.3968505859375, 1.62152099609375, 1.84619140625, 2.07086181640625, 2.2955322265625, 2.52020263671875, 2.744873046875, 2.96954345703125, 3.1942138671875, 3.41888427734375, 3.6435546875, 3.86822509765625, 4.0928955078125, 4.31756591796875, 4.542236328125, 4.76690673828125, 4.9915771484375, 5.21624755859375, 5.44091796875, 5.66558837890625, 5.8902587890625, 6.11492919921875, 6.339599609375, 6.56427001953125, 6.7889404296875, 7.01361083984375, 7.23828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 9.0, 7.0, 11.0, 19.0, 23.0, 26.0, 59.0, 79.0, 115.0, 169.0, 234.0, 344.0, 500.0, 693.0, 1065.0, 1654.0, 2462.0, 3751.0, 6033.0, 9914.0, 16589.0, 28612.0, 52356.0, 104742.0, 203655.0, 260405.0, 167783.0, 83294.0, 42569.0, 23924.0, 14059.0, 8325.0, 5306.0, 3302.0, 2097.0, 1433.0, 872.0, 595.0, 424.0, 331.0, 212.0, 155.0, 113.0, 79.0, 51.0, 40.0, 30.0, 16.0, 6.0, 5.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0106353759765625, -0.010306477546691895, -0.009977579116821289, -0.009648680686950684, -0.009319782257080078, -0.008990883827209473, -0.008661985397338867, -0.008333086967468262, -0.008004188537597656, -0.007675290107727051, -0.007346391677856445, -0.00701749324798584, -0.006688594818115234, -0.006359696388244629, -0.0060307979583740234, -0.005701899528503418, -0.0053730010986328125, -0.005044102668762207, -0.0047152042388916016, -0.004386305809020996, -0.004057407379150391, -0.003728508949279785, -0.0033996105194091797, -0.0030707120895385742, -0.0027418136596679688, -0.0024129152297973633, -0.002084016799926758, -0.0017551183700561523, -0.0014262199401855469, -0.0010973215103149414, -0.0007684230804443359, -0.00043952465057373047, -0.000110626220703125, 0.00021827220916748047, 0.0005471706390380859, 0.0008760690689086914, 0.0012049674987792969, 0.0015338659286499023, 0.0018627643585205078, 0.0021916627883911133, 0.0025205612182617188, 0.0028494596481323242, 0.0031783580780029297, 0.003507256507873535, 0.0038361549377441406, 0.004165053367614746, 0.0044939517974853516, 0.004822850227355957, 0.0051517486572265625, 0.005480647087097168, 0.0058095455169677734, 0.006138443946838379, 0.006467342376708984, 0.00679624080657959, 0.007125139236450195, 0.007454037666320801, 0.007782936096191406, 0.008111834526062012, 0.008440732955932617, 0.008769631385803223, 0.009098529815673828, 0.009427428245544434, 0.009756326675415039, 0.010085225105285645, 0.01041412353515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 7.0, 11.0, 11.0, 15.0, 20.0, 27.0, 31.0, 24.0, 49.0, 52.0, 63.0, 77.0, 59.0, 45.0, 72.0, 72.0, 54.0, 57.0, 41.0, 44.0, 34.0, 34.0, 20.0, 11.0, 16.0, 20.0, 4.0, 10.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0907649993896484e-05, -1.0620802640914917e-05, -1.033395528793335e-05, -1.0047107934951782e-05, -9.760260581970215e-06, -9.473413228988647e-06, -9.18656587600708e-06, -8.899718523025513e-06, -8.612871170043945e-06, -8.326023817062378e-06, -8.03917646408081e-06, -7.752329111099243e-06, -7.465481758117676e-06, -7.178634405136108e-06, -6.891787052154541e-06, -6.604939699172974e-06, -6.318092346191406e-06, -6.031244993209839e-06, -5.7443976402282715e-06, -5.457550287246704e-06, -5.170702934265137e-06, -4.883855581283569e-06, -4.597008228302002e-06, -4.3101608753204346e-06, -4.023313522338867e-06, -3.7364661693573e-06, -3.4496188163757324e-06, -3.162771463394165e-06, -2.8759241104125977e-06, -2.5890767574310303e-06, -2.302229404449463e-06, -2.0153820514678955e-06, -1.7285346984863281e-06, -1.4416873455047607e-06, -1.1548399925231934e-06, -8.67992639541626e-07, -5.811452865600586e-07, -2.942979335784912e-07, -7.450580596923828e-09, 2.7939677238464355e-07, 5.662441253662109e-07, 8.530914783477783e-07, 1.1399388313293457e-06, 1.426786184310913e-06, 1.7136335372924805e-06, 2.000480890274048e-06, 2.2873282432556152e-06, 2.5741755962371826e-06, 2.86102294921875e-06, 3.1478703022003174e-06, 3.4347176551818848e-06, 3.721565008163452e-06, 4.0084123611450195e-06, 4.295259714126587e-06, 4.582107067108154e-06, 4.868954420089722e-06, 5.155801773071289e-06, 5.4426491260528564e-06, 5.729496479034424e-06, 6.016343832015991e-06, 6.303191184997559e-06, 6.590038537979126e-06, 6.876885890960693e-06, 7.163733243942261e-06, 7.450580596923828e-06]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 9.0, 5.0, 15.0, 23.0, 44.0, 37.0, 55.0, 80.0, 100.0, 146.0, 232.0, 345.0, 496.0, 750.0, 1072.0, 1728.0, 2559.0, 3953.0, 6294.0, 9909.0, 16836.0, 28788.0, 52452.0, 96619.0, 166869.0, 219903.0, 185041.0, 110838.0, 60084.0, 33045.0, 18998.0, 11305.0, 6969.0, 4488.0, 2764.0, 1839.0, 1274.0, 804.0, 558.0, 348.0, 301.0, 143.0, 138.0, 87.0, 57.0, 53.0, 39.0, 16.0, 12.0, 9.0, 6.0, 8.0, 4.0, 4.0, 0.0, 3.0], "bins": [-0.00983428955078125, -0.009541749954223633, -0.009249210357666016, -0.008956670761108398, -0.008664131164550781, -0.008371591567993164, -0.008079051971435547, -0.00778651237487793, -0.0074939727783203125, -0.007201433181762695, -0.006908893585205078, -0.006616353988647461, -0.006323814392089844, -0.0060312747955322266, -0.005738735198974609, -0.005446195602416992, -0.005153656005859375, -0.004861116409301758, -0.004568576812744141, -0.0042760372161865234, -0.003983497619628906, -0.003690958023071289, -0.003398418426513672, -0.0031058788299560547, -0.0028133392333984375, -0.0025207996368408203, -0.002228260040283203, -0.001935720443725586, -0.0016431808471679688, -0.0013506412506103516, -0.0010581016540527344, -0.0007655620574951172, -0.0004730224609375, -0.0001804828643798828, 0.00011205673217773438, 0.00040459632873535156, 0.0006971359252929688, 0.000989675521850586, 0.0012822151184082031, 0.0015747547149658203, 0.0018672943115234375, 0.0021598339080810547, 0.002452373504638672, 0.002744913101196289, 0.0030374526977539062, 0.0033299922943115234, 0.0036225318908691406, 0.003915071487426758, 0.004207611083984375, 0.004500150680541992, 0.004792690277099609, 0.0050852298736572266, 0.005377769470214844, 0.005670309066772461, 0.005962848663330078, 0.006255388259887695, 0.0065479278564453125, 0.00684046745300293, 0.007133007049560547, 0.007425546646118164, 0.007718086242675781, 0.008010625839233398, 0.008303165435791016, 0.008595705032348633, 0.00888824462890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 3.0, 6.0, 4.0, 4.0, 9.0, 12.0, 12.0, 20.0, 25.0, 36.0, 45.0, 69.0, 70.0, 78.0, 77.0, 78.0, 72.0, 69.0, 66.0, 52.0, 42.0, 25.0, 22.0, 22.0, 17.0, 9.0, 6.0, 9.0, 10.0, 6.0, 4.0, 1.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0030155181884765625, -0.0028961598873138428, -0.002776801586151123, -0.0026574432849884033, -0.0025380849838256836, -0.002418726682662964, -0.002299368381500244, -0.0021800100803375244, -0.0020606517791748047, -0.001941293478012085, -0.0018219351768493652, -0.0017025768756866455, -0.0015832185745239258, -0.001463860273361206, -0.0013445019721984863, -0.0012251436710357666, -0.0011057853698730469, -0.0009864270687103271, -0.0008670687675476074, -0.0007477104663848877, -0.000628352165222168, -0.0005089938640594482, -0.0003896355628967285, -0.0002702772617340088, -0.00015091896057128906, -3.1560659408569336e-05, 8.779764175415039e-05, 0.00020715594291687012, 0.00032651424407958984, 0.00044587254524230957, 0.0005652308464050293, 0.000684589147567749, 0.0008039474487304688, 0.0009233057498931885, 0.0010426640510559082, 0.001162022352218628, 0.0012813806533813477, 0.0014007389545440674, 0.0015200972557067871, 0.0016394555568695068, 0.0017588138580322266, 0.0018781721591949463, 0.001997530460357666, 0.0021168887615203857, 0.0022362470626831055, 0.002355605363845825, 0.002474963665008545, 0.0025943219661712646, 0.0027136802673339844, 0.002833038568496704, 0.002952396869659424, 0.0030717551708221436, 0.0031911134719848633, 0.003310471773147583, 0.0034298300743103027, 0.0035491883754730225, 0.003668546676635742, 0.003787904977798462, 0.003907263278961182, 0.004026621580123901, 0.004145979881286621, 0.004265338182449341, 0.0043846964836120605, 0.00450405478477478, 0.0046234130859375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 10.0, 13.0, 19.0, 17.0, 26.0, 29.0, 28.0, 32.0, 41.0, 48.0, 56.0, 40.0, 60.0, 54.0, 45.0, 60.0, 46.0, 60.0, 54.0, 41.0, 30.0, 35.0, 27.0, 28.0, 23.0, 18.0, 13.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.445613861083984, -10.11830997467041, -9.791006088256836, -9.463703155517578, -9.136399269104004, -8.80909538269043, -8.481791496276855, -8.154487609863281, -7.827184200286865, -7.499880313873291, -7.172576904296875, -6.845273017883301, -6.517969131469727, -6.1906657218933105, -5.863361835479736, -5.53605842590332, -5.208754539489746, -4.881450653076172, -4.554147243499756, -4.226843357086182, -3.8995397090911865, -3.5722360610961914, -3.244932174682617, -2.917628526687622, -2.590324878692627, -2.263021230697632, -1.9357174634933472, -1.6084136962890625, -1.2811100482940674, -0.9538064002990723, -0.6265026330947876, -0.29919886589050293, 0.028104782104492188, 0.3554084897041321, 0.682712197303772, 1.0100159645080566, 1.3373196125030518, 1.6646232604980469, 1.9919270277023315, 2.319230794906616, 2.6465344429016113, 2.9738380908966064, 3.3011417388916016, 3.628445625305176, 3.955749273300171, 4.283052921295166, 4.61035680770874, 4.937660217285156, 5.2649641036987305, 5.592267990112305, 5.919571399688721, 6.246875286102295, 6.574178695678711, 6.901482582092285, 7.228786468505859, 7.556090354919434, 7.88339376449585, 8.210697174072266, 8.53800106048584, 8.865304946899414, 9.192608833312988, 9.519912719726562, 9.84721565246582, 10.174519538879395, 10.501823425292969]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 8.0, 10.0, 11.0, 10.0, 11.0, 21.0, 22.0, 21.0, 21.0, 18.0, 24.0, 28.0, 29.0, 26.0, 31.0, 30.0, 46.0, 46.0, 37.0, 38.0, 39.0, 49.0, 33.0, 51.0, 31.0, 31.0, 34.0, 29.0, 26.0, 17.0, 18.0, 16.0, 30.0, 15.0, 13.0, 16.0, 9.0, 7.0, 10.0, 9.0, 11.0, 7.0, 1.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.089089393615723, -8.806999206542969, -8.524909019470215, -8.242818832397461, -7.960728645324707, -7.678638458251953, -7.396548748016357, -7.1144585609436035, -6.83236837387085, -6.550278186798096, -6.268187999725342, -5.986097812652588, -5.704008102416992, -5.421917915344238, -5.139827728271484, -4.8577375411987305, -4.575647354125977, -4.293557167053223, -4.011466979980469, -3.729377031326294, -3.44728684425354, -3.165196657180786, -2.8831067085266113, -2.6010165214538574, -2.3189263343811035, -2.0368361473083496, -1.7547460794448853, -1.472656011581421, -1.190565824508667, -0.9084756374359131, -0.6263855695724487, -0.3442955017089844, -0.062206268310546875, 0.21988385915756226, 0.5019739866256714, 0.7840641140937805, 1.0661542415618896, 1.3482444286346436, 1.630334496498108, 1.9124245643615723, 2.194514751434326, 2.47660493850708, 2.758695125579834, 3.040785074234009, 3.3228752613067627, 3.6049654483795166, 3.8870553970336914, 4.169145584106445, 4.451235771179199, 4.733325958251953, 5.015416145324707, 5.297506332397461, 5.579596519470215, 5.861686706542969, 6.1437764167785645, 6.425866603851318, 6.707956790924072, 6.990046977996826, 7.27213716506958, 7.554227352142334, 7.83631706237793, 8.118407249450684, 8.400497436523438, 8.682587623596191, 8.964677810668945]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 9.0, 9.0, 25.0, 31.0, 61.0, 80.0, 105.0, 180.0, 258.0, 424.0, 660.0, 1009.0, 1558.0, 2350.0, 3797.0, 5867.0, 9411.0, 14385.0, 22525.0, 34655.0, 54589.0, 81816.0, 115485.0, 144125.0, 149831.0, 128896.0, 94721.0, 64368.0, 41838.0, 26979.0, 17522.0, 11039.0, 7166.0, 4567.0, 2972.0, 1845.0, 1209.0, 737.0, 517.0, 309.0, 212.0, 136.0, 88.0, 71.0, 40.0, 27.0, 25.0, 15.0, 4.0, 4.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.03125, -10.666015625, -10.30078125, -9.935546875, -9.5703125, -9.205078125, -8.83984375, -8.474609375, -8.109375, -7.744140625, -7.37890625, -7.013671875, -6.6484375, -6.283203125, -5.91796875, -5.552734375, -5.1875, -4.822265625, -4.45703125, -4.091796875, -3.7265625, -3.361328125, -2.99609375, -2.630859375, -2.265625, -1.900390625, -1.53515625, -1.169921875, -0.8046875, -0.439453125, -0.07421875, 0.291015625, 0.65625, 1.021484375, 1.38671875, 1.751953125, 2.1171875, 2.482421875, 2.84765625, 3.212890625, 3.578125, 3.943359375, 4.30859375, 4.673828125, 5.0390625, 5.404296875, 5.76953125, 6.134765625, 6.5, 6.865234375, 7.23046875, 7.595703125, 7.9609375, 8.326171875, 8.69140625, 9.056640625, 9.421875, 9.787109375, 10.15234375, 10.517578125, 10.8828125, 11.248046875, 11.61328125, 11.978515625, 12.34375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 4.0, 4.0, 6.0, 7.0, 12.0, 19.0, 6.0, 13.0, 15.0, 22.0, 20.0, 24.0, 25.0, 29.0, 27.0, 31.0, 37.0, 30.0, 46.0, 36.0, 58.0, 36.0, 39.0, 38.0, 39.0, 36.0, 34.0, 41.0, 24.0, 28.0, 30.0, 19.0, 24.0, 20.0, 17.0, 13.0, 24.0, 13.0, 8.0, 11.0, 6.0, 8.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.71875, -8.446044921875, -8.17333984375, -7.900634765625, -7.6279296875, -7.355224609375, -7.08251953125, -6.809814453125, -6.537109375, -6.264404296875, -5.99169921875, -5.718994140625, -5.4462890625, -5.173583984375, -4.90087890625, -4.628173828125, -4.35546875, -4.082763671875, -3.81005859375, -3.537353515625, -3.2646484375, -2.991943359375, -2.71923828125, -2.446533203125, -2.173828125, -1.901123046875, -1.62841796875, -1.355712890625, -1.0830078125, -0.810302734375, -0.53759765625, -0.264892578125, 0.0078125, 0.280517578125, 0.55322265625, 0.825927734375, 1.0986328125, 1.371337890625, 1.64404296875, 1.916748046875, 2.189453125, 2.462158203125, 2.73486328125, 3.007568359375, 3.2802734375, 3.552978515625, 3.82568359375, 4.098388671875, 4.37109375, 4.643798828125, 4.91650390625, 5.189208984375, 5.4619140625, 5.734619140625, 6.00732421875, 6.280029296875, 6.552734375, 6.825439453125, 7.09814453125, 7.370849609375, 7.6435546875, 7.916259765625, 8.18896484375, 8.461669921875, 8.734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 8.0, 1.0, 9.0, 7.0, 18.0, 23.0, 37.0, 67.0, 86.0, 128.0, 199.0, 322.0, 489.0, 828.0, 1181.0, 1849.0, 2787.0, 4312.0, 6422.0, 9919.0, 15361.0, 23342.0, 35383.0, 53112.0, 77599.0, 105653.0, 130395.0, 139613.0, 126036.0, 100221.0, 71071.0, 48497.0, 32299.0, 21171.0, 13738.0, 9141.0, 6086.0, 3896.0, 2486.0, 1666.0, 1104.0, 672.0, 497.0, 279.0, 193.0, 128.0, 77.0, 58.0, 34.0, 35.0, 11.0, 11.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-10.640625, -10.3016357421875, -9.962646484375, -9.6236572265625, -9.28466796875, -8.9456787109375, -8.606689453125, -8.2677001953125, -7.9287109375, -7.5897216796875, -7.250732421875, -6.9117431640625, -6.57275390625, -6.2337646484375, -5.894775390625, -5.5557861328125, -5.216796875, -4.8778076171875, -4.538818359375, -4.1998291015625, -3.86083984375, -3.5218505859375, -3.182861328125, -2.8438720703125, -2.5048828125, -2.1658935546875, -1.826904296875, -1.4879150390625, -1.14892578125, -0.8099365234375, -0.470947265625, -0.1319580078125, 0.20703125, 0.5460205078125, 0.885009765625, 1.2239990234375, 1.56298828125, 1.9019775390625, 2.240966796875, 2.5799560546875, 2.9189453125, 3.2579345703125, 3.596923828125, 3.9359130859375, 4.27490234375, 4.6138916015625, 4.952880859375, 5.2918701171875, 5.630859375, 5.9698486328125, 6.308837890625, 6.6478271484375, 6.98681640625, 7.3258056640625, 7.664794921875, 8.0037841796875, 8.3427734375, 8.6817626953125, 9.020751953125, 9.3597412109375, 9.69873046875, 10.0377197265625, 10.376708984375, 10.7156982421875, 11.0546875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 9.0, 10.0, 7.0, 7.0, 15.0, 20.0, 18.0, 15.0, 23.0, 31.0, 33.0, 40.0, 35.0, 36.0, 46.0, 46.0, 32.0, 52.0, 38.0, 51.0, 34.0, 32.0, 43.0, 43.0, 43.0, 35.0, 27.0, 32.0, 23.0, 25.0, 16.0, 17.0, 17.0, 12.0, 5.0, 4.0, 5.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.4935302734375, -5.299560546875, -5.1055908203125, -4.91162109375, -4.7176513671875, -4.523681640625, -4.3297119140625, -4.1357421875, -3.9417724609375, -3.747802734375, -3.5538330078125, -3.35986328125, -3.1658935546875, -2.971923828125, -2.7779541015625, -2.583984375, -2.3900146484375, -2.196044921875, -2.0020751953125, -1.80810546875, -1.6141357421875, -1.420166015625, -1.2261962890625, -1.0322265625, -0.8382568359375, -0.644287109375, -0.4503173828125, -0.25634765625, -0.0623779296875, 0.131591796875, 0.3255615234375, 0.51953125, 0.7135009765625, 0.907470703125, 1.1014404296875, 1.29541015625, 1.4893798828125, 1.683349609375, 1.8773193359375, 2.0712890625, 2.2652587890625, 2.459228515625, 2.6531982421875, 2.84716796875, 3.0411376953125, 3.235107421875, 3.4290771484375, 3.623046875, 3.8170166015625, 4.010986328125, 4.2049560546875, 4.39892578125, 4.5928955078125, 4.786865234375, 4.9808349609375, 5.1748046875, 5.3687744140625, 5.562744140625, 5.7567138671875, 5.95068359375, 6.1446533203125, 6.338623046875, 6.5325927734375, 6.7265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 10.0, 11.0, 23.0, 42.0, 55.0, 97.0, 122.0, 157.0, 259.0, 407.0, 653.0, 1034.0, 1614.0, 2752.0, 4840.0, 8831.0, 17123.0, 34042.0, 69381.0, 131643.0, 202483.0, 219931.0, 163904.0, 92699.0, 46391.0, 22936.0, 11732.0, 6266.0, 3579.0, 2078.0, 1175.0, 777.0, 525.0, 355.0, 221.0, 154.0, 68.0, 57.0, 48.0, 27.0, 10.0, 7.0, 6.0, 9.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0], "bins": [-2.21875, -2.1557464599609375, -2.092742919921875, -2.0297393798828125, -1.96673583984375, -1.9037322998046875, -1.840728759765625, -1.7777252197265625, -1.7147216796875, -1.6517181396484375, -1.588714599609375, -1.5257110595703125, -1.46270751953125, -1.3997039794921875, -1.336700439453125, -1.2736968994140625, -1.210693359375, -1.1476898193359375, -1.084686279296875, -1.0216827392578125, -0.95867919921875, -0.8956756591796875, -0.832672119140625, -0.7696685791015625, -0.7066650390625, -0.6436614990234375, -0.580657958984375, -0.5176544189453125, -0.45465087890625, -0.3916473388671875, -0.328643798828125, -0.2656402587890625, -0.20263671875, -0.1396331787109375, -0.076629638671875, -0.0136260986328125, 0.04937744140625, 0.1123809814453125, 0.175384521484375, 0.2383880615234375, 0.3013916015625, 0.3643951416015625, 0.427398681640625, 0.4904022216796875, 0.55340576171875, 0.6164093017578125, 0.679412841796875, 0.7424163818359375, 0.805419921875, 0.8684234619140625, 0.931427001953125, 0.9944305419921875, 1.05743408203125, 1.1204376220703125, 1.183441162109375, 1.2464447021484375, 1.3094482421875, 1.3724517822265625, 1.435455322265625, 1.4984588623046875, 1.56146240234375, 1.6244659423828125, 1.687469482421875, 1.7504730224609375, 1.8134765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 10.0, 16.0, 19.0, 25.0, 31.0, 41.0, 65.0, 71.0, 85.0, 98.0, 86.0, 93.0, 90.0, 71.0, 50.0, 50.0, 27.0, 23.0, 11.0, 11.0, 13.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002875328063964844, -0.0002783164381980896, -0.0002691000699996948, -0.00025988370180130005, -0.0002506673336029053, -0.0002414509654045105, -0.00023223459720611572, -0.00022301822900772095, -0.00021380186080932617, -0.0002045854926109314, -0.00019536912441253662, -0.00018615275621414185, -0.00017693638801574707, -0.0001677200198173523, -0.00015850365161895752, -0.00014928728342056274, -0.00014007091522216797, -0.0001308545470237732, -0.00012163817882537842, -0.00011242181062698364, -0.00010320544242858887, -9.398907423019409e-05, -8.477270603179932e-05, -7.555633783340454e-05, -6.633996963500977e-05, -5.712360143661499e-05, -4.7907233238220215e-05, -3.869086503982544e-05, -2.9474496841430664e-05, -2.025812864303589e-05, -1.1041760444641113e-05, -1.8253922462463379e-06, 7.3909759521484375e-06, 1.6607344150543213e-05, 2.5823712348937988e-05, 3.5040080547332764e-05, 4.425644874572754e-05, 5.3472816944122314e-05, 6.268918514251709e-05, 7.190555334091187e-05, 8.112192153930664e-05, 9.033828973770142e-05, 9.955465793609619e-05, 0.00010877102613449097, 0.00011798739433288574, 0.00012720376253128052, 0.0001364201307296753, 0.00014563649892807007, 0.00015485286712646484, 0.00016406923532485962, 0.0001732856035232544, 0.00018250197172164917, 0.00019171833992004395, 0.00020093470811843872, 0.0002101510763168335, 0.00021936744451522827, 0.00022858381271362305, 0.00023780018091201782, 0.0002470165491104126, 0.0002562329173088074, 0.00026544928550720215, 0.0002746656537055969, 0.0002838820219039917, 0.0002930983901023865, 0.00030231475830078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 9.0, 7.0, 8.0, 15.0, 18.0, 48.0, 66.0, 81.0, 124.0, 178.0, 269.0, 382.0, 526.0, 825.0, 1176.0, 1888.0, 2935.0, 4574.0, 7180.0, 11945.0, 19926.0, 35004.0, 61442.0, 102364.0, 152330.0, 181813.0, 165386.0, 119485.0, 74113.0, 42124.0, 24278.0, 14210.0, 8737.0, 5228.0, 3318.0, 2094.0, 1479.0, 916.0, 659.0, 399.0, 317.0, 215.0, 155.0, 103.0, 57.0, 46.0, 38.0, 17.0, 13.0, 14.0, 7.0, 10.0, 4.0, 3.0, 1.0, 1.0], "bins": [-1.7119140625, -1.66107177734375, -1.6102294921875, -1.55938720703125, -1.508544921875, -1.45770263671875, -1.4068603515625, -1.35601806640625, -1.30517578125, -1.25433349609375, -1.2034912109375, -1.15264892578125, -1.101806640625, -1.05096435546875, -1.0001220703125, -0.94927978515625, -0.8984375, -0.84759521484375, -0.7967529296875, -0.74591064453125, -0.695068359375, -0.64422607421875, -0.5933837890625, -0.54254150390625, -0.49169921875, -0.44085693359375, -0.3900146484375, -0.33917236328125, -0.288330078125, -0.23748779296875, -0.1866455078125, -0.13580322265625, -0.0849609375, -0.03411865234375, 0.0167236328125, 0.06756591796875, 0.118408203125, 0.16925048828125, 0.2200927734375, 0.27093505859375, 0.32177734375, 0.37261962890625, 0.4234619140625, 0.47430419921875, 0.525146484375, 0.57598876953125, 0.6268310546875, 0.67767333984375, 0.728515625, 0.77935791015625, 0.8302001953125, 0.88104248046875, 0.931884765625, 0.98272705078125, 1.0335693359375, 1.08441162109375, 1.13525390625, 1.18609619140625, 1.2369384765625, 1.28778076171875, 1.338623046875, 1.38946533203125, 1.4403076171875, 1.49114990234375, 1.5419921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 2.0, 6.0, 4.0, 7.0, 7.0, 13.0, 13.0, 15.0, 17.0, 15.0, 19.0, 22.0, 29.0, 48.0, 33.0, 51.0, 54.0, 51.0, 56.0, 62.0, 59.0, 58.0, 49.0, 41.0, 54.0, 32.0, 37.0, 26.0, 25.0, 22.0, 16.0, 6.0, 11.0, 5.0, 9.0, 6.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.6224136352539062, -0.6027374267578125, -0.5830612182617188, -0.563385009765625, -0.5437088012695312, -0.5240325927734375, -0.5043563842773438, -0.48468017578125, -0.46500396728515625, -0.4453277587890625, -0.42565155029296875, -0.405975341796875, -0.38629913330078125, -0.3666229248046875, -0.34694671630859375, -0.3272705078125, -0.30759429931640625, -0.2879180908203125, -0.26824188232421875, -0.248565673828125, -0.22888946533203125, -0.2092132568359375, -0.18953704833984375, -0.16986083984375, -0.15018463134765625, -0.1305084228515625, -0.11083221435546875, -0.091156005859375, -0.07147979736328125, -0.0518035888671875, -0.03212738037109375, -0.012451171875, 0.00722503662109375, 0.0269012451171875, 0.04657745361328125, 0.066253662109375, 0.08592987060546875, 0.1056060791015625, 0.12528228759765625, 0.14495849609375, 0.16463470458984375, 0.1843109130859375, 0.20398712158203125, 0.223663330078125, 0.24333953857421875, 0.2630157470703125, 0.28269195556640625, 0.3023681640625, 0.32204437255859375, 0.3417205810546875, 0.36139678955078125, 0.381072998046875, 0.40074920654296875, 0.4204254150390625, 0.44010162353515625, 0.45977783203125, 0.47945404052734375, 0.4991302490234375, 0.5188064575195312, 0.538482666015625, 0.5581588745117188, 0.5778350830078125, 0.5975112915039062, 0.6171875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 7.0, 11.0, 12.0, 5.0, 13.0, 11.0, 25.0, 30.0, 30.0, 29.0, 39.0, 51.0, 49.0, 62.0, 56.0, 65.0, 74.0, 69.0, 43.0, 44.0, 52.0, 40.0, 40.0, 27.0, 28.0, 23.0, 19.0, 16.0, 10.0, 7.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.640881538391113, -12.287972450256348, -11.935062408447266, -11.5821533203125, -11.229244232177734, -10.876335144042969, -10.523426055908203, -10.170516014099121, -9.817606925964355, -9.46469783782959, -9.111787796020508, -8.758878707885742, -8.405969619750977, -8.053060531616211, -7.700150966644287, -7.347241401672363, -6.994332313537598, -6.641423225402832, -6.288513660430908, -5.935604095458984, -5.582695007324219, -5.229785919189453, -4.876876354217529, -4.5239667892456055, -4.17105770111084, -3.818148374557495, -3.4652390480041504, -3.1123297214508057, -2.759420394897461, -2.406511068344116, -2.0536017417907715, -1.7006924152374268, -1.347783088684082, -0.9948737621307373, -0.6419644355773926, -0.28905510902404785, 0.06385421752929688, 0.4167635440826416, 0.7696728706359863, 1.122582197189331, 1.4754915237426758, 1.8284008502960205, 2.1813101768493652, 2.53421950340271, 2.8871288299560547, 3.2400381565093994, 3.592947483062744, 3.945856809616089, 4.298766136169434, 4.651675224304199, 5.004584789276123, 5.357494354248047, 5.7104034423828125, 6.063312530517578, 6.416222095489502, 6.769131660461426, 7.122040748596191, 7.474949836730957, 7.827859401702881, 8.180768966674805, 8.53367805480957, 8.886587142944336, 9.239496231079102, 9.592406272888184, 9.94531536102295]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 6.0, 9.0, 8.0, 17.0, 14.0, 16.0, 16.0, 31.0, 28.0, 26.0, 52.0, 36.0, 34.0, 30.0, 39.0, 40.0, 50.0, 59.0, 45.0, 30.0, 51.0, 27.0, 33.0, 40.0, 33.0, 23.0, 24.0, 20.0, 25.0, 16.0, 13.0, 23.0, 12.0, 10.0, 9.0, 7.0, 8.0, 5.0, 7.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.428844451904297, -9.131349563598633, -8.833853721618652, -8.536358833312988, -8.238862991333008, -7.941368103027344, -7.64387321472168, -7.346377849578857, -7.048882484436035, -6.751387119293213, -6.453891754150391, -6.156396865844727, -5.858901500701904, -5.561406135559082, -5.263911247253418, -4.966415882110596, -4.668920516967773, -4.371425151824951, -4.073929786682129, -3.776434898376465, -3.4789395332336426, -3.1814441680908203, -2.883949041366577, -2.586453914642334, -2.2889585494995117, -1.991463303565979, -1.6939680576324463, -1.3964728116989136, -1.0989775657653809, -0.8014823198318481, -0.5039870738983154, -0.20649194717407227, 0.0910024642944336, 0.3884977102279663, 0.685992956161499, 0.9834882020950317, 1.2809834480285645, 1.5784786939620972, 1.8759739398956299, 2.173469066619873, 2.4709644317626953, 2.7684597969055176, 3.0659549236297607, 3.363450050354004, 3.660945415496826, 3.9584407806396484, 4.2559356689453125, 4.553431034088135, 4.850926399230957, 5.148421764373779, 5.445917129516602, 5.743412017822266, 6.040907382965088, 6.33840274810791, 6.635897636413574, 6.9333930015563965, 7.230888366699219, 7.528383731842041, 7.825879096984863, 8.123373985290527, 8.420869827270508, 8.718364715576172, 9.015859603881836, 9.3133544921875, 9.61085033416748]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 13.0, 11.0, 15.0, 29.0, 34.0, 60.0, 92.0, 170.0, 247.0, 433.0, 704.0, 1153.0, 1990.0, 3378.0, 5428.0, 9450.0, 16372.0, 29198.0, 52297.0, 96276.0, 182835.0, 361091.0, 681826.0, 968122.0, 823571.0, 463425.0, 230169.0, 118870.0, 63318.0, 35161.0, 20117.0, 11588.0, 6715.0, 3974.0, 2417.0, 1435.0, 904.0, 569.0, 333.0, 178.0, 121.0, 66.0, 50.0, 28.0, 23.0, 13.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-13.015625, -12.6405029296875, -12.265380859375, -11.8902587890625, -11.51513671875, -11.1400146484375, -10.764892578125, -10.3897705078125, -10.0146484375, -9.6395263671875, -9.264404296875, -8.8892822265625, -8.51416015625, -8.1390380859375, -7.763916015625, -7.3887939453125, -7.013671875, -6.6385498046875, -6.263427734375, -5.8883056640625, -5.51318359375, -5.1380615234375, -4.762939453125, -4.3878173828125, -4.0126953125, -3.6375732421875, -3.262451171875, -2.8873291015625, -2.51220703125, -2.1370849609375, -1.761962890625, -1.3868408203125, -1.01171875, -0.6365966796875, -0.261474609375, 0.1136474609375, 0.48876953125, 0.8638916015625, 1.239013671875, 1.6141357421875, 1.9892578125, 2.3643798828125, 2.739501953125, 3.1146240234375, 3.48974609375, 3.8648681640625, 4.239990234375, 4.6151123046875, 4.990234375, 5.3653564453125, 5.740478515625, 6.1156005859375, 6.49072265625, 6.8658447265625, 7.240966796875, 7.6160888671875, 7.9912109375, 8.3663330078125, 8.741455078125, 9.1165771484375, 9.49169921875, 9.8668212890625, 10.241943359375, 10.6170654296875, 10.9921875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 3.0, 4.0, 2.0, 9.0, 8.0, 9.0, 11.0, 19.0, 17.0, 25.0, 21.0, 26.0, 38.0, 36.0, 34.0, 39.0, 46.0, 50.0, 35.0, 63.0, 52.0, 47.0, 39.0, 33.0, 43.0, 30.0, 37.0, 30.0, 44.0, 22.0, 18.0, 13.0, 15.0, 12.0, 13.0, 6.0, 3.0, 12.0, 9.0, 7.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.47320556640625, -8.2120361328125, -7.95086669921875, -7.689697265625, -7.42852783203125, -7.1673583984375, -6.90618896484375, -6.64501953125, -6.38385009765625, -6.1226806640625, -5.86151123046875, -5.600341796875, -5.33917236328125, -5.0780029296875, -4.81683349609375, -4.5556640625, -4.29449462890625, -4.0333251953125, -3.77215576171875, -3.510986328125, -3.24981689453125, -2.9886474609375, -2.72747802734375, -2.46630859375, -2.20513916015625, -1.9439697265625, -1.68280029296875, -1.421630859375, -1.16046142578125, -0.8992919921875, -0.63812255859375, -0.376953125, -0.11578369140625, 0.1453857421875, 0.40655517578125, 0.667724609375, 0.92889404296875, 1.1900634765625, 1.45123291015625, 1.71240234375, 1.97357177734375, 2.2347412109375, 2.49591064453125, 2.757080078125, 3.01824951171875, 3.2794189453125, 3.54058837890625, 3.8017578125, 4.06292724609375, 4.3240966796875, 4.58526611328125, 4.846435546875, 5.10760498046875, 5.3687744140625, 5.62994384765625, 5.89111328125, 6.15228271484375, 6.4134521484375, 6.67462158203125, 6.935791015625, 7.19696044921875, 7.4581298828125, 7.71929931640625, 7.98046875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 15.0, 16.0, 31.0, 46.0, 65.0, 115.0, 149.0, 281.0, 441.0, 713.0, 1108.0, 1733.0, 2999.0, 5026.0, 8741.0, 15143.0, 26618.0, 46346.0, 82002.0, 141731.0, 242185.0, 390264.0, 580143.0, 722401.0, 671184.0, 491437.0, 314759.0, 190118.0, 109934.0, 63621.0, 36223.0, 20175.0, 11718.0, 6702.0, 3959.0, 2344.0, 1402.0, 883.0, 552.0, 379.0, 236.0, 120.0, 99.0, 43.0, 35.0, 16.0, 15.0, 9.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.328125, -9.0147705078125, -8.701416015625, -8.3880615234375, -8.07470703125, -7.7613525390625, -7.447998046875, -7.1346435546875, -6.8212890625, -6.5079345703125, -6.194580078125, -5.8812255859375, -5.56787109375, -5.2545166015625, -4.941162109375, -4.6278076171875, -4.314453125, -4.0010986328125, -3.687744140625, -3.3743896484375, -3.06103515625, -2.7476806640625, -2.434326171875, -2.1209716796875, -1.8076171875, -1.4942626953125, -1.180908203125, -0.8675537109375, -0.55419921875, -0.2408447265625, 0.072509765625, 0.3858642578125, 0.69921875, 1.0125732421875, 1.325927734375, 1.6392822265625, 1.95263671875, 2.2659912109375, 2.579345703125, 2.8927001953125, 3.2060546875, 3.5194091796875, 3.832763671875, 4.1461181640625, 4.45947265625, 4.7728271484375, 5.086181640625, 5.3995361328125, 5.712890625, 6.0262451171875, 6.339599609375, 6.6529541015625, 6.96630859375, 7.2796630859375, 7.593017578125, 7.9063720703125, 8.2197265625, 8.5330810546875, 8.846435546875, 9.1597900390625, 9.47314453125, 9.7864990234375, 10.099853515625, 10.4132080078125, 10.7265625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 10.0, 6.0, 14.0, 11.0, 13.0, 29.0, 31.0, 39.0, 51.0, 63.0, 76.0, 88.0, 117.0, 156.0, 180.0, 207.0, 250.0, 222.0, 275.0, 272.0, 276.0, 291.0, 243.0, 207.0, 162.0, 157.0, 123.0, 129.0, 96.0, 59.0, 53.0, 28.0, 23.0, 26.0, 23.0, 16.0, 15.0, 13.0, 5.0, 8.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51171875, -4.36480712890625, -4.2178955078125, -4.07098388671875, -3.924072265625, -3.77716064453125, -3.6302490234375, -3.48333740234375, -3.33642578125, -3.18951416015625, -3.0426025390625, -2.89569091796875, -2.748779296875, -2.60186767578125, -2.4549560546875, -2.30804443359375, -2.1611328125, -2.01422119140625, -1.8673095703125, -1.72039794921875, -1.573486328125, -1.42657470703125, -1.2796630859375, -1.13275146484375, -0.98583984375, -0.83892822265625, -0.6920166015625, -0.54510498046875, -0.398193359375, -0.25128173828125, -0.1043701171875, 0.04254150390625, 0.189453125, 0.33636474609375, 0.4832763671875, 0.63018798828125, 0.777099609375, 0.92401123046875, 1.0709228515625, 1.21783447265625, 1.36474609375, 1.51165771484375, 1.6585693359375, 1.80548095703125, 1.952392578125, 2.09930419921875, 2.2462158203125, 2.39312744140625, 2.5400390625, 2.68695068359375, 2.8338623046875, 2.98077392578125, 3.127685546875, 3.27459716796875, 3.4215087890625, 3.56842041015625, 3.71533203125, 3.86224365234375, 4.0091552734375, 4.15606689453125, 4.302978515625, 4.44989013671875, 4.5968017578125, 4.74371337890625, 4.890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 9.0, 13.0, 7.0, 17.0, 15.0, 19.0, 23.0, 17.0, 25.0, 27.0, 41.0, 49.0, 46.0, 50.0, 47.0, 57.0, 52.0, 52.0, 55.0, 43.0, 48.0, 32.0, 39.0, 28.0, 35.0, 23.0, 25.0, 19.0, 16.0, 8.0, 16.0, 5.0, 7.0, 7.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.887330055236816, -9.613859176635742, -9.340387344360352, -9.066916465759277, -8.793445587158203, -8.519974708557129, -8.246503829956055, -7.973031997680664, -7.69956111907959, -7.426090240478516, -7.152618885040283, -6.879147529602051, -6.605676651000977, -6.332205772399902, -6.05873441696167, -5.7852630615234375, -5.511792182922363, -5.238321304321289, -4.964849948883057, -4.691378593444824, -4.41790771484375, -4.144436836242676, -3.8709654808044434, -3.59749436378479, -3.3240232467651367, -3.0505521297454834, -2.77708101272583, -2.5036098957061768, -2.2301387786865234, -1.9566676616668701, -1.6831965446472168, -1.4097254276275635, -1.1362547874450684, -0.862783670425415, -0.5893125534057617, -0.3158414363861084, -0.04237031936645508, 0.23110079765319824, 0.5045719146728516, 0.7780430316925049, 1.0515141487121582, 1.3249852657318115, 1.5984563827514648, 1.8719274997711182, 2.1453986167907715, 2.418869733810425, 2.692340850830078, 2.9658119678497314, 3.2392830848693848, 3.512754201889038, 3.7862253189086914, 4.059696197509766, 4.333167552947998, 4.6066389083862305, 4.880109786987305, 5.153580665588379, 5.427052021026611, 5.700523376464844, 5.973994255065918, 6.247465133666992, 6.520936489105225, 6.794407844543457, 7.067878723144531, 7.3413496017456055, 7.614820957183838]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 7.0, 14.0, 18.0, 10.0, 16.0, 29.0, 17.0, 22.0, 29.0, 31.0, 29.0, 30.0, 46.0, 37.0, 33.0, 55.0, 37.0, 44.0, 34.0, 45.0, 40.0, 40.0, 40.0, 37.0, 31.0, 31.0, 20.0, 22.0, 18.0, 26.0, 18.0, 12.0, 12.0, 8.0, 8.0, 8.0, 10.0, 6.0, 6.0, 4.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-9.298376083374023, -9.030542373657227, -8.762709617614746, -8.49487590789795, -8.227042198181152, -7.959208965301514, -7.691375732421875, -7.423542022705078, -7.1557087898254395, -6.887875556945801, -6.620041847229004, -6.352208614349365, -6.084375381469727, -5.81654167175293, -5.548708438873291, -5.280875205993652, -5.0130414962768555, -4.745208263397217, -4.47737455368042, -4.209541320800781, -3.9417078495025635, -3.6738743782043457, -3.406041145324707, -3.1382076740264893, -2.8703742027282715, -2.6025407314300537, -2.334707260131836, -2.0668740272521973, -1.7990405559539795, -1.5312070846557617, -1.2633737325668335, -0.9955403804779053, -0.7277059555053711, -0.4598725438117981, -0.1920391321182251, 0.0757942795753479, 0.3436276912689209, 0.6114611625671387, 0.8792945146560669, 1.1471278667449951, 1.414961338043213, 1.6827948093414307, 1.9506281614303589, 2.218461513519287, 2.486294984817505, 2.7541284561157227, 3.0219616889953613, 3.289795160293579, 3.557628631591797, 3.8254621028900146, 4.093295574188232, 4.361128807067871, 4.628962516784668, 4.896795749664307, 5.164628982543945, 5.432462692260742, 5.700295925140381, 5.9681291580200195, 6.235962867736816, 6.503796100616455, 6.771629333496094, 7.039463043212891, 7.307296276092529, 7.575129508972168, 7.842963218688965]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 13.0, 17.0, 18.0, 36.0, 43.0, 96.0, 121.0, 181.0, 264.0, 392.0, 621.0, 942.0, 1488.0, 2115.0, 3298.0, 5018.0, 7765.0, 11994.0, 18788.0, 30982.0, 51521.0, 91280.0, 200207.0, 331739.0, 121776.0, 64532.0, 38387.0, 23465.0, 14802.0, 9343.0, 6026.0, 3893.0, 2595.0, 1595.0, 1052.0, 716.0, 472.0, 356.0, 189.0, 144.0, 95.0, 61.0, 41.0, 25.0, 18.0, 10.0, 10.0, 3.0, 6.0, 4.0, 2.0, 4.0], "bins": [-4.796875, -4.66064453125, -4.5244140625, -4.38818359375, -4.251953125, -4.11572265625, -3.9794921875, -3.84326171875, -3.70703125, -3.57080078125, -3.4345703125, -3.29833984375, -3.162109375, -3.02587890625, -2.8896484375, -2.75341796875, -2.6171875, -2.48095703125, -2.3447265625, -2.20849609375, -2.072265625, -1.93603515625, -1.7998046875, -1.66357421875, -1.52734375, -1.39111328125, -1.2548828125, -1.11865234375, -0.982421875, -0.84619140625, -0.7099609375, -0.57373046875, -0.4375, -0.30126953125, -0.1650390625, -0.02880859375, 0.107421875, 0.24365234375, 0.3798828125, 0.51611328125, 0.65234375, 0.78857421875, 0.9248046875, 1.06103515625, 1.197265625, 1.33349609375, 1.4697265625, 1.60595703125, 1.7421875, 1.87841796875, 2.0146484375, 2.15087890625, 2.287109375, 2.42333984375, 2.5595703125, 2.69580078125, 2.83203125, 2.96826171875, 3.1044921875, 3.24072265625, 3.376953125, 3.51318359375, 3.6494140625, 3.78564453125, 3.921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 8.0, 5.0, 10.0, 8.0, 16.0, 11.0, 13.0, 24.0, 19.0, 20.0, 36.0, 19.0, 36.0, 36.0, 32.0, 33.0, 37.0, 44.0, 46.0, 29.0, 45.0, 42.0, 34.0, 33.0, 32.0, 44.0, 34.0, 37.0, 31.0, 16.0, 22.0, 20.0, 16.0, 17.0, 22.0, 7.0, 14.0, 13.0, 8.0, 7.0, 4.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 4.0, 4.0], "bins": [-9.5, -9.232421875, -8.96484375, -8.697265625, -8.4296875, -8.162109375, -7.89453125, -7.626953125, -7.359375, -7.091796875, -6.82421875, -6.556640625, -6.2890625, -6.021484375, -5.75390625, -5.486328125, -5.21875, -4.951171875, -4.68359375, -4.416015625, -4.1484375, -3.880859375, -3.61328125, -3.345703125, -3.078125, -2.810546875, -2.54296875, -2.275390625, -2.0078125, -1.740234375, -1.47265625, -1.205078125, -0.9375, -0.669921875, -0.40234375, -0.134765625, 0.1328125, 0.400390625, 0.66796875, 0.935546875, 1.203125, 1.470703125, 1.73828125, 2.005859375, 2.2734375, 2.541015625, 2.80859375, 3.076171875, 3.34375, 3.611328125, 3.87890625, 4.146484375, 4.4140625, 4.681640625, 4.94921875, 5.216796875, 5.484375, 5.751953125, 6.01953125, 6.287109375, 6.5546875, 6.822265625, 7.08984375, 7.357421875, 7.625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [6.0, 6.0, 9.0, 16.0, 18.0, 28.0, 23.0, 36.0, 76.0, 93.0, 174.0, 206.0, 311.0, 451.0, 607.0, 1014.0, 1416.0, 2044.0, 3083.0, 4452.0, 6582.0, 9875.0, 14375.0, 21864.0, 33168.0, 51830.0, 89610.0, 192734.0, 322271.0, 112674.0, 62999.0, 38686.0, 25407.0, 17272.0, 11375.0, 7578.0, 5246.0, 3461.0, 2328.0, 1595.0, 1133.0, 791.0, 546.0, 360.0, 226.0, 149.0, 108.0, 97.0, 51.0, 43.0, 25.0, 16.0, 10.0, 3.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.46484375, -3.3419189453125, -3.218994140625, -3.0960693359375, -2.97314453125, -2.8502197265625, -2.727294921875, -2.6043701171875, -2.4814453125, -2.3585205078125, -2.235595703125, -2.1126708984375, -1.98974609375, -1.8668212890625, -1.743896484375, -1.6209716796875, -1.498046875, -1.3751220703125, -1.252197265625, -1.1292724609375, -1.00634765625, -0.8834228515625, -0.760498046875, -0.6375732421875, -0.5146484375, -0.3917236328125, -0.268798828125, -0.1458740234375, -0.02294921875, 0.0999755859375, 0.222900390625, 0.3458251953125, 0.46875, 0.5916748046875, 0.714599609375, 0.8375244140625, 0.96044921875, 1.0833740234375, 1.206298828125, 1.3292236328125, 1.4521484375, 1.5750732421875, 1.697998046875, 1.8209228515625, 1.94384765625, 2.0667724609375, 2.189697265625, 2.3126220703125, 2.435546875, 2.5584716796875, 2.681396484375, 2.8043212890625, 2.92724609375, 3.0501708984375, 3.173095703125, 3.2960205078125, 3.4189453125, 3.5418701171875, 3.664794921875, 3.7877197265625, 3.91064453125, 4.0335693359375, 4.156494140625, 4.2794189453125, 4.40234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 6.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 15.0, 10.0, 12.0, 10.0, 10.0, 10.0, 17.0, 19.0, 20.0, 23.0, 24.0, 27.0, 35.0, 34.0, 30.0, 37.0, 41.0, 40.0, 31.0, 44.0, 42.0, 48.0, 32.0, 42.0, 33.0, 34.0, 36.0, 25.0, 23.0, 19.0, 17.0, 14.0, 27.0, 16.0, 18.0, 16.0, 14.0, 9.0, 10.0, 6.0, 8.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.5390625, -4.37847900390625, -4.2178955078125, -4.05731201171875, -3.896728515625, -3.73614501953125, -3.5755615234375, -3.41497802734375, -3.25439453125, -3.09381103515625, -2.9332275390625, -2.77264404296875, -2.612060546875, -2.45147705078125, -2.2908935546875, -2.13031005859375, -1.9697265625, -1.80914306640625, -1.6485595703125, -1.48797607421875, -1.327392578125, -1.16680908203125, -1.0062255859375, -0.84564208984375, -0.68505859375, -0.52447509765625, -0.3638916015625, -0.20330810546875, -0.042724609375, 0.11785888671875, 0.2784423828125, 0.43902587890625, 0.599609375, 0.76019287109375, 0.9207763671875, 1.08135986328125, 1.241943359375, 1.40252685546875, 1.5631103515625, 1.72369384765625, 1.88427734375, 2.04486083984375, 2.2054443359375, 2.36602783203125, 2.526611328125, 2.68719482421875, 2.8477783203125, 3.00836181640625, 3.1689453125, 3.32952880859375, 3.4901123046875, 3.65069580078125, 3.811279296875, 3.97186279296875, 4.1324462890625, 4.29302978515625, 4.45361328125, 4.61419677734375, 4.7747802734375, 4.93536376953125, 5.095947265625, 5.25653076171875, 5.4171142578125, 5.57769775390625, 5.73828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 6.0, 14.0, 27.0, 27.0, 37.0, 46.0, 85.0, 137.0, 210.0, 287.0, 410.0, 610.0, 821.0, 1270.0, 1933.0, 3051.0, 4750.0, 7495.0, 12428.0, 21014.0, 36954.0, 70381.0, 147509.0, 258034.0, 229065.0, 117362.0, 57022.0, 30637.0, 17724.0, 10500.0, 6531.0, 4245.0, 2671.0, 1777.0, 1100.0, 752.0, 545.0, 362.0, 234.0, 158.0, 95.0, 65.0, 58.0, 34.0, 31.0, 24.0, 6.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.010986328125, -0.010661721229553223, -0.010337114334106445, -0.010012507438659668, -0.00968790054321289, -0.009363293647766113, -0.009038686752319336, -0.008714079856872559, -0.008389472961425781, -0.008064866065979004, -0.0077402591705322266, -0.007415652275085449, -0.007091045379638672, -0.0067664384841918945, -0.006441831588745117, -0.00611722469329834, -0.0057926177978515625, -0.005468010902404785, -0.005143404006958008, -0.0048187971115112305, -0.004494190216064453, -0.004169583320617676, -0.0038449764251708984, -0.003520369529724121, -0.0031957626342773438, -0.0028711557388305664, -0.002546548843383789, -0.0022219419479370117, -0.0018973350524902344, -0.001572728157043457, -0.0012481212615966797, -0.0009235143661499023, -0.000598907470703125, -0.00027430057525634766, 5.030632019042969e-05, 0.00037491321563720703, 0.0006995201110839844, 0.0010241270065307617, 0.001348733901977539, 0.0016733407974243164, 0.0019979476928710938, 0.002322554588317871, 0.0026471614837646484, 0.0029717683792114258, 0.003296375274658203, 0.0036209821701049805, 0.003945589065551758, 0.004270195960998535, 0.0045948028564453125, 0.00491940975189209, 0.005244016647338867, 0.0055686235427856445, 0.005893230438232422, 0.006217837333679199, 0.0065424442291259766, 0.006867051124572754, 0.007191658020019531, 0.007516264915466309, 0.007840871810913086, 0.008165478706359863, 0.00849008560180664, 0.008814692497253418, 0.009139299392700195, 0.009463906288146973, 0.00978851318359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 10.0, 9.0, 5.0, 8.0, 17.0, 13.0, 13.0, 30.0, 23.0, 27.0, 30.0, 31.0, 33.0, 56.0, 39.0, 38.0, 66.0, 41.0, 43.0, 55.0, 53.0, 34.0, 52.0, 28.0, 37.0, 36.0, 29.0, 33.0, 23.0, 11.0, 12.0, 10.0, 9.0, 14.0, 10.0, 6.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.602836608886719e-06, -5.403533577919006e-06, -5.204230546951294e-06, -5.0049275159835815e-06, -4.805624485015869e-06, -4.606321454048157e-06, -4.407018423080444e-06, -4.207715392112732e-06, -4.0084123611450195e-06, -3.809109330177307e-06, -3.6098062992095947e-06, -3.4105032682418823e-06, -3.21120023727417e-06, -3.0118972063064575e-06, -2.812594175338745e-06, -2.6132911443710327e-06, -2.4139881134033203e-06, -2.214685082435608e-06, -2.0153820514678955e-06, -1.816079020500183e-06, -1.6167759895324707e-06, -1.4174729585647583e-06, -1.218169927597046e-06, -1.0188668966293335e-06, -8.195638656616211e-07, -6.202608346939087e-07, -4.209578037261963e-07, -2.2165477275848389e-07, -2.2351741790771484e-08, 1.7695128917694092e-07, 3.762543201446533e-07, 5.755573511123657e-07, 7.748603820800781e-07, 9.741634130477905e-07, 1.173466444015503e-06, 1.3727694749832153e-06, 1.5720725059509277e-06, 1.7713755369186401e-06, 1.9706785678863525e-06, 2.169981598854065e-06, 2.3692846298217773e-06, 2.5685876607894897e-06, 2.767890691757202e-06, 2.9671937227249146e-06, 3.166496753692627e-06, 3.3657997846603394e-06, 3.5651028156280518e-06, 3.764405846595764e-06, 3.9637088775634766e-06, 4.163011908531189e-06, 4.362314939498901e-06, 4.561617970466614e-06, 4.760921001434326e-06, 4.9602240324020386e-06, 5.159527063369751e-06, 5.358830094337463e-06, 5.558133125305176e-06, 5.757436156272888e-06, 5.956739187240601e-06, 6.156042218208313e-06, 6.355345249176025e-06, 6.554648280143738e-06, 6.75395131111145e-06, 6.953254342079163e-06, 7.152557373046875e-06]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 9.0, 10.0, 18.0, 26.0, 34.0, 50.0, 50.0, 102.0, 130.0, 188.0, 259.0, 385.0, 624.0, 945.0, 1446.0, 2187.0, 3483.0, 5771.0, 9853.0, 17214.0, 32632.0, 68872.0, 157478.0, 281628.0, 240342.0, 113743.0, 50995.0, 25186.0, 13949.0, 7854.0, 4667.0, 2959.0, 1859.0, 1199.0, 807.0, 516.0, 323.0, 238.0, 154.0, 115.0, 67.0, 61.0, 46.0, 27.0, 22.0, 17.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012420654296875, -0.01203012466430664, -0.011639595031738281, -0.011249065399169922, -0.010858535766601562, -0.010468006134033203, -0.010077476501464844, -0.009686946868896484, -0.009296417236328125, -0.008905887603759766, -0.008515357971191406, -0.008124828338623047, -0.0077342987060546875, -0.007343769073486328, -0.006953239440917969, -0.006562709808349609, -0.00617218017578125, -0.005781650543212891, -0.005391120910644531, -0.005000591278076172, -0.0046100616455078125, -0.004219532012939453, -0.0038290023803710938, -0.0034384727478027344, -0.003047943115234375, -0.0026574134826660156, -0.0022668838500976562, -0.0018763542175292969, -0.0014858245849609375, -0.0010952949523925781, -0.0007047653198242188, -0.0003142356872558594, 7.62939453125e-05, 0.0004668235778808594, 0.0008573532104492188, 0.0012478828430175781, 0.0016384124755859375, 0.002028942108154297, 0.0024194717407226562, 0.0028100013732910156, 0.003200531005859375, 0.0035910606384277344, 0.003981590270996094, 0.004372119903564453, 0.0047626495361328125, 0.005153179168701172, 0.005543708801269531, 0.005934238433837891, 0.00632476806640625, 0.006715297698974609, 0.007105827331542969, 0.007496356964111328, 0.007886886596679688, 0.008277416229248047, 0.008667945861816406, 0.009058475494384766, 0.009449005126953125, 0.009839534759521484, 0.010230064392089844, 0.010620594024658203, 0.011011123657226562, 0.011401653289794922, 0.011792182922363281, 0.01218271255493164, 0.0125732421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 13.0, 10.0, 13.0, 13.0, 7.0, 17.0, 26.0, 38.0, 39.0, 64.0, 91.0, 91.0, 86.0, 75.0, 90.0, 75.0, 56.0, 39.0, 27.0, 23.0, 16.0, 15.0, 11.0, 6.0, 6.0, 7.0, 8.0, 6.0, 4.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.004863739013671875, -0.004719376564025879, -0.004575014114379883, -0.004430651664733887, -0.004286289215087891, -0.0041419267654418945, -0.0039975643157958984, -0.0038532018661499023, -0.0037088394165039062, -0.00356447696685791, -0.003420114517211914, -0.003275752067565918, -0.003131389617919922, -0.0029870271682739258, -0.0028426647186279297, -0.0026983022689819336, -0.0025539398193359375, -0.0024095773696899414, -0.0022652149200439453, -0.0021208524703979492, -0.001976490020751953, -0.001832127571105957, -0.001687765121459961, -0.0015434026718139648, -0.0013990402221679688, -0.0012546777725219727, -0.0011103153228759766, -0.0009659528732299805, -0.0008215904235839844, -0.0006772279739379883, -0.0005328655242919922, -0.0003885030746459961, -0.000244140625, -9.97781753540039e-05, 4.458427429199219e-05, 0.00018894672393798828, 0.0003333091735839844, 0.00047767162322998047, 0.0006220340728759766, 0.0007663965225219727, 0.0009107589721679688, 0.0010551214218139648, 0.001199483871459961, 0.001343846321105957, 0.0014882087707519531, 0.0016325712203979492, 0.0017769336700439453, 0.0019212961196899414, 0.0020656585693359375, 0.0022100210189819336, 0.0023543834686279297, 0.0024987459182739258, 0.002643108367919922, 0.002787470817565918, 0.002931833267211914, 0.00307619571685791, 0.0032205581665039062, 0.0033649206161499023, 0.0035092830657958984, 0.0036536455154418945, 0.0037980079650878906, 0.003942370414733887, 0.004086732864379883, 0.004231095314025879, 0.004375457763671875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 14.0, 6.0, 10.0, 18.0, 21.0, 15.0, 30.0, 18.0, 16.0, 26.0, 39.0, 42.0, 58.0, 45.0, 47.0, 48.0, 57.0, 54.0, 54.0, 38.0, 45.0, 37.0, 38.0, 31.0, 37.0, 30.0, 17.0, 19.0, 19.0, 10.0, 7.0, 10.0, 13.0, 6.0, 3.0, 1.0, 8.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.423727989196777, -9.156665802001953, -8.889602661132812, -8.622539520263672, -8.355477333068848, -8.088415145874023, -7.821352005004883, -7.5542893409729, -7.287226676940918, -7.0201640129089355, -6.753101348876953, -6.486038684844971, -6.218976020812988, -5.951913356781006, -5.684850692749023, -5.417788028717041, -5.150725364685059, -4.883662700653076, -4.616600036621094, -4.349537372589111, -4.082474708557129, -3.8154120445251465, -3.548349380493164, -3.2812867164611816, -3.014224052429199, -2.747161388397217, -2.4800987243652344, -2.213036060333252, -1.9459733963012695, -1.678910732269287, -1.4118480682373047, -1.1447854042053223, -0.8777227401733398, -0.6106600761413574, -0.343597412109375, -0.07653474807739258, 0.19052791595458984, 0.45759057998657227, 0.7246532440185547, 0.9917159080505371, 1.2587785720825195, 1.525841236114502, 1.7929039001464844, 2.059966564178467, 2.327029228210449, 2.5940918922424316, 2.861154556274414, 3.1282172203063965, 3.395279884338379, 3.6623425483703613, 3.9294052124023438, 4.196467876434326, 4.463530540466309, 4.730593204498291, 4.997655868530273, 5.264718532562256, 5.531781196594238, 5.798843860626221, 6.065906524658203, 6.3329691886901855, 6.600031852722168, 6.86709451675415, 7.134157180786133, 7.401219844818115, 7.668282508850098]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 7.0, 14.0, 18.0, 10.0, 17.0, 28.0, 18.0, 22.0, 29.0, 30.0, 31.0, 30.0, 46.0, 36.0, 32.0, 56.0, 37.0, 43.0, 36.0, 44.0, 41.0, 38.0, 41.0, 38.0, 30.0, 33.0, 19.0, 20.0, 20.0, 24.0, 19.0, 12.0, 11.0, 8.0, 8.0, 9.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 4.0, 5.0, 0.0, 1.0, 1.0], "bins": [-9.223718643188477, -8.957849502563477, -8.691981315612793, -8.426112174987793, -8.16024398803711, -7.894374847412109, -7.628506183624268, -7.362637519836426, -7.096768379211426, -6.830899715423584, -6.565031051635742, -6.299161911010742, -6.0332932472229, -5.767424583435059, -5.501555919647217, -5.235687255859375, -4.969818592071533, -4.703949928283691, -4.43808126449585, -4.172212600708008, -3.906343460083008, -3.640474796295166, -3.374606132507324, -3.1087374687194824, -2.8428685665130615, -2.5769999027252197, -2.311131000518799, -2.045262336730957, -1.7793935537338257, -1.5135247707366943, -1.2476561069488525, -0.9817873239517212, -0.715919017791748, -0.4500502645969391, -0.18418151140213013, 0.08168721199035645, 0.3475559949874878, 0.6134247779846191, 0.8792934417724609, 1.1451622247695923, 1.4110310077667236, 1.676899790763855, 1.9427685737609863, 2.208637237548828, 2.47450590133667, 2.740374803543091, 3.0062434673309326, 3.2721123695373535, 3.5379810333251953, 3.803849697113037, 4.069718360900879, 4.335587501525879, 4.601456165313721, 4.8673248291015625, 5.133193492889404, 5.399062156677246, 5.664931297302246, 5.930799961090088, 6.19666862487793, 6.46253776550293, 6.7284064292907715, 6.994275093078613, 7.260143756866455, 7.526012420654297, 7.791881084442139]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 7.0, 7.0, 14.0, 18.0, 25.0, 45.0, 64.0, 94.0, 138.0, 203.0, 316.0, 477.0, 743.0, 1077.0, 1656.0, 2437.0, 3830.0, 5845.0, 8834.0, 13715.0, 21271.0, 31718.0, 47944.0, 70102.0, 95929.0, 120740.0, 135368.0, 128988.0, 107653.0, 80903.0, 56740.0, 38679.0, 25431.0, 16370.0, 10809.0, 6947.0, 4562.0, 3041.0, 2008.0, 1200.0, 879.0, 603.0, 380.0, 269.0, 182.0, 103.0, 74.0, 47.0, 21.0, 20.0, 13.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6484375, -8.357421875, -8.06640625, -7.775390625, -7.484375, -7.193359375, -6.90234375, -6.611328125, -6.3203125, -6.029296875, -5.73828125, -5.447265625, -5.15625, -4.865234375, -4.57421875, -4.283203125, -3.9921875, -3.701171875, -3.41015625, -3.119140625, -2.828125, -2.537109375, -2.24609375, -1.955078125, -1.6640625, -1.373046875, -1.08203125, -0.791015625, -0.5, -0.208984375, 0.08203125, 0.373046875, 0.6640625, 0.955078125, 1.24609375, 1.537109375, 1.828125, 2.119140625, 2.41015625, 2.701171875, 2.9921875, 3.283203125, 3.57421875, 3.865234375, 4.15625, 4.447265625, 4.73828125, 5.029296875, 5.3203125, 5.611328125, 5.90234375, 6.193359375, 6.484375, 6.775390625, 7.06640625, 7.357421875, 7.6484375, 7.939453125, 8.23046875, 8.521484375, 8.8125, 9.103515625, 9.39453125, 9.685546875, 9.9765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 10.0, 4.0, 12.0, 20.0, 23.0, 25.0, 23.0, 34.0, 27.0, 33.0, 30.0, 33.0, 41.0, 42.0, 44.0, 59.0, 43.0, 47.0, 45.0, 49.0, 44.0, 42.0, 32.0, 30.0, 22.0, 27.0, 17.0, 30.0, 21.0, 16.0, 14.0, 8.0, 10.0, 4.0, 3.0, 7.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-10.109375, -9.833984375, -9.55859375, -9.283203125, -9.0078125, -8.732421875, -8.45703125, -8.181640625, -7.90625, -7.630859375, -7.35546875, -7.080078125, -6.8046875, -6.529296875, -6.25390625, -5.978515625, -5.703125, -5.427734375, -5.15234375, -4.876953125, -4.6015625, -4.326171875, -4.05078125, -3.775390625, -3.5, -3.224609375, -2.94921875, -2.673828125, -2.3984375, -2.123046875, -1.84765625, -1.572265625, -1.296875, -1.021484375, -0.74609375, -0.470703125, -0.1953125, 0.080078125, 0.35546875, 0.630859375, 0.90625, 1.181640625, 1.45703125, 1.732421875, 2.0078125, 2.283203125, 2.55859375, 2.833984375, 3.109375, 3.384765625, 3.66015625, 3.935546875, 4.2109375, 4.486328125, 4.76171875, 5.037109375, 5.3125, 5.587890625, 5.86328125, 6.138671875, 6.4140625, 6.689453125, 6.96484375, 7.240234375, 7.515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 2.0, 6.0, 6.0, 22.0, 17.0, 27.0, 49.0, 72.0, 125.0, 165.0, 270.0, 402.0, 670.0, 1044.0, 1757.0, 2722.0, 4512.0, 7171.0, 11279.0, 17977.0, 29034.0, 45335.0, 69048.0, 98080.0, 128515.0, 146111.0, 138071.0, 113381.0, 82078.0, 54724.0, 35594.0, 22645.0, 14134.0, 8844.0, 5461.0, 3436.0, 2125.0, 1343.0, 869.0, 505.0, 344.0, 192.0, 135.0, 80.0, 64.0, 45.0, 22.0, 20.0, 8.0, 13.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.953125, -8.6519775390625, -8.350830078125, -8.0496826171875, -7.74853515625, -7.4473876953125, -7.146240234375, -6.8450927734375, -6.5439453125, -6.2427978515625, -5.941650390625, -5.6405029296875, -5.33935546875, -5.0382080078125, -4.737060546875, -4.4359130859375, -4.134765625, -3.8336181640625, -3.532470703125, -3.2313232421875, -2.93017578125, -2.6290283203125, -2.327880859375, -2.0267333984375, -1.7255859375, -1.4244384765625, -1.123291015625, -0.8221435546875, -0.52099609375, -0.2198486328125, 0.081298828125, 0.3824462890625, 0.68359375, 0.9847412109375, 1.285888671875, 1.5870361328125, 1.88818359375, 2.1893310546875, 2.490478515625, 2.7916259765625, 3.0927734375, 3.3939208984375, 3.695068359375, 3.9962158203125, 4.29736328125, 4.5985107421875, 4.899658203125, 5.2008056640625, 5.501953125, 5.8031005859375, 6.104248046875, 6.4053955078125, 6.70654296875, 7.0076904296875, 7.308837890625, 7.6099853515625, 7.9111328125, 8.2122802734375, 8.513427734375, 8.8145751953125, 9.11572265625, 9.4168701171875, 9.718017578125, 10.0191650390625, 10.3203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 12.0, 6.0, 8.0, 17.0, 13.0, 10.0, 22.0, 19.0, 36.0, 44.0, 25.0, 26.0, 38.0, 49.0, 28.0, 34.0, 34.0, 42.0, 40.0, 36.0, 44.0, 50.0, 34.0, 54.0, 35.0, 32.0, 39.0, 23.0, 28.0, 19.0, 18.0, 13.0, 10.0, 11.0, 17.0, 9.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.04296875, -4.87933349609375, -4.7156982421875, -4.55206298828125, -4.388427734375, -4.22479248046875, -4.0611572265625, -3.89752197265625, -3.73388671875, -3.57025146484375, -3.4066162109375, -3.24298095703125, -3.079345703125, -2.91571044921875, -2.7520751953125, -2.58843994140625, -2.4248046875, -2.26116943359375, -2.0975341796875, -1.93389892578125, -1.770263671875, -1.60662841796875, -1.4429931640625, -1.27935791015625, -1.11572265625, -0.95208740234375, -0.7884521484375, -0.62481689453125, -0.461181640625, -0.29754638671875, -0.1339111328125, 0.02972412109375, 0.193359375, 0.35699462890625, 0.5206298828125, 0.68426513671875, 0.847900390625, 1.01153564453125, 1.1751708984375, 1.33880615234375, 1.50244140625, 1.66607666015625, 1.8297119140625, 1.99334716796875, 2.156982421875, 2.32061767578125, 2.4842529296875, 2.64788818359375, 2.8115234375, 2.97515869140625, 3.1387939453125, 3.30242919921875, 3.466064453125, 3.62969970703125, 3.7933349609375, 3.95697021484375, 4.12060546875, 4.28424072265625, 4.4478759765625, 4.61151123046875, 4.775146484375, 4.93878173828125, 5.1024169921875, 5.26605224609375, 5.4296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 15.0, 11.0, 14.0, 18.0, 38.0, 39.0, 77.0, 96.0, 143.0, 236.0, 350.0, 593.0, 957.0, 1520.0, 2612.0, 4294.0, 7484.0, 13350.0, 24373.0, 44572.0, 78007.0, 124066.0, 166686.0, 179965.0, 152197.0, 104158.0, 62612.0, 35325.0, 19124.0, 10709.0, 5986.0, 3401.0, 2067.0, 1286.0, 771.0, 473.0, 313.0, 207.0, 143.0, 81.0, 43.0, 49.0, 23.0, 21.0, 15.0, 9.0, 10.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7900390625, -1.734619140625, -1.67919921875, -1.623779296875, -1.568359375, -1.512939453125, -1.45751953125, -1.402099609375, -1.3466796875, -1.291259765625, -1.23583984375, -1.180419921875, -1.125, -1.069580078125, -1.01416015625, -0.958740234375, -0.9033203125, -0.847900390625, -0.79248046875, -0.737060546875, -0.681640625, -0.626220703125, -0.57080078125, -0.515380859375, -0.4599609375, -0.404541015625, -0.34912109375, -0.293701171875, -0.23828125, -0.182861328125, -0.12744140625, -0.072021484375, -0.0166015625, 0.038818359375, 0.09423828125, 0.149658203125, 0.205078125, 0.260498046875, 0.31591796875, 0.371337890625, 0.4267578125, 0.482177734375, 0.53759765625, 0.593017578125, 0.6484375, 0.703857421875, 0.75927734375, 0.814697265625, 0.8701171875, 0.925537109375, 0.98095703125, 1.036376953125, 1.091796875, 1.147216796875, 1.20263671875, 1.258056640625, 1.3134765625, 1.368896484375, 1.42431640625, 1.479736328125, 1.53515625, 1.590576171875, 1.64599609375, 1.701416015625, 1.7568359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 9.0, 7.0, 8.0, 7.0, 11.0, 19.0, 17.0, 27.0, 32.0, 26.0, 40.0, 41.0, 62.0, 49.0, 71.0, 51.0, 51.0, 80.0, 61.0, 37.0, 53.0, 45.0, 37.0, 34.0, 27.0, 24.0, 20.0, 11.0, 13.0, 6.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00022423267364501953, -0.00021826103329658508, -0.00021228939294815063, -0.0002063177525997162, -0.00020034611225128174, -0.0001943744719028473, -0.00018840283155441284, -0.0001824311912059784, -0.00017645955085754395, -0.0001704879105091095, -0.00016451627016067505, -0.0001585446298122406, -0.00015257298946380615, -0.0001466013491153717, -0.00014062970876693726, -0.0001346580684185028, -0.00012868642807006836, -0.0001227147877216339, -0.00011674314737319946, -0.00011077150702476501, -0.00010479986667633057, -9.882822632789612e-05, -9.285658597946167e-05, -8.688494563102722e-05, -8.091330528259277e-05, -7.494166493415833e-05, -6.897002458572388e-05, -6.299838423728943e-05, -5.702674388885498e-05, -5.105510354042053e-05, -4.5083463191986084e-05, -3.9111822843551636e-05, -3.314018249511719e-05, -2.716854214668274e-05, -2.119690179824829e-05, -1.5225261449813843e-05, -9.253621101379395e-06, -3.2819807529449463e-06, 2.689659595489502e-06, 8.66129994392395e-06, 1.4632940292358398e-05, 2.0604580640792847e-05, 2.6576220989227295e-05, 3.254786133766174e-05, 3.851950168609619e-05, 4.449114203453064e-05, 5.046278238296509e-05, 5.6434422731399536e-05, 6.240606307983398e-05, 6.837770342826843e-05, 7.434934377670288e-05, 8.032098412513733e-05, 8.629262447357178e-05, 9.226426482200623e-05, 9.823590517044067e-05, 0.00010420754551887512, 0.00011017918586730957, 0.00011615082621574402, 0.00012212246656417847, 0.00012809410691261292, 0.00013406574726104736, 0.0001400373876094818, 0.00014600902795791626, 0.0001519806683063507, 0.00015795230865478516]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 8.0, 10.0, 21.0, 31.0, 45.0, 51.0, 74.0, 113.0, 185.0, 290.0, 430.0, 675.0, 1105.0, 1664.0, 2790.0, 4893.0, 8230.0, 14993.0, 26623.0, 47016.0, 80324.0, 122973.0, 161770.0, 172100.0, 147379.0, 104382.0, 64159.0, 37048.0, 20976.0, 11586.0, 6532.0, 3928.0, 2252.0, 1403.0, 842.0, 562.0, 388.0, 237.0, 143.0, 103.0, 76.0, 49.0, 25.0, 27.0, 14.0, 11.0, 10.0, 5.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.650390625, -1.5976409912109375, -1.544891357421875, -1.4921417236328125, -1.43939208984375, -1.3866424560546875, -1.333892822265625, -1.2811431884765625, -1.2283935546875, -1.1756439208984375, -1.122894287109375, -1.0701446533203125, -1.01739501953125, -0.9646453857421875, -0.911895751953125, -0.8591461181640625, -0.806396484375, -0.7536468505859375, -0.700897216796875, -0.6481475830078125, -0.59539794921875, -0.5426483154296875, -0.489898681640625, -0.4371490478515625, -0.3843994140625, -0.3316497802734375, -0.278900146484375, -0.2261505126953125, -0.17340087890625, -0.1206512451171875, -0.067901611328125, -0.0151519775390625, 0.03759765625, 0.0903472900390625, 0.143096923828125, 0.1958465576171875, 0.24859619140625, 0.3013458251953125, 0.354095458984375, 0.4068450927734375, 0.4595947265625, 0.5123443603515625, 0.565093994140625, 0.6178436279296875, 0.67059326171875, 0.7233428955078125, 0.776092529296875, 0.8288421630859375, 0.881591796875, 0.9343414306640625, 0.987091064453125, 1.0398406982421875, 1.09259033203125, 1.1453399658203125, 1.198089599609375, 1.2508392333984375, 1.3035888671875, 1.3563385009765625, 1.409088134765625, 1.4618377685546875, 1.51458740234375, 1.5673370361328125, 1.620086669921875, 1.6728363037109375, 1.7255859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 8.0, 12.0, 11.0, 15.0, 15.0, 12.0, 19.0, 26.0, 26.0, 33.0, 40.0, 39.0, 39.0, 55.0, 59.0, 43.0, 46.0, 63.0, 57.0, 59.0, 40.0, 48.0, 43.0, 27.0, 28.0, 27.0, 23.0, 19.0, 14.0, 9.0, 6.0, 6.0, 5.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5390625, -0.5205230712890625, -0.501983642578125, -0.4834442138671875, -0.46490478515625, -0.4463653564453125, -0.427825927734375, -0.4092864990234375, -0.3907470703125, -0.3722076416015625, -0.353668212890625, -0.3351287841796875, -0.31658935546875, -0.2980499267578125, -0.279510498046875, -0.2609710693359375, -0.242431640625, -0.2238922119140625, -0.205352783203125, -0.1868133544921875, -0.16827392578125, -0.1497344970703125, -0.131195068359375, -0.1126556396484375, -0.0941162109375, -0.0755767822265625, -0.057037353515625, -0.0384979248046875, -0.01995849609375, -0.0014190673828125, 0.017120361328125, 0.0356597900390625, 0.05419921875, 0.0727386474609375, 0.091278076171875, 0.1098175048828125, 0.12835693359375, 0.1468963623046875, 0.165435791015625, 0.1839752197265625, 0.2025146484375, 0.2210540771484375, 0.239593505859375, 0.2581329345703125, 0.27667236328125, 0.2952117919921875, 0.313751220703125, 0.3322906494140625, 0.350830078125, 0.3693695068359375, 0.387908935546875, 0.4064483642578125, 0.42498779296875, 0.4435272216796875, 0.462066650390625, 0.4806060791015625, 0.4991455078125, 0.5176849365234375, 0.536224365234375, 0.5547637939453125, 0.57330322265625, 0.5918426513671875, 0.610382080078125, 0.6289215087890625, 0.6474609375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 12.0, 5.0, 13.0, 14.0, 18.0, 17.0, 21.0, 26.0, 42.0, 34.0, 45.0, 48.0, 44.0, 56.0, 67.0, 47.0, 55.0, 56.0, 55.0, 50.0, 43.0, 43.0, 30.0, 38.0, 30.0, 13.0, 15.0, 18.0, 10.0, 8.0, 4.0, 7.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.604944229125977, -9.31793212890625, -9.030919075012207, -8.74390697479248, -8.456893920898438, -8.169881820678711, -7.882869243621826, -7.595856666564941, -7.308844089508057, -7.021831512451172, -6.734818935394287, -6.447806358337402, -6.160794258117676, -5.873781204223633, -5.586769104003906, -5.2997565269470215, -5.012743949890137, -4.725731372833252, -4.438718795776367, -4.151706218719482, -3.8646938800811768, -3.577681303024292, -3.2906689643859863, -3.0036563873291016, -2.716643810272217, -2.429631233215332, -2.1426186561584473, -1.8556063175201416, -1.5685937404632568, -1.281581163406372, -0.9945687055587769, -0.7075562477111816, -0.4205446243286133, -0.1335321068763733, 0.1534804105758667, 0.4404929280281067, 0.7275054454803467, 1.0145180225372314, 1.3015304803848267, 1.5885429382324219, 1.8755555152893066, 2.1625680923461914, 2.449580669403076, 2.736593008041382, 3.0236055850982666, 3.3106181621551514, 3.597630500793457, 3.884643077850342, 4.171655654907227, 4.458668231964111, 4.745680809020996, 5.032693386077881, 5.319705963134766, 5.606718063354492, 5.893730640411377, 6.180743217468262, 6.4677557945251465, 6.754768371582031, 7.041780948638916, 7.328793525695801, 7.615805625915527, 7.90281867980957, 8.189830780029297, 8.476842880249023, 8.763855934143066]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 12.0, 10.0, 19.0, 13.0, 17.0, 21.0, 18.0, 19.0, 32.0, 23.0, 33.0, 41.0, 37.0, 29.0, 27.0, 42.0, 40.0, 44.0, 45.0, 41.0, 54.0, 32.0, 44.0, 38.0, 32.0, 26.0, 36.0, 18.0, 24.0, 19.0, 12.0, 19.0, 16.0, 17.0, 9.0, 12.0, 8.0, 4.0, 0.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.209674835205078, -7.939460754394531, -7.669247150421143, -7.399033546447754, -7.128819465637207, -6.85860538482666, -6.5883917808532715, -6.318178176879883, -6.047964096069336, -5.777750015258789, -5.5075364112854, -5.237322807312012, -4.967108726501465, -4.696894645690918, -4.426681041717529, -4.156467437744141, -3.8862533569335938, -3.616039514541626, -3.345825672149658, -3.0756118297576904, -2.8053979873657227, -2.535184144973755, -2.264970302581787, -1.9947564601898193, -1.7245426177978516, -1.4543287754058838, -1.184114933013916, -0.9139010906219482, -0.6436872482299805, -0.3734734058380127, -0.10325956344604492, 0.16695427894592285, 0.43716907501220703, 0.7073829174041748, 0.9775967597961426, 1.2478106021881104, 1.5180244445800781, 1.788238286972046, 2.0584521293640137, 2.3286659717559814, 2.598879814147949, 2.869093656539917, 3.1393074989318848, 3.4095213413238525, 3.6797351837158203, 3.949949026107788, 4.220162868499756, 4.4903764724731445, 4.760590553283691, 5.030804634094238, 5.301018238067627, 5.571231842041016, 5.8414459228515625, 6.111660003662109, 6.381873607635498, 6.652087211608887, 6.922301292419434, 7.1925153732299805, 7.462728977203369, 7.732942581176758, 8.003156661987305, 8.273370742797852, 8.543584823608398, 8.813797950744629, 9.084012031555176]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 4.0, 7.0, 14.0, 21.0, 36.0, 73.0, 102.0, 153.0, 280.0, 413.0, 728.0, 1203.0, 2079.0, 3468.0, 5962.0, 10322.0, 17541.0, 30671.0, 53639.0, 95157.0, 170474.0, 307607.0, 530612.0, 768468.0, 801190.0, 593385.0, 353895.0, 196006.0, 108297.0, 60732.0, 34716.0, 19728.0, 11282.0, 6651.0, 3843.0, 2327.0, 1255.0, 771.0, 463.0, 279.0, 149.0, 98.0, 63.0, 41.0, 29.0, 16.0, 16.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.4375, -10.131591796875, -9.82568359375, -9.519775390625, -9.2138671875, -8.907958984375, -8.60205078125, -8.296142578125, -7.990234375, -7.684326171875, -7.37841796875, -7.072509765625, -6.7666015625, -6.460693359375, -6.15478515625, -5.848876953125, -5.54296875, -5.237060546875, -4.93115234375, -4.625244140625, -4.3193359375, -4.013427734375, -3.70751953125, -3.401611328125, -3.095703125, -2.789794921875, -2.48388671875, -2.177978515625, -1.8720703125, -1.566162109375, -1.26025390625, -0.954345703125, -0.6484375, -0.342529296875, -0.03662109375, 0.269287109375, 0.5751953125, 0.881103515625, 1.18701171875, 1.492919921875, 1.798828125, 2.104736328125, 2.41064453125, 2.716552734375, 3.0224609375, 3.328369140625, 3.63427734375, 3.940185546875, 4.24609375, 4.552001953125, 4.85791015625, 5.163818359375, 5.4697265625, 5.775634765625, 6.08154296875, 6.387451171875, 6.693359375, 6.999267578125, 7.30517578125, 7.611083984375, 7.9169921875, 8.222900390625, 8.52880859375, 8.834716796875, 9.140625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 7.0, 8.0, 11.0, 20.0, 20.0, 14.0, 18.0, 28.0, 21.0, 25.0, 24.0, 33.0, 27.0, 40.0, 29.0, 38.0, 37.0, 52.0, 44.0, 41.0, 36.0, 31.0, 39.0, 40.0, 35.0, 30.0, 29.0, 39.0, 17.0, 17.0, 17.0, 20.0, 19.0, 11.0, 21.0, 4.0, 13.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.93359375, -6.71014404296875, -6.4866943359375, -6.26324462890625, -6.039794921875, -5.81634521484375, -5.5928955078125, -5.36944580078125, -5.14599609375, -4.92254638671875, -4.6990966796875, -4.47564697265625, -4.252197265625, -4.02874755859375, -3.8052978515625, -3.58184814453125, -3.3583984375, -3.13494873046875, -2.9114990234375, -2.68804931640625, -2.464599609375, -2.24114990234375, -2.0177001953125, -1.79425048828125, -1.57080078125, -1.34735107421875, -1.1239013671875, -0.90045166015625, -0.677001953125, -0.45355224609375, -0.2301025390625, -0.00665283203125, 0.216796875, 0.44024658203125, 0.6636962890625, 0.88714599609375, 1.110595703125, 1.33404541015625, 1.5574951171875, 1.78094482421875, 2.00439453125, 2.22784423828125, 2.4512939453125, 2.67474365234375, 2.898193359375, 3.12164306640625, 3.3450927734375, 3.56854248046875, 3.7919921875, 4.01544189453125, 4.2388916015625, 4.46234130859375, 4.685791015625, 4.90924072265625, 5.1326904296875, 5.35614013671875, 5.57958984375, 5.80303955078125, 6.0264892578125, 6.24993896484375, 6.473388671875, 6.69683837890625, 6.9202880859375, 7.14373779296875, 7.3671875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [6.0, 2.0, 5.0, 9.0, 12.0, 14.0, 30.0, 57.0, 97.0, 151.0, 244.0, 438.0, 740.0, 1314.0, 2444.0, 4368.0, 8383.0, 15328.0, 29195.0, 54849.0, 101051.0, 179628.0, 306630.0, 478408.0, 650011.0, 711574.0, 609229.0, 430087.0, 268554.0, 155276.0, 86073.0, 46534.0, 24743.0, 13239.0, 7101.0, 3746.0, 2086.0, 1096.0, 651.0, 363.0, 206.0, 132.0, 74.0, 51.0, 22.0, 11.0, 17.0, 8.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53125, -7.234375, -6.9375, -6.640625, -6.34375, -6.046875, -5.75, -5.453125, -5.15625, -4.859375, -4.5625, -4.265625, -3.96875, -3.671875, -3.375, -3.078125, -2.78125, -2.484375, -2.1875, -1.890625, -1.59375, -1.296875, -1.0, -0.703125, -0.40625, -0.109375, 0.1875, 0.484375, 0.78125, 1.078125, 1.375, 1.671875, 1.96875, 2.265625, 2.5625, 2.859375, 3.15625, 3.453125, 3.75, 4.046875, 4.34375, 4.640625, 4.9375, 5.234375, 5.53125, 5.828125, 6.125, 6.421875, 6.71875, 7.015625, 7.3125, 7.609375, 7.90625, 8.203125, 8.5, 8.796875, 9.09375, 9.390625, 9.6875, 9.984375, 10.28125, 10.578125, 10.875, 11.171875, 11.46875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 7.0, 12.0, 13.0, 20.0, 21.0, 36.0, 56.0, 83.0, 84.0, 102.0, 129.0, 173.0, 194.0, 214.0, 232.0, 269.0, 261.0, 282.0, 307.0, 240.0, 259.0, 189.0, 175.0, 158.0, 127.0, 99.0, 83.0, 66.0, 45.0, 35.0, 29.0, 12.0, 19.0, 10.0, 7.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.2008056640625, -4.057861328125, -3.9149169921875, -3.77197265625, -3.6290283203125, -3.486083984375, -3.3431396484375, -3.2001953125, -3.0572509765625, -2.914306640625, -2.7713623046875, -2.62841796875, -2.4854736328125, -2.342529296875, -2.1995849609375, -2.056640625, -1.9136962890625, -1.770751953125, -1.6278076171875, -1.48486328125, -1.3419189453125, -1.198974609375, -1.0560302734375, -0.9130859375, -0.7701416015625, -0.627197265625, -0.4842529296875, -0.34130859375, -0.1983642578125, -0.055419921875, 0.0875244140625, 0.23046875, 0.3734130859375, 0.516357421875, 0.6593017578125, 0.80224609375, 0.9451904296875, 1.088134765625, 1.2310791015625, 1.3740234375, 1.5169677734375, 1.659912109375, 1.8028564453125, 1.94580078125, 2.0887451171875, 2.231689453125, 2.3746337890625, 2.517578125, 2.6605224609375, 2.803466796875, 2.9464111328125, 3.08935546875, 3.2322998046875, 3.375244140625, 3.5181884765625, 3.6611328125, 3.8040771484375, 3.947021484375, 4.0899658203125, 4.23291015625, 4.3758544921875, 4.518798828125, 4.6617431640625, 4.8046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 3.0, 12.0, 9.0, 12.0, 20.0, 16.0, 26.0, 14.0, 24.0, 35.0, 35.0, 38.0, 49.0, 60.0, 41.0, 63.0, 61.0, 59.0, 49.0, 60.0, 37.0, 49.0, 49.0, 32.0, 29.0, 26.0, 21.0, 18.0, 18.0, 6.0, 3.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.973538398742676, -7.693498134613037, -7.413457870483398, -7.133418083190918, -6.853377819061279, -6.573337554931641, -6.29329776763916, -6.0132575035095215, -5.733217239379883, -5.453176975250244, -5.1731367111206055, -4.893096923828125, -4.613056659698486, -4.333016395568848, -4.052976608276367, -3.7729363441467285, -3.49289608001709, -3.212855815887451, -2.9328157901763916, -2.652775764465332, -2.3727355003356934, -2.0926952362060547, -1.8126552104949951, -1.532615065574646, -1.2525749206542969, -0.9725347757339478, -0.6924946308135986, -0.4124544858932495, -0.1324143409729004, 0.14762580394744873, 0.42766594886779785, 0.707706093788147, 0.9877462387084961, 1.2677863836288452, 1.5478265285491943, 1.8278666734695435, 2.1079068183898926, 2.3879470825195312, 2.667987108230591, 2.9480271339416504, 3.228067398071289, 3.5081076622009277, 3.7881476879119873, 4.068187713623047, 4.3482279777526855, 4.628268241882324, 4.908308029174805, 5.188348293304443, 5.468388557434082, 5.748428821563721, 6.028469085693359, 6.30850887298584, 6.5885491371154785, 6.868589401245117, 7.148629188537598, 7.428669452667236, 7.708709716796875, 7.988749980926514, 8.268790245056152, 8.548830032348633, 8.82887077331543, 9.10891056060791, 9.38895034790039, 9.668991088867188, 9.949030876159668]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 9.0, 7.0, 7.0, 10.0, 6.0, 15.0, 19.0, 26.0, 24.0, 27.0, 43.0, 36.0, 30.0, 25.0, 34.0, 47.0, 39.0, 39.0, 51.0, 45.0, 44.0, 38.0, 38.0, 49.0, 41.0, 38.0, 33.0, 29.0, 25.0, 19.0, 18.0, 16.0, 15.0, 7.0, 10.0, 11.0, 9.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.834255218505859, -7.563576698303223, -7.292898654937744, -7.022220134735107, -6.751541614532471, -6.480863571166992, -6.2101850509643555, -5.939506530761719, -5.668828010559082, -5.398149490356445, -5.127471446990967, -4.85679292678833, -4.586114406585693, -4.315436363220215, -4.044757843017578, -3.7740793228149414, -3.503401279449463, -3.2327229976654053, -2.9620444774627686, -2.691366195678711, -2.420687675476074, -2.1500093936920166, -1.879331111907959, -1.6086527109146118, -1.3379743099212646, -1.0672959089279175, -0.7966175675392151, -0.5259392261505127, -0.2552608251571655, 0.01541757583618164, 0.28609585762023926, 0.5567742586135864, 0.8274526596069336, 1.0981310606002808, 1.368809461593628, 1.6394877433776855, 1.9101661443710327, 2.18084454536438, 2.4515228271484375, 2.722201347351074, 2.992879629135132, 3.2635579109191895, 3.534236431121826, 3.804914712905884, 4.075592994689941, 4.346271514892578, 4.616950035095215, 4.887628078460693, 5.15830659866333, 5.428985118865967, 5.699663162231445, 5.970341682434082, 6.241020202636719, 6.5116987228393555, 6.782376766204834, 7.053055286407471, 7.323733329772949, 7.594411849975586, 7.8650898933410645, 8.13576889038086, 8.40644645690918, 8.677124977111816, 8.947803497314453, 9.21848201751709, 9.489160537719727]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 7.0, 17.0, 12.0, 25.0, 34.0, 55.0, 64.0, 101.0, 160.0, 245.0, 407.0, 634.0, 942.0, 1543.0, 2629.0, 4380.0, 7704.0, 13590.0, 25194.0, 47558.0, 95161.0, 238963.0, 366988.0, 117669.0, 56837.0, 29582.0, 15992.0, 8954.0, 5213.0, 3017.0, 1831.0, 1121.0, 670.0, 461.0, 278.0, 188.0, 111.0, 72.0, 49.0, 34.0, 20.0, 12.0, 10.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.41796875, -5.25445556640625, -5.0909423828125, -4.92742919921875, -4.763916015625, -4.60040283203125, -4.4368896484375, -4.27337646484375, -4.10986328125, -3.94635009765625, -3.7828369140625, -3.61932373046875, -3.455810546875, -3.29229736328125, -3.1287841796875, -2.96527099609375, -2.8017578125, -2.63824462890625, -2.4747314453125, -2.31121826171875, -2.147705078125, -1.98419189453125, -1.8206787109375, -1.65716552734375, -1.49365234375, -1.33013916015625, -1.1666259765625, -1.00311279296875, -0.839599609375, -0.67608642578125, -0.5125732421875, -0.34906005859375, -0.185546875, -0.02203369140625, 0.1414794921875, 0.30499267578125, 0.468505859375, 0.63201904296875, 0.7955322265625, 0.95904541015625, 1.12255859375, 1.28607177734375, 1.4495849609375, 1.61309814453125, 1.776611328125, 1.94012451171875, 2.1036376953125, 2.26715087890625, 2.4306640625, 2.59417724609375, 2.7576904296875, 2.92120361328125, 3.084716796875, 3.24822998046875, 3.4117431640625, 3.57525634765625, 3.73876953125, 3.90228271484375, 4.0657958984375, 4.22930908203125, 4.392822265625, 4.55633544921875, 4.7198486328125, 4.88336181640625, 5.046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 2.0, 10.0, 6.0, 12.0, 7.0, 20.0, 12.0, 24.0, 25.0, 42.0, 35.0, 26.0, 27.0, 31.0, 40.0, 58.0, 44.0, 46.0, 50.0, 43.0, 39.0, 35.0, 46.0, 40.0, 36.0, 41.0, 42.0, 25.0, 26.0, 22.0, 19.0, 18.0, 6.0, 11.0, 10.0, 4.0, 4.0, 4.0, 7.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.45703125, -7.16815185546875, -6.8792724609375, -6.59039306640625, -6.301513671875, -6.01263427734375, -5.7237548828125, -5.43487548828125, -5.14599609375, -4.85711669921875, -4.5682373046875, -4.27935791015625, -3.990478515625, -3.70159912109375, -3.4127197265625, -3.12384033203125, -2.8349609375, -2.54608154296875, -2.2572021484375, -1.96832275390625, -1.679443359375, -1.39056396484375, -1.1016845703125, -0.81280517578125, -0.52392578125, -0.23504638671875, 0.0538330078125, 0.34271240234375, 0.631591796875, 0.92047119140625, 1.2093505859375, 1.49822998046875, 1.787109375, 2.07598876953125, 2.3648681640625, 2.65374755859375, 2.942626953125, 3.23150634765625, 3.5203857421875, 3.80926513671875, 4.09814453125, 4.38702392578125, 4.6759033203125, 4.96478271484375, 5.253662109375, 5.54254150390625, 5.8314208984375, 6.12030029296875, 6.4091796875, 6.69805908203125, 6.9869384765625, 7.27581787109375, 7.564697265625, 7.85357666015625, 8.1424560546875, 8.43133544921875, 8.72021484375, 9.00909423828125, 9.2979736328125, 9.58685302734375, 9.875732421875, 10.16461181640625, 10.4534912109375, 10.74237060546875, 11.03125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 6.0, 12.0, 15.0, 30.0, 48.0, 66.0, 101.0, 141.0, 169.0, 271.0, 374.0, 577.0, 815.0, 1212.0, 1719.0, 2403.0, 3515.0, 5317.0, 7698.0, 11323.0, 17106.0, 25332.0, 37988.0, 58628.0, 98526.0, 245013.0, 254221.0, 99043.0, 59401.0, 38626.0, 25346.0, 17137.0, 11512.0, 7859.0, 5329.0, 3607.0, 2461.0, 1687.0, 1181.0, 840.0, 584.0, 396.0, 260.0, 200.0, 141.0, 110.0, 70.0, 48.0, 32.0, 18.0, 16.0, 7.0, 8.0, 2.0, 3.0, 2.0], "bins": [-3.91015625, -3.795196533203125, -3.68023681640625, -3.565277099609375, -3.4503173828125, -3.335357666015625, -3.22039794921875, -3.105438232421875, -2.990478515625, -2.875518798828125, -2.76055908203125, -2.645599365234375, -2.5306396484375, -2.415679931640625, -2.30072021484375, -2.185760498046875, -2.07080078125, -1.955841064453125, -1.84088134765625, -1.725921630859375, -1.6109619140625, -1.496002197265625, -1.38104248046875, -1.266082763671875, -1.151123046875, -1.036163330078125, -0.92120361328125, -0.806243896484375, -0.6912841796875, -0.576324462890625, -0.46136474609375, -0.346405029296875, -0.2314453125, -0.116485595703125, -0.00152587890625, 0.113433837890625, 0.2283935546875, 0.343353271484375, 0.45831298828125, 0.573272705078125, 0.688232421875, 0.803192138671875, 0.91815185546875, 1.033111572265625, 1.1480712890625, 1.263031005859375, 1.37799072265625, 1.492950439453125, 1.60791015625, 1.722869873046875, 1.83782958984375, 1.952789306640625, 2.0677490234375, 2.182708740234375, 2.29766845703125, 2.412628173828125, 2.527587890625, 2.642547607421875, 2.75750732421875, 2.872467041015625, 2.9874267578125, 3.102386474609375, 3.21734619140625, 3.332305908203125, 3.447265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 8.0, 5.0, 8.0, 13.0, 10.0, 7.0, 13.0, 13.0, 15.0, 27.0, 18.0, 38.0, 17.0, 25.0, 27.0, 27.0, 29.0, 42.0, 39.0, 35.0, 21.0, 40.0, 40.0, 40.0, 46.0, 34.0, 31.0, 22.0, 35.0, 25.0, 26.0, 23.0, 28.0, 23.0, 17.0, 26.0, 14.0, 12.0, 14.0, 13.0, 9.0, 11.0, 7.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-5.05859375, -4.90966796875, -4.7607421875, -4.61181640625, -4.462890625, -4.31396484375, -4.1650390625, -4.01611328125, -3.8671875, -3.71826171875, -3.5693359375, -3.42041015625, -3.271484375, -3.12255859375, -2.9736328125, -2.82470703125, -2.67578125, -2.52685546875, -2.3779296875, -2.22900390625, -2.080078125, -1.93115234375, -1.7822265625, -1.63330078125, -1.484375, -1.33544921875, -1.1865234375, -1.03759765625, -0.888671875, -0.73974609375, -0.5908203125, -0.44189453125, -0.29296875, -0.14404296875, 0.0048828125, 0.15380859375, 0.302734375, 0.45166015625, 0.6005859375, 0.74951171875, 0.8984375, 1.04736328125, 1.1962890625, 1.34521484375, 1.494140625, 1.64306640625, 1.7919921875, 1.94091796875, 2.08984375, 2.23876953125, 2.3876953125, 2.53662109375, 2.685546875, 2.83447265625, 2.9833984375, 3.13232421875, 3.28125, 3.43017578125, 3.5791015625, 3.72802734375, 3.876953125, 4.02587890625, 4.1748046875, 4.32373046875, 4.47265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 9.0, 7.0, 14.0, 20.0, 21.0, 54.0, 55.0, 66.0, 114.0, 156.0, 244.0, 358.0, 519.0, 777.0, 1314.0, 1988.0, 3362.0, 5657.0, 9862.0, 17956.0, 33383.0, 68662.0, 155106.0, 289483.0, 239899.0, 109505.0, 50615.0, 25560.0, 13875.0, 7909.0, 4556.0, 2721.0, 1680.0, 1005.0, 687.0, 425.0, 254.0, 212.0, 135.0, 102.0, 60.0, 55.0, 35.0, 27.0, 17.0, 15.0, 12.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.012451171875, -0.012093305587768555, -0.01173543930053711, -0.011377573013305664, -0.011019706726074219, -0.010661840438842773, -0.010303974151611328, -0.009946107864379883, -0.009588241577148438, -0.009230375289916992, -0.008872509002685547, -0.008514642715454102, -0.008156776428222656, -0.007798910140991211, -0.007441043853759766, -0.00708317756652832, -0.006725311279296875, -0.00636744499206543, -0.006009578704833984, -0.005651712417602539, -0.005293846130371094, -0.0049359798431396484, -0.004578113555908203, -0.004220247268676758, -0.0038623809814453125, -0.003504514694213867, -0.003146648406982422, -0.0027887821197509766, -0.0024309158325195312, -0.002073049545288086, -0.0017151832580566406, -0.0013573169708251953, -0.00099945068359375, -0.0006415843963623047, -0.0002837181091308594, 7.414817810058594e-05, 0.00043201446533203125, 0.0007898807525634766, 0.0011477470397949219, 0.0015056133270263672, 0.0018634796142578125, 0.002221345901489258, 0.002579212188720703, 0.0029370784759521484, 0.0032949447631835938, 0.003652811050415039, 0.004010677337646484, 0.00436854362487793, 0.004726409912109375, 0.00508427619934082, 0.005442142486572266, 0.005800008773803711, 0.006157875061035156, 0.0065157413482666016, 0.006873607635498047, 0.007231473922729492, 0.0075893402099609375, 0.007947206497192383, 0.008305072784423828, 0.008662939071655273, 0.009020805358886719, 0.009378671646118164, 0.00973653793334961, 0.010094404220581055, 0.0104522705078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 6.0, 5.0, 10.0, 9.0, 15.0, 20.0, 18.0, 21.0, 21.0, 22.0, 31.0, 41.0, 36.0, 30.0, 46.0, 51.0, 45.0, 55.0, 45.0, 68.0, 48.0, 36.0, 38.0, 42.0, 35.0, 41.0, 27.0, 21.0, 14.0, 24.0, 17.0, 8.0, 11.0, 12.0, 6.0, 6.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.841255187988281e-06, -5.653128027915955e-06, -5.465000867843628e-06, -5.276873707771301e-06, -5.088746547698975e-06, -4.900619387626648e-06, -4.712492227554321e-06, -4.524365067481995e-06, -4.336237907409668e-06, -4.148110747337341e-06, -3.959983587265015e-06, -3.771856427192688e-06, -3.5837292671203613e-06, -3.3956021070480347e-06, -3.207474946975708e-06, -3.0193477869033813e-06, -2.8312206268310547e-06, -2.643093466758728e-06, -2.4549663066864014e-06, -2.2668391466140747e-06, -2.078711986541748e-06, -1.8905848264694214e-06, -1.7024576663970947e-06, -1.514330506324768e-06, -1.3262033462524414e-06, -1.1380761861801147e-06, -9.499490261077881e-07, -7.618218660354614e-07, -5.736947059631348e-07, -3.855675458908081e-07, -1.9744038581848145e-07, -9.313225746154785e-09, 1.7881393432617188e-07, 3.6694109439849854e-07, 5.550682544708252e-07, 7.431954145431519e-07, 9.313225746154785e-07, 1.1194497346878052e-06, 1.3075768947601318e-06, 1.4957040548324585e-06, 1.6838312149047852e-06, 1.8719583749771118e-06, 2.0600855350494385e-06, 2.248212695121765e-06, 2.436339855194092e-06, 2.6244670152664185e-06, 2.812594175338745e-06, 3.0007213354110718e-06, 3.1888484954833984e-06, 3.376975655555725e-06, 3.5651028156280518e-06, 3.7532299757003784e-06, 3.941357135772705e-06, 4.129484295845032e-06, 4.317611455917358e-06, 4.505738615989685e-06, 4.693865776062012e-06, 4.881992936134338e-06, 5.070120096206665e-06, 5.258247256278992e-06, 5.446374416351318e-06, 5.634501576423645e-06, 5.822628736495972e-06, 6.010755896568298e-06, 6.198883056640625e-06]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 8.0, 6.0, 9.0, 16.0, 23.0, 38.0, 75.0, 82.0, 194.0, 288.0, 449.0, 685.0, 1283.0, 2040.0, 3718.0, 6529.0, 12068.0, 22789.0, 47504.0, 108222.0, 245407.0, 301037.0, 160657.0, 68230.0, 31511.0, 15914.0, 8374.0, 4604.0, 2760.0, 1614.0, 947.0, 576.0, 339.0, 216.0, 117.0, 83.0, 55.0, 29.0, 16.0, 18.0, 6.0, 10.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.014373779296875, -0.013965725898742676, -0.013557672500610352, -0.013149619102478027, -0.012741565704345703, -0.012333512306213379, -0.011925458908081055, -0.01151740550994873, -0.011109352111816406, -0.010701298713684082, -0.010293245315551758, -0.009885191917419434, -0.00947713851928711, -0.009069085121154785, -0.008661031723022461, -0.008252978324890137, -0.007844924926757812, -0.007436871528625488, -0.007028818130493164, -0.00662076473236084, -0.006212711334228516, -0.005804657936096191, -0.005396604537963867, -0.004988551139831543, -0.004580497741699219, -0.0041724443435668945, -0.0037643909454345703, -0.003356337547302246, -0.002948284149169922, -0.0025402307510375977, -0.0021321773529052734, -0.0017241239547729492, -0.001316070556640625, -0.0009080171585083008, -0.0004999637603759766, -9.191036224365234e-05, 0.0003161430358886719, 0.0007241964340209961, 0.0011322498321533203, 0.0015403032302856445, 0.0019483566284179688, 0.002356410026550293, 0.002764463424682617, 0.0031725168228149414, 0.0035805702209472656, 0.00398862361907959, 0.004396677017211914, 0.004804730415344238, 0.0052127838134765625, 0.005620837211608887, 0.006028890609741211, 0.006436944007873535, 0.006844997406005859, 0.007253050804138184, 0.007661104202270508, 0.008069157600402832, 0.008477210998535156, 0.00888526439666748, 0.009293317794799805, 0.009701371192932129, 0.010109424591064453, 0.010517477989196777, 0.010925531387329102, 0.011333584785461426, 0.01174163818359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 6.0, 7.0, 5.0, 6.0, 14.0, 18.0, 31.0, 37.0, 53.0, 70.0, 81.0, 100.0, 111.0, 102.0, 94.0, 67.0, 52.0, 41.0, 26.0, 15.0, 14.0, 11.0, 2.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00461578369140625, -0.004463136196136475, -0.004310488700866699, -0.004157841205596924, -0.0040051937103271484, -0.003852546215057373, -0.0036998987197875977, -0.0035472512245178223, -0.003394603729248047, -0.0032419562339782715, -0.003089308738708496, -0.0029366612434387207, -0.0027840137481689453, -0.00263136625289917, -0.0024787187576293945, -0.002326071262359619, -0.0021734237670898438, -0.0020207762718200684, -0.001868128776550293, -0.0017154812812805176, -0.0015628337860107422, -0.0014101862907409668, -0.0012575387954711914, -0.001104891300201416, -0.0009522438049316406, -0.0007995963096618652, -0.0006469488143920898, -0.0004943013191223145, -0.00034165382385253906, -0.00018900632858276367, -3.635883331298828e-05, 0.00011628866195678711, 0.0002689361572265625, 0.0004215836524963379, 0.0005742311477661133, 0.0007268786430358887, 0.0008795261383056641, 0.0010321736335754395, 0.0011848211288452148, 0.0013374686241149902, 0.0014901161193847656, 0.001642763614654541, 0.0017954111099243164, 0.0019480586051940918, 0.002100706100463867, 0.0022533535957336426, 0.002406001091003418, 0.0025586485862731934, 0.0027112960815429688, 0.002863943576812744, 0.0030165910720825195, 0.003169238567352295, 0.0033218860626220703, 0.0034745335578918457, 0.003627181053161621, 0.0037798285484313965, 0.003932476043701172, 0.004085123538970947, 0.004237771034240723, 0.004390418529510498, 0.0045430660247802734, 0.004695713520050049, 0.004848361015319824, 0.0050010085105896, 0.005153656005859375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 9.0, 12.0, 8.0, 14.0, 18.0, 25.0, 12.0, 22.0, 35.0, 30.0, 34.0, 42.0, 46.0, 51.0, 55.0, 55.0, 63.0, 47.0, 49.0, 53.0, 44.0, 42.0, 49.0, 37.0, 26.0, 20.0, 24.0, 16.0, 18.0, 11.0, 3.0, 4.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.819305896759033, -7.551950454711914, -7.284595012664795, -7.017239570617676, -6.749884128570557, -6.4825286865234375, -6.21517276763916, -5.947817802429199, -5.680461883544922, -5.413106441497803, -5.145750999450684, -4.8783955574035645, -4.611040115356445, -4.343684673309326, -4.076329231262207, -3.808973550796509, -3.5416183471679688, -3.2742629051208496, -3.0069074630737305, -2.7395520210266113, -2.472196578979492, -2.204841136932373, -1.9374854564666748, -1.6701300144195557, -1.4027745723724365, -1.1354191303253174, -0.8680636286735535, -0.6007081270217896, -0.3333526849746704, -0.06599724292755127, 0.20135831832885742, 0.46871376037597656, 0.7360687255859375, 1.0034241676330566, 1.2707796096801758, 1.5381351709365845, 1.8054906129837036, 2.072845935821533, 2.3402016162872314, 2.6075570583343506, 2.8749125003814697, 3.142267942428589, 3.409623384475708, 3.6769790649414062, 3.9443345069885254, 4.2116899490356445, 4.479045391082764, 4.746400833129883, 5.013756275177002, 5.281111717224121, 5.54846715927124, 5.815822601318359, 6.0831780433654785, 6.350533485412598, 6.617889404296875, 6.885244369506836, 7.152600288391113, 7.419955730438232, 7.687311172485352, 7.954666614532471, 8.22202205657959, 8.489377975463867, 8.756732940673828, 9.024088859558105, 9.291443824768066]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 9.0, 8.0, 5.0, 10.0, 6.0, 16.0, 19.0, 26.0, 25.0, 26.0, 43.0, 35.0, 29.0, 26.0, 34.0, 47.0, 40.0, 37.0, 51.0, 44.0, 46.0, 39.0, 36.0, 49.0, 43.0, 38.0, 33.0, 28.0, 26.0, 19.0, 17.0, 17.0, 16.0, 6.0, 7.0, 14.0, 9.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.766287326812744, -7.497143268585205, -7.227999210357666, -6.958855152130127, -6.689711093902588, -6.420567035675049, -6.151422500610352, -5.8822784423828125, -5.613134384155273, -5.343990325927734, -5.074846267700195, -4.805702209472656, -4.536558151245117, -4.267414093017578, -3.99826979637146, -3.729125738143921, -3.459981918334961, -3.190837860107422, -2.921693801879883, -2.6525497436523438, -2.3834056854248047, -2.1142616271972656, -1.8451173305511475, -1.5759732723236084, -1.3068292140960693, -1.0376851558685303, -0.7685410380363464, -0.4993969202041626, -0.23025286197662354, 0.03889119625091553, 0.30803537368774414, 0.5771794319152832, 0.8463239669799805, 1.1154680252075195, 1.3846120834350586, 1.6537562608718872, 1.9229003190994263, 2.192044258117676, 2.461188554763794, 2.730332612991333, 2.999476671218872, 3.268620729446411, 3.53776478767395, 3.8069090843200684, 4.076053142547607, 4.3451972007751465, 4.6143412590026855, 4.883485317230225, 5.152629375457764, 5.421773433685303, 5.690917491912842, 5.960061550140381, 6.22920560836792, 6.498349666595459, 6.767494201660156, 7.036638259887695, 7.305782318115234, 7.574926376342773, 7.8440704345703125, 8.113214492797852, 8.38235855102539, 8.65150260925293, 8.920646667480469, 9.189790725708008, 9.458934783935547]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 9.0, 11.0, 26.0, 35.0, 61.0, 107.0, 190.0, 253.0, 448.0, 671.0, 1089.0, 1776.0, 2848.0, 4497.0, 7155.0, 11907.0, 18571.0, 30001.0, 45457.0, 67839.0, 95904.0, 122410.0, 137808.0, 134123.0, 113613.0, 85384.0, 59504.0, 39802.0, 24966.0, 15953.0, 9916.0, 6123.0, 3847.0, 2327.0, 1452.0, 936.0, 572.0, 372.0, 225.0, 143.0, 84.0, 47.0, 30.0, 16.0, 17.0, 11.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.40625, -8.14208984375, -7.8779296875, -7.61376953125, -7.349609375, -7.08544921875, -6.8212890625, -6.55712890625, -6.29296875, -6.02880859375, -5.7646484375, -5.50048828125, -5.236328125, -4.97216796875, -4.7080078125, -4.44384765625, -4.1796875, -3.91552734375, -3.6513671875, -3.38720703125, -3.123046875, -2.85888671875, -2.5947265625, -2.33056640625, -2.06640625, -1.80224609375, -1.5380859375, -1.27392578125, -1.009765625, -0.74560546875, -0.4814453125, -0.21728515625, 0.046875, 0.31103515625, 0.5751953125, 0.83935546875, 1.103515625, 1.36767578125, 1.6318359375, 1.89599609375, 2.16015625, 2.42431640625, 2.6884765625, 2.95263671875, 3.216796875, 3.48095703125, 3.7451171875, 4.00927734375, 4.2734375, 4.53759765625, 4.8017578125, 5.06591796875, 5.330078125, 5.59423828125, 5.8583984375, 6.12255859375, 6.38671875, 6.65087890625, 6.9150390625, 7.17919921875, 7.443359375, 7.70751953125, 7.9716796875, 8.23583984375, 8.5]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 6.0, 7.0, 8.0, 12.0, 14.0, 22.0, 26.0, 24.0, 29.0, 39.0, 34.0, 37.0, 48.0, 34.0, 41.0, 43.0, 40.0, 44.0, 61.0, 39.0, 48.0, 41.0, 43.0, 39.0, 44.0, 23.0, 27.0, 21.0, 18.0, 16.0, 19.0, 7.0, 9.0, 8.0, 8.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.4552001953125, -8.176025390625, -7.8968505859375, -7.61767578125, -7.3385009765625, -7.059326171875, -6.7801513671875, -6.5009765625, -6.2218017578125, -5.942626953125, -5.6634521484375, -5.38427734375, -5.1051025390625, -4.825927734375, -4.5467529296875, -4.267578125, -3.9884033203125, -3.709228515625, -3.4300537109375, -3.15087890625, -2.8717041015625, -2.592529296875, -2.3133544921875, -2.0341796875, -1.7550048828125, -1.475830078125, -1.1966552734375, -0.91748046875, -0.6383056640625, -0.359130859375, -0.0799560546875, 0.19921875, 0.4783935546875, 0.757568359375, 1.0367431640625, 1.31591796875, 1.5950927734375, 1.874267578125, 2.1534423828125, 2.4326171875, 2.7117919921875, 2.990966796875, 3.2701416015625, 3.54931640625, 3.8284912109375, 4.107666015625, 4.3868408203125, 4.666015625, 4.9451904296875, 5.224365234375, 5.5035400390625, 5.78271484375, 6.0618896484375, 6.341064453125, 6.6202392578125, 6.8994140625, 7.1785888671875, 7.457763671875, 7.7369384765625, 8.01611328125, 8.2952880859375, 8.574462890625, 8.8536376953125, 9.1328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 8.0, 14.0, 21.0, 41.0, 66.0, 81.0, 145.0, 233.0, 361.0, 643.0, 1004.0, 1622.0, 2649.0, 4195.0, 6941.0, 11224.0, 17832.0, 28396.0, 44402.0, 67843.0, 95834.0, 124921.0, 141445.0, 137263.0, 115353.0, 85219.0, 58707.0, 38046.0, 24072.0, 15073.0, 9501.0, 5882.0, 3654.0, 2185.0, 1443.0, 857.0, 511.0, 349.0, 207.0, 97.0, 65.0, 65.0, 34.0, 17.0, 19.0, 9.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4609375, -8.195068359375, -7.92919921875, -7.663330078125, -7.3974609375, -7.131591796875, -6.86572265625, -6.599853515625, -6.333984375, -6.068115234375, -5.80224609375, -5.536376953125, -5.2705078125, -5.004638671875, -4.73876953125, -4.472900390625, -4.20703125, -3.941162109375, -3.67529296875, -3.409423828125, -3.1435546875, -2.877685546875, -2.61181640625, -2.345947265625, -2.080078125, -1.814208984375, -1.54833984375, -1.282470703125, -1.0166015625, -0.750732421875, -0.48486328125, -0.218994140625, 0.046875, 0.312744140625, 0.57861328125, 0.844482421875, 1.1103515625, 1.376220703125, 1.64208984375, 1.907958984375, 2.173828125, 2.439697265625, 2.70556640625, 2.971435546875, 3.2373046875, 3.503173828125, 3.76904296875, 4.034912109375, 4.30078125, 4.566650390625, 4.83251953125, 5.098388671875, 5.3642578125, 5.630126953125, 5.89599609375, 6.161865234375, 6.427734375, 6.693603515625, 6.95947265625, 7.225341796875, 7.4912109375, 7.757080078125, 8.02294921875, 8.288818359375, 8.5546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 10.0, 10.0, 7.0, 8.0, 9.0, 18.0, 14.0, 17.0, 21.0, 21.0, 30.0, 31.0, 45.0, 35.0, 41.0, 33.0, 34.0, 42.0, 45.0, 36.0, 35.0, 49.0, 41.0, 39.0, 39.0, 39.0, 22.0, 23.0, 35.0, 25.0, 21.0, 12.0, 20.0, 12.0, 6.0, 14.0, 10.0, 8.0, 11.0, 8.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.24609375, -4.09100341796875, -3.9359130859375, -3.78082275390625, -3.625732421875, -3.47064208984375, -3.3155517578125, -3.16046142578125, -3.00537109375, -2.85028076171875, -2.6951904296875, -2.54010009765625, -2.385009765625, -2.22991943359375, -2.0748291015625, -1.91973876953125, -1.7646484375, -1.60955810546875, -1.4544677734375, -1.29937744140625, -1.144287109375, -0.98919677734375, -0.8341064453125, -0.67901611328125, -0.52392578125, -0.36883544921875, -0.2137451171875, -0.05865478515625, 0.096435546875, 0.25152587890625, 0.4066162109375, 0.56170654296875, 0.716796875, 0.87188720703125, 1.0269775390625, 1.18206787109375, 1.337158203125, 1.49224853515625, 1.6473388671875, 1.80242919921875, 1.95751953125, 2.11260986328125, 2.2677001953125, 2.42279052734375, 2.577880859375, 2.73297119140625, 2.8880615234375, 3.04315185546875, 3.1982421875, 3.35333251953125, 3.5084228515625, 3.66351318359375, 3.818603515625, 3.97369384765625, 4.1287841796875, 4.28387451171875, 4.43896484375, 4.59405517578125, 4.7491455078125, 4.90423583984375, 5.059326171875, 5.21441650390625, 5.3695068359375, 5.52459716796875, 5.6796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 16.0, 14.0, 22.0, 29.0, 41.0, 55.0, 93.0, 131.0, 160.0, 259.0, 380.0, 567.0, 890.0, 1382.0, 2199.0, 3617.0, 6328.0, 11131.0, 19988.0, 37121.0, 66288.0, 110432.0, 155656.0, 178888.0, 163565.0, 119829.0, 74293.0, 42150.0, 22647.0, 12626.0, 6884.0, 4021.0, 2416.0, 1524.0, 992.0, 625.0, 421.0, 252.0, 193.0, 135.0, 80.0, 55.0, 55.0, 30.0, 15.0, 15.0, 10.0, 13.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-1.818359375, -1.7608184814453125, -1.703277587890625, -1.6457366943359375, -1.58819580078125, -1.5306549072265625, -1.473114013671875, -1.4155731201171875, -1.3580322265625, -1.3004913330078125, -1.242950439453125, -1.1854095458984375, -1.12786865234375, -1.0703277587890625, -1.012786865234375, -0.9552459716796875, -0.897705078125, -0.8401641845703125, -0.782623291015625, -0.7250823974609375, -0.66754150390625, -0.6100006103515625, -0.552459716796875, -0.4949188232421875, -0.4373779296875, -0.3798370361328125, -0.322296142578125, -0.2647552490234375, -0.20721435546875, -0.1496734619140625, -0.092132568359375, -0.0345916748046875, 0.02294921875, 0.0804901123046875, 0.138031005859375, 0.1955718994140625, 0.25311279296875, 0.3106536865234375, 0.368194580078125, 0.4257354736328125, 0.4832763671875, 0.5408172607421875, 0.598358154296875, 0.6558990478515625, 0.71343994140625, 0.7709808349609375, 0.828521728515625, 0.8860626220703125, 0.943603515625, 1.0011444091796875, 1.058685302734375, 1.1162261962890625, 1.17376708984375, 1.2313079833984375, 1.288848876953125, 1.3463897705078125, 1.4039306640625, 1.4614715576171875, 1.519012451171875, 1.5765533447265625, 1.63409423828125, 1.6916351318359375, 1.749176025390625, 1.8067169189453125, 1.8642578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 2.0, 8.0, 4.0, 14.0, 10.0, 13.0, 13.0, 15.0, 22.0, 29.0, 31.0, 39.0, 39.0, 42.0, 56.0, 47.0, 64.0, 53.0, 48.0, 58.0, 55.0, 51.0, 39.0, 36.0, 35.0, 30.0, 19.0, 29.0, 21.0, 18.0, 10.0, 13.0, 5.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.0002033710479736328, -0.00019766390323638916, -0.0001919567584991455, -0.00018624961376190186, -0.0001805424690246582, -0.00017483532428741455, -0.0001691281795501709, -0.00016342103481292725, -0.0001577138900756836, -0.00015200674533843994, -0.0001462996006011963, -0.00014059245586395264, -0.00013488531112670898, -0.00012917816638946533, -0.00012347102165222168, -0.00011776387691497803, -0.00011205673217773438, -0.00010634958744049072, -0.00010064244270324707, -9.493529796600342e-05, -8.922815322875977e-05, -8.352100849151611e-05, -7.781386375427246e-05, -7.210671901702881e-05, -6.639957427978516e-05, -6.0692429542541504e-05, -5.498528480529785e-05, -4.92781400680542e-05, -4.357099533081055e-05, -3.7863850593566895e-05, -3.215670585632324e-05, -2.644956111907959e-05, -2.0742416381835938e-05, -1.5035271644592285e-05, -9.328126907348633e-06, -3.6209821701049805e-06, 2.086162567138672e-06, 7.793307304382324e-06, 1.3500452041625977e-05, 1.920759677886963e-05, 2.491474151611328e-05, 3.0621886253356934e-05, 3.6329030990600586e-05, 4.203617572784424e-05, 4.774332046508789e-05, 5.345046520233154e-05, 5.9157609939575195e-05, 6.486475467681885e-05, 7.05718994140625e-05, 7.627904415130615e-05, 8.19861888885498e-05, 8.769333362579346e-05, 9.340047836303711e-05, 9.910762310028076e-05, 0.00010481476783752441, 0.00011052191257476807, 0.00011622905731201172, 0.00012193620204925537, 0.00012764334678649902, 0.00013335049152374268, 0.00013905763626098633, 0.00014476478099822998, 0.00015047192573547363, 0.00015617907047271729, 0.00016188621520996094]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 7.0, 9.0, 17.0, 25.0, 44.0, 52.0, 73.0, 106.0, 166.0, 241.0, 355.0, 576.0, 939.0, 1595.0, 2726.0, 4911.0, 9401.0, 18417.0, 37699.0, 74090.0, 131905.0, 188881.0, 204704.0, 163085.0, 100536.0, 53156.0, 26215.0, 13093.0, 6518.0, 3626.0, 2035.0, 1224.0, 741.0, 485.0, 304.0, 193.0, 130.0, 74.0, 76.0, 44.0, 28.0, 18.0, 9.0, 9.0, 7.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.072265625, -2.003753662109375, -1.93524169921875, -1.866729736328125, -1.7982177734375, -1.729705810546875, -1.66119384765625, -1.592681884765625, -1.524169921875, -1.455657958984375, -1.38714599609375, -1.318634033203125, -1.2501220703125, -1.181610107421875, -1.11309814453125, -1.044586181640625, -0.97607421875, -0.907562255859375, -0.83905029296875, -0.770538330078125, -0.7020263671875, -0.633514404296875, -0.56500244140625, -0.496490478515625, -0.427978515625, -0.359466552734375, -0.29095458984375, -0.222442626953125, -0.1539306640625, -0.085418701171875, -0.01690673828125, 0.051605224609375, 0.1201171875, 0.188629150390625, 0.25714111328125, 0.325653076171875, 0.3941650390625, 0.462677001953125, 0.53118896484375, 0.599700927734375, 0.668212890625, 0.736724853515625, 0.80523681640625, 0.873748779296875, 0.9422607421875, 1.010772705078125, 1.07928466796875, 1.147796630859375, 1.21630859375, 1.284820556640625, 1.35333251953125, 1.421844482421875, 1.4903564453125, 1.558868408203125, 1.62738037109375, 1.695892333984375, 1.764404296875, 1.832916259765625, 1.90142822265625, 1.969940185546875, 2.0384521484375, 2.106964111328125, 2.17547607421875, 2.243988037109375, 2.3125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 7.0, 2.0, 3.0, 5.0, 8.0, 7.0, 18.0, 20.0, 18.0, 30.0, 33.0, 25.0, 39.0, 39.0, 38.0, 45.0, 47.0, 54.0, 57.0, 65.0, 52.0, 56.0, 55.0, 41.0, 45.0, 45.0, 35.0, 30.0, 18.0, 12.0, 19.0, 11.0, 8.0, 7.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8173828125, -0.793304443359375, -0.76922607421875, -0.745147705078125, -0.7210693359375, -0.696990966796875, -0.67291259765625, -0.648834228515625, -0.624755859375, -0.600677490234375, -0.57659912109375, -0.552520751953125, -0.5284423828125, -0.504364013671875, -0.48028564453125, -0.456207275390625, -0.43212890625, -0.408050537109375, -0.38397216796875, -0.359893798828125, -0.3358154296875, -0.311737060546875, -0.28765869140625, -0.263580322265625, -0.239501953125, -0.215423583984375, -0.19134521484375, -0.167266845703125, -0.1431884765625, -0.119110107421875, -0.09503173828125, -0.070953369140625, -0.046875, -0.022796630859375, 0.00128173828125, 0.025360107421875, 0.0494384765625, 0.073516845703125, 0.09759521484375, 0.121673583984375, 0.145751953125, 0.169830322265625, 0.19390869140625, 0.217987060546875, 0.2420654296875, 0.266143798828125, 0.29022216796875, 0.314300537109375, 0.33837890625, 0.362457275390625, 0.38653564453125, 0.410614013671875, 0.4346923828125, 0.458770751953125, 0.48284912109375, 0.506927490234375, 0.531005859375, 0.555084228515625, 0.57916259765625, 0.603240966796875, 0.6273193359375, 0.651397705078125, 0.67547607421875, 0.699554443359375, 0.7236328125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 12.0, 11.0, 7.0, 14.0, 21.0, 12.0, 25.0, 27.0, 35.0, 30.0, 45.0, 40.0, 42.0, 51.0, 58.0, 49.0, 44.0, 50.0, 45.0, 46.0, 42.0, 45.0, 47.0, 37.0, 28.0, 24.0, 18.0, 23.0, 12.0, 15.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.23851490020752, -7.989044189453125, -7.7395734786987305, -7.490102767944336, -7.240632057189941, -6.991161346435547, -6.741690635681152, -6.492219924926758, -6.242749214172363, -5.993278503417969, -5.743807792663574, -5.49433708190918, -5.244866371154785, -4.995395660400391, -4.745924949645996, -4.496454238891602, -4.246984004974365, -3.9975132942199707, -3.748042583465576, -3.4985718727111816, -3.249101161956787, -2.9996304512023926, -2.750159978866577, -2.5006892681121826, -2.251218557357788, -2.0017478466033936, -1.752277135848999, -1.502806544303894, -1.2533358335494995, -1.003865122795105, -0.75439453125, -0.5049238204956055, -0.25545310974121094, -0.005982428789138794, 0.24348825216293335, 0.4929589033126831, 0.7424296140670776, 0.9919003248214722, 1.2413709163665771, 1.4908416271209717, 1.7403123378753662, 1.9897830486297607, 2.2392537593841553, 2.4887242317199707, 2.7381949424743652, 2.9876656532287598, 3.2371363639831543, 3.486607074737549, 3.7360777854919434, 3.985548496246338, 4.235019207000732, 4.484489917755127, 4.7339606285095215, 4.983431339263916, 5.232901573181152, 5.482372283935547, 5.731842994689941, 5.981313705444336, 6.2307844161987305, 6.480255126953125, 6.7297258377075195, 6.979196548461914, 7.228667259216309, 7.478137969970703, 7.727608680725098]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 9.0, 4.0, 3.0, 9.0, 12.0, 8.0, 13.0, 15.0, 16.0, 18.0, 24.0, 23.0, 24.0, 36.0, 22.0, 39.0, 35.0, 41.0, 36.0, 36.0, 41.0, 50.0, 32.0, 45.0, 32.0, 44.0, 40.0, 36.0, 39.0, 22.0, 24.0, 36.0, 21.0, 21.0, 22.0, 13.0, 7.0, 12.0, 7.0, 10.0, 3.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.392923831939697, -6.135748863220215, -5.878574371337891, -5.621399402618408, -5.364224433898926, -5.107049942016602, -4.849874973297119, -4.592700004577637, -4.3355255126953125, -4.07835054397583, -3.8211758136749268, -3.5640010833740234, -3.306826114654541, -3.0496513843536377, -2.7924766540527344, -2.535301685333252, -2.2781267166137695, -2.020951986312866, -1.7637770175933838, -1.5066022872924805, -1.2494274377822876, -0.9922525882720947, -0.7350778579711914, -0.47790300846099854, -0.22072815895080566, 0.03644666075706482, 0.2936214804649353, 0.5507962703704834, 0.8079711198806763, 1.0651459693908691, 1.3223206996917725, 1.5794955492019653, 1.836669921875, 2.0938446521759033, 2.3510196208953857, 2.608194351196289, 2.8653693199157715, 3.122544050216675, 3.379718780517578, 3.6368937492370605, 3.894068479537964, 4.151243209838867, 4.40841817855835, 4.665593147277832, 4.922767639160156, 5.179942607879639, 5.437117576599121, 5.694292068481445, 5.951467037200928, 6.20864200592041, 6.465816497802734, 6.722991466522217, 6.980166435241699, 7.237340927124023, 7.494515895843506, 7.751690864562988, 8.008865356445312, 8.266039848327637, 8.523215293884277, 8.780389785766602, 9.037564277648926, 9.294739723205566, 9.55191421508789, 9.809088706970215, 10.066264152526855]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 11.0, 14.0, 24.0, 34.0, 48.0, 85.0, 125.0, 190.0, 275.0, 516.0, 893.0, 1521.0, 2707.0, 4306.0, 7882.0, 13786.0, 24889.0, 44979.0, 81942.0, 150127.0, 268605.0, 456949.0, 677510.0, 778119.0, 659979.0, 438925.0, 256081.0, 142908.0, 79248.0, 44040.0, 24667.0, 13827.0, 7961.0, 4490.0, 2697.0, 1513.0, 916.0, 580.0, 353.0, 215.0, 125.0, 74.0, 47.0, 32.0, 13.0, 23.0, 12.0, 9.0, 2.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.234375, -8.9407958984375, -8.647216796875, -8.3536376953125, -8.06005859375, -7.7664794921875, -7.472900390625, -7.1793212890625, -6.8857421875, -6.5921630859375, -6.298583984375, -6.0050048828125, -5.71142578125, -5.4178466796875, -5.124267578125, -4.8306884765625, -4.537109375, -4.2435302734375, -3.949951171875, -3.6563720703125, -3.36279296875, -3.0692138671875, -2.775634765625, -2.4820556640625, -2.1884765625, -1.8948974609375, -1.601318359375, -1.3077392578125, -1.01416015625, -0.7205810546875, -0.427001953125, -0.1334228515625, 0.16015625, 0.4537353515625, 0.747314453125, 1.0408935546875, 1.33447265625, 1.6280517578125, 1.921630859375, 2.2152099609375, 2.5087890625, 2.8023681640625, 3.095947265625, 3.3895263671875, 3.68310546875, 3.9766845703125, 4.270263671875, 4.5638427734375, 4.857421875, 5.1510009765625, 5.444580078125, 5.7381591796875, 6.03173828125, 6.3253173828125, 6.618896484375, 6.9124755859375, 7.2060546875, 7.4996337890625, 7.793212890625, 8.0867919921875, 8.38037109375, 8.6739501953125, 8.967529296875, 9.2611083984375, 9.5546875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 6.0, 9.0, 12.0, 7.0, 7.0, 7.0, 11.0, 15.0, 15.0, 7.0, 11.0, 24.0, 31.0, 39.0, 27.0, 24.0, 35.0, 33.0, 29.0, 36.0, 46.0, 43.0, 36.0, 34.0, 45.0, 34.0, 46.0, 40.0, 31.0, 39.0, 28.0, 27.0, 29.0, 18.0, 22.0, 16.0, 14.0, 9.0, 5.0, 10.0, 10.0, 9.0, 11.0, 7.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.05078125, -5.83331298828125, -5.6158447265625, -5.39837646484375, -5.180908203125, -4.96343994140625, -4.7459716796875, -4.52850341796875, -4.31103515625, -4.09356689453125, -3.8760986328125, -3.65863037109375, -3.441162109375, -3.22369384765625, -3.0062255859375, -2.78875732421875, -2.5712890625, -2.35382080078125, -2.1363525390625, -1.91888427734375, -1.701416015625, -1.48394775390625, -1.2664794921875, -1.04901123046875, -0.83154296875, -0.61407470703125, -0.3966064453125, -0.17913818359375, 0.038330078125, 0.25579833984375, 0.4732666015625, 0.69073486328125, 0.908203125, 1.12567138671875, 1.3431396484375, 1.56060791015625, 1.778076171875, 1.99554443359375, 2.2130126953125, 2.43048095703125, 2.64794921875, 2.86541748046875, 3.0828857421875, 3.30035400390625, 3.517822265625, 3.73529052734375, 3.9527587890625, 4.17022705078125, 4.3876953125, 4.60516357421875, 4.8226318359375, 5.04010009765625, 5.257568359375, 5.47503662109375, 5.6925048828125, 5.90997314453125, 6.12744140625, 6.34490966796875, 6.5623779296875, 6.77984619140625, 6.997314453125, 7.21478271484375, 7.4322509765625, 7.64971923828125, 7.8671875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 3.0, 7.0, 10.0, 13.0, 34.0, 45.0, 78.0, 148.0, 237.0, 383.0, 664.0, 1014.0, 1906.0, 3144.0, 5228.0, 8693.0, 14729.0, 24858.0, 40403.0, 65586.0, 105865.0, 164246.0, 242344.0, 341280.0, 439412.0, 512816.0, 527917.0, 480297.0, 388184.0, 286118.0, 198317.0, 130225.0, 82277.0, 51374.0, 30686.0, 18389.0, 11159.0, 6566.0, 3952.0, 2236.0, 1377.0, 823.0, 520.0, 294.0, 169.0, 97.0, 80.0, 34.0, 24.0, 15.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-7.328125, -7.10760498046875, -6.8870849609375, -6.66656494140625, -6.446044921875, -6.22552490234375, -6.0050048828125, -5.78448486328125, -5.56396484375, -5.34344482421875, -5.1229248046875, -4.90240478515625, -4.681884765625, -4.46136474609375, -4.2408447265625, -4.02032470703125, -3.7998046875, -3.57928466796875, -3.3587646484375, -3.13824462890625, -2.917724609375, -2.69720458984375, -2.4766845703125, -2.25616455078125, -2.03564453125, -1.81512451171875, -1.5946044921875, -1.37408447265625, -1.153564453125, -0.93304443359375, -0.7125244140625, -0.49200439453125, -0.271484375, -0.05096435546875, 0.1695556640625, 0.39007568359375, 0.610595703125, 0.83111572265625, 1.0516357421875, 1.27215576171875, 1.49267578125, 1.71319580078125, 1.9337158203125, 2.15423583984375, 2.374755859375, 2.59527587890625, 2.8157958984375, 3.03631591796875, 3.2568359375, 3.47735595703125, 3.6978759765625, 3.91839599609375, 4.138916015625, 4.35943603515625, 4.5799560546875, 4.80047607421875, 5.02099609375, 5.24151611328125, 5.4620361328125, 5.68255615234375, 5.903076171875, 6.12359619140625, 6.3441162109375, 6.56463623046875, 6.78515625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [7.0, 2.0, 0.0, 3.0, 2.0, 4.0, 9.0, 10.0, 5.0, 15.0, 19.0, 18.0, 23.0, 23.0, 42.0, 49.0, 60.0, 48.0, 71.0, 80.0, 82.0, 105.0, 136.0, 139.0, 156.0, 193.0, 192.0, 182.0, 195.0, 215.0, 231.0, 196.0, 195.0, 183.0, 152.0, 156.0, 142.0, 103.0, 96.0, 88.0, 70.0, 61.0, 60.0, 51.0, 34.0, 33.0, 37.0, 25.0, 15.0, 17.0, 17.0, 9.0, 11.0, 4.0, 11.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.98828125, -2.88720703125, -2.7861328125, -2.68505859375, -2.583984375, -2.48291015625, -2.3818359375, -2.28076171875, -2.1796875, -2.07861328125, -1.9775390625, -1.87646484375, -1.775390625, -1.67431640625, -1.5732421875, -1.47216796875, -1.37109375, -1.27001953125, -1.1689453125, -1.06787109375, -0.966796875, -0.86572265625, -0.7646484375, -0.66357421875, -0.5625, -0.46142578125, -0.3603515625, -0.25927734375, -0.158203125, -0.05712890625, 0.0439453125, 0.14501953125, 0.24609375, 0.34716796875, 0.4482421875, 0.54931640625, 0.650390625, 0.75146484375, 0.8525390625, 0.95361328125, 1.0546875, 1.15576171875, 1.2568359375, 1.35791015625, 1.458984375, 1.56005859375, 1.6611328125, 1.76220703125, 1.86328125, 1.96435546875, 2.0654296875, 2.16650390625, 2.267578125, 2.36865234375, 2.4697265625, 2.57080078125, 2.671875, 2.77294921875, 2.8740234375, 2.97509765625, 3.076171875, 3.17724609375, 3.2783203125, 3.37939453125, 3.48046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 9.0, 5.0, 9.0, 7.0, 11.0, 7.0, 14.0, 9.0, 22.0, 16.0, 23.0, 21.0, 23.0, 32.0, 43.0, 35.0, 56.0, 49.0, 39.0, 50.0, 49.0, 55.0, 41.0, 43.0, 34.0, 31.0, 37.0, 33.0, 22.0, 27.0, 25.0, 15.0, 15.0, 10.0, 11.0, 14.0, 10.0, 9.0, 6.0, 12.0, 5.0, 1.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-7.132905960083008, -6.912222385406494, -6.691538333892822, -6.470854759216309, -6.250171184539795, -6.029487609863281, -5.808803558349609, -5.588119983673096, -5.367436408996582, -5.146752834320068, -4.9260687828063965, -4.705385208129883, -4.484701633453369, -4.2640180587768555, -4.043334007263184, -3.82265043258667, -3.601966381072998, -3.3812825679779053, -3.1605989933013916, -2.939915180206299, -2.719231605529785, -2.4985477924346924, -2.2778639793395996, -2.057180404663086, -1.8364965915679932, -1.61581289768219, -1.3951292037963867, -1.174445390701294, -0.9537616968154907, -0.7330780029296875, -0.5123941898345947, -0.2917104959487915, -0.07102632522583008, 0.14965739846229553, 0.37034112215042114, 0.5910248756408691, 0.8117085695266724, 1.0323922634124756, 1.2530760765075684, 1.4737597703933716, 1.6944434642791748, 1.915127158164978, 2.1358108520507812, 2.356494665145874, 2.577178478240967, 2.7978620529174805, 3.0185458660125732, 3.239229679107666, 3.4599132537841797, 3.6805970668792725, 3.901280641555786, 4.121964454650879, 4.342648029327393, 4.563331604003906, 4.784015655517578, 5.004699230194092, 5.2253828048706055, 5.446066379547119, 5.666750431060791, 5.887434005737305, 6.108117580413818, 6.328801155090332, 6.549485206604004, 6.770168781280518, 6.9908528327941895]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 6.0, 9.0, 8.0, 12.0, 15.0, 14.0, 23.0, 17.0, 27.0, 26.0, 19.0, 41.0, 40.0, 32.0, 31.0, 40.0, 48.0, 49.0, 42.0, 46.0, 32.0, 41.0, 38.0, 48.0, 42.0, 33.0, 35.0, 24.0, 28.0, 24.0, 20.0, 17.0, 8.0, 13.0, 11.0, 7.0, 12.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.792871952056885, -7.5218424797058105, -7.250812530517578, -6.979783058166504, -6.70875358581543, -6.437723636627197, -6.166694164276123, -5.895664215087891, -5.624634742736816, -5.353605270385742, -5.08257532119751, -4.8115458488464355, -4.540515899658203, -4.269486427307129, -3.9984569549560547, -3.7274272441864014, -3.456397533416748, -3.1853678226470947, -2.9143381118774414, -2.643308639526367, -2.372278928756714, -2.1012492179870605, -1.8302196264266968, -1.559190034866333, -1.2881603240966797, -1.0171306133270264, -0.7461010217666626, -0.47507137060165405, -0.2040417194366455, 0.06698799133300781, 0.3380175828933716, 0.6090471744537354, 0.8800773620605469, 1.1511070728302002, 1.422136664390564, 1.6931662559509277, 1.964195966720581, 2.2352256774902344, 2.5062551498413086, 2.777284860610962, 3.0483145713806152, 3.3193442821502686, 3.590373992919922, 3.861403465270996, 4.13243293762207, 4.403462886810303, 4.674492359161377, 4.945522308349609, 5.216551780700684, 5.487581253051758, 5.75861120223999, 6.0296406745910645, 6.300670623779297, 6.571700096130371, 6.842729568481445, 7.1137590408325195, 7.384788990020752, 7.655818462371826, 7.926848411560059, 8.197877883911133, 8.468907356262207, 8.739936828613281, 9.010967254638672, 9.281996726989746, 9.55302619934082]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 15.0, 12.0, 20.0, 37.0, 53.0, 79.0, 141.0, 204.0, 285.0, 508.0, 707.0, 1078.0, 1698.0, 2509.0, 3893.0, 5727.0, 8868.0, 14086.0, 22299.0, 36178.0, 61732.0, 113816.0, 313928.0, 224243.0, 95615.0, 53702.0, 31824.0, 19668.0, 12321.0, 8022.0, 5210.0, 3412.0, 2277.0, 1540.0, 1004.0, 635.0, 437.0, 268.0, 177.0, 109.0, 78.0, 50.0, 27.0, 21.0, 16.0, 11.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -4.007080078125, -3.88134765625, -3.755615234375, -3.6298828125, -3.504150390625, -3.37841796875, -3.252685546875, -3.126953125, -3.001220703125, -2.87548828125, -2.749755859375, -2.6240234375, -2.498291015625, -2.37255859375, -2.246826171875, -2.12109375, -1.995361328125, -1.86962890625, -1.743896484375, -1.6181640625, -1.492431640625, -1.36669921875, -1.240966796875, -1.115234375, -0.989501953125, -0.86376953125, -0.738037109375, -0.6123046875, -0.486572265625, -0.36083984375, -0.235107421875, -0.109375, 0.016357421875, 0.14208984375, 0.267822265625, 0.3935546875, 0.519287109375, 0.64501953125, 0.770751953125, 0.896484375, 1.022216796875, 1.14794921875, 1.273681640625, 1.3994140625, 1.525146484375, 1.65087890625, 1.776611328125, 1.90234375, 2.028076171875, 2.15380859375, 2.279541015625, 2.4052734375, 2.531005859375, 2.65673828125, 2.782470703125, 2.908203125, 3.033935546875, 3.15966796875, 3.285400390625, 3.4111328125, 3.536865234375, 3.66259765625, 3.788330078125, 3.9140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 0.0, 3.0, 1.0, 7.0, 9.0, 9.0, 10.0, 17.0, 14.0, 22.0, 17.0, 22.0, 26.0, 25.0, 28.0, 36.0, 36.0, 36.0, 41.0, 44.0, 43.0, 46.0, 42.0, 45.0, 42.0, 36.0, 44.0, 32.0, 35.0, 42.0, 35.0, 26.0, 17.0, 20.0, 17.0, 15.0, 19.0, 10.0, 5.0, 8.0, 8.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1328125, -7.8548583984375, -7.576904296875, -7.2989501953125, -7.02099609375, -6.7430419921875, -6.465087890625, -6.1871337890625, -5.9091796875, -5.6312255859375, -5.353271484375, -5.0753173828125, -4.79736328125, -4.5194091796875, -4.241455078125, -3.9635009765625, -3.685546875, -3.4075927734375, -3.129638671875, -2.8516845703125, -2.57373046875, -2.2957763671875, -2.017822265625, -1.7398681640625, -1.4619140625, -1.1839599609375, -0.906005859375, -0.6280517578125, -0.35009765625, -0.0721435546875, 0.205810546875, 0.4837646484375, 0.76171875, 1.0396728515625, 1.317626953125, 1.5955810546875, 1.87353515625, 2.1514892578125, 2.429443359375, 2.7073974609375, 2.9853515625, 3.2633056640625, 3.541259765625, 3.8192138671875, 4.09716796875, 4.3751220703125, 4.653076171875, 4.9310302734375, 5.208984375, 5.4869384765625, 5.764892578125, 6.0428466796875, 6.32080078125, 6.5987548828125, 6.876708984375, 7.1546630859375, 7.4326171875, 7.7105712890625, 7.988525390625, 8.2664794921875, 8.54443359375, 8.8223876953125, 9.100341796875, 9.3782958984375, 9.65625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 12.0, 17.0, 29.0, 38.0, 67.0, 95.0, 134.0, 185.0, 263.0, 355.0, 516.0, 736.0, 1075.0, 1543.0, 2236.0, 3200.0, 4759.0, 6972.0, 10397.0, 15616.0, 23335.0, 35168.0, 53679.0, 88575.0, 190379.0, 309769.0, 110958.0, 64201.0, 41002.0, 27256.0, 18190.0, 11898.0, 8181.0, 5590.0, 3731.0, 2634.0, 1745.0, 1199.0, 866.0, 582.0, 406.0, 269.0, 200.0, 148.0, 118.0, 81.0, 61.0, 29.0, 18.0, 15.0, 3.0, 6.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.451171875, -3.34051513671875, -3.2298583984375, -3.11920166015625, -3.008544921875, -2.89788818359375, -2.7872314453125, -2.67657470703125, -2.56591796875, -2.45526123046875, -2.3446044921875, -2.23394775390625, -2.123291015625, -2.01263427734375, -1.9019775390625, -1.79132080078125, -1.6806640625, -1.57000732421875, -1.4593505859375, -1.34869384765625, -1.238037109375, -1.12738037109375, -1.0167236328125, -0.90606689453125, -0.79541015625, -0.68475341796875, -0.5740966796875, -0.46343994140625, -0.352783203125, -0.24212646484375, -0.1314697265625, -0.02081298828125, 0.08984375, 0.20050048828125, 0.3111572265625, 0.42181396484375, 0.532470703125, 0.64312744140625, 0.7537841796875, 0.86444091796875, 0.97509765625, 1.08575439453125, 1.1964111328125, 1.30706787109375, 1.417724609375, 1.52838134765625, 1.6390380859375, 1.74969482421875, 1.8603515625, 1.97100830078125, 2.0816650390625, 2.19232177734375, 2.302978515625, 2.41363525390625, 2.5242919921875, 2.63494873046875, 2.74560546875, 2.85626220703125, 2.9669189453125, 3.07757568359375, 3.188232421875, 3.29888916015625, 3.4095458984375, 3.52020263671875, 3.630859375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 14.0, 10.0, 10.0, 15.0, 16.0, 25.0, 19.0, 23.0, 30.0, 26.0, 22.0, 23.0, 27.0, 31.0, 27.0, 29.0, 37.0, 40.0, 28.0, 42.0, 47.0, 38.0, 38.0, 33.0, 27.0, 35.0, 40.0, 24.0, 16.0, 24.0, 29.0, 22.0, 14.0, 16.0, 18.0, 9.0, 10.0, 6.0, 9.0, 9.0, 6.0, 2.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.4453125, -4.30242919921875, -4.1595458984375, -4.01666259765625, -3.873779296875, -3.73089599609375, -3.5880126953125, -3.44512939453125, -3.30224609375, -3.15936279296875, -3.0164794921875, -2.87359619140625, -2.730712890625, -2.58782958984375, -2.4449462890625, -2.30206298828125, -2.1591796875, -2.01629638671875, -1.8734130859375, -1.73052978515625, -1.587646484375, -1.44476318359375, -1.3018798828125, -1.15899658203125, -1.01611328125, -0.87322998046875, -0.7303466796875, -0.58746337890625, -0.444580078125, -0.30169677734375, -0.1588134765625, -0.01593017578125, 0.126953125, 0.26983642578125, 0.4127197265625, 0.55560302734375, 0.698486328125, 0.84136962890625, 0.9842529296875, 1.12713623046875, 1.27001953125, 1.41290283203125, 1.5557861328125, 1.69866943359375, 1.841552734375, 1.98443603515625, 2.1273193359375, 2.27020263671875, 2.4130859375, 2.55596923828125, 2.6988525390625, 2.84173583984375, 2.984619140625, 3.12750244140625, 3.2703857421875, 3.41326904296875, 3.55615234375, 3.69903564453125, 3.8419189453125, 3.98480224609375, 4.127685546875, 4.27056884765625, 4.4134521484375, 4.55633544921875, 4.69921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 13.0, 8.0, 17.0, 37.0, 42.0, 68.0, 84.0, 139.0, 186.0, 289.0, 445.0, 706.0, 1084.0, 1547.0, 2365.0, 3906.0, 6370.0, 10290.0, 17817.0, 32261.0, 62544.0, 131645.0, 244312.0, 248769.0, 138216.0, 65201.0, 33344.0, 18471.0, 10698.0, 6369.0, 4039.0, 2539.0, 1654.0, 1022.0, 656.0, 459.0, 320.0, 195.0, 148.0, 91.0, 60.0, 38.0, 36.0, 19.0, 10.0, 9.0, 8.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.009033203125, -0.008742094039916992, -0.008450984954833984, -0.008159875869750977, -0.007868766784667969, -0.007577657699584961, -0.007286548614501953, -0.006995439529418945, -0.0067043304443359375, -0.00641322135925293, -0.006122112274169922, -0.005831003189086914, -0.005539894104003906, -0.0052487850189208984, -0.004957675933837891, -0.004666566848754883, -0.004375457763671875, -0.004084348678588867, -0.0037932395935058594, -0.0035021305084228516, -0.0032110214233398438, -0.002919912338256836, -0.002628803253173828, -0.0023376941680908203, -0.0020465850830078125, -0.0017554759979248047, -0.0014643669128417969, -0.001173257827758789, -0.0008821487426757812, -0.0005910396575927734, -0.0002999305725097656, -8.821487426757812e-06, 0.00028228759765625, 0.0005733966827392578, 0.0008645057678222656, 0.0011556148529052734, 0.0014467239379882812, 0.001737833023071289, 0.002028942108154297, 0.0023200511932373047, 0.0026111602783203125, 0.0029022693634033203, 0.003193378448486328, 0.003484487533569336, 0.0037755966186523438, 0.0040667057037353516, 0.004357814788818359, 0.004648923873901367, 0.004940032958984375, 0.005231142044067383, 0.005522251129150391, 0.0058133602142333984, 0.006104469299316406, 0.006395578384399414, 0.006686687469482422, 0.00697779655456543, 0.0072689056396484375, 0.007560014724731445, 0.007851123809814453, 0.008142232894897461, 0.008433341979980469, 0.008724451065063477, 0.009015560150146484, 0.009306669235229492, 0.0095977783203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 7.0, 3.0, 8.0, 12.0, 9.0, 23.0, 35.0, 20.0, 29.0, 23.0, 34.0, 38.0, 48.0, 56.0, 38.0, 65.0, 42.0, 70.0, 52.0, 52.0, 39.0, 42.0, 58.0, 30.0, 45.0, 21.0, 27.0, 7.0, 17.0, 13.0, 10.0, 7.0, 3.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.662441253662109e-06, -5.45848160982132e-06, -5.25452196598053e-06, -5.05056232213974e-06, -4.84660267829895e-06, -4.64264303445816e-06, -4.438683390617371e-06, -4.234723746776581e-06, -4.030764102935791e-06, -3.826804459095001e-06, -3.6228448152542114e-06, -3.4188851714134216e-06, -3.214925527572632e-06, -3.010965883731842e-06, -2.8070062398910522e-06, -2.6030465960502625e-06, -2.3990869522094727e-06, -2.195127308368683e-06, -1.991167664527893e-06, -1.7872080206871033e-06, -1.5832483768463135e-06, -1.3792887330055237e-06, -1.1753290891647339e-06, -9.71369445323944e-07, -7.674098014831543e-07, -5.634501576423645e-07, -3.594905138015747e-07, -1.555308699607849e-07, 4.842877388000488e-08, 2.523884177207947e-07, 4.5634806156158447e-07, 6.603077054023743e-07, 8.642673492431641e-07, 1.0682269930839539e-06, 1.2721866369247437e-06, 1.4761462807655334e-06, 1.6801059246063232e-06, 1.884065568447113e-06, 2.088025212287903e-06, 2.2919848561286926e-06, 2.4959444999694824e-06, 2.6999041438102722e-06, 2.903863787651062e-06, 3.107823431491852e-06, 3.3117830753326416e-06, 3.5157427191734314e-06, 3.719702363014221e-06, 3.923662006855011e-06, 4.127621650695801e-06, 4.3315812945365906e-06, 4.53554093837738e-06, 4.73950058221817e-06, 4.94346022605896e-06, 5.14741986989975e-06, 5.3513795137405396e-06, 5.555339157581329e-06, 5.759298801422119e-06, 5.963258445262909e-06, 6.167218089103699e-06, 6.3711777329444885e-06, 6.575137376785278e-06, 6.779097020626068e-06, 6.983056664466858e-06, 7.187016308307648e-06, 7.3909759521484375e-06]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 4.0, 11.0, 11.0, 19.0, 29.0, 37.0, 65.0, 101.0, 129.0, 206.0, 309.0, 460.0, 714.0, 1038.0, 1603.0, 2539.0, 3979.0, 6288.0, 10284.0, 16756.0, 28107.0, 49513.0, 92854.0, 164880.0, 221884.0, 188432.0, 112420.0, 60156.0, 33894.0, 19739.0, 11775.0, 7305.0, 4530.0, 3005.0, 1836.0, 1244.0, 803.0, 504.0, 364.0, 242.0, 168.0, 109.0, 68.0, 50.0, 22.0, 30.0, 14.0, 9.0, 9.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.007442474365234375, -0.007182776927947998, -0.006923079490661621, -0.006663382053375244, -0.006403684616088867, -0.00614398717880249, -0.005884289741516113, -0.005624592304229736, -0.005364894866943359, -0.005105197429656982, -0.0048454999923706055, -0.0045858025550842285, -0.0043261051177978516, -0.004066407680511475, -0.0038067102432250977, -0.0035470128059387207, -0.0032873153686523438, -0.003027617931365967, -0.00276792049407959, -0.002508223056793213, -0.002248525619506836, -0.001988828182220459, -0.001729130744934082, -0.001469433307647705, -0.0012097358703613281, -0.0009500384330749512, -0.0006903409957885742, -0.00043064355850219727, -0.0001709461212158203, 8.875131607055664e-05, 0.0003484487533569336, 0.0006081461906433105, 0.0008678436279296875, 0.0011275410652160645, 0.0013872385025024414, 0.0016469359397888184, 0.0019066333770751953, 0.0021663308143615723, 0.0024260282516479492, 0.002685725688934326, 0.002945423126220703, 0.00320512056350708, 0.003464818000793457, 0.003724515438079834, 0.003984212875366211, 0.004243910312652588, 0.004503607749938965, 0.004763305187225342, 0.005023002624511719, 0.005282700061798096, 0.005542397499084473, 0.00580209493637085, 0.0060617923736572266, 0.0063214898109436035, 0.0065811872482299805, 0.006840884685516357, 0.007100582122802734, 0.007360279560089111, 0.007619976997375488, 0.007879674434661865, 0.008139371871948242, 0.00839906930923462, 0.008658766746520996, 0.008918464183807373, 0.00917816162109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 12.0, 10.0, 7.0, 20.0, 20.0, 20.0, 38.0, 42.0, 44.0, 66.0, 72.0, 90.0, 98.0, 81.0, 71.0, 50.0, 62.0, 45.0, 29.0, 27.0, 22.0, 8.0, 10.0, 11.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.003936767578125, -0.003811657428741455, -0.00368654727935791, -0.0035614371299743652, -0.0034363269805908203, -0.0033112168312072754, -0.0031861066818237305, -0.0030609965324401855, -0.0029358863830566406, -0.0028107762336730957, -0.0026856660842895508, -0.002560555934906006, -0.002435445785522461, -0.002310335636138916, -0.002185225486755371, -0.002060115337371826, -0.0019350051879882812, -0.0018098950386047363, -0.0016847848892211914, -0.0015596747398376465, -0.0014345645904541016, -0.0013094544410705566, -0.0011843442916870117, -0.0010592341423034668, -0.0009341239929199219, -0.000809013843536377, -0.000683903694152832, -0.0005587935447692871, -0.0004336833953857422, -0.00030857324600219727, -0.00018346309661865234, -5.835294723510742e-05, 6.67572021484375e-05, 0.00019186735153198242, 0.00031697750091552734, 0.00044208765029907227, 0.0005671977996826172, 0.0006923079490661621, 0.000817418098449707, 0.000942528247833252, 0.0010676383972167969, 0.0011927485466003418, 0.0013178586959838867, 0.0014429688453674316, 0.0015680789947509766, 0.0016931891441345215, 0.0018182992935180664, 0.0019434094429016113, 0.0020685195922851562, 0.002193629741668701, 0.002318739891052246, 0.002443850040435791, 0.002568960189819336, 0.002694070339202881, 0.0028191804885864258, 0.0029442906379699707, 0.0030694007873535156, 0.0031945109367370605, 0.0033196210861206055, 0.0034447312355041504, 0.0035698413848876953, 0.0036949515342712402, 0.003820061683654785, 0.00394517183303833, 0.004070281982421875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 7.0, 7.0, 9.0, 11.0, 11.0, 17.0, 14.0, 17.0, 23.0, 24.0, 27.0, 33.0, 34.0, 36.0, 50.0, 50.0, 43.0, 46.0, 48.0, 46.0, 40.0, 43.0, 35.0, 41.0, 34.0, 29.0, 28.0, 27.0, 18.0, 18.0, 17.0, 14.0, 12.0, 13.0, 10.0, 9.0, 7.0, 9.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-6.744120121002197, -6.5294084548950195, -6.314696788787842, -6.099985122680664, -5.885273456573486, -5.670561790466309, -5.455850601196289, -5.241138458251953, -5.026427268981934, -4.811715602874756, -4.597003936767578, -4.3822922706604, -4.167580604553223, -3.952868938446045, -3.7381575107574463, -3.5234458446502686, -3.3087339401245117, -3.094022274017334, -2.8793106079101562, -2.6645989418029785, -2.449887275695801, -2.235175609588623, -2.0204641819000244, -1.8057525157928467, -1.591040849685669, -1.3763291835784912, -1.1616175174713135, -0.9469059705734253, -0.7321943044662476, -0.5174826383590698, -0.30277109146118164, -0.0880594253540039, 0.12665271759033203, 0.3413643538951874, 0.5560759902000427, 0.7707875967025757, 0.9854992628097534, 1.2002109289169312, 1.4149224758148193, 1.629634141921997, 1.8443458080291748, 2.0590574741363525, 2.2737691402435303, 2.488480567932129, 2.7031922340393066, 2.9179039001464844, 3.132615566253662, 3.34732723236084, 3.5620388984680176, 3.7767505645751953, 3.991462230682373, 4.206173896789551, 4.4208855628967285, 4.635597229003906, 4.850308418273926, 5.065020561218262, 5.279731750488281, 5.494443416595459, 5.709155082702637, 5.9238667488098145, 6.138578414916992, 6.35329008102417, 6.568001747131348, 6.782712936401367, 6.997425079345703]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 8.0, 9.0, 12.0, 15.0, 15.0, 20.0, 19.0, 27.0, 27.0, 19.0, 40.0, 40.0, 31.0, 31.0, 42.0, 47.0, 47.0, 43.0, 47.0, 32.0, 41.0, 38.0, 48.0, 42.0, 32.0, 36.0, 22.0, 26.0, 28.0, 19.0, 17.0, 10.0, 12.0, 11.0, 7.0, 11.0, 10.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.787393569946289, -7.517526149749756, -7.247659206390381, -6.977791786193848, -6.7079243659973145, -6.438056945800781, -6.168190002441406, -5.898322582244873, -5.62845516204834, -5.358587741851807, -5.088720798492432, -4.818853378295898, -4.548985958099365, -4.279118537902832, -4.009251594543457, -3.739384174346924, -3.469517230987549, -3.1996500492095947, -2.9297826290130615, -2.6599154472351074, -2.390048027038574, -2.12018084526062, -1.850313663482666, -1.5804463624954224, -1.3105790615081787, -1.040711760520935, -0.7708445191383362, -0.5009772777557373, -0.23110997676849365, 0.03875732421875, 0.3086245059967041, 0.5784918069839478, 0.8483591079711914, 1.118226408958435, 1.3880937099456787, 1.6579608917236328, 1.9278281927108765, 2.19769549369812, 2.467562675476074, 2.7374300956726074, 3.0072972774505615, 3.2771644592285156, 3.547031879425049, 3.816899061203003, 4.086766242980957, 4.35663366317749, 4.626501083374023, 4.896368026733398, 5.166235446929932, 5.436102867126465, 5.70596981048584, 5.975837230682373, 6.245704650878906, 6.515571594238281, 6.7854390144348145, 7.055306434631348, 7.325173377990723, 7.595040798187256, 7.864907741546631, 8.134775161743164, 8.404642105102539, 8.67451000213623, 8.944376945495605, 9.21424388885498, 9.484111785888672]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 13.0, 16.0, 30.0, 52.0, 88.0, 130.0, 238.0, 432.0, 637.0, 1164.0, 1854.0, 2935.0, 4775.0, 7918.0, 12696.0, 20012.0, 31518.0, 48924.0, 72517.0, 100565.0, 126385.0, 138443.0, 132160.0, 109809.0, 81015.0, 56220.0, 36802.0, 23275.0, 14471.0, 8950.0, 5672.0, 3467.0, 2115.0, 1269.0, 800.0, 485.0, 288.0, 179.0, 96.0, 40.0, 37.0, 20.0, 17.0, 7.0, 6.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.40625, -7.1478271484375, -6.889404296875, -6.6309814453125, -6.37255859375, -6.1141357421875, -5.855712890625, -5.5972900390625, -5.3388671875, -5.0804443359375, -4.822021484375, -4.5635986328125, -4.30517578125, -4.0467529296875, -3.788330078125, -3.5299072265625, -3.271484375, -3.0130615234375, -2.754638671875, -2.4962158203125, -2.23779296875, -1.9793701171875, -1.720947265625, -1.4625244140625, -1.2041015625, -0.9456787109375, -0.687255859375, -0.4288330078125, -0.17041015625, 0.0880126953125, 0.346435546875, 0.6048583984375, 0.86328125, 1.1217041015625, 1.380126953125, 1.6385498046875, 1.89697265625, 2.1553955078125, 2.413818359375, 2.6722412109375, 2.9306640625, 3.1890869140625, 3.447509765625, 3.7059326171875, 3.96435546875, 4.2227783203125, 4.481201171875, 4.7396240234375, 4.998046875, 5.2564697265625, 5.514892578125, 5.7733154296875, 6.03173828125, 6.2901611328125, 6.548583984375, 6.8070068359375, 7.0654296875, 7.3238525390625, 7.582275390625, 7.8406982421875, 8.09912109375, 8.3575439453125, 8.615966796875, 8.8743896484375, 9.1328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 5.0, 6.0, 6.0, 16.0, 10.0, 10.0, 13.0, 12.0, 15.0, 14.0, 15.0, 27.0, 32.0, 33.0, 31.0, 35.0, 35.0, 37.0, 37.0, 55.0, 38.0, 41.0, 39.0, 52.0, 43.0, 30.0, 38.0, 34.0, 39.0, 33.0, 23.0, 21.0, 30.0, 17.0, 15.0, 15.0, 4.0, 14.0, 7.0, 11.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76171875, -6.49859619140625, -6.2354736328125, -5.97235107421875, -5.709228515625, -5.44610595703125, -5.1829833984375, -4.91986083984375, -4.65673828125, -4.39361572265625, -4.1304931640625, -3.86737060546875, -3.604248046875, -3.34112548828125, -3.0780029296875, -2.81488037109375, -2.5517578125, -2.28863525390625, -2.0255126953125, -1.76239013671875, -1.499267578125, -1.23614501953125, -0.9730224609375, -0.70989990234375, -0.44677734375, -0.18365478515625, 0.0794677734375, 0.34259033203125, 0.605712890625, 0.86883544921875, 1.1319580078125, 1.39508056640625, 1.658203125, 1.92132568359375, 2.1844482421875, 2.44757080078125, 2.710693359375, 2.97381591796875, 3.2369384765625, 3.50006103515625, 3.76318359375, 4.02630615234375, 4.2894287109375, 4.55255126953125, 4.815673828125, 5.07879638671875, 5.3419189453125, 5.60504150390625, 5.8681640625, 6.13128662109375, 6.3944091796875, 6.65753173828125, 6.920654296875, 7.18377685546875, 7.4468994140625, 7.71002197265625, 7.97314453125, 8.23626708984375, 8.4993896484375, 8.76251220703125, 9.025634765625, 9.28875732421875, 9.5518798828125, 9.81500244140625, 10.078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 11.0, 14.0, 32.0, 39.0, 53.0, 98.0, 150.0, 234.0, 340.0, 484.0, 759.0, 1141.0, 1761.0, 2584.0, 3775.0, 5620.0, 8546.0, 12690.0, 18498.0, 27331.0, 38200.0, 53220.0, 70702.0, 88396.0, 102958.0, 110379.0, 108136.0, 97822.0, 80539.0, 62990.0, 46609.0, 33031.0, 23230.0, 15534.0, 10789.0, 7218.0, 4852.0, 3265.0, 2243.0, 1461.0, 951.0, 614.0, 430.0, 295.0, 184.0, 135.0, 82.0, 45.0, 29.0, 23.0, 11.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-6.71875, -6.50738525390625, -6.2960205078125, -6.08465576171875, -5.873291015625, -5.66192626953125, -5.4505615234375, -5.23919677734375, -5.02783203125, -4.81646728515625, -4.6051025390625, -4.39373779296875, -4.182373046875, -3.97100830078125, -3.7596435546875, -3.54827880859375, -3.3369140625, -3.12554931640625, -2.9141845703125, -2.70281982421875, -2.491455078125, -2.28009033203125, -2.0687255859375, -1.85736083984375, -1.64599609375, -1.43463134765625, -1.2232666015625, -1.01190185546875, -0.800537109375, -0.58917236328125, -0.3778076171875, -0.16644287109375, 0.044921875, 0.25628662109375, 0.4676513671875, 0.67901611328125, 0.890380859375, 1.10174560546875, 1.3131103515625, 1.52447509765625, 1.73583984375, 1.94720458984375, 2.1585693359375, 2.36993408203125, 2.581298828125, 2.79266357421875, 3.0040283203125, 3.21539306640625, 3.4267578125, 3.63812255859375, 3.8494873046875, 4.06085205078125, 4.272216796875, 4.48358154296875, 4.6949462890625, 4.90631103515625, 5.11767578125, 5.32904052734375, 5.5404052734375, 5.75177001953125, 5.963134765625, 6.17449951171875, 6.3858642578125, 6.59722900390625, 6.80859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 2.0, 8.0, 4.0, 6.0, 4.0, 6.0, 9.0, 8.0, 16.0, 18.0, 18.0, 25.0, 32.0, 24.0, 22.0, 29.0, 39.0, 30.0, 46.0, 37.0, 40.0, 35.0, 28.0, 44.0, 23.0, 40.0, 41.0, 32.0, 38.0, 40.0, 26.0, 22.0, 20.0, 22.0, 28.0, 19.0, 24.0, 14.0, 13.0, 12.0, 10.0, 5.0, 8.0, 8.0, 7.0, 2.0, 6.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.70703125, -4.5538330078125, -4.400634765625, -4.2474365234375, -4.09423828125, -3.9410400390625, -3.787841796875, -3.6346435546875, -3.4814453125, -3.3282470703125, -3.175048828125, -3.0218505859375, -2.86865234375, -2.7154541015625, -2.562255859375, -2.4090576171875, -2.255859375, -2.1026611328125, -1.949462890625, -1.7962646484375, -1.64306640625, -1.4898681640625, -1.336669921875, -1.1834716796875, -1.0302734375, -0.8770751953125, -0.723876953125, -0.5706787109375, -0.41748046875, -0.2642822265625, -0.111083984375, 0.0421142578125, 0.1953125, 0.3485107421875, 0.501708984375, 0.6549072265625, 0.80810546875, 0.9613037109375, 1.114501953125, 1.2677001953125, 1.4208984375, 1.5740966796875, 1.727294921875, 1.8804931640625, 2.03369140625, 2.1868896484375, 2.340087890625, 2.4932861328125, 2.646484375, 2.7996826171875, 2.952880859375, 3.1060791015625, 3.25927734375, 3.4124755859375, 3.565673828125, 3.7188720703125, 3.8720703125, 4.0252685546875, 4.178466796875, 4.3316650390625, 4.48486328125, 4.6380615234375, 4.791259765625, 4.9444580078125, 5.09765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 5.0, 9.0, 9.0, 17.0, 20.0, 51.0, 60.0, 109.0, 150.0, 213.0, 322.0, 490.0, 795.0, 1152.0, 1951.0, 2990.0, 4929.0, 8365.0, 13937.0, 23032.0, 37852.0, 59753.0, 86356.0, 114111.0, 134035.0, 138590.0, 125339.0, 100405.0, 71682.0, 47441.0, 29310.0, 17758.0, 10583.0, 6305.0, 3890.0, 2386.0, 1507.0, 895.0, 580.0, 378.0, 279.0, 159.0, 112.0, 68.0, 57.0, 38.0, 20.0, 24.0, 11.0, 9.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5185546875, -1.4714508056640625, -1.424346923828125, -1.3772430419921875, -1.33013916015625, -1.2830352783203125, -1.235931396484375, -1.1888275146484375, -1.1417236328125, -1.0946197509765625, -1.047515869140625, -1.0004119873046875, -0.95330810546875, -0.9062042236328125, -0.859100341796875, -0.8119964599609375, -0.764892578125, -0.7177886962890625, -0.670684814453125, -0.6235809326171875, -0.57647705078125, -0.5293731689453125, -0.482269287109375, -0.4351654052734375, -0.3880615234375, -0.3409576416015625, -0.293853759765625, -0.2467498779296875, -0.19964599609375, -0.1525421142578125, -0.105438232421875, -0.0583343505859375, -0.01123046875, 0.0358734130859375, 0.082977294921875, 0.1300811767578125, 0.17718505859375, 0.2242889404296875, 0.271392822265625, 0.3184967041015625, 0.3656005859375, 0.4127044677734375, 0.459808349609375, 0.5069122314453125, 0.55401611328125, 0.6011199951171875, 0.648223876953125, 0.6953277587890625, 0.742431640625, 0.7895355224609375, 0.836639404296875, 0.8837432861328125, 0.93084716796875, 0.9779510498046875, 1.025054931640625, 1.0721588134765625, 1.1192626953125, 1.1663665771484375, 1.213470458984375, 1.2605743408203125, 1.30767822265625, 1.3547821044921875, 1.401885986328125, 1.4489898681640625, 1.49609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 3.0, 7.0, 6.0, 4.0, 5.0, 6.0, 7.0, 17.0, 18.0, 14.0, 21.0, 25.0, 20.0, 30.0, 17.0, 21.0, 32.0, 29.0, 39.0, 46.0, 42.0, 28.0, 47.0, 44.0, 54.0, 61.0, 38.0, 39.0, 39.0, 36.0, 35.0, 34.0, 24.0, 12.0, 18.0, 13.0, 14.0, 10.0, 7.0, 8.0, 9.0, 5.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012612342834472656, -0.0001216307282447815, -0.00011713802814483643, -0.00011264532804489136, -0.00010815262794494629, -0.00010365992784500122, -9.916722774505615e-05, -9.467452764511108e-05, -9.018182754516602e-05, -8.568912744522095e-05, -8.119642734527588e-05, -7.670372724533081e-05, -7.221102714538574e-05, -6.771832704544067e-05, -6.32256269454956e-05, -5.873292684555054e-05, -5.424022674560547e-05, -4.97475266456604e-05, -4.525482654571533e-05, -4.0762126445770264e-05, -3.6269426345825195e-05, -3.177672624588013e-05, -2.728402614593506e-05, -2.279132604598999e-05, -1.8298625946044922e-05, -1.3805925846099854e-05, -9.313225746154785e-06, -4.820525646209717e-06, -3.2782554626464844e-07, 4.16487455368042e-06, 8.657574653625488e-06, 1.3150274753570557e-05, 1.7642974853515625e-05, 2.2135674953460693e-05, 2.6628375053405762e-05, 3.112107515335083e-05, 3.56137752532959e-05, 4.010647535324097e-05, 4.4599175453186035e-05, 4.9091875553131104e-05, 5.358457565307617e-05, 5.807727575302124e-05, 6.256997585296631e-05, 6.706267595291138e-05, 7.155537605285645e-05, 7.604807615280151e-05, 8.054077625274658e-05, 8.503347635269165e-05, 8.952617645263672e-05, 9.401887655258179e-05, 9.851157665252686e-05, 0.00010300427675247192, 0.00010749697685241699, 0.00011198967695236206, 0.00011648237705230713, 0.0001209750771522522, 0.00012546777725219727, 0.00012996047735214233, 0.0001344531774520874, 0.00013894587755203247, 0.00014343857765197754, 0.0001479312777519226, 0.00015242397785186768, 0.00015691667795181274, 0.0001614093780517578]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 1.0, 7.0, 7.0, 7.0, 15.0, 16.0, 29.0, 52.0, 56.0, 87.0, 118.0, 150.0, 261.0, 372.0, 598.0, 951.0, 1448.0, 2414.0, 3987.0, 6574.0, 11157.0, 19584.0, 33144.0, 54368.0, 83532.0, 115311.0, 141659.0, 148386.0, 133780.0, 104358.0, 72473.0, 45942.0, 27617.0, 16349.0, 9506.0, 5564.0, 3253.0, 1976.0, 1203.0, 716.0, 520.0, 305.0, 214.0, 158.0, 99.0, 56.0, 59.0, 40.0, 26.0, 14.0, 13.0, 11.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.5830078125, -1.532470703125, -1.48193359375, -1.431396484375, -1.380859375, -1.330322265625, -1.27978515625, -1.229248046875, -1.1787109375, -1.128173828125, -1.07763671875, -1.027099609375, -0.9765625, -0.926025390625, -0.87548828125, -0.824951171875, -0.7744140625, -0.723876953125, -0.67333984375, -0.622802734375, -0.572265625, -0.521728515625, -0.47119140625, -0.420654296875, -0.3701171875, -0.319580078125, -0.26904296875, -0.218505859375, -0.16796875, -0.117431640625, -0.06689453125, -0.016357421875, 0.0341796875, 0.084716796875, 0.13525390625, 0.185791015625, 0.236328125, 0.286865234375, 0.33740234375, 0.387939453125, 0.4384765625, 0.489013671875, 0.53955078125, 0.590087890625, 0.640625, 0.691162109375, 0.74169921875, 0.792236328125, 0.8427734375, 0.893310546875, 0.94384765625, 0.994384765625, 1.044921875, 1.095458984375, 1.14599609375, 1.196533203125, 1.2470703125, 1.297607421875, 1.34814453125, 1.398681640625, 1.44921875, 1.499755859375, 1.55029296875, 1.600830078125, 1.6513671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 13.0, 10.0, 15.0, 20.0, 35.0, 39.0, 45.0, 48.0, 62.0, 64.0, 63.0, 70.0, 69.0, 57.0, 54.0, 57.0, 46.0, 45.0, 31.0, 39.0, 31.0, 18.0, 14.0, 19.0, 6.0, 3.0, 9.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.955078125, -0.9252700805664062, -0.8954620361328125, -0.8656539916992188, -0.835845947265625, -0.8060379028320312, -0.7762298583984375, -0.7464218139648438, -0.71661376953125, -0.6868057250976562, -0.6569976806640625, -0.6271896362304688, -0.597381591796875, -0.5675735473632812, -0.5377655029296875, -0.5079574584960938, -0.4781494140625, -0.44834136962890625, -0.4185333251953125, -0.38872528076171875, -0.358917236328125, -0.32910919189453125, -0.2993011474609375, -0.26949310302734375, -0.23968505859375, -0.20987701416015625, -0.1800689697265625, -0.15026092529296875, -0.120452880859375, -0.09064483642578125, -0.0608367919921875, -0.03102874755859375, -0.001220703125, 0.02858734130859375, 0.0583953857421875, 0.08820343017578125, 0.118011474609375, 0.14781951904296875, 0.1776275634765625, 0.20743560791015625, 0.23724365234375, 0.26705169677734375, 0.2968597412109375, 0.32666778564453125, 0.356475830078125, 0.38628387451171875, 0.4160919189453125, 0.44589996337890625, 0.4757080078125, 0.5055160522460938, 0.5353240966796875, 0.5651321411132812, 0.594940185546875, 0.6247482299804688, 0.6545562744140625, 0.6843643188476562, 0.71417236328125, 0.7439804077148438, 0.7737884521484375, 0.8035964965820312, 0.833404541015625, 0.8632125854492188, 0.8930206298828125, 0.9228286743164062, 0.95263671875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 7.0, 4.0, 10.0, 14.0, 10.0, 10.0, 14.0, 11.0, 18.0, 14.0, 25.0, 35.0, 43.0, 36.0, 38.0, 49.0, 39.0, 48.0, 49.0, 45.0, 54.0, 38.0, 42.0, 37.0, 31.0, 32.0, 30.0, 12.0, 33.0, 22.0, 24.0, 23.0, 19.0, 11.0, 9.0, 6.0, 9.0, 7.0, 12.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.669055461883545, -6.456001281738281, -6.242947578430176, -6.02989387512207, -5.816839694976807, -5.603785514831543, -5.3907318115234375, -5.177678108215332, -4.964623928070068, -4.751569747924805, -4.538516044616699, -4.325462341308594, -4.11240816116333, -3.8993542194366455, -3.686300277709961, -3.4732463359832764, -3.260192394256592, -3.0471384525299072, -2.8340845108032227, -2.621030569076538, -2.4079766273498535, -2.194922685623169, -1.9818687438964844, -1.7688148021697998, -1.5557608604431152, -1.3427069187164307, -1.129652976989746, -0.9165990352630615, -0.703545093536377, -0.4904911518096924, -0.2774372100830078, -0.06438326835632324, 0.14867115020751953, 0.3617250919342041, 0.5747790336608887, 0.7878329753875732, 1.0008869171142578, 1.2139408588409424, 1.426994800567627, 1.6400487422943115, 1.853102684020996, 2.0661566257476807, 2.2792105674743652, 2.49226450920105, 2.7053184509277344, 2.918372392654419, 3.1314263343811035, 3.344480276107788, 3.5575342178344727, 3.7705881595611572, 3.983642101287842, 4.1966962814331055, 4.409749984741211, 4.622803688049316, 4.83585786819458, 5.048912048339844, 5.261965751647949, 5.475019454956055, 5.688073635101318, 5.901127815246582, 6.1141815185546875, 6.327235221862793, 6.540289402008057, 6.75334358215332, 6.966397285461426]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 9.0, 5.0, 12.0, 8.0, 16.0, 16.0, 26.0, 22.0, 20.0, 26.0, 20.0, 40.0, 25.0, 51.0, 36.0, 66.0, 43.0, 52.0, 47.0, 37.0, 42.0, 40.0, 42.0, 41.0, 40.0, 35.0, 31.0, 21.0, 27.0, 21.0, 17.0, 13.0, 9.0, 13.0, 4.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.204326629638672, -8.905534744262695, -8.606742858886719, -8.307950973510742, -8.009159088134766, -7.710367679595947, -7.411576271057129, -7.112784385681152, -6.813992500305176, -6.515200614929199, -6.216408729553223, -5.917617321014404, -5.618825435638428, -5.320033550262451, -5.021242141723633, -4.722450256347656, -4.42365837097168, -4.124866485595703, -3.8260748386383057, -3.527283191680908, -3.2284913063049316, -2.929699420928955, -2.6309077739715576, -2.33211612701416, -2.0333242416381836, -1.7345324754714966, -1.4357407093048096, -1.1369489431381226, -0.8381571769714355, -0.5393654108047485, -0.24057364463806152, 0.05821800231933594, 0.3570108413696289, 0.6558026075363159, 0.9545943737030029, 1.25338613986969, 1.552177906036377, 1.850969672203064, 2.149761438369751, 2.4485530853271484, 2.747344970703125, 3.0461368560791016, 3.344928503036499, 3.6437201499938965, 3.942512035369873, 4.24130392074585, 4.540095329284668, 4.8388872146606445, 5.137679100036621, 5.436470985412598, 5.735262870788574, 6.034054279327393, 6.332846164703369, 6.631638050079346, 6.930429458618164, 7.229221343994141, 7.528013229370117, 7.826805114746094, 8.12559700012207, 8.424388885498047, 8.723180770874023, 9.021971702575684, 9.32076358795166, 9.619555473327637, 9.918347358703613]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 8.0, 14.0, 7.0, 20.0, 43.0, 53.0, 94.0, 143.0, 233.0, 434.0, 599.0, 1056.0, 1773.0, 2792.0, 4523.0, 7778.0, 12818.0, 21484.0, 36478.0, 61411.0, 104017.0, 173897.0, 283895.0, 431743.0, 580220.0, 652811.0, 597395.0, 455998.0, 303843.0, 187670.0, 112712.0, 65912.0, 38469.0, 22140.0, 12999.0, 7735.0, 4416.0, 2708.0, 1521.0, 949.0, 570.0, 346.0, 247.0, 119.0, 81.0, 52.0, 25.0, 22.0, 7.0, 4.0, 6.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.0625, -7.80712890625, -7.5517578125, -7.29638671875, -7.041015625, -6.78564453125, -6.5302734375, -6.27490234375, -6.01953125, -5.76416015625, -5.5087890625, -5.25341796875, -4.998046875, -4.74267578125, -4.4873046875, -4.23193359375, -3.9765625, -3.72119140625, -3.4658203125, -3.21044921875, -2.955078125, -2.69970703125, -2.4443359375, -2.18896484375, -1.93359375, -1.67822265625, -1.4228515625, -1.16748046875, -0.912109375, -0.65673828125, -0.4013671875, -0.14599609375, 0.109375, 0.36474609375, 0.6201171875, 0.87548828125, 1.130859375, 1.38623046875, 1.6416015625, 1.89697265625, 2.15234375, 2.40771484375, 2.6630859375, 2.91845703125, 3.173828125, 3.42919921875, 3.6845703125, 3.93994140625, 4.1953125, 4.45068359375, 4.7060546875, 4.96142578125, 5.216796875, 5.47216796875, 5.7275390625, 5.98291015625, 6.23828125, 6.49365234375, 6.7490234375, 7.00439453125, 7.259765625, 7.51513671875, 7.7705078125, 8.02587890625, 8.28125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 6.0, 6.0, 9.0, 8.0, 11.0, 10.0, 16.0, 14.0, 11.0, 15.0, 24.0, 29.0, 26.0, 34.0, 42.0, 28.0, 42.0, 49.0, 43.0, 41.0, 42.0, 45.0, 39.0, 33.0, 34.0, 48.0, 29.0, 34.0, 35.0, 31.0, 28.0, 14.0, 21.0, 19.0, 15.0, 16.0, 11.0, 10.0, 9.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.14453125, -6.90313720703125, -6.6617431640625, -6.42034912109375, -6.178955078125, -5.93756103515625, -5.6961669921875, -5.45477294921875, -5.21337890625, -4.97198486328125, -4.7305908203125, -4.48919677734375, -4.247802734375, -4.00640869140625, -3.7650146484375, -3.52362060546875, -3.2822265625, -3.04083251953125, -2.7994384765625, -2.55804443359375, -2.316650390625, -2.07525634765625, -1.8338623046875, -1.59246826171875, -1.35107421875, -1.10968017578125, -0.8682861328125, -0.62689208984375, -0.385498046875, -0.14410400390625, 0.0972900390625, 0.33868408203125, 0.580078125, 0.82147216796875, 1.0628662109375, 1.30426025390625, 1.545654296875, 1.78704833984375, 2.0284423828125, 2.26983642578125, 2.51123046875, 2.75262451171875, 2.9940185546875, 3.23541259765625, 3.476806640625, 3.71820068359375, 3.9595947265625, 4.20098876953125, 4.4423828125, 4.68377685546875, 4.9251708984375, 5.16656494140625, 5.407958984375, 5.64935302734375, 5.8907470703125, 6.13214111328125, 6.37353515625, 6.61492919921875, 6.8563232421875, 7.09771728515625, 7.339111328125, 7.58050537109375, 7.8218994140625, 8.06329345703125, 8.3046875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 19.0, 16.0, 40.0, 61.0, 92.0, 158.0, 225.0, 382.0, 634.0, 1034.0, 1731.0, 2685.0, 4540.0, 7623.0, 12679.0, 20814.0, 34001.0, 55239.0, 87474.0, 135772.0, 199281.0, 281612.0, 368630.0, 444900.0, 488335.0, 483558.0, 430976.0, 350174.0, 262550.0, 185407.0, 125143.0, 79937.0, 50075.0, 31045.0, 18725.0, 11442.0, 6859.0, 4084.0, 2462.0, 1476.0, 924.0, 553.0, 347.0, 216.0, 144.0, 82.0, 46.0, 32.0, 24.0, 10.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.703125, -6.49298095703125, -6.2828369140625, -6.07269287109375, -5.862548828125, -5.65240478515625, -5.4422607421875, -5.23211669921875, -5.02197265625, -4.81182861328125, -4.6016845703125, -4.39154052734375, -4.181396484375, -3.97125244140625, -3.7611083984375, -3.55096435546875, -3.3408203125, -3.13067626953125, -2.9205322265625, -2.71038818359375, -2.500244140625, -2.29010009765625, -2.0799560546875, -1.86981201171875, -1.65966796875, -1.44952392578125, -1.2393798828125, -1.02923583984375, -0.819091796875, -0.60894775390625, -0.3988037109375, -0.18865966796875, 0.021484375, 0.23162841796875, 0.4417724609375, 0.65191650390625, 0.862060546875, 1.07220458984375, 1.2823486328125, 1.49249267578125, 1.70263671875, 1.91278076171875, 2.1229248046875, 2.33306884765625, 2.543212890625, 2.75335693359375, 2.9635009765625, 3.17364501953125, 3.3837890625, 3.59393310546875, 3.8040771484375, 4.01422119140625, 4.224365234375, 4.43450927734375, 4.6446533203125, 4.85479736328125, 5.06494140625, 5.27508544921875, 5.4852294921875, 5.69537353515625, 5.905517578125, 6.11566162109375, 6.3258056640625, 6.53594970703125, 6.74609375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 3.0, 6.0, 4.0, 11.0, 21.0, 17.0, 15.0, 29.0, 34.0, 52.0, 53.0, 62.0, 94.0, 107.0, 112.0, 148.0, 133.0, 196.0, 196.0, 210.0, 223.0, 222.0, 221.0, 234.0, 193.0, 213.0, 193.0, 168.0, 148.0, 163.0, 131.0, 92.0, 85.0, 57.0, 54.0, 26.0, 38.0, 24.0, 19.0, 19.0, 14.0, 10.0, 6.0, 6.0, 9.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.787384033203125, -3.66656494140625, -3.545745849609375, -3.4249267578125, -3.304107666015625, -3.18328857421875, -3.062469482421875, -2.941650390625, -2.820831298828125, -2.70001220703125, -2.579193115234375, -2.4583740234375, -2.337554931640625, -2.21673583984375, -2.095916748046875, -1.97509765625, -1.854278564453125, -1.73345947265625, -1.612640380859375, -1.4918212890625, -1.371002197265625, -1.25018310546875, -1.129364013671875, -1.008544921875, -0.887725830078125, -0.76690673828125, -0.646087646484375, -0.5252685546875, -0.404449462890625, -0.28363037109375, -0.162811279296875, -0.0419921875, 0.078826904296875, 0.19964599609375, 0.320465087890625, 0.4412841796875, 0.562103271484375, 0.68292236328125, 0.803741455078125, 0.924560546875, 1.045379638671875, 1.16619873046875, 1.287017822265625, 1.4078369140625, 1.528656005859375, 1.64947509765625, 1.770294189453125, 1.89111328125, 2.011932373046875, 2.13275146484375, 2.253570556640625, 2.3743896484375, 2.495208740234375, 2.61602783203125, 2.736846923828125, 2.857666015625, 2.978485107421875, 3.09930419921875, 3.220123291015625, 3.3409423828125, 3.461761474609375, 3.58258056640625, 3.703399658203125, 3.82421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 2.0, 6.0, 6.0, 6.0, 9.0, 7.0, 15.0, 16.0, 12.0, 14.0, 27.0, 16.0, 30.0, 27.0, 31.0, 29.0, 37.0, 45.0, 41.0, 62.0, 44.0, 52.0, 47.0, 34.0, 46.0, 30.0, 33.0, 34.0, 35.0, 19.0, 23.0, 33.0, 22.0, 18.0, 14.0, 19.0, 12.0, 7.0, 7.0, 10.0, 9.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.2608256340026855, -7.035211086273193, -6.809596061706543, -6.583981513977051, -6.358366966247559, -6.132751941680908, -5.907137393951416, -5.681522369384766, -5.455907821655273, -5.230293273925781, -5.004678249359131, -4.779063701629639, -4.553448677062988, -4.327834129333496, -4.102219581604004, -3.8766047954559326, -3.6509900093078613, -3.42537522315979, -3.1997604370117188, -2.9741458892822266, -2.7485311031341553, -2.522916316986084, -2.297301769256592, -2.0716869831085205, -1.8460721969604492, -1.620457410812378, -1.3948427438735962, -1.1692280769348145, -0.9436132907867432, -0.7179985046386719, -0.49238383769989014, -0.2667691707611084, -0.04115486145019531, 0.1844598650932312, 0.4100745916366577, 0.6356893181800842, 0.8613040447235107, 1.086918830871582, 1.3125334978103638, 1.5381481647491455, 1.7637629508972168, 1.989377737045288, 2.2149925231933594, 2.4406070709228516, 2.666221857070923, 2.891836643218994, 3.1174511909484863, 3.3430659770965576, 3.568680763244629, 3.7942955493927, 4.0199103355407715, 4.245524883270264, 4.471139907836914, 4.696754455566406, 4.922369003295898, 5.147983551025391, 5.373598575592041, 5.599213123321533, 5.824828147888184, 6.050442695617676, 6.276057243347168, 6.501672267913818, 6.7272868156433105, 6.952901840209961, 7.178516387939453]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 4.0, 2.0, 3.0, 8.0, 5.0, 8.0, 11.0, 11.0, 14.0, 20.0, 14.0, 28.0, 24.0, 26.0, 28.0, 37.0, 38.0, 28.0, 34.0, 39.0, 36.0, 33.0, 43.0, 41.0, 45.0, 35.0, 44.0, 33.0, 48.0, 33.0, 29.0, 24.0, 23.0, 31.0, 23.0, 18.0, 19.0, 14.0, 13.0, 8.0, 4.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.454634666442871, -8.189760208129883, -7.924886226654053, -7.660012245178223, -7.395137786865234, -7.130263328552246, -6.865389347076416, -6.600515365600586, -6.335640907287598, -6.070766448974609, -5.805892467498779, -5.541018486022949, -5.276144027709961, -5.011269569396973, -4.746395587921143, -4.4815216064453125, -4.216647148132324, -3.951772928237915, -3.686898708343506, -3.4220244884490967, -3.1571502685546875, -2.8922760486602783, -2.627401828765869, -2.36252760887146, -2.097653388977051, -1.8327791690826416, -1.5679049491882324, -1.3030307292938232, -1.038156509399414, -0.7732822895050049, -0.5084080696105957, -0.24353384971618652, 0.021340370178222656, 0.28621459007263184, 0.551088809967041, 0.8159630298614502, 1.0808372497558594, 1.3457114696502686, 1.6105856895446777, 1.875459909439087, 2.140334129333496, 2.4052083492279053, 2.6700825691223145, 2.9349567890167236, 3.199831008911133, 3.464705228805542, 3.729579448699951, 3.9944536685943604, 4.2593278884887695, 4.524202346801758, 4.789076328277588, 5.053950309753418, 5.318824768066406, 5.5836992263793945, 5.848573207855225, 6.113447189331055, 6.378321647644043, 6.643196105957031, 6.908070087432861, 7.172944068908691, 7.43781852722168, 7.702692985534668, 7.967566967010498, 8.232440948486328, 8.497315406799316]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 12.0, 20.0, 13.0, 26.0, 38.0, 50.0, 87.0, 132.0, 195.0, 287.0, 453.0, 596.0, 918.0, 1543.0, 2294.0, 3552.0, 5814.0, 9391.0, 15657.0, 26488.0, 46407.0, 86541.0, 191749.0, 369534.0, 130299.0, 65709.0, 36315.0, 21117.0, 12460.0, 7627.0, 4702.0, 3039.0, 1846.0, 1233.0, 828.0, 498.0, 352.0, 227.0, 174.0, 135.0, 68.0, 37.0, 34.0, 19.0, 13.0, 16.0, 9.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.640625, -4.49688720703125, -4.3531494140625, -4.20941162109375, -4.065673828125, -3.92193603515625, -3.7781982421875, -3.63446044921875, -3.49072265625, -3.34698486328125, -3.2032470703125, -3.05950927734375, -2.915771484375, -2.77203369140625, -2.6282958984375, -2.48455810546875, -2.3408203125, -2.19708251953125, -2.0533447265625, -1.90960693359375, -1.765869140625, -1.62213134765625, -1.4783935546875, -1.33465576171875, -1.19091796875, -1.04718017578125, -0.9034423828125, -0.75970458984375, -0.615966796875, -0.47222900390625, -0.3284912109375, -0.18475341796875, -0.041015625, 0.10272216796875, 0.2464599609375, 0.39019775390625, 0.533935546875, 0.67767333984375, 0.8214111328125, 0.96514892578125, 1.10888671875, 1.25262451171875, 1.3963623046875, 1.54010009765625, 1.683837890625, 1.82757568359375, 1.9713134765625, 2.11505126953125, 2.2587890625, 2.40252685546875, 2.5462646484375, 2.69000244140625, 2.833740234375, 2.97747802734375, 3.1212158203125, 3.26495361328125, 3.40869140625, 3.55242919921875, 3.6961669921875, 3.83990478515625, 3.983642578125, 4.12738037109375, 4.2711181640625, 4.41485595703125, 4.55859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 6.0, 8.0, 6.0, 11.0, 7.0, 5.0, 18.0, 17.0, 21.0, 27.0, 23.0, 25.0, 33.0, 40.0, 34.0, 50.0, 39.0, 35.0, 41.0, 44.0, 47.0, 44.0, 44.0, 50.0, 37.0, 33.0, 26.0, 34.0, 36.0, 23.0, 30.0, 26.0, 16.0, 16.0, 12.0, 11.0, 5.0, 3.0, 2.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.2578125, -8.9674072265625, -8.677001953125, -8.3865966796875, -8.09619140625, -7.8057861328125, -7.515380859375, -7.2249755859375, -6.9345703125, -6.6441650390625, -6.353759765625, -6.0633544921875, -5.77294921875, -5.4825439453125, -5.192138671875, -4.9017333984375, -4.611328125, -4.3209228515625, -4.030517578125, -3.7401123046875, -3.44970703125, -3.1593017578125, -2.868896484375, -2.5784912109375, -2.2880859375, -1.9976806640625, -1.707275390625, -1.4168701171875, -1.12646484375, -0.8360595703125, -0.545654296875, -0.2552490234375, 0.03515625, 0.3255615234375, 0.615966796875, 0.9063720703125, 1.19677734375, 1.4871826171875, 1.777587890625, 2.0679931640625, 2.3583984375, 2.6488037109375, 2.939208984375, 3.2296142578125, 3.52001953125, 3.8104248046875, 4.100830078125, 4.3912353515625, 4.681640625, 4.9720458984375, 5.262451171875, 5.5528564453125, 5.84326171875, 6.1336669921875, 6.424072265625, 6.7144775390625, 7.0048828125, 7.2952880859375, 7.585693359375, 7.8760986328125, 8.16650390625, 8.4569091796875, 8.747314453125, 9.0377197265625, 9.328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 12.0, 14.0, 29.0, 42.0, 40.0, 89.0, 114.0, 173.0, 265.0, 350.0, 578.0, 814.0, 1221.0, 1750.0, 2700.0, 3987.0, 5902.0, 9222.0, 14030.0, 21455.0, 33454.0, 52565.0, 89002.0, 183889.0, 324845.0, 118228.0, 66559.0, 41000.0, 26096.0, 17167.0, 11000.0, 7365.0, 4845.0, 3194.0, 2073.0, 1437.0, 983.0, 655.0, 492.0, 253.0, 214.0, 139.0, 96.0, 78.0, 57.0, 25.0, 26.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.10546875, -3.97808837890625, -3.8507080078125, -3.72332763671875, -3.595947265625, -3.46856689453125, -3.3411865234375, -3.21380615234375, -3.08642578125, -2.95904541015625, -2.8316650390625, -2.70428466796875, -2.576904296875, -2.44952392578125, -2.3221435546875, -2.19476318359375, -2.0673828125, -1.94000244140625, -1.8126220703125, -1.68524169921875, -1.557861328125, -1.43048095703125, -1.3031005859375, -1.17572021484375, -1.04833984375, -0.92095947265625, -0.7935791015625, -0.66619873046875, -0.538818359375, -0.41143798828125, -0.2840576171875, -0.15667724609375, -0.029296875, 0.09808349609375, 0.2254638671875, 0.35284423828125, 0.480224609375, 0.60760498046875, 0.7349853515625, 0.86236572265625, 0.98974609375, 1.11712646484375, 1.2445068359375, 1.37188720703125, 1.499267578125, 1.62664794921875, 1.7540283203125, 1.88140869140625, 2.0087890625, 2.13616943359375, 2.2635498046875, 2.39093017578125, 2.518310546875, 2.64569091796875, 2.7730712890625, 2.90045166015625, 3.02783203125, 3.15521240234375, 3.2825927734375, 3.40997314453125, 3.537353515625, 3.66473388671875, 3.7921142578125, 3.91949462890625, 4.046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 0.0, 2.0, 5.0, 4.0, 12.0, 9.0, 9.0, 14.0, 12.0, 16.0, 21.0, 21.0, 28.0, 21.0, 28.0, 22.0, 31.0, 31.0, 38.0, 29.0, 34.0, 38.0, 37.0, 47.0, 34.0, 40.0, 28.0, 51.0, 43.0, 29.0, 39.0, 28.0, 25.0, 28.0, 23.0, 17.0, 19.0, 20.0, 8.0, 13.0, 11.0, 9.0, 6.0, 8.0, 6.0, 5.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.34375, -5.17779541015625, -5.0118408203125, -4.84588623046875, -4.679931640625, -4.51397705078125, -4.3480224609375, -4.18206787109375, -4.01611328125, -3.85015869140625, -3.6842041015625, -3.51824951171875, -3.352294921875, -3.18634033203125, -3.0203857421875, -2.85443115234375, -2.6884765625, -2.52252197265625, -2.3565673828125, -2.19061279296875, -2.024658203125, -1.85870361328125, -1.6927490234375, -1.52679443359375, -1.36083984375, -1.19488525390625, -1.0289306640625, -0.86297607421875, -0.697021484375, -0.53106689453125, -0.3651123046875, -0.19915771484375, -0.033203125, 0.13275146484375, 0.2987060546875, 0.46466064453125, 0.630615234375, 0.79656982421875, 0.9625244140625, 1.12847900390625, 1.29443359375, 1.46038818359375, 1.6263427734375, 1.79229736328125, 1.958251953125, 2.12420654296875, 2.2901611328125, 2.45611572265625, 2.6220703125, 2.78802490234375, 2.9539794921875, 3.11993408203125, 3.285888671875, 3.45184326171875, 3.6177978515625, 3.78375244140625, 3.94970703125, 4.11566162109375, 4.2816162109375, 4.44757080078125, 4.613525390625, 4.77947998046875, 4.9454345703125, 5.11138916015625, 5.27734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 13.0, 15.0, 22.0, 31.0, 49.0, 78.0, 148.0, 195.0, 279.0, 405.0, 647.0, 943.0, 1497.0, 2416.0, 3728.0, 6036.0, 9975.0, 17355.0, 31233.0, 60598.0, 129794.0, 244108.0, 254807.0, 139003.0, 65545.0, 33718.0, 18216.0, 10463.0, 6229.0, 3888.0, 2467.0, 1565.0, 1070.0, 701.0, 441.0, 316.0, 191.0, 140.0, 79.0, 48.0, 34.0, 24.0, 14.0, 7.0, 10.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0104522705078125, -0.010145306587219238, -0.009838342666625977, -0.009531378746032715, -0.009224414825439453, -0.008917450904846191, -0.00861048698425293, -0.008303523063659668, -0.007996559143066406, -0.0076895952224731445, -0.007382631301879883, -0.007075667381286621, -0.006768703460693359, -0.006461739540100098, -0.006154775619506836, -0.005847811698913574, -0.0055408477783203125, -0.005233883857727051, -0.004926919937133789, -0.004619956016540527, -0.004312992095947266, -0.004006028175354004, -0.003699064254760742, -0.0033921003341674805, -0.0030851364135742188, -0.002778172492980957, -0.0024712085723876953, -0.0021642446517944336, -0.0018572807312011719, -0.0015503168106079102, -0.0012433528900146484, -0.0009363889694213867, -0.000629425048828125, -0.0003224611282348633, -1.5497207641601562e-05, 0.00029146671295166016, 0.0005984306335449219, 0.0009053945541381836, 0.0012123584747314453, 0.001519322395324707, 0.0018262863159179688, 0.0021332502365112305, 0.002440214157104492, 0.002747178077697754, 0.0030541419982910156, 0.0033611059188842773, 0.003668069839477539, 0.003975033760070801, 0.0042819976806640625, 0.004588961601257324, 0.004895925521850586, 0.005202889442443848, 0.005509853363037109, 0.005816817283630371, 0.006123781204223633, 0.0064307451248168945, 0.006737709045410156, 0.007044672966003418, 0.00735163688659668, 0.007658600807189941, 0.007965564727783203, 0.008272528648376465, 0.008579492568969727, 0.008886456489562988, 0.00919342041015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 4.0, 8.0, 7.0, 9.0, 11.0, 12.0, 16.0, 15.0, 25.0, 25.0, 31.0, 24.0, 37.0, 51.0, 45.0, 60.0, 50.0, 60.0, 47.0, 59.0, 40.0, 65.0, 56.0, 30.0, 34.0, 33.0, 26.0, 16.0, 19.0, 24.0, 10.0, 11.0, 10.0, 10.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.198883056640625e-06, -5.986541509628296e-06, -5.774199962615967e-06, -5.561858415603638e-06, -5.349516868591309e-06, -5.1371753215789795e-06, -4.92483377456665e-06, -4.712492227554321e-06, -4.500150680541992e-06, -4.287809133529663e-06, -4.075467586517334e-06, -3.863126039505005e-06, -3.6507844924926758e-06, -3.4384429454803467e-06, -3.2261013984680176e-06, -3.0137598514556885e-06, -2.8014183044433594e-06, -2.5890767574310303e-06, -2.376735210418701e-06, -2.164393663406372e-06, -1.952052116394043e-06, -1.7397105693817139e-06, -1.5273690223693848e-06, -1.3150274753570557e-06, -1.1026859283447266e-06, -8.903443813323975e-07, -6.780028343200684e-07, -4.6566128730773926e-07, -2.5331974029541016e-07, -4.0978193283081055e-08, 1.7136335372924805e-07, 3.8370490074157715e-07, 5.960464477539062e-07, 8.083879947662354e-07, 1.0207295417785645e-06, 1.2330710887908936e-06, 1.4454126358032227e-06, 1.6577541828155518e-06, 1.8700957298278809e-06, 2.08243727684021e-06, 2.294778823852539e-06, 2.507120370864868e-06, 2.7194619178771973e-06, 2.9318034648895264e-06, 3.1441450119018555e-06, 3.3564865589141846e-06, 3.5688281059265137e-06, 3.7811696529388428e-06, 3.993511199951172e-06, 4.205852746963501e-06, 4.41819429397583e-06, 4.630535840988159e-06, 4.842877388000488e-06, 5.055218935012817e-06, 5.2675604820251465e-06, 5.479902029037476e-06, 5.692243576049805e-06, 5.904585123062134e-06, 6.116926670074463e-06, 6.329268217086792e-06, 6.541609764099121e-06, 6.75395131111145e-06, 6.966292858123779e-06, 7.178634405136108e-06, 7.3909759521484375e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 8.0, 13.0, 18.0, 24.0, 28.0, 55.0, 64.0, 80.0, 137.0, 209.0, 299.0, 432.0, 722.0, 1214.0, 1870.0, 2942.0, 4930.0, 8102.0, 13984.0, 25423.0, 47433.0, 95520.0, 184801.0, 250767.0, 193733.0, 101655.0, 50405.0, 26731.0, 14955.0, 8661.0, 4933.0, 3065.0, 1934.0, 1202.0, 734.0, 476.0, 333.0, 217.0, 127.0, 98.0, 67.0, 50.0, 41.0, 20.0, 12.0, 10.0, 9.0, 8.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.00980377197265625, -0.009502530097961426, -0.009201288223266602, -0.008900046348571777, -0.008598804473876953, -0.008297562599182129, -0.007996320724487305, -0.0076950788497924805, -0.007393836975097656, -0.007092595100402832, -0.006791353225708008, -0.006490111351013184, -0.006188869476318359, -0.005887627601623535, -0.005586385726928711, -0.005285143852233887, -0.0049839019775390625, -0.004682660102844238, -0.004381418228149414, -0.00408017635345459, -0.0037789344787597656, -0.0034776926040649414, -0.003176450729370117, -0.002875208854675293, -0.0025739669799804688, -0.0022727251052856445, -0.0019714832305908203, -0.001670241355895996, -0.0013689994812011719, -0.0010677576065063477, -0.0007665157318115234, -0.0004652738571166992, -0.000164031982421875, 0.00013720989227294922, 0.00043845176696777344, 0.0007396936416625977, 0.0010409355163574219, 0.001342177391052246, 0.0016434192657470703, 0.0019446611404418945, 0.0022459030151367188, 0.002547144889831543, 0.002848386764526367, 0.0031496286392211914, 0.0034508705139160156, 0.00375211238861084, 0.004053354263305664, 0.004354596138000488, 0.0046558380126953125, 0.004957079887390137, 0.005258321762084961, 0.005559563636779785, 0.005860805511474609, 0.006162047386169434, 0.006463289260864258, 0.006764531135559082, 0.007065773010253906, 0.0073670148849487305, 0.007668256759643555, 0.007969498634338379, 0.008270740509033203, 0.008571982383728027, 0.008873224258422852, 0.009174466133117676, 0.0094757080078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 11.0, 6.0, 11.0, 13.0, 33.0, 45.0, 81.0, 92.0, 136.0, 138.0, 130.0, 107.0, 70.0, 43.0, 31.0, 20.0, 12.0, 5.0, 5.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00614166259765625, -0.005968213081359863, -0.0057947635650634766, -0.00562131404876709, -0.005447864532470703, -0.005274415016174316, -0.00510096549987793, -0.004927515983581543, -0.004754066467285156, -0.0045806169509887695, -0.004407167434692383, -0.004233717918395996, -0.004060268402099609, -0.0038868188858032227, -0.003713369369506836, -0.0035399198532104492, -0.0033664703369140625, -0.0031930208206176758, -0.003019571304321289, -0.0028461217880249023, -0.0026726722717285156, -0.002499222755432129, -0.002325773239135742, -0.0021523237228393555, -0.0019788742065429688, -0.001805424690246582, -0.0016319751739501953, -0.0014585256576538086, -0.0012850761413574219, -0.0011116266250610352, -0.0009381771087646484, -0.0007647275924682617, -0.000591278076171875, -0.0004178285598754883, -0.00024437904357910156, -7.092952728271484e-05, 0.00010251998901367188, 0.0002759695053100586, 0.0004494190216064453, 0.000622868537902832, 0.0007963180541992188, 0.0009697675704956055, 0.0011432170867919922, 0.001316666603088379, 0.0014901161193847656, 0.0016635656356811523, 0.001837015151977539, 0.0020104646682739258, 0.0021839141845703125, 0.0023573637008666992, 0.002530813217163086, 0.0027042627334594727, 0.0028777122497558594, 0.003051161766052246, 0.003224611282348633, 0.0033980607986450195, 0.0035715103149414062, 0.003744959831237793, 0.00391840934753418, 0.004091858863830566, 0.004265308380126953, 0.00443875789642334, 0.0046122074127197266, 0.004785656929016113, 0.0049591064453125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 4.0, 7.0, 6.0, 12.0, 8.0, 11.0, 12.0, 17.0, 14.0, 20.0, 19.0, 28.0, 25.0, 35.0, 31.0, 37.0, 44.0, 42.0, 45.0, 54.0, 50.0, 43.0, 36.0, 44.0, 30.0, 39.0, 36.0, 36.0, 25.0, 17.0, 30.0, 22.0, 19.0, 18.0, 19.0, 15.0, 7.0, 6.0, 11.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.329930305480957, -7.104283809661865, -6.878636837005615, -6.652990341186523, -6.427343845367432, -6.20169734954834, -5.97605037689209, -5.750403881072998, -5.524757385253906, -5.2991108894348145, -5.0734639167785645, -4.847817420959473, -4.622170925140381, -4.396524429321289, -4.170877456665039, -3.9452309608459473, -3.7195839881896973, -3.4939372539520264, -3.2682907581329346, -3.0426440238952637, -2.816997528076172, -2.591350793838501, -2.36570405960083, -2.1400575637817383, -1.9144108295440674, -1.688764214515686, -1.4631175994873047, -1.2374708652496338, -1.0118242502212524, -0.7861776351928711, -0.5605309009552002, -0.33488428592681885, -0.1092371940612793, 0.11640945076942444, 0.3420560956001282, 0.5677027702331543, 0.7933493852615356, 1.018996000289917, 1.244642734527588, 1.4702893495559692, 1.6959359645843506, 1.921582579612732, 2.1472291946411133, 2.372875928878784, 2.598522663116455, 2.824169158935547, 3.0498158931732178, 3.2754626274108887, 3.5011091232299805, 3.7267558574676514, 3.952402353286743, 4.178049087524414, 4.403695583343506, 4.629342079162598, 4.854989051818848, 5.0806355476379395, 5.306282043457031, 5.531928539276123, 5.757575511932373, 5.983222007751465, 6.208868503570557, 6.434514999389648, 6.660161972045898, 6.88580846786499, 7.11145544052124]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 4.0, 2.0, 3.0, 8.0, 4.0, 8.0, 11.0, 13.0, 13.0, 19.0, 14.0, 29.0, 22.0, 27.0, 26.0, 36.0, 42.0, 28.0, 33.0, 39.0, 35.0, 30.0, 47.0, 41.0, 44.0, 36.0, 44.0, 30.0, 48.0, 35.0, 30.0, 23.0, 25.0, 26.0, 27.0, 17.0, 20.0, 15.0, 12.0, 9.0, 4.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.410799980163574, -8.146383285522461, -7.881966590881348, -7.617549896240234, -7.353133201599121, -7.088716506958008, -6.8242998123168945, -6.559883117675781, -6.295466423034668, -6.031049728393555, -5.766633033752441, -5.502216339111328, -5.237799644470215, -4.973382949829102, -4.708966255187988, -4.444549560546875, -4.1801323890686035, -3.9157156944274902, -3.651298999786377, -3.3868823051452637, -3.1224656105041504, -2.858048915863037, -2.5936319828033447, -2.3292152881622314, -2.064798593521118, -1.8003818988800049, -1.5359652042388916, -1.2715483903884888, -1.0071316957473755, -0.7427150011062622, -0.4782981872558594, -0.2138814926147461, 0.05053520202636719, 0.31495192646980286, 0.5793686509132385, 0.8437854051589966, 1.1082020998001099, 1.3726187944412231, 1.637035608291626, 1.9014523029327393, 2.1658689975738525, 2.430285692214966, 2.694702386856079, 2.9591193199157715, 3.2235360145568848, 3.487952709197998, 3.7523694038391113, 4.016786098480225, 4.281202793121338, 4.545619487762451, 4.8100361824035645, 5.074452877044678, 5.338869571685791, 5.603286266326904, 5.867703437805176, 6.132120132446289, 6.396536827087402, 6.660953521728516, 6.925370216369629, 7.189786911010742, 7.4542036056518555, 7.718620300292969, 7.983036994934082, 8.247453689575195, 8.511870384216309]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 11.0, 21.0, 29.0, 43.0, 79.0, 103.0, 150.0, 246.0, 357.0, 539.0, 921.0, 1374.0, 2065.0, 3295.0, 5062.0, 7967.0, 12462.0, 19334.0, 28849.0, 43369.0, 61829.0, 83225.0, 104892.0, 119558.0, 123209.0, 112497.0, 93149.0, 71373.0, 51305.0, 35166.0, 23412.0, 15234.0, 9751.0, 6281.0, 4009.0, 2650.0, 1612.0, 1101.0, 684.0, 456.0, 307.0, 210.0, 129.0, 92.0, 59.0, 30.0, 20.0, 13.0, 11.0, 6.0, 4.0, 2.0, 2.0, 3.0], "bins": [-7.8515625, -7.6221923828125, -7.392822265625, -7.1634521484375, -6.93408203125, -6.7047119140625, -6.475341796875, -6.2459716796875, -6.0166015625, -5.7872314453125, -5.557861328125, -5.3284912109375, -5.09912109375, -4.8697509765625, -4.640380859375, -4.4110107421875, -4.181640625, -3.9522705078125, -3.722900390625, -3.4935302734375, -3.26416015625, -3.0347900390625, -2.805419921875, -2.5760498046875, -2.3466796875, -2.1173095703125, -1.887939453125, -1.6585693359375, -1.42919921875, -1.1998291015625, -0.970458984375, -0.7410888671875, -0.51171875, -0.2823486328125, -0.052978515625, 0.1763916015625, 0.40576171875, 0.6351318359375, 0.864501953125, 1.0938720703125, 1.3232421875, 1.5526123046875, 1.781982421875, 2.0113525390625, 2.24072265625, 2.4700927734375, 2.699462890625, 2.9288330078125, 3.158203125, 3.3875732421875, 3.616943359375, 3.8463134765625, 4.07568359375, 4.3050537109375, 4.534423828125, 4.7637939453125, 4.9931640625, 5.2225341796875, 5.451904296875, 5.6812744140625, 5.91064453125, 6.1400146484375, 6.369384765625, 6.5987548828125, 6.828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 7.0, 3.0, 1.0, 6.0, 7.0, 6.0, 5.0, 8.0, 10.0, 16.0, 16.0, 23.0, 24.0, 24.0, 22.0, 24.0, 29.0, 31.0, 30.0, 52.0, 26.0, 38.0, 35.0, 49.0, 49.0, 46.0, 26.0, 42.0, 43.0, 42.0, 28.0, 34.0, 24.0, 26.0, 35.0, 15.0, 27.0, 20.0, 11.0, 12.0, 9.0, 9.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.671875, -8.4085693359375, -8.145263671875, -7.8819580078125, -7.61865234375, -7.3553466796875, -7.092041015625, -6.8287353515625, -6.5654296875, -6.3021240234375, -6.038818359375, -5.7755126953125, -5.51220703125, -5.2489013671875, -4.985595703125, -4.7222900390625, -4.458984375, -4.1956787109375, -3.932373046875, -3.6690673828125, -3.40576171875, -3.1424560546875, -2.879150390625, -2.6158447265625, -2.3525390625, -2.0892333984375, -1.825927734375, -1.5626220703125, -1.29931640625, -1.0360107421875, -0.772705078125, -0.5093994140625, -0.24609375, 0.0172119140625, 0.280517578125, 0.5438232421875, 0.80712890625, 1.0704345703125, 1.333740234375, 1.5970458984375, 1.8603515625, 2.1236572265625, 2.386962890625, 2.6502685546875, 2.91357421875, 3.1768798828125, 3.440185546875, 3.7034912109375, 3.966796875, 4.2301025390625, 4.493408203125, 4.7567138671875, 5.02001953125, 5.2833251953125, 5.546630859375, 5.8099365234375, 6.0732421875, 6.3365478515625, 6.599853515625, 6.8631591796875, 7.12646484375, 7.3897705078125, 7.653076171875, 7.9163818359375, 8.1796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 8.0, 8.0, 10.0, 17.0, 32.0, 47.0, 76.0, 100.0, 148.0, 232.0, 370.0, 645.0, 974.0, 1430.0, 2262.0, 3384.0, 5186.0, 7966.0, 12248.0, 18082.0, 26908.0, 37856.0, 53224.0, 71127.0, 89975.0, 105769.0, 114229.0, 110687.0, 98775.0, 81362.0, 62427.0, 45551.0, 31738.0, 22004.0, 15128.0, 9768.0, 6510.0, 4317.0, 2841.0, 1809.0, 1195.0, 726.0, 474.0, 338.0, 207.0, 131.0, 108.0, 56.0, 47.0, 21.0, 12.0, 5.0, 8.0, 3.0, 1.0, 4.0, 1.0, 1.0], "bins": [-6.921875, -6.7105712890625, -6.499267578125, -6.2879638671875, -6.07666015625, -5.8653564453125, -5.654052734375, -5.4427490234375, -5.2314453125, -5.0201416015625, -4.808837890625, -4.5975341796875, -4.38623046875, -4.1749267578125, -3.963623046875, -3.7523193359375, -3.541015625, -3.3297119140625, -3.118408203125, -2.9071044921875, -2.69580078125, -2.4844970703125, -2.273193359375, -2.0618896484375, -1.8505859375, -1.6392822265625, -1.427978515625, -1.2166748046875, -1.00537109375, -0.7940673828125, -0.582763671875, -0.3714599609375, -0.16015625, 0.0511474609375, 0.262451171875, 0.4737548828125, 0.68505859375, 0.8963623046875, 1.107666015625, 1.3189697265625, 1.5302734375, 1.7415771484375, 1.952880859375, 2.1641845703125, 2.37548828125, 2.5867919921875, 2.798095703125, 3.0093994140625, 3.220703125, 3.4320068359375, 3.643310546875, 3.8546142578125, 4.06591796875, 4.2772216796875, 4.488525390625, 4.6998291015625, 4.9111328125, 5.1224365234375, 5.333740234375, 5.5450439453125, 5.75634765625, 5.9676513671875, 6.178955078125, 6.3902587890625, 6.6015625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 4.0, 9.0, 12.0, 14.0, 16.0, 11.0, 18.0, 22.0, 15.0, 26.0, 34.0, 27.0, 26.0, 36.0, 34.0, 38.0, 37.0, 23.0, 37.0, 30.0, 51.0, 30.0, 39.0, 31.0, 39.0, 32.0, 28.0, 30.0, 27.0, 34.0, 29.0, 25.0, 21.0, 15.0, 13.0, 15.0, 14.0, 11.0, 7.0, 5.0, 4.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.3046875, -5.14483642578125, -4.9849853515625, -4.82513427734375, -4.665283203125, -4.50543212890625, -4.3455810546875, -4.18572998046875, -4.02587890625, -3.86602783203125, -3.7061767578125, -3.54632568359375, -3.386474609375, -3.22662353515625, -3.0667724609375, -2.90692138671875, -2.7470703125, -2.58721923828125, -2.4273681640625, -2.26751708984375, -2.107666015625, -1.94781494140625, -1.7879638671875, -1.62811279296875, -1.46826171875, -1.30841064453125, -1.1485595703125, -0.98870849609375, -0.828857421875, -0.66900634765625, -0.5091552734375, -0.34930419921875, -0.189453125, -0.02960205078125, 0.1302490234375, 0.29010009765625, 0.449951171875, 0.60980224609375, 0.7696533203125, 0.92950439453125, 1.08935546875, 1.24920654296875, 1.4090576171875, 1.56890869140625, 1.728759765625, 1.88861083984375, 2.0484619140625, 2.20831298828125, 2.3681640625, 2.52801513671875, 2.6878662109375, 2.84771728515625, 3.007568359375, 3.16741943359375, 3.3272705078125, 3.48712158203125, 3.64697265625, 3.80682373046875, 3.9666748046875, 4.12652587890625, 4.286376953125, 4.44622802734375, 4.6060791015625, 4.76593017578125, 4.92578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 12.0, 19.0, 24.0, 44.0, 61.0, 115.0, 147.0, 226.0, 332.0, 457.0, 723.0, 1201.0, 1922.0, 2932.0, 4752.0, 7955.0, 12845.0, 20370.0, 32434.0, 48352.0, 69240.0, 91634.0, 111533.0, 122503.0, 121246.0, 109448.0, 89607.0, 67397.0, 47432.0, 31199.0, 19891.0, 12343.0, 7480.0, 4806.0, 2903.0, 1792.0, 1119.0, 718.0, 439.0, 296.0, 222.0, 131.0, 87.0, 57.0, 31.0, 17.0, 22.0, 6.0, 4.0, 8.0, 2.0, 5.0, 3.0, 4.0], "bins": [-1.4638671875, -1.4207611083984375, -1.377655029296875, -1.3345489501953125, -1.29144287109375, -1.2483367919921875, -1.205230712890625, -1.1621246337890625, -1.1190185546875, -1.0759124755859375, -1.032806396484375, -0.9897003173828125, -0.94659423828125, -0.9034881591796875, -0.860382080078125, -0.8172760009765625, -0.774169921875, -0.7310638427734375, -0.687957763671875, -0.6448516845703125, -0.60174560546875, -0.5586395263671875, -0.515533447265625, -0.4724273681640625, -0.4293212890625, -0.3862152099609375, -0.343109130859375, -0.3000030517578125, -0.25689697265625, -0.2137908935546875, -0.170684814453125, -0.1275787353515625, -0.08447265625, -0.0413665771484375, 0.001739501953125, 0.0448455810546875, 0.08795166015625, 0.1310577392578125, 0.174163818359375, 0.2172698974609375, 0.2603759765625, 0.3034820556640625, 0.346588134765625, 0.3896942138671875, 0.43280029296875, 0.4759063720703125, 0.519012451171875, 0.5621185302734375, 0.605224609375, 0.6483306884765625, 0.691436767578125, 0.7345428466796875, 0.77764892578125, 0.8207550048828125, 0.863861083984375, 0.9069671630859375, 0.9500732421875, 0.9931793212890625, 1.036285400390625, 1.0793914794921875, 1.12249755859375, 1.1656036376953125, 1.208709716796875, 1.2518157958984375, 1.294921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 12.0, 3.0, 13.0, 24.0, 21.0, 17.0, 24.0, 23.0, 23.0, 27.0, 41.0, 25.0, 29.0, 45.0, 40.0, 43.0, 39.0, 39.0, 39.0, 30.0, 49.0, 40.0, 31.0, 47.0, 36.0, 33.0, 26.0, 20.0, 16.0, 22.0, 19.0, 13.0, 15.0, 15.0, 6.0, 8.0, 9.0, 8.0, 4.0, 2.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001342296600341797, -0.0001297593116760254, -0.0001252889633178711, -0.0001208186149597168, -0.0001163482666015625, -0.0001118779182434082, -0.0001074075698852539, -0.00010293722152709961, -9.846687316894531e-05, -9.399652481079102e-05, -8.952617645263672e-05, -8.505582809448242e-05, -8.058547973632812e-05, -7.611513137817383e-05, -7.164478302001953e-05, -6.717443466186523e-05, -6.270408630371094e-05, -5.823373794555664e-05, -5.3763389587402344e-05, -4.929304122924805e-05, -4.482269287109375e-05, -4.035234451293945e-05, -3.5881996154785156e-05, -3.141164779663086e-05, -2.6941299438476562e-05, -2.2470951080322266e-05, -1.800060272216797e-05, -1.3530254364013672e-05, -9.059906005859375e-06, -4.589557647705078e-06, -1.1920928955078125e-07, 4.351139068603516e-06, 8.821487426757812e-06, 1.329183578491211e-05, 1.7762184143066406e-05, 2.2232532501220703e-05, 2.6702880859375e-05, 3.11732292175293e-05, 3.5643577575683594e-05, 4.011392593383789e-05, 4.458427429199219e-05, 4.9054622650146484e-05, 5.352497100830078e-05, 5.799531936645508e-05, 6.246566772460938e-05, 6.693601608276367e-05, 7.140636444091797e-05, 7.587671279907227e-05, 8.034706115722656e-05, 8.481740951538086e-05, 8.928775787353516e-05, 9.375810623168945e-05, 9.822845458984375e-05, 0.00010269880294799805, 0.00010716915130615234, 0.00011163949966430664, 0.00011610984802246094, 0.00012058019638061523, 0.00012505054473876953, 0.00012952089309692383, 0.00013399124145507812, 0.00013846158981323242, 0.00014293193817138672, 0.00014740228652954102, 0.0001518726348876953]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 7.0, 13.0, 22.0, 22.0, 30.0, 47.0, 89.0, 133.0, 193.0, 321.0, 552.0, 904.0, 1451.0, 2401.0, 4163.0, 7341.0, 12963.0, 22539.0, 38552.0, 60964.0, 89253.0, 118561.0, 139245.0, 142888.0, 127175.0, 99470.0, 69975.0, 44952.0, 27338.0, 15853.0, 8769.0, 5051.0, 2886.0, 1664.0, 1021.0, 658.0, 387.0, 237.0, 160.0, 104.0, 63.0, 52.0, 31.0, 23.0, 12.0, 10.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0], "bins": [-1.7158203125, -1.6656036376953125, -1.615386962890625, -1.5651702880859375, -1.51495361328125, -1.4647369384765625, -1.414520263671875, -1.3643035888671875, -1.3140869140625, -1.2638702392578125, -1.213653564453125, -1.1634368896484375, -1.11322021484375, -1.0630035400390625, -1.012786865234375, -0.9625701904296875, -0.912353515625, -0.8621368408203125, -0.811920166015625, -0.7617034912109375, -0.71148681640625, -0.6612701416015625, -0.611053466796875, -0.5608367919921875, -0.5106201171875, -0.4604034423828125, -0.410186767578125, -0.3599700927734375, -0.30975341796875, -0.2595367431640625, -0.209320068359375, -0.1591033935546875, -0.10888671875, -0.0586700439453125, -0.008453369140625, 0.0417633056640625, 0.09197998046875, 0.1421966552734375, 0.192413330078125, 0.2426300048828125, 0.2928466796875, 0.3430633544921875, 0.393280029296875, 0.4434967041015625, 0.49371337890625, 0.5439300537109375, 0.594146728515625, 0.6443634033203125, 0.694580078125, 0.7447967529296875, 0.795013427734375, 0.8452301025390625, 0.89544677734375, 0.9456634521484375, 0.995880126953125, 1.0460968017578125, 1.0963134765625, 1.1465301513671875, 1.196746826171875, 1.2469635009765625, 1.29718017578125, 1.3473968505859375, 1.397613525390625, 1.4478302001953125, 1.498046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 4.0, 5.0, 5.0, 5.0, 9.0, 8.0, 14.0, 18.0, 12.0, 19.0, 26.0, 27.0, 29.0, 39.0, 42.0, 34.0, 49.0, 46.0, 42.0, 42.0, 49.0, 37.0, 42.0, 43.0, 47.0, 34.0, 37.0, 41.0, 36.0, 30.0, 18.0, 21.0, 19.0, 13.0, 15.0, 15.0, 7.0, 5.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.64453125, -0.6227188110351562, -0.6009063720703125, -0.5790939331054688, -0.557281494140625, -0.5354690551757812, -0.5136566162109375, -0.49184417724609375, -0.47003173828125, -0.44821929931640625, -0.4264068603515625, -0.40459442138671875, -0.382781982421875, -0.36096954345703125, -0.3391571044921875, -0.31734466552734375, -0.2955322265625, -0.27371978759765625, -0.2519073486328125, -0.23009490966796875, -0.208282470703125, -0.18647003173828125, -0.1646575927734375, -0.14284515380859375, -0.12103271484375, -0.09922027587890625, -0.0774078369140625, -0.05559539794921875, -0.033782958984375, -0.01197052001953125, 0.0098419189453125, 0.03165435791015625, 0.053466796875, 0.07527923583984375, 0.0970916748046875, 0.11890411376953125, 0.140716552734375, 0.16252899169921875, 0.1843414306640625, 0.20615386962890625, 0.22796630859375, 0.24977874755859375, 0.2715911865234375, 0.29340362548828125, 0.315216064453125, 0.33702850341796875, 0.3588409423828125, 0.38065338134765625, 0.4024658203125, 0.42427825927734375, 0.4460906982421875, 0.46790313720703125, 0.489715576171875, 0.5115280151367188, 0.5333404541015625, 0.5551528930664062, 0.57696533203125, 0.5987777709960938, 0.6205902099609375, 0.6424026489257812, 0.664215087890625, 0.6860275268554688, 0.7078399658203125, 0.7296524047851562, 0.75146484375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 7.0, 5.0, 9.0, 15.0, 13.0, 19.0, 17.0, 22.0, 20.0, 30.0, 32.0, 33.0, 47.0, 50.0, 47.0, 40.0, 38.0, 46.0, 63.0, 43.0, 44.0, 45.0, 37.0, 40.0, 26.0, 28.0, 21.0, 25.0, 13.0, 23.0, 21.0, 13.0, 12.0, 10.0, 7.0, 5.0, 2.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.115194797515869, -6.883185863494873, -6.651176452636719, -6.419167518615723, -6.187158107757568, -5.955149173736572, -5.723139762878418, -5.491130828857422, -5.259121894836426, -5.02711296081543, -4.795103549957275, -4.563094615936279, -4.331085205078125, -4.099076271057129, -3.8670670986175537, -3.6350579261779785, -3.403048515319824, -3.171039342880249, -2.939030170440674, -2.7070212364196777, -2.4750118255615234, -2.2430028915405273, -2.010993719100952, -1.778984546661377, -1.5469753742218018, -1.3149662017822266, -1.0829570293426514, -0.8509479761123657, -0.6189388036727905, -0.38692963123321533, -0.1549205780029297, 0.07708859443664551, 0.3090982437133789, 0.5411074161529541, 0.7731165289878845, 1.005125641822815, 1.2371348142623901, 1.4691439867019653, 1.701153039932251, 1.9331622123718262, 2.1651713848114014, 2.3971805572509766, 2.6291897296905518, 2.861198902130127, 3.093207836151123, 3.3252172470092773, 3.5572261810302734, 3.7892353534698486, 4.021244525909424, 4.25325345993042, 4.485262870788574, 4.71727180480957, 4.949281215667725, 5.181290149688721, 5.413299560546875, 5.645308494567871, 5.877317428588867, 6.109326362609863, 6.341335773468018, 6.573344707489014, 6.805354118347168, 7.037363052368164, 7.26937198638916, 7.5013813972473145, 7.733390808105469]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 8.0, 14.0, 13.0, 10.0, 16.0, 22.0, 17.0, 26.0, 18.0, 37.0, 42.0, 31.0, 41.0, 30.0, 41.0, 41.0, 35.0, 35.0, 46.0, 39.0, 38.0, 41.0, 33.0, 38.0, 33.0, 40.0, 23.0, 29.0, 23.0, 28.0, 19.0, 16.0, 17.0, 13.0, 6.0, 10.0, 6.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.047165870666504, -8.762916564941406, -8.478668212890625, -8.194418907165527, -7.910170555114746, -7.625921249389648, -7.341672420501709, -7.0574235916137695, -6.77317476272583, -6.488925933837891, -6.204677104949951, -5.920428276062012, -5.636178970336914, -5.351930618286133, -5.067681312561035, -4.783432483673096, -4.499183654785156, -4.214934825897217, -3.9306859970092773, -3.646436929702759, -3.3621881008148193, -3.07793927192688, -2.7936902046203613, -2.509441375732422, -2.2251925468444824, -1.940943717956543, -1.656694769859314, -1.372445821762085, -1.0881969928741455, -0.803948163986206, -0.519699215888977, -0.23545026779174805, 0.048798561096191406, 0.33304744958877563, 0.6172963380813599, 0.9015452265739441, 1.1857941150665283, 1.4700429439544678, 1.7542918920516968, 2.038540840148926, 2.3227896690368652, 2.6070384979248047, 2.891287326812744, 3.1755363941192627, 3.459785223007202, 3.7440340518951416, 4.02828311920166, 4.3125319480896, 4.596780776977539, 4.8810296058654785, 5.165278434753418, 5.449527263641357, 5.733776092529297, 6.0180253982543945, 6.302274227142334, 6.586523056030273, 6.870771884918213, 7.155020713806152, 7.439269542694092, 7.723518371582031, 8.007767677307129, 8.29201602935791, 8.576265335083008, 8.860513687133789, 9.144762992858887]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 17.0, 11.0, 31.0, 38.0, 45.0, 89.0, 139.0, 226.0, 344.0, 530.0, 800.0, 1248.0, 1922.0, 3027.0, 4781.0, 7505.0, 12100.0, 18806.0, 29733.0, 46969.0, 74423.0, 114633.0, 174313.0, 254142.0, 349549.0, 445403.0, 508349.0, 514910.0, 460969.0, 369096.0, 270976.0, 188153.0, 124706.0, 80074.0, 50839.0, 32173.0, 20093.0, 12323.0, 7707.0, 4854.0, 3039.0, 1863.0, 1189.0, 745.0, 480.0, 318.0, 208.0, 144.0, 97.0, 64.0, 31.0, 25.0, 17.0, 10.0, 8.0, 1.0, 2.0, 2.0], "bins": [-7.203125, -6.9854736328125, -6.767822265625, -6.5501708984375, -6.33251953125, -6.1148681640625, -5.897216796875, -5.6795654296875, -5.4619140625, -5.2442626953125, -5.026611328125, -4.8089599609375, -4.59130859375, -4.3736572265625, -4.156005859375, -3.9383544921875, -3.720703125, -3.5030517578125, -3.285400390625, -3.0677490234375, -2.85009765625, -2.6324462890625, -2.414794921875, -2.1971435546875, -1.9794921875, -1.7618408203125, -1.544189453125, -1.3265380859375, -1.10888671875, -0.8912353515625, -0.673583984375, -0.4559326171875, -0.23828125, -0.0206298828125, 0.197021484375, 0.4146728515625, 0.63232421875, 0.8499755859375, 1.067626953125, 1.2852783203125, 1.5029296875, 1.7205810546875, 1.938232421875, 2.1558837890625, 2.37353515625, 2.5911865234375, 2.808837890625, 3.0264892578125, 3.244140625, 3.4617919921875, 3.679443359375, 3.8970947265625, 4.11474609375, 4.3323974609375, 4.550048828125, 4.7677001953125, 4.9853515625, 5.2030029296875, 5.420654296875, 5.6383056640625, 5.85595703125, 6.0736083984375, 6.291259765625, 6.5089111328125, 6.7265625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 6.0, 5.0, 9.0, 8.0, 13.0, 8.0, 14.0, 13.0, 19.0, 15.0, 33.0, 31.0, 37.0, 33.0, 46.0, 40.0, 24.0, 43.0, 40.0, 44.0, 49.0, 49.0, 38.0, 37.0, 34.0, 42.0, 26.0, 32.0, 31.0, 25.0, 37.0, 16.0, 15.0, 28.0, 18.0, 8.0, 8.0, 11.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.42108154296875, -7.1585693359375, -6.89605712890625, -6.633544921875, -6.37103271484375, -6.1085205078125, -5.84600830078125, -5.58349609375, -5.32098388671875, -5.0584716796875, -4.79595947265625, -4.533447265625, -4.27093505859375, -4.0084228515625, -3.74591064453125, -3.4833984375, -3.22088623046875, -2.9583740234375, -2.69586181640625, -2.433349609375, -2.17083740234375, -1.9083251953125, -1.64581298828125, -1.38330078125, -1.12078857421875, -0.8582763671875, -0.59576416015625, -0.333251953125, -0.07073974609375, 0.1917724609375, 0.45428466796875, 0.716796875, 0.97930908203125, 1.2418212890625, 1.50433349609375, 1.766845703125, 2.02935791015625, 2.2918701171875, 2.55438232421875, 2.81689453125, 3.07940673828125, 3.3419189453125, 3.60443115234375, 3.866943359375, 4.12945556640625, 4.3919677734375, 4.65447998046875, 4.9169921875, 5.17950439453125, 5.4420166015625, 5.70452880859375, 5.967041015625, 6.22955322265625, 6.4920654296875, 6.75457763671875, 7.01708984375, 7.27960205078125, 7.5421142578125, 7.80462646484375, 8.067138671875, 8.32965087890625, 8.5921630859375, 8.85467529296875, 9.1171875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 10.0, 16.0, 37.0, 35.0, 64.0, 132.0, 222.0, 342.0, 589.0, 930.0, 1651.0, 2731.0, 4696.0, 7996.0, 13839.0, 23591.0, 39756.0, 66825.0, 106454.0, 166956.0, 244693.0, 334781.0, 425781.0, 487176.0, 504508.0, 470646.0, 394251.0, 304534.0, 216696.0, 144079.0, 92306.0, 56476.0, 33821.0, 19843.0, 11358.0, 6791.0, 3963.0, 2248.0, 1323.0, 845.0, 501.0, 306.0, 190.0, 123.0, 57.0, 43.0, 27.0, 14.0, 12.0, 13.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0], "bins": [-7.3828125, -7.15447998046875, -6.9261474609375, -6.69781494140625, -6.469482421875, -6.24114990234375, -6.0128173828125, -5.78448486328125, -5.55615234375, -5.32781982421875, -5.0994873046875, -4.87115478515625, -4.642822265625, -4.41448974609375, -4.1861572265625, -3.95782470703125, -3.7294921875, -3.50115966796875, -3.2728271484375, -3.04449462890625, -2.816162109375, -2.58782958984375, -2.3594970703125, -2.13116455078125, -1.90283203125, -1.67449951171875, -1.4461669921875, -1.21783447265625, -0.989501953125, -0.76116943359375, -0.5328369140625, -0.30450439453125, -0.076171875, 0.15216064453125, 0.3804931640625, 0.60882568359375, 0.837158203125, 1.06549072265625, 1.2938232421875, 1.52215576171875, 1.75048828125, 1.97882080078125, 2.2071533203125, 2.43548583984375, 2.663818359375, 2.89215087890625, 3.1204833984375, 3.34881591796875, 3.5771484375, 3.80548095703125, 4.0338134765625, 4.26214599609375, 4.490478515625, 4.71881103515625, 4.9471435546875, 5.17547607421875, 5.40380859375, 5.63214111328125, 5.8604736328125, 6.08880615234375, 6.317138671875, 6.54547119140625, 6.7738037109375, 7.00213623046875, 7.23046875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 4.0, 8.0, 4.0, 11.0, 10.0, 17.0, 14.0, 26.0, 42.0, 46.0, 57.0, 81.0, 73.0, 112.0, 117.0, 149.0, 165.0, 193.0, 213.0, 233.0, 232.0, 233.0, 248.0, 248.0, 237.0, 192.0, 179.0, 177.0, 162.0, 132.0, 93.0, 83.0, 68.0, 55.0, 40.0, 34.0, 23.0, 19.0, 14.0, 5.0, 10.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.98828125, -3.84979248046875, -3.7113037109375, -3.57281494140625, -3.434326171875, -3.29583740234375, -3.1573486328125, -3.01885986328125, -2.88037109375, -2.74188232421875, -2.6033935546875, -2.46490478515625, -2.326416015625, -2.18792724609375, -2.0494384765625, -1.91094970703125, -1.7724609375, -1.63397216796875, -1.4954833984375, -1.35699462890625, -1.218505859375, -1.08001708984375, -0.9415283203125, -0.80303955078125, -0.66455078125, -0.52606201171875, -0.3875732421875, -0.24908447265625, -0.110595703125, 0.02789306640625, 0.1663818359375, 0.30487060546875, 0.443359375, 0.58184814453125, 0.7203369140625, 0.85882568359375, 0.997314453125, 1.13580322265625, 1.2742919921875, 1.41278076171875, 1.55126953125, 1.68975830078125, 1.8282470703125, 1.96673583984375, 2.105224609375, 2.24371337890625, 2.3822021484375, 2.52069091796875, 2.6591796875, 2.79766845703125, 2.9361572265625, 3.07464599609375, 3.213134765625, 3.35162353515625, 3.4901123046875, 3.62860107421875, 3.76708984375, 3.90557861328125, 4.0440673828125, 4.18255615234375, 4.321044921875, 4.45953369140625, 4.5980224609375, 4.73651123046875, 4.875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 7.0, 12.0, 8.0, 15.0, 16.0, 23.0, 24.0, 30.0, 33.0, 35.0, 41.0, 44.0, 42.0, 44.0, 50.0, 53.0, 53.0, 52.0, 61.0, 46.0, 50.0, 41.0, 30.0, 32.0, 26.0, 21.0, 20.0, 19.0, 14.0, 6.0, 8.0, 6.0, 12.0, 7.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.519721984863281, -8.25348949432373, -7.98725700378418, -7.721024513244629, -7.454792022705078, -7.188559532165527, -6.922327518463135, -6.656095027923584, -6.389862537384033, -6.123630046844482, -5.857397556304932, -5.591165065765381, -5.324933052062988, -5.0587005615234375, -4.792468070983887, -4.526235580444336, -4.260003089904785, -3.9937705993652344, -3.7275381088256836, -3.461305856704712, -3.195073366165161, -2.9288408756256104, -2.6626086235046387, -2.396376132965088, -2.130143642425537, -1.8639111518859863, -1.597678780555725, -1.3314464092254639, -1.065213918685913, -0.7989814281463623, -0.5327490568161011, -0.26651668548583984, -0.0002841949462890625, 0.26594823598861694, 0.532180666923523, 0.798413097858429, 1.064645528793335, 1.3308780193328857, 1.597110390663147, 1.8633427619934082, 2.129575252532959, 2.3958077430725098, 2.6620402336120605, 2.9282724857330322, 3.194504976272583, 3.460737466812134, 3.7269697189331055, 3.9932022094726562, 4.259434700012207, 4.525667190551758, 4.791899681091309, 5.058132171630859, 5.32436466217041, 5.590597152709961, 5.8568291664123535, 6.123061656951904, 6.389294147491455, 6.655526638031006, 6.921759128570557, 7.187991619110107, 7.4542236328125, 7.720456123352051, 7.986688613891602, 8.252921104431152, 8.519153594970703]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 7.0, 8.0, 7.0, 6.0, 10.0, 12.0, 11.0, 21.0, 18.0, 32.0, 22.0, 29.0, 38.0, 33.0, 42.0, 43.0, 40.0, 42.0, 35.0, 46.0, 46.0, 37.0, 37.0, 41.0, 42.0, 28.0, 28.0, 30.0, 26.0, 36.0, 31.0, 20.0, 14.0, 23.0, 15.0, 6.0, 16.0, 5.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.36882209777832, -9.075923919677734, -8.783026695251465, -8.490128517150879, -8.197230339050293, -7.904332637786865, -7.6114349365234375, -7.318536758422852, -7.025639057159424, -6.732741355895996, -6.43984317779541, -6.146945476531982, -5.854047775268555, -5.561149597167969, -5.268251895904541, -4.975354194641113, -4.682456016540527, -4.3895583152771, -4.096660137176514, -3.803762435913086, -3.510864496231079, -3.2179665565490723, -2.9250688552856445, -2.6321709156036377, -2.339272975921631, -2.046375036239624, -1.7534772157669067, -1.4605793952941895, -1.1676814556121826, -0.8747835159301758, -0.5818856954574585, -0.2889878749847412, 0.003910064697265625, 0.2968079447746277, 0.5897058248519897, 0.8826037049293518, 1.1755015850067139, 1.4683995246887207, 1.761297345161438, 2.0541951656341553, 2.347093105316162, 2.639991044998169, 2.932888984680176, 3.2257866859436035, 3.5186846256256104, 3.811582565307617, 4.104480266571045, 4.397377967834473, 4.690276145935059, 4.983173847198486, 5.276072025299072, 5.5689697265625, 5.861867904663086, 6.154765605926514, 6.447663307189941, 6.740561485290527, 7.033459186553955, 7.326356887817383, 7.619255065917969, 7.9121527671813965, 8.205050468444824, 8.49794864654541, 8.790846824645996, 9.083744049072266, 9.376642227172852]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 12.0, 11.0, 15.0, 28.0, 51.0, 62.0, 75.0, 103.0, 167.0, 206.0, 321.0, 494.0, 694.0, 1028.0, 1505.0, 2170.0, 3323.0, 5238.0, 8143.0, 12644.0, 20653.0, 33320.0, 57143.0, 103204.0, 236833.0, 290394.0, 112963.0, 61398.0, 36008.0, 21803.0, 13594.0, 8465.0, 5508.0, 3588.0, 2365.0, 1572.0, 1055.0, 773.0, 517.0, 324.0, 214.0, 160.0, 128.0, 87.0, 73.0, 37.0, 26.0, 14.0, 11.0, 10.0, 7.0, 7.0, 1.0, 2.0, 4.0, 2.0, 3.0], "bins": [-4.625, -4.48077392578125, -4.3365478515625, -4.19232177734375, -4.048095703125, -3.90386962890625, -3.7596435546875, -3.61541748046875, -3.47119140625, -3.32696533203125, -3.1827392578125, -3.03851318359375, -2.894287109375, -2.75006103515625, -2.6058349609375, -2.46160888671875, -2.3173828125, -2.17315673828125, -2.0289306640625, -1.88470458984375, -1.740478515625, -1.59625244140625, -1.4520263671875, -1.30780029296875, -1.16357421875, -1.01934814453125, -0.8751220703125, -0.73089599609375, -0.586669921875, -0.44244384765625, -0.2982177734375, -0.15399169921875, -0.009765625, 0.13446044921875, 0.2786865234375, 0.42291259765625, 0.567138671875, 0.71136474609375, 0.8555908203125, 0.99981689453125, 1.14404296875, 1.28826904296875, 1.4324951171875, 1.57672119140625, 1.720947265625, 1.86517333984375, 2.0093994140625, 2.15362548828125, 2.2978515625, 2.44207763671875, 2.5863037109375, 2.73052978515625, 2.874755859375, 3.01898193359375, 3.1632080078125, 3.30743408203125, 3.45166015625, 3.59588623046875, 3.7401123046875, 3.88433837890625, 4.028564453125, 4.17279052734375, 4.3170166015625, 4.46124267578125, 4.60546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 8.0, 5.0, 6.0, 12.0, 13.0, 12.0, 22.0, 33.0, 21.0, 36.0, 33.0, 43.0, 31.0, 51.0, 45.0, 38.0, 39.0, 39.0, 39.0, 52.0, 45.0, 36.0, 37.0, 37.0, 36.0, 31.0, 30.0, 26.0, 29.0, 19.0, 23.0, 15.0, 12.0, 4.0, 6.0, 10.0, 9.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.265625, -9.9464111328125, -9.627197265625, -9.3079833984375, -8.98876953125, -8.6695556640625, -8.350341796875, -8.0311279296875, -7.7119140625, -7.3927001953125, -7.073486328125, -6.7542724609375, -6.43505859375, -6.1158447265625, -5.796630859375, -5.4774169921875, -5.158203125, -4.8389892578125, -4.519775390625, -4.2005615234375, -3.88134765625, -3.5621337890625, -3.242919921875, -2.9237060546875, -2.6044921875, -2.2852783203125, -1.966064453125, -1.6468505859375, -1.32763671875, -1.0084228515625, -0.689208984375, -0.3699951171875, -0.05078125, 0.2684326171875, 0.587646484375, 0.9068603515625, 1.22607421875, 1.5452880859375, 1.864501953125, 2.1837158203125, 2.5029296875, 2.8221435546875, 3.141357421875, 3.4605712890625, 3.77978515625, 4.0989990234375, 4.418212890625, 4.7374267578125, 5.056640625, 5.3758544921875, 5.695068359375, 6.0142822265625, 6.33349609375, 6.6527099609375, 6.971923828125, 7.2911376953125, 7.6103515625, 7.9295654296875, 8.248779296875, 8.5679931640625, 8.88720703125, 9.2064208984375, 9.525634765625, 9.8448486328125, 10.1640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 21.0, 19.0, 25.0, 53.0, 53.0, 97.0, 139.0, 213.0, 296.0, 425.0, 631.0, 915.0, 1425.0, 2081.0, 3199.0, 4887.0, 7292.0, 11319.0, 17856.0, 28444.0, 46261.0, 80007.0, 162258.0, 362113.0, 134369.0, 70543.0, 41454.0, 25637.0, 16256.0, 10443.0, 6747.0, 4277.0, 2899.0, 1939.0, 1289.0, 857.0, 583.0, 373.0, 287.0, 188.0, 147.0, 74.0, 60.0, 27.0, 29.0, 13.0, 10.0, 14.0, 5.0, 4.0, 4.0, 0.0, 3.0], "bins": [-5.02734375, -4.88116455078125, -4.7349853515625, -4.58880615234375, -4.442626953125, -4.29644775390625, -4.1502685546875, -4.00408935546875, -3.85791015625, -3.71173095703125, -3.5655517578125, -3.41937255859375, -3.273193359375, -3.12701416015625, -2.9808349609375, -2.83465576171875, -2.6884765625, -2.54229736328125, -2.3961181640625, -2.24993896484375, -2.103759765625, -1.95758056640625, -1.8114013671875, -1.66522216796875, -1.51904296875, -1.37286376953125, -1.2266845703125, -1.08050537109375, -0.934326171875, -0.78814697265625, -0.6419677734375, -0.49578857421875, -0.349609375, -0.20343017578125, -0.0572509765625, 0.08892822265625, 0.235107421875, 0.38128662109375, 0.5274658203125, 0.67364501953125, 0.81982421875, 0.96600341796875, 1.1121826171875, 1.25836181640625, 1.404541015625, 1.55072021484375, 1.6968994140625, 1.84307861328125, 1.9892578125, 2.13543701171875, 2.2816162109375, 2.42779541015625, 2.573974609375, 2.72015380859375, 2.8663330078125, 3.01251220703125, 3.15869140625, 3.30487060546875, 3.4510498046875, 3.59722900390625, 3.743408203125, 3.88958740234375, 4.0357666015625, 4.18194580078125, 4.328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 2.0, 8.0, 2.0, 3.0, 8.0, 5.0, 8.0, 13.0, 9.0, 15.0, 18.0, 21.0, 15.0, 23.0, 33.0, 37.0, 38.0, 33.0, 41.0, 34.0, 39.0, 37.0, 51.0, 38.0, 45.0, 41.0, 52.0, 24.0, 47.0, 40.0, 29.0, 26.0, 19.0, 21.0, 23.0, 17.0, 16.0, 18.0, 14.0, 8.0, 8.0, 7.0, 8.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-6.53515625, -6.3447265625, -6.154296875, -5.9638671875, -5.7734375, -5.5830078125, -5.392578125, -5.2021484375, -5.01171875, -4.8212890625, -4.630859375, -4.4404296875, -4.25, -4.0595703125, -3.869140625, -3.6787109375, -3.48828125, -3.2978515625, -3.107421875, -2.9169921875, -2.7265625, -2.5361328125, -2.345703125, -2.1552734375, -1.96484375, -1.7744140625, -1.583984375, -1.3935546875, -1.203125, -1.0126953125, -0.822265625, -0.6318359375, -0.44140625, -0.2509765625, -0.060546875, 0.1298828125, 0.3203125, 0.5107421875, 0.701171875, 0.8916015625, 1.08203125, 1.2724609375, 1.462890625, 1.6533203125, 1.84375, 2.0341796875, 2.224609375, 2.4150390625, 2.60546875, 2.7958984375, 2.986328125, 3.1767578125, 3.3671875, 3.5576171875, 3.748046875, 3.9384765625, 4.12890625, 4.3193359375, 4.509765625, 4.7001953125, 4.890625, 5.0810546875, 5.271484375, 5.4619140625, 5.65234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1.0, 2.0, 5.0, 7.0, 10.0, 21.0, 11.0, 22.0, 48.0, 51.0, 60.0, 89.0, 120.0, 168.0, 240.0, 452.0, 626.0, 1075.0, 1625.0, 2695.0, 4581.0, 8050.0, 14292.0, 27558.0, 57696.0, 140675.0, 302881.0, 268983.0, 114108.0, 48804.0, 23641.0, 12529.0, 6804.0, 4054.0, 2369.0, 1443.0, 1000.0, 557.0, 403.0, 253.0, 168.0, 111.0, 77.0, 62.0, 30.0, 29.0, 24.0, 19.0, 10.0, 8.0, 9.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.011993408203125, -0.01159214973449707, -0.01119089126586914, -0.010789632797241211, -0.010388374328613281, -0.009987115859985352, -0.009585857391357422, -0.009184598922729492, -0.008783340454101562, -0.008382081985473633, -0.007980823516845703, -0.0075795650482177734, -0.007178306579589844, -0.006777048110961914, -0.006375789642333984, -0.005974531173706055, -0.005573272705078125, -0.005172014236450195, -0.004770755767822266, -0.004369497299194336, -0.003968238830566406, -0.0035669803619384766, -0.003165721893310547, -0.002764463424682617, -0.0023632049560546875, -0.001961946487426758, -0.0015606880187988281, -0.0011594295501708984, -0.0007581710815429688, -0.00035691261291503906, 4.4345855712890625e-05, 0.0004456043243408203, 0.00084686279296875, 0.0012481212615966797, 0.0016493797302246094, 0.002050638198852539, 0.0024518966674804688, 0.0028531551361083984, 0.003254413604736328, 0.003655672073364258, 0.0040569305419921875, 0.004458189010620117, 0.004859447479248047, 0.0052607059478759766, 0.005661964416503906, 0.006063222885131836, 0.006464481353759766, 0.006865739822387695, 0.007266998291015625, 0.007668256759643555, 0.008069515228271484, 0.008470773696899414, 0.008872032165527344, 0.009273290634155273, 0.009674549102783203, 0.010075807571411133, 0.010477066040039062, 0.010878324508666992, 0.011279582977294922, 0.011680841445922852, 0.012082099914550781, 0.012483358383178711, 0.01288461685180664, 0.01328587532043457, 0.0136871337890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 12.0, 11.0, 22.0, 23.0, 21.0, 22.0, 26.0, 49.0, 39.0, 35.0, 46.0, 50.0, 76.0, 49.0, 55.0, 51.0, 70.0, 56.0, 62.0, 31.0, 35.0, 32.0, 29.0, 25.0, 18.0, 11.0, 11.0, 7.0, 7.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.973743438720703e-06, -6.724148988723755e-06, -6.474554538726807e-06, -6.224960088729858e-06, -5.97536563873291e-06, -5.725771188735962e-06, -5.476176738739014e-06, -5.2265822887420654e-06, -4.976987838745117e-06, -4.727393388748169e-06, -4.477798938751221e-06, -4.2282044887542725e-06, -3.978610038757324e-06, -3.729015588760376e-06, -3.4794211387634277e-06, -3.2298266887664795e-06, -2.9802322387695312e-06, -2.730637788772583e-06, -2.4810433387756348e-06, -2.2314488887786865e-06, -1.9818544387817383e-06, -1.73225998878479e-06, -1.4826655387878418e-06, -1.2330710887908936e-06, -9.834766387939453e-07, -7.338821887969971e-07, -4.842877388000488e-07, -2.3469328880310059e-07, 1.4901161193847656e-08, 2.644956111907959e-07, 5.140900611877441e-07, 7.636845111846924e-07, 1.0132789611816406e-06, 1.2628734111785889e-06, 1.5124678611755371e-06, 1.7620623111724854e-06, 2.0116567611694336e-06, 2.261251211166382e-06, 2.51084566116333e-06, 2.7604401111602783e-06, 3.0100345611572266e-06, 3.259629011154175e-06, 3.509223461151123e-06, 3.7588179111480713e-06, 4.0084123611450195e-06, 4.258006811141968e-06, 4.507601261138916e-06, 4.757195711135864e-06, 5.0067901611328125e-06, 5.256384611129761e-06, 5.505979061126709e-06, 5.755573511123657e-06, 6.0051679611206055e-06, 6.254762411117554e-06, 6.504356861114502e-06, 6.75395131111145e-06, 7.0035457611083984e-06, 7.253140211105347e-06, 7.502734661102295e-06, 7.752329111099243e-06, 8.001923561096191e-06, 8.25151801109314e-06, 8.501112461090088e-06, 8.750706911087036e-06, 9.000301361083984e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 7.0, 15.0, 24.0, 24.0, 41.0, 83.0, 81.0, 103.0, 168.0, 240.0, 357.0, 466.0, 668.0, 927.0, 1344.0, 1975.0, 2847.0, 4384.0, 6803.0, 10977.0, 18291.0, 31781.0, 58895.0, 116566.0, 214105.0, 242122.0, 155110.0, 78307.0, 40789.0, 22538.0, 13757.0, 8200.0, 5368.0, 3456.0, 2306.0, 1573.0, 1129.0, 807.0, 557.0, 417.0, 304.0, 177.0, 156.0, 96.0, 69.0, 39.0, 35.0, 27.0, 15.0, 12.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.0108795166015625, -0.010551929473876953, -0.010224342346191406, -0.00989675521850586, -0.009569168090820312, -0.009241580963134766, -0.008913993835449219, -0.008586406707763672, -0.008258819580078125, -0.007931232452392578, -0.007603645324707031, -0.007276058197021484, -0.0069484710693359375, -0.006620883941650391, -0.006293296813964844, -0.005965709686279297, -0.00563812255859375, -0.005310535430908203, -0.004982948303222656, -0.004655361175537109, -0.0043277740478515625, -0.004000186920166016, -0.0036725997924804688, -0.003345012664794922, -0.003017425537109375, -0.002689838409423828, -0.0023622512817382812, -0.0020346641540527344, -0.0017070770263671875, -0.0013794898986816406, -0.0010519027709960938, -0.0007243156433105469, -0.000396728515625, -6.914138793945312e-05, 0.00025844573974609375, 0.0005860328674316406, 0.0009136199951171875, 0.0012412071228027344, 0.0015687942504882812, 0.0018963813781738281, 0.002223968505859375, 0.002551555633544922, 0.0028791427612304688, 0.0032067298889160156, 0.0035343170166015625, 0.0038619041442871094, 0.004189491271972656, 0.004517078399658203, 0.00484466552734375, 0.005172252655029297, 0.005499839782714844, 0.005827426910400391, 0.0061550140380859375, 0.006482601165771484, 0.006810188293457031, 0.007137775421142578, 0.007465362548828125, 0.007792949676513672, 0.008120536804199219, 0.008448123931884766, 0.008775711059570312, 0.00910329818725586, 0.009430885314941406, 0.009758472442626953, 0.0100860595703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 11.0, 6.0, 11.0, 17.0, 18.0, 23.0, 38.0, 47.0, 65.0, 80.0, 86.0, 116.0, 101.0, 84.0, 64.0, 53.0, 34.0, 36.0, 8.0, 22.0, 12.0, 8.0, 7.0, 5.0, 7.0, 4.0, 7.0, 6.0, 3.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0051116943359375, -0.0049250125885009766, -0.004738330841064453, -0.00455164909362793, -0.004364967346191406, -0.004178285598754883, -0.003991603851318359, -0.003804922103881836, -0.0036182403564453125, -0.003431558609008789, -0.0032448768615722656, -0.003058195114135742, -0.0028715133666992188, -0.0026848316192626953, -0.002498149871826172, -0.0023114681243896484, -0.002124786376953125, -0.0019381046295166016, -0.0017514228820800781, -0.0015647411346435547, -0.0013780593872070312, -0.0011913776397705078, -0.0010046958923339844, -0.0008180141448974609, -0.0006313323974609375, -0.00044465065002441406, -0.0002579689025878906, -7.128715515136719e-05, 0.00011539459228515625, 0.0003020763397216797, 0.0004887580871582031, 0.0006754398345947266, 0.00086212158203125, 0.0010488033294677734, 0.0012354850769042969, 0.0014221668243408203, 0.0016088485717773438, 0.0017955303192138672, 0.0019822120666503906, 0.002168893814086914, 0.0023555755615234375, 0.002542257308959961, 0.0027289390563964844, 0.002915620803833008, 0.0031023025512695312, 0.0032889842987060547, 0.003475666046142578, 0.0036623477935791016, 0.003849029541015625, 0.0040357112884521484, 0.004222393035888672, 0.004409074783325195, 0.004595756530761719, 0.004782438278198242, 0.004969120025634766, 0.005155801773071289, 0.0053424835205078125, 0.005529165267944336, 0.005715847015380859, 0.005902528762817383, 0.006089210510253906, 0.00627589225769043, 0.006462574005126953, 0.0066492557525634766, 0.0068359375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 9.0, 11.0, 10.0, 13.0, 19.0, 20.0, 25.0, 40.0, 34.0, 37.0, 48.0, 44.0, 40.0, 52.0, 48.0, 51.0, 62.0, 57.0, 50.0, 46.0, 49.0, 31.0, 36.0, 26.0, 18.0, 21.0, 19.0, 15.0, 12.0, 10.0, 7.0, 9.0, 6.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.70928955078125, -8.44082260131836, -8.172355651855469, -7.903888702392578, -7.6354217529296875, -7.366954803466797, -7.098487854003906, -6.830020904541016, -6.561553955078125, -6.293087005615234, -6.024620056152344, -5.756153106689453, -5.4876861572265625, -5.219219207763672, -4.950752258300781, -4.682285308837891, -4.413818836212158, -4.145351886749268, -3.876884937286377, -3.6084179878234863, -3.3399510383605957, -3.071484088897705, -2.8030173778533936, -2.534550428390503, -2.2660834789276123, -1.9976165294647217, -1.729149580001831, -1.46068274974823, -1.1922158002853394, -0.9237488508224487, -0.6552820205688477, -0.38681507110595703, -0.1183481216430664, 0.15011879801750183, 0.41858571767807007, 0.6870526075363159, 0.9555195569992065, 1.2239865064620972, 1.4924533367156982, 1.7609202861785889, 2.0293872356414795, 2.29785418510437, 2.5663211345672607, 2.8347878456115723, 3.103254795074463, 3.3717217445373535, 3.640188694000244, 3.9086556434631348, 4.177122592926025, 4.445589542388916, 4.714056491851807, 4.982523441314697, 5.250990390777588, 5.5194573402404785, 5.787923812866211, 6.056390762329102, 6.324857711791992, 6.593324661254883, 6.861791610717773, 7.130258560180664, 7.398725509643555, 7.667192459106445, 7.935659408569336, 8.204126358032227, 8.472593307495117]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 7.0, 8.0, 7.0, 5.0, 10.0, 13.0, 11.0, 21.0, 18.0, 31.0, 24.0, 29.0, 39.0, 34.0, 42.0, 40.0, 41.0, 42.0, 32.0, 49.0, 46.0, 39.0, 35.0, 39.0, 43.0, 26.0, 30.0, 31.0, 26.0, 38.0, 27.0, 21.0, 15.0, 22.0, 15.0, 6.0, 17.0, 4.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.395456314086914, -9.103449821472168, -8.811442375183105, -8.51943588256836, -8.227428436279297, -7.935421466827393, -7.643414497375488, -7.351408004760742, -7.05940055847168, -6.767393589019775, -6.475386619567871, -6.183379650115967, -5.8913726806640625, -5.599365711212158, -5.307358741760254, -5.015352249145508, -4.7233452796936035, -4.431338310241699, -4.139331340789795, -3.8473243713378906, -3.5553174018859863, -3.263310432434082, -2.971303701400757, -2.6792967319488525, -2.3872897624969482, -2.095282793045044, -1.8032758235931396, -1.511268973350525, -1.2192620038986206, -0.9272550344467163, -0.6352481842041016, -0.34324121475219727, -0.05123424530029297, 0.24077269434928894, 0.5327796339988708, 0.8247865438461304, 1.1167935132980347, 1.408800482749939, 1.7008073329925537, 1.992814302444458, 2.2848212718963623, 2.5768282413482666, 2.868835210800171, 3.160841941833496, 3.4528489112854004, 3.7448558807373047, 4.036862850189209, 4.328869819641113, 4.620876789093018, 4.912883758544922, 5.204890727996826, 5.4968976974487305, 5.788904666900635, 6.080911636352539, 6.372918128967285, 6.664925575256348, 6.956932067871094, 7.248939037322998, 7.540946006774902, 7.832952976226807, 8.124959945678711, 8.416966438293457, 8.70897388458252, 9.000980377197266, 9.292987823486328]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 11.0, 14.0, 22.0, 22.0, 53.0, 99.0, 135.0, 217.0, 306.0, 493.0, 826.0, 1265.0, 1982.0, 3091.0, 4985.0, 8025.0, 12626.0, 19469.0, 29712.0, 44322.0, 63290.0, 84603.0, 106350.0, 120347.0, 122993.0, 112079.0, 92727.0, 70523.0, 50505.0, 34512.0, 22945.0, 14631.0, 9377.0, 5957.0, 3645.0, 2466.0, 1417.0, 913.0, 603.0, 370.0, 210.0, 147.0, 92.0, 71.0, 44.0, 24.0, 16.0, 12.0, 8.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.88671875, -6.66583251953125, -6.4449462890625, -6.22406005859375, -6.003173828125, -5.78228759765625, -5.5614013671875, -5.34051513671875, -5.11962890625, -4.89874267578125, -4.6778564453125, -4.45697021484375, -4.236083984375, -4.01519775390625, -3.7943115234375, -3.57342529296875, -3.3525390625, -3.13165283203125, -2.9107666015625, -2.68988037109375, -2.468994140625, -2.24810791015625, -2.0272216796875, -1.80633544921875, -1.58544921875, -1.36456298828125, -1.1436767578125, -0.92279052734375, -0.701904296875, -0.48101806640625, -0.2601318359375, -0.03924560546875, 0.181640625, 0.40252685546875, 0.6234130859375, 0.84429931640625, 1.065185546875, 1.28607177734375, 1.5069580078125, 1.72784423828125, 1.94873046875, 2.16961669921875, 2.3905029296875, 2.61138916015625, 2.832275390625, 3.05316162109375, 3.2740478515625, 3.49493408203125, 3.7158203125, 3.93670654296875, 4.1575927734375, 4.37847900390625, 4.599365234375, 4.82025146484375, 5.0411376953125, 5.26202392578125, 5.48291015625, 5.70379638671875, 5.9246826171875, 6.14556884765625, 6.366455078125, 6.58734130859375, 6.8082275390625, 7.02911376953125, 7.25]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 3.0, 5.0, 7.0, 7.0, 11.0, 12.0, 9.0, 16.0, 28.0, 15.0, 26.0, 30.0, 19.0, 29.0, 41.0, 46.0, 42.0, 33.0, 49.0, 42.0, 32.0, 49.0, 45.0, 36.0, 30.0, 41.0, 31.0, 28.0, 25.0, 36.0, 26.0, 25.0, 19.0, 24.0, 16.0, 19.0, 10.0, 7.0, 8.0, 4.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.515625, -8.232177734375, -7.94873046875, -7.665283203125, -7.3818359375, -7.098388671875, -6.81494140625, -6.531494140625, -6.248046875, -5.964599609375, -5.68115234375, -5.397705078125, -5.1142578125, -4.830810546875, -4.54736328125, -4.263916015625, -3.98046875, -3.697021484375, -3.41357421875, -3.130126953125, -2.8466796875, -2.563232421875, -2.27978515625, -1.996337890625, -1.712890625, -1.429443359375, -1.14599609375, -0.862548828125, -0.5791015625, -0.295654296875, -0.01220703125, 0.271240234375, 0.5546875, 0.838134765625, 1.12158203125, 1.405029296875, 1.6884765625, 1.971923828125, 2.25537109375, 2.538818359375, 2.822265625, 3.105712890625, 3.38916015625, 3.672607421875, 3.9560546875, 4.239501953125, 4.52294921875, 4.806396484375, 5.08984375, 5.373291015625, 5.65673828125, 5.940185546875, 6.2236328125, 6.507080078125, 6.79052734375, 7.073974609375, 7.357421875, 7.640869140625, 7.92431640625, 8.207763671875, 8.4912109375, 8.774658203125, 9.05810546875, 9.341552734375, 9.625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 11.0, 12.0, 31.0, 50.0, 67.0, 118.0, 162.0, 236.0, 382.0, 627.0, 993.0, 1552.0, 2356.0, 3761.0, 5827.0, 8722.0, 13663.0, 20977.0, 30866.0, 44994.0, 63384.0, 83859.0, 103408.0, 117054.0, 118193.0, 109075.0, 91718.0, 70277.0, 51388.0, 35714.0, 23964.0, 16027.0, 10349.0, 6791.0, 4250.0, 2784.0, 1755.0, 1171.0, 706.0, 458.0, 286.0, 172.0, 147.0, 79.0, 54.0, 31.0, 22.0, 14.0, 8.0, 5.0, 2.0, 5.0, 4.0, 0.0, 1.0], "bins": [-7.25390625, -7.0352783203125, -6.816650390625, -6.5980224609375, -6.37939453125, -6.1607666015625, -5.942138671875, -5.7235107421875, -5.5048828125, -5.2862548828125, -5.067626953125, -4.8489990234375, -4.63037109375, -4.4117431640625, -4.193115234375, -3.9744873046875, -3.755859375, -3.5372314453125, -3.318603515625, -3.0999755859375, -2.88134765625, -2.6627197265625, -2.444091796875, -2.2254638671875, -2.0068359375, -1.7882080078125, -1.569580078125, -1.3509521484375, -1.13232421875, -0.9136962890625, -0.695068359375, -0.4764404296875, -0.2578125, -0.0391845703125, 0.179443359375, 0.3980712890625, 0.61669921875, 0.8353271484375, 1.053955078125, 1.2725830078125, 1.4912109375, 1.7098388671875, 1.928466796875, 2.1470947265625, 2.36572265625, 2.5843505859375, 2.802978515625, 3.0216064453125, 3.240234375, 3.4588623046875, 3.677490234375, 3.8961181640625, 4.11474609375, 4.3333740234375, 4.552001953125, 4.7706298828125, 4.9892578125, 5.2078857421875, 5.426513671875, 5.6451416015625, 5.86376953125, 6.0823974609375, 6.301025390625, 6.5196533203125, 6.73828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 8.0, 8.0, 5.0, 6.0, 8.0, 12.0, 23.0, 16.0, 22.0, 27.0, 27.0, 35.0, 26.0, 40.0, 41.0, 45.0, 46.0, 44.0, 48.0, 56.0, 39.0, 41.0, 37.0, 39.0, 34.0, 32.0, 36.0, 30.0, 28.0, 28.0, 27.0, 19.0, 15.0, 15.0, 6.0, 8.0, 8.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5546875, -5.35919189453125, -5.1636962890625, -4.96820068359375, -4.772705078125, -4.57720947265625, -4.3817138671875, -4.18621826171875, -3.99072265625, -3.79522705078125, -3.5997314453125, -3.40423583984375, -3.208740234375, -3.01324462890625, -2.8177490234375, -2.62225341796875, -2.4267578125, -2.23126220703125, -2.0357666015625, -1.84027099609375, -1.644775390625, -1.44927978515625, -1.2537841796875, -1.05828857421875, -0.86279296875, -0.66729736328125, -0.4718017578125, -0.27630615234375, -0.080810546875, 0.11468505859375, 0.3101806640625, 0.50567626953125, 0.701171875, 0.89666748046875, 1.0921630859375, 1.28765869140625, 1.483154296875, 1.67864990234375, 1.8741455078125, 2.06964111328125, 2.26513671875, 2.46063232421875, 2.6561279296875, 2.85162353515625, 3.047119140625, 3.24261474609375, 3.4381103515625, 3.63360595703125, 3.8291015625, 4.02459716796875, 4.2200927734375, 4.41558837890625, 4.611083984375, 4.80657958984375, 5.0020751953125, 5.19757080078125, 5.39306640625, 5.58856201171875, 5.7840576171875, 5.97955322265625, 6.175048828125, 6.37054443359375, 6.5660400390625, 6.76153564453125, 6.95703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 9.0, 12.0, 17.0, 20.0, 41.0, 59.0, 119.0, 159.0, 317.0, 527.0, 954.0, 1615.0, 2863.0, 5153.0, 8944.0, 15751.0, 26452.0, 42135.0, 63466.0, 87959.0, 111377.0, 126799.0, 129324.0, 119498.0, 98951.0, 74247.0, 51438.0, 33233.0, 19955.0, 11790.0, 6783.0, 3784.0, 2065.0, 1138.0, 669.0, 366.0, 175.0, 143.0, 94.0, 56.0, 31.0, 20.0, 18.0, 13.0, 6.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.58203125, -1.5329437255859375, -1.483856201171875, -1.4347686767578125, -1.38568115234375, -1.3365936279296875, -1.287506103515625, -1.2384185791015625, -1.1893310546875, -1.1402435302734375, -1.091156005859375, -1.0420684814453125, -0.99298095703125, -0.9438934326171875, -0.894805908203125, -0.8457183837890625, -0.796630859375, -0.7475433349609375, -0.698455810546875, -0.6493682861328125, -0.60028076171875, -0.5511932373046875, -0.502105712890625, -0.4530181884765625, -0.4039306640625, -0.3548431396484375, -0.305755615234375, -0.2566680908203125, -0.20758056640625, -0.1584930419921875, -0.109405517578125, -0.0603179931640625, -0.01123046875, 0.0378570556640625, 0.086944580078125, 0.1360321044921875, 0.18511962890625, 0.2342071533203125, 0.283294677734375, 0.3323822021484375, 0.3814697265625, 0.4305572509765625, 0.479644775390625, 0.5287322998046875, 0.57781982421875, 0.6269073486328125, 0.675994873046875, 0.7250823974609375, 0.774169921875, 0.8232574462890625, 0.872344970703125, 0.9214324951171875, 0.97052001953125, 1.0196075439453125, 1.068695068359375, 1.1177825927734375, 1.1668701171875, 1.2159576416015625, 1.265045166015625, 1.3141326904296875, 1.36322021484375, 1.4123077392578125, 1.461395263671875, 1.5104827880859375, 1.5595703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 8.0, 12.0, 6.0, 18.0, 17.0, 21.0, 15.0, 23.0, 24.0, 32.0, 30.0, 33.0, 39.0, 42.0, 46.0, 51.0, 45.0, 38.0, 51.0, 49.0, 45.0, 34.0, 36.0, 39.0, 39.0, 35.0, 24.0, 21.0, 22.0, 20.0, 22.0, 16.0, 10.0, 12.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.00020432472229003906, -0.00019904226064682007, -0.00019375979900360107, -0.00018847733736038208, -0.00018319487571716309, -0.0001779124140739441, -0.0001726299524307251, -0.0001673474907875061, -0.0001620650291442871, -0.00015678256750106812, -0.00015150010585784912, -0.00014621764421463013, -0.00014093518257141113, -0.00013565272092819214, -0.00013037025928497314, -0.00012508779764175415, -0.00011980533599853516, -0.00011452287435531616, -0.00010924041271209717, -0.00010395795106887817, -9.867548942565918e-05, -9.339302778244019e-05, -8.811056613922119e-05, -8.28281044960022e-05, -7.75456428527832e-05, -7.226318120956421e-05, -6.698071956634521e-05, -6.169825792312622e-05, -5.6415796279907227e-05, -5.113333463668823e-05, -4.585087299346924e-05, -4.0568411350250244e-05, -3.528594970703125e-05, -3.0003488063812256e-05, -2.4721026420593262e-05, -1.9438564777374268e-05, -1.4156103134155273e-05, -8.87364149093628e-06, -3.591179847717285e-06, 1.691281795501709e-06, 6.973743438720703e-06, 1.2256205081939697e-05, 1.753866672515869e-05, 2.2821128368377686e-05, 2.810359001159668e-05, 3.3386051654815674e-05, 3.866851329803467e-05, 4.395097494125366e-05, 4.9233436584472656e-05, 5.451589822769165e-05, 5.9798359870910645e-05, 6.508082151412964e-05, 7.036328315734863e-05, 7.564574480056763e-05, 8.092820644378662e-05, 8.621066808700562e-05, 9.149312973022461e-05, 9.67755913734436e-05, 0.0001020580530166626, 0.00010734051465988159, 0.00011262297630310059, 0.00011790543794631958, 0.00012318789958953857, 0.00012847036123275757, 0.00013375282287597656]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 4.0, 7.0, 13.0, 19.0, 26.0, 38.0, 78.0, 91.0, 163.0, 236.0, 412.0, 717.0, 1025.0, 1645.0, 2759.0, 4289.0, 6874.0, 11157.0, 17720.0, 26536.0, 37733.0, 52422.0, 69197.0, 85492.0, 99286.0, 106387.0, 107133.0, 98957.0, 85698.0, 69119.0, 52280.0, 37857.0, 26146.0, 17264.0, 11027.0, 7117.0, 4295.0, 2752.0, 1782.0, 1022.0, 642.0, 436.0, 249.0, 180.0, 96.0, 59.0, 40.0, 19.0, 20.0, 20.0, 11.0, 4.0, 5.0, 1.0, 2.0, 3.0], "bins": [-1.388671875, -1.3478240966796875, -1.306976318359375, -1.2661285400390625, -1.22528076171875, -1.1844329833984375, -1.143585205078125, -1.1027374267578125, -1.0618896484375, -1.0210418701171875, -0.980194091796875, -0.9393463134765625, -0.89849853515625, -0.8576507568359375, -0.816802978515625, -0.7759552001953125, -0.735107421875, -0.6942596435546875, -0.653411865234375, -0.6125640869140625, -0.57171630859375, -0.5308685302734375, -0.490020751953125, -0.4491729736328125, -0.4083251953125, -0.3674774169921875, -0.326629638671875, -0.2857818603515625, -0.24493408203125, -0.2040863037109375, -0.163238525390625, -0.1223907470703125, -0.08154296875, -0.0406951904296875, 0.000152587890625, 0.0410003662109375, 0.08184814453125, 0.1226959228515625, 0.163543701171875, 0.2043914794921875, 0.2452392578125, 0.2860870361328125, 0.326934814453125, 0.3677825927734375, 0.40863037109375, 0.4494781494140625, 0.490325927734375, 0.5311737060546875, 0.572021484375, 0.6128692626953125, 0.653717041015625, 0.6945648193359375, 0.73541259765625, 0.7762603759765625, 0.817108154296875, 0.8579559326171875, 0.8988037109375, 0.9396514892578125, 0.980499267578125, 1.0213470458984375, 1.06219482421875, 1.1030426025390625, 1.143890380859375, 1.1847381591796875, 1.2255859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 7.0, 12.0, 11.0, 11.0, 10.0, 17.0, 18.0, 16.0, 18.0, 23.0, 24.0, 26.0, 28.0, 33.0, 42.0, 43.0, 38.0, 38.0, 51.0, 44.0, 35.0, 31.0, 38.0, 29.0, 44.0, 40.0, 30.0, 29.0, 25.0, 23.0, 22.0, 28.0, 11.0, 18.0, 11.0, 10.0, 10.0, 10.0, 8.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6025390625, -0.5822982788085938, -0.5620574951171875, -0.5418167114257812, -0.521575927734375, -0.5013351440429688, -0.4810943603515625, -0.46085357666015625, -0.44061279296875, -0.42037200927734375, -0.4001312255859375, -0.37989044189453125, -0.359649658203125, -0.33940887451171875, -0.3191680908203125, -0.29892730712890625, -0.2786865234375, -0.25844573974609375, -0.2382049560546875, -0.21796417236328125, -0.197723388671875, -0.17748260498046875, -0.1572418212890625, -0.13700103759765625, -0.11676025390625, -0.09651947021484375, -0.0762786865234375, -0.05603790283203125, -0.035797119140625, -0.01555633544921875, 0.0046844482421875, 0.02492523193359375, 0.045166015625, 0.06540679931640625, 0.0856475830078125, 0.10588836669921875, 0.126129150390625, 0.14636993408203125, 0.1666107177734375, 0.18685150146484375, 0.20709228515625, 0.22733306884765625, 0.2475738525390625, 0.26781463623046875, 0.288055419921875, 0.30829620361328125, 0.3285369873046875, 0.34877777099609375, 0.3690185546875, 0.38925933837890625, 0.4095001220703125, 0.42974090576171875, 0.449981689453125, 0.47022247314453125, 0.4904632568359375, 0.5107040405273438, 0.53094482421875, 0.5511856079101562, 0.5714263916015625, 0.5916671752929688, 0.611907958984375, 0.6321487426757812, 0.6523895263671875, 0.6726303100585938, 0.69287109375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 9.0, 6.0, 8.0, 9.0, 7.0, 10.0, 21.0, 25.0, 25.0, 25.0, 30.0, 38.0, 36.0, 36.0, 47.0, 41.0, 50.0, 60.0, 47.0, 41.0, 68.0, 51.0, 53.0, 33.0, 28.0, 24.0, 29.0, 28.0, 18.0, 25.0, 19.0, 10.0, 10.0, 8.0, 9.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.250895500183105, -7.987729072570801, -7.724562644958496, -7.461395740509033, -7.1982293128967285, -6.935062885284424, -6.671895980834961, -6.408729553222656, -6.145563125610352, -5.882396697998047, -5.619230270385742, -5.356063365936279, -5.092896938323975, -4.82973051071167, -4.566563606262207, -4.303397178649902, -4.040230751037598, -3.777064323425293, -3.513897657394409, -3.2507309913635254, -2.9875645637512207, -2.724398136138916, -2.4612314701080322, -2.1980648040771484, -1.9348983764648438, -1.6717318296432495, -1.4085652828216553, -1.145398736000061, -0.8822321891784668, -0.6190656423568726, -0.3558990955352783, -0.09273254871368408, 0.17043495178222656, 0.4336014986038208, 0.696768045425415, 0.9599345922470093, 1.2231011390686035, 1.4862676858901978, 1.749434232711792, 2.012600898742676, 2.2757673263549805, 2.538933753967285, 2.802100419998169, 3.0652670860290527, 3.3284335136413574, 3.591599941253662, 3.854766607284546, 4.11793327331543, 4.381099700927734, 4.644266128540039, 4.907432556152344, 5.170599460601807, 5.433765888214111, 5.696932315826416, 5.960099220275879, 6.223265647888184, 6.486432075500488, 6.749598503112793, 7.012764930725098, 7.2759318351745605, 7.539098262786865, 7.80226469039917, 8.065431594848633, 8.328598022460938, 8.591764450073242]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 6.0, 1.0, 7.0, 7.0, 7.0, 8.0, 16.0, 11.0, 20.0, 11.0, 33.0, 15.0, 30.0, 23.0, 34.0, 31.0, 43.0, 45.0, 42.0, 40.0, 33.0, 44.0, 47.0, 42.0, 50.0, 36.0, 35.0, 33.0, 29.0, 27.0, 33.0, 23.0, 30.0, 20.0, 16.0, 18.0, 5.0, 15.0, 8.0, 9.0, 7.0, 10.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.381034851074219, -8.079608917236328, -7.778183460235596, -7.476758003234863, -7.175332069396973, -6.873906135559082, -6.57248067855835, -6.271055221557617, -5.969629287719727, -5.668203353881836, -5.3667778968811035, -5.065352439880371, -4.7639265060424805, -4.46250057220459, -4.161075115203857, -3.859649419784546, -3.5582237243652344, -3.256798028945923, -2.9553723335266113, -2.6539466381073, -2.3525209426879883, -2.0510952472686768, -1.7496695518493652, -1.4482438564300537, -1.1468181610107422, -0.8453924655914307, -0.5439667701721191, -0.24254107475280762, 0.058884620666503906, 0.36031031608581543, 0.661736011505127, 0.9631617069244385, 1.26458740234375, 1.5660130977630615, 1.867438793182373, 2.1688644886016846, 2.470290184020996, 2.7717158794403076, 3.073141574859619, 3.3745672702789307, 3.675992965698242, 3.9774186611175537, 4.278844356536865, 4.580269813537598, 4.881695747375488, 5.183121681213379, 5.484547138214111, 5.785972595214844, 6.087398529052734, 6.388824462890625, 6.690249919891357, 6.99167537689209, 7.2931013107299805, 7.594527244567871, 7.8959527015686035, 8.197378158569336, 8.498804092407227, 8.800230026245117, 9.101655960083008, 9.403080940246582, 9.704506874084473, 10.005932807922363, 10.307357788085938, 10.608783721923828, 10.910209655761719]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 10.0, 30.0, 39.0, 68.0, 105.0, 216.0, 395.0, 690.0, 1280.0, 2285.0, 4277.0, 7716.0, 14234.0, 25901.0, 47670.0, 86563.0, 152071.0, 254158.0, 396451.0, 544618.0, 641038.0, 624785.0, 509970.0, 358678.0, 225940.0, 132320.0, 73987.0, 40615.0, 21773.0, 11756.0, 6482.0, 3608.0, 1992.0, 1075.0, 609.0, 332.0, 204.0, 123.0, 89.0, 52.0, 29.0, 16.0, 12.0, 12.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.4375, -8.145263671875, -7.85302734375, -7.560791015625, -7.2685546875, -6.976318359375, -6.68408203125, -6.391845703125, -6.099609375, -5.807373046875, -5.51513671875, -5.222900390625, -4.9306640625, -4.638427734375, -4.34619140625, -4.053955078125, -3.76171875, -3.469482421875, -3.17724609375, -2.885009765625, -2.5927734375, -2.300537109375, -2.00830078125, -1.716064453125, -1.423828125, -1.131591796875, -0.83935546875, -0.547119140625, -0.2548828125, 0.037353515625, 0.32958984375, 0.621826171875, 0.9140625, 1.206298828125, 1.49853515625, 1.790771484375, 2.0830078125, 2.375244140625, 2.66748046875, 2.959716796875, 3.251953125, 3.544189453125, 3.83642578125, 4.128662109375, 4.4208984375, 4.713134765625, 5.00537109375, 5.297607421875, 5.58984375, 5.882080078125, 6.17431640625, 6.466552734375, 6.7587890625, 7.051025390625, 7.34326171875, 7.635498046875, 7.927734375, 8.219970703125, 8.51220703125, 8.804443359375, 9.0966796875, 9.388916015625, 9.68115234375, 9.973388671875, 10.265625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 2.0, 1.0, 6.0, 8.0, 11.0, 11.0, 19.0, 19.0, 20.0, 26.0, 21.0, 19.0, 35.0, 37.0, 41.0, 35.0, 42.0, 52.0, 40.0, 23.0, 43.0, 47.0, 45.0, 42.0, 33.0, 38.0, 33.0, 32.0, 32.0, 27.0, 21.0, 27.0, 28.0, 12.0, 12.0, 11.0, 14.0, 9.0, 9.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.62109375, -7.35260009765625, -7.0841064453125, -6.81561279296875, -6.547119140625, -6.27862548828125, -6.0101318359375, -5.74163818359375, -5.47314453125, -5.20465087890625, -4.9361572265625, -4.66766357421875, -4.399169921875, -4.13067626953125, -3.8621826171875, -3.59368896484375, -3.3251953125, -3.05670166015625, -2.7882080078125, -2.51971435546875, -2.251220703125, -1.98272705078125, -1.7142333984375, -1.44573974609375, -1.17724609375, -0.90875244140625, -0.6402587890625, -0.37176513671875, -0.103271484375, 0.16522216796875, 0.4337158203125, 0.70220947265625, 0.970703125, 1.23919677734375, 1.5076904296875, 1.77618408203125, 2.044677734375, 2.31317138671875, 2.5816650390625, 2.85015869140625, 3.11865234375, 3.38714599609375, 3.6556396484375, 3.92413330078125, 4.192626953125, 4.46112060546875, 4.7296142578125, 4.99810791015625, 5.2666015625, 5.53509521484375, 5.8035888671875, 6.07208251953125, 6.340576171875, 6.60906982421875, 6.8775634765625, 7.14605712890625, 7.41455078125, 7.68304443359375, 7.9515380859375, 8.22003173828125, 8.488525390625, 8.75701904296875, 9.0255126953125, 9.29400634765625, 9.5625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 7.0, 4.0, 6.0, 12.0, 39.0, 31.0, 63.0, 94.0, 198.0, 260.0, 374.0, 697.0, 1071.0, 1804.0, 2966.0, 4916.0, 8240.0, 13737.0, 22801.0, 37005.0, 59781.0, 94623.0, 142338.0, 207341.0, 283045.0, 359894.0, 425462.0, 463193.0, 458776.0, 418196.0, 349650.0, 271493.0, 197050.0, 135472.0, 89118.0, 56128.0, 35077.0, 21020.0, 12733.0, 7753.0, 4617.0, 2747.0, 1715.0, 1068.0, 628.0, 407.0, 225.0, 146.0, 104.0, 58.0, 43.0, 26.0, 14.0, 10.0, 4.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-6.84375, -6.62249755859375, -6.4012451171875, -6.17999267578125, -5.958740234375, -5.73748779296875, -5.5162353515625, -5.29498291015625, -5.07373046875, -4.85247802734375, -4.6312255859375, -4.40997314453125, -4.188720703125, -3.96746826171875, -3.7462158203125, -3.52496337890625, -3.3037109375, -3.08245849609375, -2.8612060546875, -2.63995361328125, -2.418701171875, -2.19744873046875, -1.9761962890625, -1.75494384765625, -1.53369140625, -1.31243896484375, -1.0911865234375, -0.86993408203125, -0.648681640625, -0.42742919921875, -0.2061767578125, 0.01507568359375, 0.236328125, 0.45758056640625, 0.6788330078125, 0.90008544921875, 1.121337890625, 1.34259033203125, 1.5638427734375, 1.78509521484375, 2.00634765625, 2.22760009765625, 2.4488525390625, 2.67010498046875, 2.891357421875, 3.11260986328125, 3.3338623046875, 3.55511474609375, 3.7763671875, 3.99761962890625, 4.2188720703125, 4.44012451171875, 4.661376953125, 4.88262939453125, 5.1038818359375, 5.32513427734375, 5.54638671875, 5.76763916015625, 5.9888916015625, 6.21014404296875, 6.431396484375, 6.65264892578125, 6.8739013671875, 7.09515380859375, 7.31640625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 8.0, 10.0, 13.0, 19.0, 28.0, 21.0, 28.0, 32.0, 49.0, 50.0, 51.0, 53.0, 110.0, 125.0, 124.0, 152.0, 160.0, 181.0, 166.0, 197.0, 202.0, 202.0, 226.0, 186.0, 191.0, 201.0, 183.0, 173.0, 148.0, 142.0, 99.0, 103.0, 90.0, 67.0, 62.0, 38.0, 46.0, 28.0, 22.0, 22.0, 18.0, 15.0, 4.0, 10.0, 2.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.62890625, -3.5079345703125, -3.386962890625, -3.2659912109375, -3.14501953125, -3.0240478515625, -2.903076171875, -2.7821044921875, -2.6611328125, -2.5401611328125, -2.419189453125, -2.2982177734375, -2.17724609375, -2.0562744140625, -1.935302734375, -1.8143310546875, -1.693359375, -1.5723876953125, -1.451416015625, -1.3304443359375, -1.20947265625, -1.0885009765625, -0.967529296875, -0.8465576171875, -0.7255859375, -0.6046142578125, -0.483642578125, -0.3626708984375, -0.24169921875, -0.1207275390625, 0.000244140625, 0.1212158203125, 0.2421875, 0.3631591796875, 0.484130859375, 0.6051025390625, 0.72607421875, 0.8470458984375, 0.968017578125, 1.0889892578125, 1.2099609375, 1.3309326171875, 1.451904296875, 1.5728759765625, 1.69384765625, 1.8148193359375, 1.935791015625, 2.0567626953125, 2.177734375, 2.2987060546875, 2.419677734375, 2.5406494140625, 2.66162109375, 2.7825927734375, 2.903564453125, 3.0245361328125, 3.1455078125, 3.2664794921875, 3.387451171875, 3.5084228515625, 3.62939453125, 3.7503662109375, 3.871337890625, 3.9923095703125, 4.11328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 10.0, 5.0, 5.0, 11.0, 9.0, 18.0, 24.0, 22.0, 27.0, 46.0, 39.0, 31.0, 45.0, 57.0, 52.0, 50.0, 43.0, 58.0, 49.0, 56.0, 44.0, 40.0, 44.0, 42.0, 39.0, 27.0, 25.0, 11.0, 15.0, 13.0, 10.0, 9.0, 12.0, 1.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.79105281829834, -9.502177238464355, -9.213300704956055, -8.92442512512207, -8.63554859161377, -8.346673011779785, -8.057796478271484, -7.7689208984375, -7.480044364929199, -7.191168308258057, -6.902292251586914, -6.6134161949157715, -6.324540138244629, -6.035664081573486, -5.746788024902344, -5.457912445068359, -5.169036388397217, -4.880160331726074, -4.591284275054932, -4.302408218383789, -4.0135321617126465, -3.724656105041504, -3.4357802867889404, -3.146904230117798, -2.8580281734466553, -2.5691521167755127, -2.28027606010437, -1.991400122642517, -1.7025240659713745, -1.413648009300232, -1.124772071838379, -0.8358960151672363, -0.5470199584960938, -0.25814393162727356, 0.03073209524154663, 0.31960809230804443, 0.608484148979187, 0.8973602056503296, 1.1862361431121826, 1.4751121997833252, 1.7639882564544678, 2.0528643131256104, 2.341740369796753, 2.6306161880493164, 2.919492244720459, 3.2083683013916016, 3.497244358062744, 3.7861204147338867, 4.074996471405029, 4.363872528076172, 4.6527485847473145, 4.941624641418457, 5.2305006980896, 5.519376754760742, 5.808252334594727, 6.097128868103027, 6.386004447937012, 6.674880504608154, 6.963756561279297, 7.2526326179504395, 7.541508674621582, 7.830384731292725, 8.119260787963867, 8.408136367797852, 8.697012901306152]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 5.0, 5.0, 6.0, 7.0, 6.0, 12.0, 19.0, 18.0, 29.0, 27.0, 21.0, 35.0, 26.0, 21.0, 34.0, 47.0, 36.0, 40.0, 43.0, 32.0, 37.0, 42.0, 51.0, 51.0, 44.0, 34.0, 30.0, 31.0, 33.0, 25.0, 26.0, 18.0, 26.0, 18.0, 10.0, 19.0, 6.0, 5.0, 4.0, 1.0, 7.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.165173530578613, -8.860442161560059, -8.55571174621582, -8.250980377197266, -7.946249485015869, -7.641518592834473, -7.336787223815918, -7.0320563316345215, -6.727325439453125, -6.4225945472717285, -6.117863655090332, -5.813132286071777, -5.508401393890381, -5.203670501708984, -4.89893913269043, -4.594208240509033, -4.289477348327637, -3.9847464561462402, -3.6800153255462646, -3.375284194946289, -3.0705533027648926, -2.765822410583496, -2.4610912799835205, -2.156360149383545, -1.8516292572021484, -1.5468982458114624, -1.2421672344207764, -0.9374362230300903, -0.6327052116394043, -0.32797420024871826, -0.023243188858032227, 0.28148794174194336, 0.5862197875976562, 0.8909507989883423, 1.1956818103790283, 1.5004128217697144, 1.8051438331604004, 2.109874725341797, 2.4146058559417725, 2.719336986541748, 3.0240678787231445, 3.328798770904541, 3.6335299015045166, 3.938261032104492, 4.242991924285889, 4.547722816467285, 4.85245418548584, 5.157185077667236, 5.461915969848633, 5.766646862030029, 6.071377754211426, 6.3761091232299805, 6.680840015411377, 6.985570907592773, 7.290302276611328, 7.595033168792725, 7.899764060974121, 8.204495429992676, 8.509225845336914, 8.813957214355469, 9.118688583374023, 9.423418998718262, 9.728150367736816, 10.032880783081055, 10.33761215209961]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 10.0, 9.0, 18.0, 21.0, 36.0, 57.0, 86.0, 120.0, 210.0, 320.0, 515.0, 827.0, 1485.0, 2483.0, 4542.0, 8117.0, 15377.0, 30355.0, 62762.0, 152133.0, 462756.0, 169205.0, 68286.0, 32494.0, 16369.0, 8829.0, 4732.0, 2527.0, 1524.0, 886.0, 557.0, 345.0, 214.0, 113.0, 78.0, 57.0, 34.0, 19.0, 18.0, 11.0, 10.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.70703125, -6.49444580078125, -6.2818603515625, -6.06927490234375, -5.856689453125, -5.64410400390625, -5.4315185546875, -5.21893310546875, -5.00634765625, -4.79376220703125, -4.5811767578125, -4.36859130859375, -4.156005859375, -3.94342041015625, -3.7308349609375, -3.51824951171875, -3.3056640625, -3.09307861328125, -2.8804931640625, -2.66790771484375, -2.455322265625, -2.24273681640625, -2.0301513671875, -1.81756591796875, -1.60498046875, -1.39239501953125, -1.1798095703125, -0.96722412109375, -0.754638671875, -0.54205322265625, -0.3294677734375, -0.11688232421875, 0.095703125, 0.30828857421875, 0.5208740234375, 0.73345947265625, 0.946044921875, 1.15863037109375, 1.3712158203125, 1.58380126953125, 1.79638671875, 2.00897216796875, 2.2215576171875, 2.43414306640625, 2.646728515625, 2.85931396484375, 3.0718994140625, 3.28448486328125, 3.4970703125, 3.70965576171875, 3.9222412109375, 4.13482666015625, 4.347412109375, 4.55999755859375, 4.7725830078125, 4.98516845703125, 5.19775390625, 5.41033935546875, 5.6229248046875, 5.83551025390625, 6.048095703125, 6.26068115234375, 6.4732666015625, 6.68585205078125, 6.8984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 7.0, 9.0, 7.0, 7.0, 6.0, 10.0, 18.0, 20.0, 16.0, 34.0, 35.0, 22.0, 43.0, 30.0, 36.0, 57.0, 44.0, 40.0, 49.0, 63.0, 49.0, 55.0, 38.0, 34.0, 51.0, 31.0, 31.0, 30.0, 27.0, 15.0, 18.0, 19.0, 13.0, 8.0, 10.0, 11.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.03125, -9.6727294921875, -9.314208984375, -8.9556884765625, -8.59716796875, -8.2386474609375, -7.880126953125, -7.5216064453125, -7.1630859375, -6.8045654296875, -6.446044921875, -6.0875244140625, -5.72900390625, -5.3704833984375, -5.011962890625, -4.6534423828125, -4.294921875, -3.9364013671875, -3.577880859375, -3.2193603515625, -2.86083984375, -2.5023193359375, -2.143798828125, -1.7852783203125, -1.4267578125, -1.0682373046875, -0.709716796875, -0.3511962890625, 0.00732421875, 0.3658447265625, 0.724365234375, 1.0828857421875, 1.44140625, 1.7999267578125, 2.158447265625, 2.5169677734375, 2.87548828125, 3.2340087890625, 3.592529296875, 3.9510498046875, 4.3095703125, 4.6680908203125, 5.026611328125, 5.3851318359375, 5.74365234375, 6.1021728515625, 6.460693359375, 6.8192138671875, 7.177734375, 7.5362548828125, 7.894775390625, 8.2532958984375, 8.61181640625, 8.9703369140625, 9.328857421875, 9.6873779296875, 10.0458984375, 10.4044189453125, 10.762939453125, 11.1214599609375, 11.47998046875, 11.8385009765625, 12.197021484375, 12.5555419921875, 12.9140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 9.0, 12.0, 15.0, 21.0, 35.0, 54.0, 85.0, 140.0, 186.0, 280.0, 406.0, 613.0, 965.0, 1460.0, 2281.0, 3551.0, 5693.0, 8915.0, 14344.0, 23307.0, 38671.0, 66254.0, 127183.0, 362322.0, 182459.0, 85287.0, 48007.0, 28566.0, 17587.0, 10912.0, 6738.0, 4262.0, 2770.0, 1794.0, 1153.0, 767.0, 503.0, 322.0, 218.0, 137.0, 103.0, 55.0, 43.0, 20.0, 19.0, 13.0, 10.0, 9.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.87890625, -4.72503662109375, -4.5711669921875, -4.41729736328125, -4.263427734375, -4.10955810546875, -3.9556884765625, -3.80181884765625, -3.64794921875, -3.49407958984375, -3.3402099609375, -3.18634033203125, -3.032470703125, -2.87860107421875, -2.7247314453125, -2.57086181640625, -2.4169921875, -2.26312255859375, -2.1092529296875, -1.95538330078125, -1.801513671875, -1.64764404296875, -1.4937744140625, -1.33990478515625, -1.18603515625, -1.03216552734375, -0.8782958984375, -0.72442626953125, -0.570556640625, -0.41668701171875, -0.2628173828125, -0.10894775390625, 0.044921875, 0.19879150390625, 0.3526611328125, 0.50653076171875, 0.660400390625, 0.81427001953125, 0.9681396484375, 1.12200927734375, 1.27587890625, 1.42974853515625, 1.5836181640625, 1.73748779296875, 1.891357421875, 2.04522705078125, 2.1990966796875, 2.35296630859375, 2.5068359375, 2.66070556640625, 2.8145751953125, 2.96844482421875, 3.122314453125, 3.27618408203125, 3.4300537109375, 3.58392333984375, 3.73779296875, 3.89166259765625, 4.0455322265625, 4.19940185546875, 4.353271484375, 4.50714111328125, 4.6610107421875, 4.81488037109375, 4.96875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 7.0, 5.0, 7.0, 13.0, 10.0, 11.0, 16.0, 16.0, 17.0, 28.0, 30.0, 24.0, 33.0, 27.0, 44.0, 38.0, 39.0, 52.0, 48.0, 46.0, 45.0, 26.0, 48.0, 43.0, 46.0, 40.0, 31.0, 36.0, 30.0, 20.0, 22.0, 23.0, 17.0, 14.0, 12.0, 12.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.37890625, -6.1788330078125, -5.978759765625, -5.7786865234375, -5.57861328125, -5.3785400390625, -5.178466796875, -4.9783935546875, -4.7783203125, -4.5782470703125, -4.378173828125, -4.1781005859375, -3.97802734375, -3.7779541015625, -3.577880859375, -3.3778076171875, -3.177734375, -2.9776611328125, -2.777587890625, -2.5775146484375, -2.37744140625, -2.1773681640625, -1.977294921875, -1.7772216796875, -1.5771484375, -1.3770751953125, -1.177001953125, -0.9769287109375, -0.77685546875, -0.5767822265625, -0.376708984375, -0.1766357421875, 0.0234375, 0.2235107421875, 0.423583984375, 0.6236572265625, 0.82373046875, 1.0238037109375, 1.223876953125, 1.4239501953125, 1.6240234375, 1.8240966796875, 2.024169921875, 2.2242431640625, 2.42431640625, 2.6243896484375, 2.824462890625, 3.0245361328125, 3.224609375, 3.4246826171875, 3.624755859375, 3.8248291015625, 4.02490234375, 4.2249755859375, 4.425048828125, 4.6251220703125, 4.8251953125, 5.0252685546875, 5.225341796875, 5.4254150390625, 5.62548828125, 5.8255615234375, 6.025634765625, 6.2257080078125, 6.42578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 4.0, 7.0, 7.0, 8.0, 12.0, 13.0, 27.0, 43.0, 42.0, 63.0, 109.0, 145.0, 173.0, 301.0, 407.0, 557.0, 739.0, 1135.0, 1618.0, 2241.0, 3223.0, 4963.0, 7308.0, 11146.0, 18114.0, 28940.0, 51831.0, 100384.0, 185849.0, 239262.0, 173881.0, 91517.0, 47615.0, 27392.0, 16896.0, 10638.0, 6859.0, 4627.0, 3126.0, 2154.0, 1482.0, 1064.0, 827.0, 508.0, 377.0, 243.0, 194.0, 138.0, 109.0, 75.0, 59.0, 53.0, 22.0, 7.0, 9.0, 8.0, 3.0, 3.0, 2.0, 3.0, 3.0], "bins": [-0.00881195068359375, -0.00854027271270752, -0.008268594741821289, -0.007996916770935059, -0.007725238800048828, -0.007453560829162598, -0.007181882858276367, -0.006910204887390137, -0.006638526916503906, -0.006366848945617676, -0.006095170974731445, -0.005823493003845215, -0.005551815032958984, -0.005280137062072754, -0.0050084590911865234, -0.004736781120300293, -0.0044651031494140625, -0.004193425178527832, -0.0039217472076416016, -0.003650069236755371, -0.0033783912658691406, -0.00310671329498291, -0.0028350353240966797, -0.0025633573532104492, -0.0022916793823242188, -0.0020200014114379883, -0.0017483234405517578, -0.0014766454696655273, -0.0012049674987792969, -0.0009332895278930664, -0.0006616115570068359, -0.00038993358612060547, -0.000118255615234375, 0.00015342235565185547, 0.00042510032653808594, 0.0006967782974243164, 0.0009684562683105469, 0.0012401342391967773, 0.0015118122100830078, 0.0017834901809692383, 0.0020551681518554688, 0.0023268461227416992, 0.0025985240936279297, 0.00287020206451416, 0.0031418800354003906, 0.003413558006286621, 0.0036852359771728516, 0.003956913948059082, 0.0042285919189453125, 0.004500269889831543, 0.0047719478607177734, 0.005043625831604004, 0.005315303802490234, 0.005586981773376465, 0.005858659744262695, 0.006130337715148926, 0.006402015686035156, 0.006673693656921387, 0.006945371627807617, 0.007217049598693848, 0.007488727569580078, 0.007760405540466309, 0.008032083511352539, 0.00830376148223877, 0.008575439453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 4.0, 7.0, 7.0, 8.0, 8.0, 12.0, 10.0, 21.0, 22.0, 31.0, 30.0, 38.0, 32.0, 39.0, 61.0, 34.0, 46.0, 39.0, 43.0, 52.0, 60.0, 50.0, 51.0, 41.0, 49.0, 34.0, 25.0, 23.0, 15.0, 17.0, 22.0, 12.0, 8.0, 10.0, 13.0, 3.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.68899917602539e-06, -7.479451596736908e-06, -7.269904017448425e-06, -7.060356438159943e-06, -6.85080885887146e-06, -6.641261279582977e-06, -6.431713700294495e-06, -6.222166121006012e-06, -6.012618541717529e-06, -5.803070962429047e-06, -5.593523383140564e-06, -5.383975803852081e-06, -5.174428224563599e-06, -4.964880645275116e-06, -4.755333065986633e-06, -4.545785486698151e-06, -4.336237907409668e-06, -4.126690328121185e-06, -3.917142748832703e-06, -3.70759516954422e-06, -3.4980475902557373e-06, -3.2885000109672546e-06, -3.078952431678772e-06, -2.8694048523902893e-06, -2.6598572731018066e-06, -2.450309693813324e-06, -2.2407621145248413e-06, -2.0312145352363586e-06, -1.821666955947876e-06, -1.6121193766593933e-06, -1.4025717973709106e-06, -1.193024218082428e-06, -9.834766387939453e-07, -7.739290595054626e-07, -5.6438148021698e-07, -3.548339009284973e-07, -1.4528632164001465e-07, 6.426125764846802e-08, 2.738088369369507e-07, 4.833564162254333e-07, 6.92903995513916e-07, 9.024515748023987e-07, 1.1119991540908813e-06, 1.321546733379364e-06, 1.5310943126678467e-06, 1.7406418919563293e-06, 1.950189471244812e-06, 2.1597370505332947e-06, 2.3692846298217773e-06, 2.57883220911026e-06, 2.7883797883987427e-06, 2.9979273676872253e-06, 3.207474946975708e-06, 3.4170225262641907e-06, 3.6265701055526733e-06, 3.836117684841156e-06, 4.045665264129639e-06, 4.255212843418121e-06, 4.464760422706604e-06, 4.674308001995087e-06, 4.883855581283569e-06, 5.093403160572052e-06, 5.302950739860535e-06, 5.512498319149017e-06, 5.7220458984375e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 12.0, 21.0, 27.0, 43.0, 64.0, 101.0, 150.0, 184.0, 318.0, 460.0, 686.0, 1071.0, 1730.0, 2788.0, 4691.0, 7597.0, 12687.0, 22866.0, 43139.0, 88781.0, 180788.0, 263950.0, 202602.0, 102786.0, 49555.0, 25580.0, 14323.0, 8249.0, 4904.0, 3019.0, 1960.0, 1192.0, 820.0, 488.0, 305.0, 207.0, 122.0, 78.0, 73.0, 43.0, 24.0, 21.0, 15.0, 16.0, 8.0, 1.0, 6.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.01184844970703125, -0.011505961418151855, -0.011163473129272461, -0.010820984840393066, -0.010478496551513672, -0.010136008262634277, -0.009793519973754883, -0.009451031684875488, -0.009108543395996094, -0.0087660551071167, -0.008423566818237305, -0.00808107852935791, -0.007738590240478516, -0.007396101951599121, -0.0070536136627197266, -0.006711125373840332, -0.0063686370849609375, -0.006026148796081543, -0.0056836605072021484, -0.005341172218322754, -0.004998683929443359, -0.004656195640563965, -0.00431370735168457, -0.003971219062805176, -0.0036287307739257812, -0.0032862424850463867, -0.002943754196166992, -0.0026012659072875977, -0.002258777618408203, -0.0019162893295288086, -0.001573801040649414, -0.0012313127517700195, -0.000888824462890625, -0.0005463361740112305, -0.00020384788513183594, 0.0001386404037475586, 0.0004811286926269531, 0.0008236169815063477, 0.0011661052703857422, 0.0015085935592651367, 0.0018510818481445312, 0.0021935701370239258, 0.0025360584259033203, 0.002878546714782715, 0.0032210350036621094, 0.003563523292541504, 0.0039060115814208984, 0.004248499870300293, 0.0045909881591796875, 0.004933476448059082, 0.0052759647369384766, 0.005618453025817871, 0.005960941314697266, 0.00630342960357666, 0.006645917892456055, 0.006988406181335449, 0.007330894470214844, 0.007673382759094238, 0.008015871047973633, 0.008358359336853027, 0.008700847625732422, 0.009043335914611816, 0.009385824203491211, 0.009728312492370605, 0.01007080078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 7.0, 1.0, 6.0, 6.0, 5.0, 11.0, 13.0, 16.0, 29.0, 29.0, 41.0, 49.0, 47.0, 87.0, 87.0, 73.0, 89.0, 80.0, 60.0, 49.0, 54.0, 31.0, 32.0, 22.0, 13.0, 7.0, 8.0, 10.0, 10.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.003963470458984375, -0.003838956356048584, -0.003714442253112793, -0.003589928150177002, -0.003465414047241211, -0.00334089994430542, -0.003216385841369629, -0.003091871738433838, -0.002967357635498047, -0.002842843532562256, -0.002718329429626465, -0.002593815326690674, -0.002469301223754883, -0.002344787120819092, -0.0022202730178833008, -0.0020957589149475098, -0.0019712448120117188, -0.0018467307090759277, -0.0017222166061401367, -0.0015977025032043457, -0.0014731884002685547, -0.0013486742973327637, -0.0012241601943969727, -0.0010996460914611816, -0.0009751319885253906, -0.0008506178855895996, -0.0007261037826538086, -0.0006015896797180176, -0.00047707557678222656, -0.00035256147384643555, -0.00022804737091064453, -0.00010353326797485352, 2.09808349609375e-05, 0.00014549493789672852, 0.00027000904083251953, 0.00039452314376831055, 0.0005190372467041016, 0.0006435513496398926, 0.0007680654525756836, 0.0008925795555114746, 0.0010170936584472656, 0.0011416077613830566, 0.0012661218643188477, 0.0013906359672546387, 0.0015151500701904297, 0.0016396641731262207, 0.0017641782760620117, 0.0018886923789978027, 0.0020132064819335938, 0.0021377205848693848, 0.0022622346878051758, 0.002386748790740967, 0.002511262893676758, 0.002635776996612549, 0.00276029109954834, 0.002884805202484131, 0.003009319305419922, 0.003133833408355713, 0.003258347511291504, 0.003382861614227295, 0.003507375717163086, 0.003631889820098877, 0.003756403923034668, 0.003880918025970459, 0.00400543212890625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 12.0, 4.0, 6.0, 11.0, 16.0, 15.0, 27.0, 29.0, 35.0, 50.0, 30.0, 52.0, 49.0, 48.0, 55.0, 51.0, 53.0, 48.0, 50.0, 52.0, 49.0, 49.0, 31.0, 42.0, 24.0, 25.0, 20.0, 14.0, 8.0, 13.0, 9.0, 8.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.153491020202637, -9.855945587158203, -9.558401107788086, -9.260855674743652, -8.963310241699219, -8.665764808654785, -8.368219375610352, -8.070674896240234, -7.773129463195801, -7.475584030151367, -7.178039073944092, -6.880494117736816, -6.582948684692383, -6.285403251647949, -5.987858295440674, -5.690313339233398, -5.392767906188965, -5.095222473144531, -4.797677516937256, -4.5001325607299805, -4.202587127685547, -3.9050419330596924, -3.607496738433838, -3.3099515438079834, -3.012406349182129, -2.7148611545562744, -2.41731595993042, -2.1197707653045654, -1.822225570678711, -1.5246803760528564, -1.227135181427002, -0.9295899868011475, -0.632044792175293, -0.3344995975494385, -0.036954402923583984, 0.2605907917022705, 0.558135986328125, 0.8556811809539795, 1.153226375579834, 1.4507715702056885, 1.748316764831543, 2.0458619594573975, 2.343407154083252, 2.6409523487091064, 2.938497543334961, 3.2360427379608154, 3.53358793258667, 3.8311331272125244, 4.128678321838379, 4.4262237548828125, 4.723768711090088, 5.021313667297363, 5.318859100341797, 5.6164045333862305, 5.913949489593506, 6.211494445800781, 6.509039878845215, 6.806585311889648, 7.104130268096924, 7.401675224304199, 7.699220657348633, 7.996766090393066, 8.2943115234375, 8.591856002807617, 8.88940143585205]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 5.0, 5.0, 6.0, 7.0, 7.0, 13.0, 17.0, 19.0, 29.0, 28.0, 20.0, 34.0, 28.0, 19.0, 33.0, 48.0, 37.0, 40.0, 43.0, 34.0, 33.0, 44.0, 52.0, 48.0, 45.0, 34.0, 31.0, 30.0, 34.0, 25.0, 24.0, 20.0, 26.0, 18.0, 10.0, 18.0, 6.0, 5.0, 4.0, 1.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.184959411621094, -8.879925727844238, -8.574891090393066, -8.269857406616211, -7.964823246002197, -7.659789085388184, -7.354755401611328, -7.0497212409973145, -6.744687080383301, -6.439652919769287, -6.134618759155273, -5.829585075378418, -5.524550914764404, -5.219516754150391, -4.914483070373535, -4.6094489097595215, -4.304414749145508, -3.999380588531494, -3.6943466663360596, -3.389312744140625, -3.0842785835266113, -2.7792444229125977, -2.474210500717163, -2.1691765785217285, -1.8641424179077148, -1.5591083765029907, -1.2540743350982666, -0.9490402936935425, -0.6440062522888184, -0.33897221088409424, -0.03393816947937012, 0.27109575271606445, 0.5761299133300781, 0.8811639547348022, 1.1861979961395264, 1.4912320375442505, 1.7962660789489746, 2.1013002395629883, 2.406334161758423, 2.7113680839538574, 3.016402244567871, 3.3214364051818848, 3.6264703273773193, 3.931504249572754, 4.236538410186768, 4.541572570800781, 4.846606254577637, 5.15164041519165, 5.456674575805664, 5.761708736419678, 6.066742897033691, 6.371776580810547, 6.6768107414245605, 6.981844902038574, 7.28687858581543, 7.591912746429443, 7.896946907043457, 8.201980590820312, 8.507015228271484, 8.81204891204834, 9.117082595825195, 9.422117233276367, 9.727150917053223, 10.032184600830078, 10.33721923828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 9.0, 18.0, 33.0, 42.0, 69.0, 98.0, 133.0, 208.0, 291.0, 460.0, 761.0, 1109.0, 1748.0, 2653.0, 3989.0, 6358.0, 9609.0, 14113.0, 20957.0, 30773.0, 43661.0, 60434.0, 78941.0, 96705.0, 110060.0, 112386.0, 106957.0, 92308.0, 73998.0, 55580.0, 40080.0, 27732.0, 18962.0, 12690.0, 8563.0, 5504.0, 3552.0, 2295.0, 1583.0, 1088.0, 708.0, 447.0, 315.0, 217.0, 134.0, 76.0, 48.0, 35.0, 24.0, 12.0, 9.0, 9.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-6.57421875, -6.3646240234375, -6.155029296875, -5.9454345703125, -5.73583984375, -5.5262451171875, -5.316650390625, -5.1070556640625, -4.8974609375, -4.6878662109375, -4.478271484375, -4.2686767578125, -4.05908203125, -3.8494873046875, -3.639892578125, -3.4302978515625, -3.220703125, -3.0111083984375, -2.801513671875, -2.5919189453125, -2.38232421875, -2.1727294921875, -1.963134765625, -1.7535400390625, -1.5439453125, -1.3343505859375, -1.124755859375, -0.9151611328125, -0.70556640625, -0.4959716796875, -0.286376953125, -0.0767822265625, 0.1328125, 0.3424072265625, 0.552001953125, 0.7615966796875, 0.97119140625, 1.1807861328125, 1.390380859375, 1.5999755859375, 1.8095703125, 2.0191650390625, 2.228759765625, 2.4383544921875, 2.64794921875, 2.8575439453125, 3.067138671875, 3.2767333984375, 3.486328125, 3.6959228515625, 3.905517578125, 4.1151123046875, 4.32470703125, 4.5343017578125, 4.743896484375, 4.9534912109375, 5.1630859375, 5.3726806640625, 5.582275390625, 5.7918701171875, 6.00146484375, 6.2110595703125, 6.420654296875, 6.6302490234375, 6.83984375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 4.0, 8.0, 13.0, 6.0, 6.0, 10.0, 15.0, 17.0, 21.0, 19.0, 19.0, 29.0, 26.0, 25.0, 32.0, 42.0, 34.0, 37.0, 53.0, 29.0, 39.0, 35.0, 46.0, 49.0, 47.0, 38.0, 37.0, 36.0, 44.0, 28.0, 22.0, 14.0, 20.0, 21.0, 18.0, 19.0, 8.0, 6.0, 9.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.6484375, -8.3402099609375, -8.031982421875, -7.7237548828125, -7.41552734375, -7.1072998046875, -6.799072265625, -6.4908447265625, -6.1826171875, -5.8743896484375, -5.566162109375, -5.2579345703125, -4.94970703125, -4.6414794921875, -4.333251953125, -4.0250244140625, -3.716796875, -3.4085693359375, -3.100341796875, -2.7921142578125, -2.48388671875, -2.1756591796875, -1.867431640625, -1.5592041015625, -1.2509765625, -0.9427490234375, -0.634521484375, -0.3262939453125, -0.01806640625, 0.2901611328125, 0.598388671875, 0.9066162109375, 1.21484375, 1.5230712890625, 1.831298828125, 2.1395263671875, 2.44775390625, 2.7559814453125, 3.064208984375, 3.3724365234375, 3.6806640625, 3.9888916015625, 4.297119140625, 4.6053466796875, 4.91357421875, 5.2218017578125, 5.530029296875, 5.8382568359375, 6.146484375, 6.4547119140625, 6.762939453125, 7.0711669921875, 7.37939453125, 7.6876220703125, 7.995849609375, 8.3040771484375, 8.6123046875, 8.9205322265625, 9.228759765625, 9.5369873046875, 9.84521484375, 10.1534423828125, 10.461669921875, 10.7698974609375, 11.078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 13.0, 19.0, 35.0, 46.0, 93.0, 135.0, 199.0, 309.0, 514.0, 840.0, 1329.0, 2160.0, 3576.0, 5504.0, 8673.0, 14038.0, 21917.0, 34447.0, 52009.0, 74776.0, 100491.0, 122083.0, 131584.0, 126306.0, 106507.0, 80367.0, 56856.0, 37949.0, 24320.0, 15387.0, 9675.0, 6150.0, 3898.0, 2357.0, 1451.0, 965.0, 560.0, 344.0, 266.0, 165.0, 89.0, 70.0, 33.0, 23.0, 8.0, 11.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.99609375, -7.75091552734375, -7.5057373046875, -7.26055908203125, -7.015380859375, -6.77020263671875, -6.5250244140625, -6.27984619140625, -6.03466796875, -5.78948974609375, -5.5443115234375, -5.29913330078125, -5.053955078125, -4.80877685546875, -4.5635986328125, -4.31842041015625, -4.0732421875, -3.82806396484375, -3.5828857421875, -3.33770751953125, -3.092529296875, -2.84735107421875, -2.6021728515625, -2.35699462890625, -2.11181640625, -1.86663818359375, -1.6214599609375, -1.37628173828125, -1.131103515625, -0.88592529296875, -0.6407470703125, -0.39556884765625, -0.150390625, 0.09478759765625, 0.3399658203125, 0.58514404296875, 0.830322265625, 1.07550048828125, 1.3206787109375, 1.56585693359375, 1.81103515625, 2.05621337890625, 2.3013916015625, 2.54656982421875, 2.791748046875, 3.03692626953125, 3.2821044921875, 3.52728271484375, 3.7724609375, 4.01763916015625, 4.2628173828125, 4.50799560546875, 4.753173828125, 4.99835205078125, 5.2435302734375, 5.48870849609375, 5.73388671875, 5.97906494140625, 6.2242431640625, 6.46942138671875, 6.714599609375, 6.95977783203125, 7.2049560546875, 7.45013427734375, 7.6953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 9.0, 5.0, 6.0, 7.0, 13.0, 11.0, 11.0, 11.0, 17.0, 12.0, 25.0, 23.0, 27.0, 26.0, 18.0, 44.0, 44.0, 44.0, 37.0, 45.0, 46.0, 53.0, 45.0, 37.0, 35.0, 38.0, 45.0, 32.0, 29.0, 30.0, 20.0, 21.0, 31.0, 26.0, 23.0, 12.0, 9.0, 11.0, 5.0, 3.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.578125, -6.3734130859375, -6.168701171875, -5.9639892578125, -5.75927734375, -5.5545654296875, -5.349853515625, -5.1451416015625, -4.9404296875, -4.7357177734375, -4.531005859375, -4.3262939453125, -4.12158203125, -3.9168701171875, -3.712158203125, -3.5074462890625, -3.302734375, -3.0980224609375, -2.893310546875, -2.6885986328125, -2.48388671875, -2.2791748046875, -2.074462890625, -1.8697509765625, -1.6650390625, -1.4603271484375, -1.255615234375, -1.0509033203125, -0.84619140625, -0.6414794921875, -0.436767578125, -0.2320556640625, -0.02734375, 0.1773681640625, 0.382080078125, 0.5867919921875, 0.79150390625, 0.9962158203125, 1.200927734375, 1.4056396484375, 1.6103515625, 1.8150634765625, 2.019775390625, 2.2244873046875, 2.42919921875, 2.6339111328125, 2.838623046875, 3.0433349609375, 3.248046875, 3.4527587890625, 3.657470703125, 3.8621826171875, 4.06689453125, 4.2716064453125, 4.476318359375, 4.6810302734375, 4.8857421875, 5.0904541015625, 5.295166015625, 5.4998779296875, 5.70458984375, 5.9093017578125, 6.114013671875, 6.3187255859375, 6.5234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 15.0, 12.0, 26.0, 68.0, 76.0, 95.0, 195.0, 298.0, 470.0, 768.0, 1241.0, 1950.0, 2999.0, 4797.0, 7342.0, 10636.0, 16134.0, 23399.0, 32853.0, 44457.0, 57538.0, 71015.0, 83071.0, 92944.0, 96635.0, 94798.0, 88215.0, 77153.0, 64632.0, 50783.0, 38216.0, 27829.0, 19433.0, 13301.0, 8896.0, 5863.0, 3813.0, 2430.0, 1545.0, 967.0, 626.0, 380.0, 257.0, 137.0, 97.0, 60.0, 33.0, 17.0, 15.0, 12.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.283203125, -1.2440185546875, -1.204833984375, -1.1656494140625, -1.12646484375, -1.0872802734375, -1.048095703125, -1.0089111328125, -0.9697265625, -0.9305419921875, -0.891357421875, -0.8521728515625, -0.81298828125, -0.7738037109375, -0.734619140625, -0.6954345703125, -0.65625, -0.6170654296875, -0.577880859375, -0.5386962890625, -0.49951171875, -0.4603271484375, -0.421142578125, -0.3819580078125, -0.3427734375, -0.3035888671875, -0.264404296875, -0.2252197265625, -0.18603515625, -0.1468505859375, -0.107666015625, -0.0684814453125, -0.029296875, 0.0098876953125, 0.049072265625, 0.0882568359375, 0.12744140625, 0.1666259765625, 0.205810546875, 0.2449951171875, 0.2841796875, 0.3233642578125, 0.362548828125, 0.4017333984375, 0.44091796875, 0.4801025390625, 0.519287109375, 0.5584716796875, 0.59765625, 0.6368408203125, 0.676025390625, 0.7152099609375, 0.75439453125, 0.7935791015625, 0.832763671875, 0.8719482421875, 0.9111328125, 0.9503173828125, 0.989501953125, 1.0286865234375, 1.06787109375, 1.1070556640625, 1.146240234375, 1.1854248046875, 1.224609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 9.0, 14.0, 18.0, 23.0, 27.0, 29.0, 23.0, 29.0, 31.0, 36.0, 44.0, 46.0, 45.0, 53.0, 48.0, 56.0, 44.0, 53.0, 47.0, 38.0, 39.0, 38.0, 27.0, 24.0, 23.0, 27.0, 18.0, 17.0, 16.0, 5.0, 8.0, 12.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021266937255859375, -0.00020658783614635468, -0.0002005062997341156, -0.00019442476332187653, -0.00018834322690963745, -0.00018226169049739838, -0.0001761801540851593, -0.00017009861767292023, -0.00016401708126068115, -0.00015793554484844208, -0.000151854008436203, -0.00014577247202396393, -0.00013969093561172485, -0.00013360939919948578, -0.0001275278627872467, -0.00012144632637500763, -0.00011536478996276855, -0.00010928325355052948, -0.0001032017171382904, -9.712018072605133e-05, -9.103864431381226e-05, -8.495710790157318e-05, -7.88755714893341e-05, -7.279403507709503e-05, -6.671249866485596e-05, -6.063096225261688e-05, -5.454942584037781e-05, -4.846788942813873e-05, -4.238635301589966e-05, -3.6304816603660583e-05, -3.022328019142151e-05, -2.4141743779182434e-05, -1.806020736694336e-05, -1.1978670954704285e-05, -5.89713454246521e-06, 1.8440186977386475e-07, 6.2659382820129395e-06, 1.2347474694252014e-05, 1.842901110649109e-05, 2.4510547518730164e-05, 3.059208393096924e-05, 3.667362034320831e-05, 4.275515675544739e-05, 4.883669316768646e-05, 5.491822957992554e-05, 6.099976599216461e-05, 6.708130240440369e-05, 7.316283881664276e-05, 7.924437522888184e-05, 8.532591164112091e-05, 9.140744805335999e-05, 9.748898446559906e-05, 0.00010357052087783813, 0.00010965205729007721, 0.00011573359370231628, 0.00012181513011455536, 0.00012789666652679443, 0.0001339782029390335, 0.00014005973935127258, 0.00014614127576351166, 0.00015222281217575073, 0.0001583043485879898, 0.00016438588500022888, 0.00017046742141246796, 0.00017654895782470703]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 15.0, 14.0, 26.0, 51.0, 73.0, 97.0, 188.0, 278.0, 458.0, 754.0, 1181.0, 1856.0, 3074.0, 4859.0, 7455.0, 11368.0, 17129.0, 24832.0, 35558.0, 47721.0, 62126.0, 76411.0, 89828.0, 98670.0, 100293.0, 96642.0, 87121.0, 73789.0, 59486.0, 45639.0, 32910.0, 23446.0, 16081.0, 10554.0, 6830.0, 4305.0, 2773.0, 1791.0, 1047.0, 719.0, 414.0, 274.0, 173.0, 106.0, 47.0, 35.0, 22.0, 16.0, 13.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2470703125, -1.2060546875, -1.1650390625, -1.1240234375, -1.0830078125, -1.0419921875, -1.0009765625, -0.9599609375, -0.9189453125, -0.8779296875, -0.8369140625, -0.7958984375, -0.7548828125, -0.7138671875, -0.6728515625, -0.6318359375, -0.5908203125, -0.5498046875, -0.5087890625, -0.4677734375, -0.4267578125, -0.3857421875, -0.3447265625, -0.3037109375, -0.2626953125, -0.2216796875, -0.1806640625, -0.1396484375, -0.0986328125, -0.0576171875, -0.0166015625, 0.0244140625, 0.0654296875, 0.1064453125, 0.1474609375, 0.1884765625, 0.2294921875, 0.2705078125, 0.3115234375, 0.3525390625, 0.3935546875, 0.4345703125, 0.4755859375, 0.5166015625, 0.5576171875, 0.5986328125, 0.6396484375, 0.6806640625, 0.7216796875, 0.7626953125, 0.8037109375, 0.8447265625, 0.8857421875, 0.9267578125, 0.9677734375, 1.0087890625, 1.0498046875, 1.0908203125, 1.1318359375, 1.1728515625, 1.2138671875, 1.2548828125, 1.2958984375, 1.3369140625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 7.0, 3.0, 7.0, 7.0, 11.0, 10.0, 9.0, 17.0, 13.0, 23.0, 19.0, 37.0, 43.0, 30.0, 37.0, 49.0, 45.0, 39.0, 34.0, 49.0, 44.0, 45.0, 46.0, 50.0, 51.0, 42.0, 27.0, 38.0, 36.0, 29.0, 14.0, 12.0, 14.0, 16.0, 13.0, 10.0, 4.0, 4.0, 4.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.81005859375, -0.784881591796875, -0.75970458984375, -0.734527587890625, -0.7093505859375, -0.684173583984375, -0.65899658203125, -0.633819580078125, -0.608642578125, -0.583465576171875, -0.55828857421875, -0.533111572265625, -0.5079345703125, -0.482757568359375, -0.45758056640625, -0.432403564453125, -0.4072265625, -0.382049560546875, -0.35687255859375, -0.331695556640625, -0.3065185546875, -0.281341552734375, -0.25616455078125, -0.230987548828125, -0.205810546875, -0.180633544921875, -0.15545654296875, -0.130279541015625, -0.1051025390625, -0.079925537109375, -0.05474853515625, -0.029571533203125, -0.00439453125, 0.020782470703125, 0.04595947265625, 0.071136474609375, 0.0963134765625, 0.121490478515625, 0.14666748046875, 0.171844482421875, 0.197021484375, 0.222198486328125, 0.24737548828125, 0.272552490234375, 0.2977294921875, 0.322906494140625, 0.34808349609375, 0.373260498046875, 0.3984375, 0.423614501953125, 0.44879150390625, 0.473968505859375, 0.4991455078125, 0.524322509765625, 0.54949951171875, 0.574676513671875, 0.599853515625, 0.625030517578125, 0.65020751953125, 0.675384521484375, 0.7005615234375, 0.725738525390625, 0.75091552734375, 0.776092529296875, 0.80126953125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 13.0, 9.0, 16.0, 14.0, 13.0, 11.0, 26.0, 26.0, 25.0, 34.0, 39.0, 30.0, 35.0, 40.0, 40.0, 51.0, 45.0, 44.0, 44.0, 49.0, 45.0, 52.0, 40.0, 39.0, 27.0, 29.0, 27.0, 31.0, 19.0, 17.0, 15.0, 9.0, 7.0, 9.0, 5.0, 5.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.529717445373535, -8.2735595703125, -8.017402648925781, -7.761244773864746, -7.505087375640869, -7.248929977416992, -6.992772102355957, -6.73661470413208, -6.480457305908203, -6.224299907684326, -5.968142509460449, -5.711984634399414, -5.455827236175537, -5.19966983795166, -4.943511962890625, -4.687354564666748, -4.431197166442871, -4.175039768218994, -3.918882131576538, -3.662724494934082, -3.406567096710205, -3.150409698486328, -2.894252061843872, -2.638094425201416, -2.381937026977539, -2.125779628753662, -1.869621992111206, -1.6134644746780396, -1.357306957244873, -1.1011494398117065, -0.84499192237854, -0.5888344049453735, -0.33267641067504883, -0.07651889324188232, 0.17963862419128418, 0.4357961416244507, 0.6919536590576172, 0.9481111764907837, 1.2042686939239502, 1.4604262113571167, 1.7165837287902832, 1.9727412462234497, 2.228898763656616, 2.4850564002990723, 2.741213798522949, 2.997371196746826, 3.2535288333892822, 3.5096864700317383, 3.7658438682556152, 4.022001266479492, 4.278159141540527, 4.534316539764404, 4.790473937988281, 5.046631336212158, 5.302788734436035, 5.55894660949707, 5.815104007720947, 6.071261405944824, 6.327419281005859, 6.583576679229736, 6.839734077453613, 7.09589147567749, 7.352048873901367, 7.608206748962402, 7.864364147186279]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 9.0, 9.0, 10.0, 12.0, 12.0, 11.0, 21.0, 12.0, 24.0, 18.0, 17.0, 36.0, 33.0, 24.0, 27.0, 37.0, 35.0, 37.0, 31.0, 35.0, 50.0, 33.0, 36.0, 46.0, 30.0, 30.0, 31.0, 26.0, 25.0, 41.0, 28.0, 30.0, 19.0, 22.0, 16.0, 15.0, 12.0, 11.0, 15.0, 3.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-9.399365425109863, -9.111756324768066, -8.824146270751953, -8.536537170410156, -8.24892807006836, -7.9613189697265625, -7.673709392547607, -7.386099815368652, -7.0984907150268555, -6.810881614685059, -6.5232720375061035, -6.235662460327148, -5.948053359985352, -5.660444259643555, -5.3728346824646, -5.0852251052856445, -4.797616004943848, -4.510006904602051, -4.222397327423096, -3.9347879886627197, -3.6471786499023438, -3.3595693111419678, -3.071959972381592, -2.784350633621216, -2.49674129486084, -2.209131956100464, -1.921522617340088, -1.633913278579712, -1.346303939819336, -1.05869460105896, -0.771085262298584, -0.483475923538208, -0.19586658477783203, 0.09174275398254395, 0.3793520927429199, 0.6669614315032959, 0.9545707702636719, 1.2421801090240479, 1.5297894477844238, 1.8173987865447998, 2.105008125305176, 2.3926174640655518, 2.6802268028259277, 2.9678361415863037, 3.2554454803466797, 3.5430548191070557, 3.8306641578674316, 4.118273735046387, 4.405882835388184, 4.6934919357299805, 4.9811015129089355, 5.268711090087891, 5.5563201904296875, 5.843929290771484, 6.1315388679504395, 6.4191484451293945, 6.706757545471191, 6.994366645812988, 7.281976222991943, 7.569585800170898, 7.857194900512695, 8.144804000854492, 8.432413101196289, 8.720023155212402, 9.0076322555542]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 11.0, 12.0, 11.0, 40.0, 37.0, 63.0, 115.0, 198.0, 300.0, 542.0, 911.0, 1732.0, 2872.0, 5178.0, 9105.0, 16568.0, 30453.0, 53977.0, 95796.0, 165758.0, 265484.0, 394569.0, 521733.0, 598797.0, 589191.0, 497055.0, 364201.0, 241759.0, 145083.0, 85210.0, 47214.0, 26368.0, 14781.0, 8133.0, 4643.0, 2611.0, 1521.0, 901.0, 521.0, 326.0, 194.0, 127.0, 73.0, 38.0, 24.0, 13.0, 15.0, 9.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-9.65625, -9.3626708984375, -9.069091796875, -8.7755126953125, -8.48193359375, -8.1883544921875, -7.894775390625, -7.6011962890625, -7.3076171875, -7.0140380859375, -6.720458984375, -6.4268798828125, -6.13330078125, -5.8397216796875, -5.546142578125, -5.2525634765625, -4.958984375, -4.6654052734375, -4.371826171875, -4.0782470703125, -3.78466796875, -3.4910888671875, -3.197509765625, -2.9039306640625, -2.6103515625, -2.3167724609375, -2.023193359375, -1.7296142578125, -1.43603515625, -1.1424560546875, -0.848876953125, -0.5552978515625, -0.26171875, 0.0318603515625, 0.325439453125, 0.6190185546875, 0.91259765625, 1.2061767578125, 1.499755859375, 1.7933349609375, 2.0869140625, 2.3804931640625, 2.674072265625, 2.9676513671875, 3.26123046875, 3.5548095703125, 3.848388671875, 4.1419677734375, 4.435546875, 4.7291259765625, 5.022705078125, 5.3162841796875, 5.60986328125, 5.9034423828125, 6.197021484375, 6.4906005859375, 6.7841796875, 7.0777587890625, 7.371337890625, 7.6649169921875, 7.95849609375, 8.2520751953125, 8.545654296875, 8.8392333984375, 9.1328125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 2.0, 3.0, 3.0, 14.0, 14.0, 11.0, 9.0, 15.0, 13.0, 15.0, 22.0, 21.0, 19.0, 18.0, 26.0, 36.0, 41.0, 28.0, 40.0, 43.0, 38.0, 30.0, 37.0, 40.0, 41.0, 39.0, 36.0, 40.0, 27.0, 35.0, 17.0, 36.0, 28.0, 19.0, 25.0, 20.0, 24.0, 12.0, 11.0, 13.0, 11.0, 5.0, 1.0, 3.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.265625, -8.003662109375, -7.74169921875, -7.479736328125, -7.2177734375, -6.955810546875, -6.69384765625, -6.431884765625, -6.169921875, -5.907958984375, -5.64599609375, -5.384033203125, -5.1220703125, -4.860107421875, -4.59814453125, -4.336181640625, -4.07421875, -3.812255859375, -3.55029296875, -3.288330078125, -3.0263671875, -2.764404296875, -2.50244140625, -2.240478515625, -1.978515625, -1.716552734375, -1.45458984375, -1.192626953125, -0.9306640625, -0.668701171875, -0.40673828125, -0.144775390625, 0.1171875, 0.379150390625, 0.64111328125, 0.903076171875, 1.1650390625, 1.427001953125, 1.68896484375, 1.950927734375, 2.212890625, 2.474853515625, 2.73681640625, 2.998779296875, 3.2607421875, 3.522705078125, 3.78466796875, 4.046630859375, 4.30859375, 4.570556640625, 4.83251953125, 5.094482421875, 5.3564453125, 5.618408203125, 5.88037109375, 6.142333984375, 6.404296875, 6.666259765625, 6.92822265625, 7.190185546875, 7.4521484375, 7.714111328125, 7.97607421875, 8.238037109375, 8.5]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 16.0, 24.0, 39.0, 65.0, 112.0, 199.0, 308.0, 567.0, 929.0, 1474.0, 2521.0, 4456.0, 7571.0, 13018.0, 22817.0, 39777.0, 67080.0, 111315.0, 174291.0, 257734.0, 353512.0, 441575.0, 501377.0, 511953.0, 468975.0, 387680.0, 293358.0, 203029.0, 132048.0, 81443.0, 48554.0, 28069.0, 16018.0, 9219.0, 5288.0, 3169.0, 1939.0, 1112.0, 677.0, 416.0, 232.0, 124.0, 78.0, 45.0, 31.0, 20.0, 13.0, 10.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.59765625, -7.33734130859375, -7.0770263671875, -6.81671142578125, -6.556396484375, -6.29608154296875, -6.0357666015625, -5.77545166015625, -5.51513671875, -5.25482177734375, -4.9945068359375, -4.73419189453125, -4.473876953125, -4.21356201171875, -3.9532470703125, -3.69293212890625, -3.4326171875, -3.17230224609375, -2.9119873046875, -2.65167236328125, -2.391357421875, -2.13104248046875, -1.8707275390625, -1.61041259765625, -1.35009765625, -1.08978271484375, -0.8294677734375, -0.56915283203125, -0.308837890625, -0.04852294921875, 0.2117919921875, 0.47210693359375, 0.732421875, 0.99273681640625, 1.2530517578125, 1.51336669921875, 1.773681640625, 2.03399658203125, 2.2943115234375, 2.55462646484375, 2.81494140625, 3.07525634765625, 3.3355712890625, 3.59588623046875, 3.856201171875, 4.11651611328125, 4.3768310546875, 4.63714599609375, 4.8974609375, 5.15777587890625, 5.4180908203125, 5.67840576171875, 5.938720703125, 6.19903564453125, 6.4593505859375, 6.71966552734375, 6.97998046875, 7.24029541015625, 7.5006103515625, 7.76092529296875, 8.021240234375, 8.28155517578125, 8.5418701171875, 8.80218505859375, 9.0625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 4.0, 6.0, 6.0, 6.0, 16.0, 10.0, 21.0, 25.0, 32.0, 24.0, 42.0, 51.0, 65.0, 70.0, 77.0, 93.0, 111.0, 116.0, 152.0, 168.0, 187.0, 190.0, 203.0, 196.0, 230.0, 200.0, 202.0, 189.0, 167.0, 168.0, 138.0, 155.0, 110.0, 111.0, 90.0, 91.0, 58.0, 71.0, 37.0, 48.0, 31.0, 28.0, 20.0, 12.0, 12.0, 8.0, 4.0, 3.0, 2.0, 5.0, 7.0, 3.0, 0.0, 2.0], "bins": [-4.38671875, -4.25994873046875, -4.1331787109375, -4.00640869140625, -3.879638671875, -3.75286865234375, -3.6260986328125, -3.49932861328125, -3.37255859375, -3.24578857421875, -3.1190185546875, -2.99224853515625, -2.865478515625, -2.73870849609375, -2.6119384765625, -2.48516845703125, -2.3583984375, -2.23162841796875, -2.1048583984375, -1.97808837890625, -1.851318359375, -1.72454833984375, -1.5977783203125, -1.47100830078125, -1.34423828125, -1.21746826171875, -1.0906982421875, -0.96392822265625, -0.837158203125, -0.71038818359375, -0.5836181640625, -0.45684814453125, -0.330078125, -0.20330810546875, -0.0765380859375, 0.05023193359375, 0.177001953125, 0.30377197265625, 0.4305419921875, 0.55731201171875, 0.68408203125, 0.81085205078125, 0.9376220703125, 1.06439208984375, 1.191162109375, 1.31793212890625, 1.4447021484375, 1.57147216796875, 1.6982421875, 1.82501220703125, 1.9517822265625, 2.07855224609375, 2.205322265625, 2.33209228515625, 2.4588623046875, 2.58563232421875, 2.71240234375, 2.83917236328125, 2.9659423828125, 3.09271240234375, 3.219482421875, 3.34625244140625, 3.4730224609375, 3.59979248046875, 3.7265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 10.0, 4.0, 8.0, 10.0, 19.0, 19.0, 23.0, 18.0, 32.0, 34.0, 36.0, 36.0, 38.0, 48.0, 51.0, 49.0, 60.0, 52.0, 44.0, 43.0, 58.0, 44.0, 39.0, 39.0, 33.0, 27.0, 28.0, 23.0, 18.0, 17.0, 12.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.636021614074707, -10.33125114440918, -10.026480674743652, -9.721710205078125, -9.416940689086914, -9.112170219421387, -8.80739974975586, -8.502629280090332, -8.197858810424805, -7.893088340759277, -7.58831787109375, -7.283547878265381, -6.9787774085998535, -6.674006938934326, -6.369236946105957, -6.06446647644043, -5.759696006774902, -5.454925537109375, -5.150155067443848, -4.8453850746154785, -4.540614604949951, -4.235844135284424, -3.9310739040374756, -3.6263036727905273, -3.321533203125, -3.0167627334594727, -2.7119925022125244, -2.407222270965576, -2.102451801300049, -1.797681450843811, -1.4929111003875732, -1.188140869140625, -0.8833713531494141, -0.5786010026931763, -0.2738306522369385, 0.030939698219299316, 0.3357100486755371, 0.6404803991317749, 0.9452507495880127, 1.250020980834961, 1.5547914505004883, 1.859561800956726, 2.164332151412964, 2.469102382659912, 2.7738728523254395, 3.078643321990967, 3.383413553237915, 3.6881837844848633, 3.9929542541503906, 4.297724723815918, 4.602495193481445, 4.9072651863098145, 5.212035655975342, 5.516806125640869, 5.821576118469238, 6.126346588134766, 6.431117057800293, 6.73588752746582, 7.040657997131348, 7.345427989959717, 7.650198459625244, 7.9549689292907715, 8.25973892211914, 8.564509391784668, 8.869279861450195]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 6.0, 11.0, 10.0, 9.0, 11.0, 16.0, 9.0, 17.0, 16.0, 23.0, 14.0, 25.0, 30.0, 35.0, 38.0, 32.0, 34.0, 34.0, 46.0, 50.0, 39.0, 50.0, 32.0, 45.0, 43.0, 45.0, 34.0, 39.0, 21.0, 33.0, 30.0, 15.0, 17.0, 18.0, 17.0, 9.0, 8.0, 15.0, 11.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.722511291503906, -10.401338577270508, -10.08016586303711, -9.758992195129395, -9.437819480895996, -9.116646766662598, -8.795473098754883, -8.474300384521484, -8.153127670288086, -7.8319549560546875, -7.510781764984131, -7.189608573913574, -6.868435859680176, -6.547263145446777, -6.226089954376221, -5.904916763305664, -5.583744049072266, -5.262571334838867, -4.9413981437683105, -4.620224952697754, -4.2990522384643555, -3.977879285812378, -3.6567063331604004, -3.335533380508423, -3.0143604278564453, -2.6931874752044678, -2.3720145225524902, -2.0508415699005127, -1.7296686172485352, -1.4084956645965576, -1.08732271194458, -0.7661497592926025, -0.4449758529663086, -0.12380290031433105, 0.19737005233764648, 0.518543004989624, 0.8397159576416016, 1.160888910293579, 1.4820618629455566, 1.8032348155975342, 2.1244077682495117, 2.4455807209014893, 2.766753673553467, 3.0879266262054443, 3.409099578857422, 3.7302725315093994, 4.051445484161377, 4.372618675231934, 4.693791389465332, 5.0149641036987305, 5.336137294769287, 5.657310485839844, 5.978483200073242, 6.299655914306641, 6.620829105377197, 6.942002296447754, 7.263175010681152, 7.584347724914551, 7.905520915985107, 8.226694107055664, 8.547866821289062, 8.869039535522461, 9.19021224975586, 9.511385917663574, 9.832558631896973]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 10.0, 11.0, 27.0, 26.0, 57.0, 58.0, 121.0, 161.0, 215.0, 349.0, 569.0, 803.0, 1170.0, 1737.0, 2359.0, 3316.0, 5001.0, 7253.0, 11073.0, 16493.0, 25627.0, 40470.0, 67018.0, 126375.0, 338850.0, 176925.0, 83631.0, 48842.0, 30391.0, 19570.0, 12721.0, 8638.0, 5813.0, 3989.0, 2689.0, 1906.0, 1398.0, 971.0, 612.0, 440.0, 299.0, 198.0, 120.0, 85.0, 51.0, 42.0, 40.0, 14.0, 8.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-4.58984375, -4.449462890625, -4.30908203125, -4.168701171875, -4.0283203125, -3.887939453125, -3.74755859375, -3.607177734375, -3.466796875, -3.326416015625, -3.18603515625, -3.045654296875, -2.9052734375, -2.764892578125, -2.62451171875, -2.484130859375, -2.34375, -2.203369140625, -2.06298828125, -1.922607421875, -1.7822265625, -1.641845703125, -1.50146484375, -1.361083984375, -1.220703125, -1.080322265625, -0.93994140625, -0.799560546875, -0.6591796875, -0.518798828125, -0.37841796875, -0.238037109375, -0.09765625, 0.042724609375, 0.18310546875, 0.323486328125, 0.4638671875, 0.604248046875, 0.74462890625, 0.885009765625, 1.025390625, 1.165771484375, 1.30615234375, 1.446533203125, 1.5869140625, 1.727294921875, 1.86767578125, 2.008056640625, 2.1484375, 2.288818359375, 2.42919921875, 2.569580078125, 2.7099609375, 2.850341796875, 2.99072265625, 3.131103515625, 3.271484375, 3.411865234375, 3.55224609375, 3.692626953125, 3.8330078125, 3.973388671875, 4.11376953125, 4.254150390625, 4.39453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 3.0, 3.0, 8.0, 6.0, 9.0, 8.0, 2.0, 13.0, 8.0, 17.0, 14.0, 26.0, 11.0, 20.0, 22.0, 28.0, 29.0, 22.0, 31.0, 30.0, 36.0, 38.0, 55.0, 39.0, 43.0, 37.0, 40.0, 39.0, 29.0, 34.0, 34.0, 33.0, 38.0, 25.0, 28.0, 22.0, 14.0, 20.0, 15.0, 12.0, 10.0, 9.0, 5.0, 8.0, 10.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0], "bins": [-10.8125, -10.514404296875, -10.21630859375, -9.918212890625, -9.6201171875, -9.322021484375, -9.02392578125, -8.725830078125, -8.427734375, -8.129638671875, -7.83154296875, -7.533447265625, -7.2353515625, -6.937255859375, -6.63916015625, -6.341064453125, -6.04296875, -5.744873046875, -5.44677734375, -5.148681640625, -4.8505859375, -4.552490234375, -4.25439453125, -3.956298828125, -3.658203125, -3.360107421875, -3.06201171875, -2.763916015625, -2.4658203125, -2.167724609375, -1.86962890625, -1.571533203125, -1.2734375, -0.975341796875, -0.67724609375, -0.379150390625, -0.0810546875, 0.217041015625, 0.51513671875, 0.813232421875, 1.111328125, 1.409423828125, 1.70751953125, 2.005615234375, 2.3037109375, 2.601806640625, 2.89990234375, 3.197998046875, 3.49609375, 3.794189453125, 4.09228515625, 4.390380859375, 4.6884765625, 4.986572265625, 5.28466796875, 5.582763671875, 5.880859375, 6.178955078125, 6.47705078125, 6.775146484375, 7.0732421875, 7.371337890625, 7.66943359375, 7.967529296875, 8.265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 8.0, 15.0, 28.0, 29.0, 51.0, 72.0, 100.0, 161.0, 236.0, 370.0, 554.0, 858.0, 1304.0, 2119.0, 3343.0, 5242.0, 8484.0, 13913.0, 22727.0, 37947.0, 64451.0, 119766.0, 356990.0, 194258.0, 88020.0, 50227.0, 29733.0, 18055.0, 10982.0, 6791.0, 4228.0, 2625.0, 1674.0, 1114.0, 714.0, 476.0, 298.0, 198.0, 131.0, 93.0, 61.0, 31.0, 24.0, 14.0, 12.0, 9.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.80560302734375, -4.6385498046875, -4.47149658203125, -4.304443359375, -4.13739013671875, -3.9703369140625, -3.80328369140625, -3.63623046875, -3.46917724609375, -3.3021240234375, -3.13507080078125, -2.968017578125, -2.80096435546875, -2.6339111328125, -2.46685791015625, -2.2998046875, -2.13275146484375, -1.9656982421875, -1.79864501953125, -1.631591796875, -1.46453857421875, -1.2974853515625, -1.13043212890625, -0.96337890625, -0.79632568359375, -0.6292724609375, -0.46221923828125, -0.295166015625, -0.12811279296875, 0.0389404296875, 0.20599365234375, 0.373046875, 0.54010009765625, 0.7071533203125, 0.87420654296875, 1.041259765625, 1.20831298828125, 1.3753662109375, 1.54241943359375, 1.70947265625, 1.87652587890625, 2.0435791015625, 2.21063232421875, 2.377685546875, 2.54473876953125, 2.7117919921875, 2.87884521484375, 3.0458984375, 3.21295166015625, 3.3800048828125, 3.54705810546875, 3.714111328125, 3.88116455078125, 4.0482177734375, 4.21527099609375, 4.38232421875, 4.54937744140625, 4.7164306640625, 4.88348388671875, 5.050537109375, 5.21759033203125, 5.3846435546875, 5.55169677734375, 5.71875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 6.0, 7.0, 9.0, 12.0, 13.0, 19.0, 21.0, 20.0, 33.0, 24.0, 33.0, 32.0, 33.0, 41.0, 45.0, 39.0, 52.0, 49.0, 39.0, 48.0, 40.0, 35.0, 40.0, 38.0, 44.0, 31.0, 33.0, 30.0, 21.0, 21.0, 25.0, 13.0, 8.0, 8.0, 13.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.32452392578125, -6.1060791015625, -5.88763427734375, -5.669189453125, -5.45074462890625, -5.2322998046875, -5.01385498046875, -4.79541015625, -4.57696533203125, -4.3585205078125, -4.14007568359375, -3.921630859375, -3.70318603515625, -3.4847412109375, -3.26629638671875, -3.0478515625, -2.82940673828125, -2.6109619140625, -2.39251708984375, -2.174072265625, -1.95562744140625, -1.7371826171875, -1.51873779296875, -1.30029296875, -1.08184814453125, -0.8634033203125, -0.64495849609375, -0.426513671875, -0.20806884765625, 0.0103759765625, 0.22882080078125, 0.447265625, 0.66571044921875, 0.8841552734375, 1.10260009765625, 1.321044921875, 1.53948974609375, 1.7579345703125, 1.97637939453125, 2.19482421875, 2.41326904296875, 2.6317138671875, 2.85015869140625, 3.068603515625, 3.28704833984375, 3.5054931640625, 3.72393798828125, 3.9423828125, 4.16082763671875, 4.3792724609375, 4.59771728515625, 4.816162109375, 5.03460693359375, 5.2530517578125, 5.47149658203125, 5.68994140625, 5.90838623046875, 6.1268310546875, 6.34527587890625, 6.563720703125, 6.78216552734375, 7.0006103515625, 7.21905517578125, 7.4375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 10.0, 9.0, 12.0, 13.0, 21.0, 32.0, 43.0, 62.0, 80.0, 104.0, 160.0, 231.0, 313.0, 443.0, 623.0, 860.0, 1338.0, 1918.0, 2845.0, 4409.0, 6784.0, 10837.0, 17953.0, 31326.0, 59132.0, 125784.0, 247249.0, 255184.0, 134103.0, 62849.0, 32894.0, 18853.0, 11171.0, 6929.0, 4481.0, 3009.0, 1897.0, 1400.0, 944.0, 643.0, 439.0, 315.0, 245.0, 163.0, 151.0, 97.0, 67.0, 47.0, 33.0, 20.0, 14.0, 9.0, 7.0, 2.0, 1.0, 5.0, 2.0, 2.0], "bins": [-0.0126953125, -0.012311100959777832, -0.011926889419555664, -0.011542677879333496, -0.011158466339111328, -0.01077425479888916, -0.010390043258666992, -0.010005831718444824, -0.009621620178222656, -0.009237408638000488, -0.00885319709777832, -0.008468985557556152, -0.008084774017333984, -0.007700562477111816, -0.0073163509368896484, -0.0069321393966674805, -0.0065479278564453125, -0.0061637163162231445, -0.0057795047760009766, -0.005395293235778809, -0.005011081695556641, -0.004626870155334473, -0.004242658615112305, -0.0038584470748901367, -0.0034742355346679688, -0.0030900239944458008, -0.002705812454223633, -0.002321600914001465, -0.0019373893737792969, -0.001553177833557129, -0.001168966293334961, -0.000784754753112793, -0.000400543212890625, -1.633167266845703e-05, 0.00036787986755371094, 0.0007520914077758789, 0.0011363029479980469, 0.0015205144882202148, 0.0019047260284423828, 0.0022889375686645508, 0.0026731491088867188, 0.0030573606491088867, 0.0034415721893310547, 0.0038257837295532227, 0.004209995269775391, 0.004594206809997559, 0.0049784183502197266, 0.0053626298904418945, 0.0057468414306640625, 0.0061310529708862305, 0.0065152645111083984, 0.006899476051330566, 0.007283687591552734, 0.007667899131774902, 0.00805211067199707, 0.008436322212219238, 0.008820533752441406, 0.009204745292663574, 0.009588956832885742, 0.00997316837310791, 0.010357379913330078, 0.010741591453552246, 0.011125802993774414, 0.011510014533996582, 0.01189422607421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 9.0, 5.0, 10.0, 9.0, 11.0, 10.0, 30.0, 32.0, 34.0, 30.0, 45.0, 40.0, 51.0, 44.0, 62.0, 55.0, 65.0, 70.0, 47.0, 55.0, 34.0, 34.0, 32.0, 40.0, 28.0, 24.0, 18.0, 12.0, 5.0, 11.0, 5.0, 7.0, 5.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.285045623779297e-06, -8.015893399715424e-06, -7.74674117565155e-06, -7.477588951587677e-06, -7.208436727523804e-06, -6.93928450345993e-06, -6.670132279396057e-06, -6.400980055332184e-06, -6.1318278312683105e-06, -5.862675607204437e-06, -5.593523383140564e-06, -5.324371159076691e-06, -5.055218935012817e-06, -4.786066710948944e-06, -4.516914486885071e-06, -4.2477622628211975e-06, -3.978610038757324e-06, -3.709457814693451e-06, -3.4403055906295776e-06, -3.1711533665657043e-06, -2.902001142501831e-06, -2.6328489184379578e-06, -2.3636966943740845e-06, -2.094544470310211e-06, -1.8253922462463379e-06, -1.5562400221824646e-06, -1.2870877981185913e-06, -1.017935574054718e-06, -7.487833499908447e-07, -4.796311259269714e-07, -2.1047890186309814e-07, 5.8673322200775146e-08, 3.2782554626464844e-07, 5.969777703285217e-07, 8.66129994392395e-07, 1.1352822184562683e-06, 1.4044344425201416e-06, 1.6735866665840149e-06, 1.942738890647888e-06, 2.2118911147117615e-06, 2.4810433387756348e-06, 2.750195562839508e-06, 3.0193477869033813e-06, 3.2885000109672546e-06, 3.557652235031128e-06, 3.826804459095001e-06, 4.0959566831588745e-06, 4.365108907222748e-06, 4.634261131286621e-06, 4.903413355350494e-06, 5.172565579414368e-06, 5.441717803478241e-06, 5.710870027542114e-06, 5.9800222516059875e-06, 6.249174475669861e-06, 6.518326699733734e-06, 6.787478923797607e-06, 7.056631147861481e-06, 7.325783371925354e-06, 7.594935595989227e-06, 7.8640878200531e-06, 8.133240044116974e-06, 8.402392268180847e-06, 8.67154449224472e-06, 8.940696716308594e-06]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 1.0, 13.0, 18.0, 22.0, 34.0, 58.0, 79.0, 105.0, 147.0, 205.0, 295.0, 434.0, 592.0, 881.0, 1264.0, 1904.0, 2861.0, 4580.0, 7233.0, 12210.0, 20869.0, 38371.0, 76206.0, 159956.0, 264170.0, 220384.0, 111729.0, 53773.0, 28230.0, 15862.0, 9323.0, 5799.0, 3571.0, 2347.0, 1600.0, 1044.0, 723.0, 498.0, 346.0, 243.0, 187.0, 117.0, 84.0, 54.0, 39.0, 26.0, 20.0, 14.0, 14.0, 7.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0133056640625, -0.012886643409729004, -0.012467622756958008, -0.012048602104187012, -0.011629581451416016, -0.01121056079864502, -0.010791540145874023, -0.010372519493103027, -0.009953498840332031, -0.009534478187561035, -0.009115457534790039, -0.008696436882019043, -0.008277416229248047, -0.00785839557647705, -0.007439374923706055, -0.007020354270935059, -0.0066013336181640625, -0.006182312965393066, -0.00576329231262207, -0.005344271659851074, -0.004925251007080078, -0.004506230354309082, -0.004087209701538086, -0.00366818904876709, -0.0032491683959960938, -0.0028301477432250977, -0.0024111270904541016, -0.0019921064376831055, -0.0015730857849121094, -0.0011540651321411133, -0.0007350444793701172, -0.0003160238265991211, 0.000102996826171875, 0.0005220174789428711, 0.0009410381317138672, 0.0013600587844848633, 0.0017790794372558594, 0.0021981000900268555, 0.0026171207427978516, 0.0030361413955688477, 0.0034551620483398438, 0.00387418270111084, 0.004293203353881836, 0.004712224006652832, 0.005131244659423828, 0.005550265312194824, 0.00596928596496582, 0.006388306617736816, 0.0068073272705078125, 0.007226347923278809, 0.007645368576049805, 0.0080643892288208, 0.008483409881591797, 0.008902430534362793, 0.009321451187133789, 0.009740471839904785, 0.010159492492675781, 0.010578513145446777, 0.010997533798217773, 0.01141655445098877, 0.011835575103759766, 0.012254595756530762, 0.012673616409301758, 0.013092637062072754, 0.01351165771484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 5.0, 7.0, 8.0, 8.0, 5.0, 5.0, 13.0, 17.0, 17.0, 30.0, 43.0, 53.0, 58.0, 91.0, 75.0, 98.0, 92.0, 88.0, 55.0, 45.0, 41.0, 33.0, 22.0, 11.0, 14.0, 12.0, 9.0, 4.0, 12.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0052032470703125, -0.005016028881072998, -0.004828810691833496, -0.004641592502593994, -0.004454374313354492, -0.00426715612411499, -0.004079937934875488, -0.0038927197456359863, -0.0037055015563964844, -0.0035182833671569824, -0.0033310651779174805, -0.0031438469886779785, -0.0029566287994384766, -0.0027694106101989746, -0.0025821924209594727, -0.0023949742317199707, -0.0022077560424804688, -0.002020537853240967, -0.0018333196640014648, -0.0016461014747619629, -0.001458883285522461, -0.001271665096282959, -0.001084446907043457, -0.0008972287178039551, -0.0007100105285644531, -0.0005227923393249512, -0.0003355741500854492, -0.00014835596084594727, 3.886222839355469e-05, 0.00022608041763305664, 0.0004132986068725586, 0.0006005167961120605, 0.0007877349853515625, 0.0009749531745910645, 0.0011621713638305664, 0.0013493895530700684, 0.0015366077423095703, 0.0017238259315490723, 0.0019110441207885742, 0.002098262310028076, 0.002285480499267578, 0.00247269868850708, 0.002659916877746582, 0.002847135066986084, 0.003034353256225586, 0.003221571445465088, 0.00340878963470459, 0.003596007823944092, 0.0037832260131835938, 0.003970444202423096, 0.004157662391662598, 0.0043448805809021, 0.0045320987701416016, 0.0047193169593811035, 0.0049065351486206055, 0.005093753337860107, 0.005280971527099609, 0.005468189716339111, 0.005655407905578613, 0.005842626094818115, 0.006029844284057617, 0.006217062473297119, 0.006404280662536621, 0.006591498851776123, 0.006778717041015625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 4.0, 1.0, 6.0, 8.0, 9.0, 8.0, 18.0, 20.0, 19.0, 19.0, 26.0, 38.0, 29.0, 31.0, 38.0, 44.0, 42.0, 46.0, 49.0, 54.0, 47.0, 43.0, 51.0, 49.0, 41.0, 43.0, 31.0, 29.0, 33.0, 24.0, 25.0, 18.0, 14.0, 11.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.467933654785156, -10.181836128234863, -9.895737648010254, -9.609640121459961, -9.323541641235352, -9.037444114685059, -8.751346588134766, -8.465248107910156, -8.179150581359863, -7.893052577972412, -7.606954574584961, -7.320857048034668, -7.034759044647217, -6.748661041259766, -6.4625630378723145, -6.176465034484863, -5.890367031097412, -5.604269027709961, -5.31817102432251, -5.032073020935059, -4.745975494384766, -4.4598774909973145, -4.173779487609863, -3.887681722640991, -3.60158371925354, -3.315485715866089, -3.029387950897217, -2.7432899475097656, -2.4571919441223145, -2.1710941791534424, -1.8849961757659912, -1.5988984107971191, -1.3128008842468262, -1.0267030000686646, -0.7406050562858582, -0.45450711250305176, -0.16840922832489014, 0.11768865585327148, 0.40378665924072266, 0.6898844242095947, 0.9759824275970459, 1.2620803117752075, 1.5481781959533691, 1.8342761993408203, 2.1203742027282715, 2.4064719676971436, 2.6925699710845947, 2.978667736053467, 3.264765739440918, 3.550863742828369, 3.836961507797241, 4.123059272766113, 4.4091572761535645, 4.695255279541016, 4.981353282928467, 5.267451286315918, 5.553548812866211, 5.839646816253662, 6.125744819641113, 6.411842346191406, 6.697940349578857, 6.984038352966309, 7.27013635635376, 7.556234359741211, 7.842332363128662]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 10.0, 10.0, 10.0, 17.0, 9.0, 16.0, 17.0, 22.0, 15.0, 26.0, 30.0, 35.0, 36.0, 34.0, 35.0, 35.0, 43.0, 51.0, 39.0, 51.0, 30.0, 47.0, 43.0, 44.0, 33.0, 38.0, 20.0, 35.0, 29.0, 17.0, 18.0, 16.0, 16.0, 10.0, 8.0, 14.0, 11.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.691352844238281, -10.370362281799316, -10.049371719360352, -9.728381156921387, -9.407390594482422, -9.086400985717773, -8.765409469604492, -8.444419860839844, -8.123429298400879, -7.802438735961914, -7.481448173522949, -7.160457611083984, -6.839467525482178, -6.518476963043213, -6.197486400604248, -5.876496315002441, -5.555505275726318, -5.2345147132873535, -4.913524150848389, -4.592534065246582, -4.271543502807617, -3.9505529403686523, -3.6295623779296875, -3.3085720539093018, -2.987581491470337, -2.666590929031372, -2.3456006050109863, -2.0246100425720215, -1.7036195993423462, -1.382629156112671, -1.061638593673706, -0.7406482696533203, -0.41965770721435547, -0.09866723418235779, 0.2223232388496399, 0.54331374168396, 0.8643041849136353, 1.1852946281433105, 1.5062851905822754, 1.8272755146026611, 2.148266077041626, 2.469256639480591, 2.7902469635009766, 3.1112375259399414, 3.4322280883789062, 3.753218412399292, 4.074209213256836, 4.395199298858643, 4.716189861297607, 5.037180423736572, 5.358170986175537, 5.679161071777344, 6.000151634216309, 6.321142196655273, 6.642132759094238, 6.963123321533203, 7.284113883972168, 7.605104446411133, 7.926095008850098, 8.247085571289062, 8.568076133728027, 8.889066696166992, 9.21005630493164, 9.531046867370605, 9.85203742980957]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 9.0, 9.0, 18.0, 19.0, 51.0, 42.0, 77.0, 149.0, 218.0, 312.0, 533.0, 830.0, 1309.0, 2100.0, 3180.0, 5530.0, 8704.0, 14480.0, 23026.0, 35928.0, 54551.0, 78933.0, 105547.0, 126321.0, 133707.0, 125785.0, 103264.0, 77277.0, 53503.0, 34868.0, 22135.0, 13786.0, 8548.0, 5342.0, 3176.0, 2023.0, 1204.0, 749.0, 500.0, 305.0, 180.0, 112.0, 83.0, 50.0, 31.0, 18.0, 13.0, 11.0, 7.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.671875, -7.42803955078125, -7.1842041015625, -6.94036865234375, -6.696533203125, -6.45269775390625, -6.2088623046875, -5.96502685546875, -5.72119140625, -5.47735595703125, -5.2335205078125, -4.98968505859375, -4.745849609375, -4.50201416015625, -4.2581787109375, -4.01434326171875, -3.7705078125, -3.52667236328125, -3.2828369140625, -3.03900146484375, -2.795166015625, -2.55133056640625, -2.3074951171875, -2.06365966796875, -1.81982421875, -1.57598876953125, -1.3321533203125, -1.08831787109375, -0.844482421875, -0.60064697265625, -0.3568115234375, -0.11297607421875, 0.130859375, 0.37469482421875, 0.6185302734375, 0.86236572265625, 1.106201171875, 1.35003662109375, 1.5938720703125, 1.83770751953125, 2.08154296875, 2.32537841796875, 2.5692138671875, 2.81304931640625, 3.056884765625, 3.30072021484375, 3.5445556640625, 3.78839111328125, 4.0322265625, 4.27606201171875, 4.5198974609375, 4.76373291015625, 5.007568359375, 5.25140380859375, 5.4952392578125, 5.73907470703125, 5.98291015625, 6.22674560546875, 6.4705810546875, 6.71441650390625, 6.958251953125, 7.20208740234375, 7.4459228515625, 7.68975830078125, 7.93359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 12.0, 10.0, 12.0, 13.0, 15.0, 14.0, 19.0, 22.0, 21.0, 30.0, 36.0, 33.0, 37.0, 39.0, 52.0, 43.0, 41.0, 44.0, 50.0, 51.0, 51.0, 51.0, 34.0, 26.0, 42.0, 31.0, 24.0, 28.0, 25.0, 23.0, 12.0, 11.0, 9.0, 9.0, 7.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.2764892578125, -10.927978515625, -10.5794677734375, -10.23095703125, -9.8824462890625, -9.533935546875, -9.1854248046875, -8.8369140625, -8.4884033203125, -8.139892578125, -7.7913818359375, -7.44287109375, -7.0943603515625, -6.745849609375, -6.3973388671875, -6.048828125, -5.7003173828125, -5.351806640625, -5.0032958984375, -4.65478515625, -4.3062744140625, -3.957763671875, -3.6092529296875, -3.2607421875, -2.9122314453125, -2.563720703125, -2.2152099609375, -1.86669921875, -1.5181884765625, -1.169677734375, -0.8211669921875, -0.47265625, -0.1241455078125, 0.224365234375, 0.5728759765625, 0.92138671875, 1.2698974609375, 1.618408203125, 1.9669189453125, 2.3154296875, 2.6639404296875, 3.012451171875, 3.3609619140625, 3.70947265625, 4.0579833984375, 4.406494140625, 4.7550048828125, 5.103515625, 5.4520263671875, 5.800537109375, 6.1490478515625, 6.49755859375, 6.8460693359375, 7.194580078125, 7.5430908203125, 7.8916015625, 8.2401123046875, 8.588623046875, 8.9371337890625, 9.28564453125, 9.6341552734375, 9.982666015625, 10.3311767578125, 10.6796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 12.0, 21.0, 25.0, 37.0, 66.0, 93.0, 138.0, 231.0, 387.0, 608.0, 971.0, 1537.0, 2461.0, 4034.0, 6713.0, 11119.0, 18096.0, 29393.0, 46277.0, 70396.0, 100148.0, 127998.0, 143613.0, 137618.0, 113447.0, 83013.0, 56355.0, 36076.0, 22084.0, 13856.0, 8347.0, 5017.0, 3089.0, 1986.0, 1198.0, 720.0, 506.0, 306.0, 203.0, 116.0, 74.0, 46.0, 41.0, 31.0, 18.0, 13.0, 7.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.83984375, -7.58465576171875, -7.3294677734375, -7.07427978515625, -6.819091796875, -6.56390380859375, -6.3087158203125, -6.05352783203125, -5.79833984375, -5.54315185546875, -5.2879638671875, -5.03277587890625, -4.777587890625, -4.52239990234375, -4.2672119140625, -4.01202392578125, -3.7568359375, -3.50164794921875, -3.2464599609375, -2.99127197265625, -2.736083984375, -2.48089599609375, -2.2257080078125, -1.97052001953125, -1.71533203125, -1.46014404296875, -1.2049560546875, -0.94976806640625, -0.694580078125, -0.43939208984375, -0.1842041015625, 0.07098388671875, 0.326171875, 0.58135986328125, 0.8365478515625, 1.09173583984375, 1.346923828125, 1.60211181640625, 1.8572998046875, 2.11248779296875, 2.36767578125, 2.62286376953125, 2.8780517578125, 3.13323974609375, 3.388427734375, 3.64361572265625, 3.8988037109375, 4.15399169921875, 4.4091796875, 4.66436767578125, 4.9195556640625, 5.17474365234375, 5.429931640625, 5.68511962890625, 5.9403076171875, 6.19549560546875, 6.45068359375, 6.70587158203125, 6.9610595703125, 7.21624755859375, 7.471435546875, 7.72662353515625, 7.9818115234375, 8.23699951171875, 8.4921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 13.0, 7.0, 4.0, 7.0, 11.0, 14.0, 14.0, 19.0, 22.0, 27.0, 28.0, 30.0, 35.0, 33.0, 32.0, 43.0, 43.0, 50.0, 30.0, 54.0, 46.0, 43.0, 40.0, 40.0, 42.0, 44.0, 37.0, 31.0, 22.0, 27.0, 28.0, 20.0, 18.0, 13.0, 8.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3515625, -6.13385009765625, -5.9161376953125, -5.69842529296875, -5.480712890625, -5.26300048828125, -5.0452880859375, -4.82757568359375, -4.60986328125, -4.39215087890625, -4.1744384765625, -3.95672607421875, -3.739013671875, -3.52130126953125, -3.3035888671875, -3.08587646484375, -2.8681640625, -2.65045166015625, -2.4327392578125, -2.21502685546875, -1.997314453125, -1.77960205078125, -1.5618896484375, -1.34417724609375, -1.12646484375, -0.90875244140625, -0.6910400390625, -0.47332763671875, -0.255615234375, -0.03790283203125, 0.1798095703125, 0.39752197265625, 0.615234375, 0.83294677734375, 1.0506591796875, 1.26837158203125, 1.486083984375, 1.70379638671875, 1.9215087890625, 2.13922119140625, 2.35693359375, 2.57464599609375, 2.7923583984375, 3.01007080078125, 3.227783203125, 3.44549560546875, 3.6632080078125, 3.88092041015625, 4.0986328125, 4.31634521484375, 4.5340576171875, 4.75177001953125, 4.969482421875, 5.18719482421875, 5.4049072265625, 5.62261962890625, 5.84033203125, 6.05804443359375, 6.2757568359375, 6.49346923828125, 6.711181640625, 6.92889404296875, 7.1466064453125, 7.36431884765625, 7.58203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 9.0, 14.0, 22.0, 39.0, 56.0, 89.0, 142.0, 230.0, 331.0, 552.0, 872.0, 1387.0, 2326.0, 3805.0, 6105.0, 9839.0, 15996.0, 24704.0, 37508.0, 53999.0, 74428.0, 94417.0, 111796.0, 118328.0, 116046.0, 103141.0, 83989.0, 62766.0, 44219.0, 29939.0, 19225.0, 12513.0, 7567.0, 4598.0, 2838.0, 1872.0, 1086.0, 642.0, 426.0, 238.0, 190.0, 107.0, 63.0, 45.0, 18.0, 12.0, 9.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.8984375, -1.838592529296875, -1.77874755859375, -1.718902587890625, -1.6590576171875, -1.599212646484375, -1.53936767578125, -1.479522705078125, -1.419677734375, -1.359832763671875, -1.29998779296875, -1.240142822265625, -1.1802978515625, -1.120452880859375, -1.06060791015625, -1.000762939453125, -0.94091796875, -0.881072998046875, -0.82122802734375, -0.761383056640625, -0.7015380859375, -0.641693115234375, -0.58184814453125, -0.522003173828125, -0.462158203125, -0.402313232421875, -0.34246826171875, -0.282623291015625, -0.2227783203125, -0.162933349609375, -0.10308837890625, -0.043243408203125, 0.0166015625, 0.076446533203125, 0.13629150390625, 0.196136474609375, 0.2559814453125, 0.315826416015625, 0.37567138671875, 0.435516357421875, 0.495361328125, 0.555206298828125, 0.61505126953125, 0.674896240234375, 0.7347412109375, 0.794586181640625, 0.85443115234375, 0.914276123046875, 0.97412109375, 1.033966064453125, 1.09381103515625, 1.153656005859375, 1.2135009765625, 1.273345947265625, 1.33319091796875, 1.393035888671875, 1.452880859375, 1.512725830078125, 1.57257080078125, 1.632415771484375, 1.6922607421875, 1.752105712890625, 1.81195068359375, 1.871795654296875, 1.931640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 9.0, 6.0, 12.0, 11.0, 9.0, 16.0, 17.0, 18.0, 30.0, 18.0, 24.0, 29.0, 28.0, 32.0, 49.0, 44.0, 39.0, 41.0, 59.0, 50.0, 45.0, 47.0, 43.0, 40.0, 39.0, 35.0, 30.0, 40.0, 25.0, 21.0, 19.0, 17.0, 13.0, 12.0, 10.0, 8.0, 8.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001951456069946289, -0.000188460573554039, -0.0001817755401134491, -0.0001750905066728592, -0.0001684054732322693, -0.00016172043979167938, -0.00015503540635108948, -0.00014835037291049957, -0.00014166533946990967, -0.00013498030602931976, -0.00012829527258872986, -0.00012161023914813995, -0.00011492520570755005, -0.00010824017226696014, -0.00010155513882637024, -9.487010538578033e-05, -8.818507194519043e-05, -8.150003850460052e-05, -7.481500506401062e-05, -6.812997162342072e-05, -6.144493818283081e-05, -5.4759904742240906e-05, -4.8074871301651e-05, -4.1389837861061096e-05, -3.470480442047119e-05, -2.8019770979881287e-05, -2.1334737539291382e-05, -1.4649704098701477e-05, -7.964670658111572e-06, -1.2796372175216675e-06, 5.405396223068237e-06, 1.2090429663658142e-05, 1.8775463104248047e-05, 2.546049654483795e-05, 3.2145529985427856e-05, 3.883056342601776e-05, 4.5515596866607666e-05, 5.220063030719757e-05, 5.8885663747787476e-05, 6.557069718837738e-05, 7.225573062896729e-05, 7.894076406955719e-05, 8.56257975101471e-05, 9.2310830950737e-05, 9.89958643913269e-05, 0.00010568089783191681, 0.00011236593127250671, 0.00011905096471309662, 0.00012573599815368652, 0.00013242103159427643, 0.00013910606503486633, 0.00014579109847545624, 0.00015247613191604614, 0.00015916116535663605, 0.00016584619879722595, 0.00017253123223781586, 0.00017921626567840576, 0.00018590129911899567, 0.00019258633255958557, 0.00019927136600017548, 0.00020595639944076538, 0.00021264143288135529, 0.0002193264663219452, 0.0002260114997625351, 0.000232696533203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 8.0, 3.0, 15.0, 21.0, 34.0, 38.0, 64.0, 112.0, 137.0, 260.0, 413.0, 629.0, 1054.0, 1632.0, 2637.0, 4208.0, 6984.0, 10963.0, 17242.0, 26361.0, 39043.0, 55645.0, 74100.0, 92086.0, 106814.0, 113155.0, 110837.0, 99630.0, 82747.0, 64651.0, 46827.0, 32069.0, 21421.0, 13817.0, 8688.0, 5358.0, 3329.0, 2026.0, 1249.0, 818.0, 515.0, 316.0, 211.0, 128.0, 92.0, 57.0, 38.0, 17.0, 32.0, 16.0, 8.0, 7.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7041015625, -1.6468048095703125, -1.589508056640625, -1.5322113037109375, -1.47491455078125, -1.4176177978515625, -1.360321044921875, -1.3030242919921875, -1.2457275390625, -1.1884307861328125, -1.131134033203125, -1.0738372802734375, -1.01654052734375, -0.9592437744140625, -0.901947021484375, -0.8446502685546875, -0.787353515625, -0.7300567626953125, -0.672760009765625, -0.6154632568359375, -0.55816650390625, -0.5008697509765625, -0.443572998046875, -0.3862762451171875, -0.3289794921875, -0.2716827392578125, -0.214385986328125, -0.1570892333984375, -0.09979248046875, -0.0424957275390625, 0.014801025390625, 0.0720977783203125, 0.12939453125, 0.1866912841796875, 0.243988037109375, 0.3012847900390625, 0.35858154296875, 0.4158782958984375, 0.473175048828125, 0.5304718017578125, 0.5877685546875, 0.6450653076171875, 0.702362060546875, 0.7596588134765625, 0.81695556640625, 0.8742523193359375, 0.931549072265625, 0.9888458251953125, 1.046142578125, 1.1034393310546875, 1.160736083984375, 1.2180328369140625, 1.27532958984375, 1.3326263427734375, 1.389923095703125, 1.4472198486328125, 1.5045166015625, 1.5618133544921875, 1.619110107421875, 1.6764068603515625, 1.73370361328125, 1.7910003662109375, 1.848297119140625, 1.9055938720703125, 1.962890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 3.0, 5.0, 4.0, 7.0, 11.0, 9.0, 17.0, 20.0, 19.0, 16.0, 25.0, 18.0, 31.0, 30.0, 46.0, 31.0, 58.0, 39.0, 48.0, 43.0, 39.0, 41.0, 47.0, 37.0, 30.0, 45.0, 30.0, 34.0, 40.0, 22.0, 31.0, 17.0, 9.0, 20.0, 14.0, 11.0, 14.0, 9.0, 6.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74853515625, -0.7213592529296875, -0.694183349609375, -0.6670074462890625, -0.63983154296875, -0.6126556396484375, -0.585479736328125, -0.5583038330078125, -0.5311279296875, -0.5039520263671875, -0.476776123046875, -0.4496002197265625, -0.42242431640625, -0.3952484130859375, -0.368072509765625, -0.3408966064453125, -0.313720703125, -0.2865447998046875, -0.259368896484375, -0.2321929931640625, -0.20501708984375, -0.1778411865234375, -0.150665283203125, -0.1234893798828125, -0.0963134765625, -0.0691375732421875, -0.041961669921875, -0.0147857666015625, 0.01239013671875, 0.0395660400390625, 0.066741943359375, 0.0939178466796875, 0.12109375, 0.1482696533203125, 0.175445556640625, 0.2026214599609375, 0.22979736328125, 0.2569732666015625, 0.284149169921875, 0.3113250732421875, 0.3385009765625, 0.3656768798828125, 0.392852783203125, 0.4200286865234375, 0.44720458984375, 0.4743804931640625, 0.501556396484375, 0.5287322998046875, 0.555908203125, 0.5830841064453125, 0.610260009765625, 0.6374359130859375, 0.66461181640625, 0.6917877197265625, 0.718963623046875, 0.7461395263671875, 0.7733154296875, 0.8004913330078125, 0.827667236328125, 0.8548431396484375, 0.88201904296875, 0.9091949462890625, 0.936370849609375, 0.9635467529296875, 0.99072265625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 8.0, 5.0, 10.0, 13.0, 15.0, 22.0, 36.0, 29.0, 35.0, 28.0, 45.0, 42.0, 44.0, 40.0, 46.0, 56.0, 48.0, 53.0, 43.0, 52.0, 47.0, 36.0, 34.0, 32.0, 39.0, 19.0, 29.0, 21.0, 12.0, 10.0, 7.0, 5.0, 9.0, 3.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.993473052978516, -10.703258514404297, -10.413044929504395, -10.122830390930176, -9.832615852355957, -9.542402267456055, -9.252187728881836, -8.961973190307617, -8.671759605407715, -8.381545066833496, -8.091331481933594, -7.801116943359375, -7.5109028816223145, -7.220688819885254, -6.930474281311035, -6.640260219573975, -6.350045680999756, -6.059831619262695, -5.769617080688477, -5.479403018951416, -5.1891889572143555, -4.898974418640137, -4.608760356903076, -4.318546295166016, -4.028331756591797, -3.7381174564361572, -3.4479033946990967, -3.157689094543457, -2.8674750328063965, -2.577260732650757, -2.287046432495117, -1.9968323707580566, -1.7066187858581543, -1.4164046049118042, -1.126190423965454, -0.8359761238098145, -0.5457619428634644, -0.25554776191711426, 0.03466653823852539, 0.32488059997558594, 0.6150949001312256, 0.9053090810775757, 1.1955232620239258, 1.4857375621795654, 1.7759517431259155, 2.0661659240722656, 2.3563802242279053, 2.646594285964966, 2.9368085861206055, 3.227022886276245, 3.5172369480133057, 3.8074512481689453, 4.097665309906006, 4.387879371643066, 4.678093910217285, 4.968307971954346, 5.258522033691406, 5.548736095428467, 5.8389506340026855, 6.129164695739746, 6.419378757476807, 6.709592819213867, 6.999807357788086, 7.2900214195251465, 7.580235958099365]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 9.0, 9.0, 10.0, 12.0, 18.0, 16.0, 14.0, 26.0, 23.0, 31.0, 25.0, 25.0, 27.0, 31.0, 40.0, 41.0, 32.0, 52.0, 40.0, 51.0, 55.0, 40.0, 44.0, 45.0, 51.0, 35.0, 34.0, 25.0, 30.0, 23.0, 24.0, 11.0, 13.0, 13.0, 7.0, 7.0, 8.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0049409866333, -9.630271911621094, -9.25560188293457, -8.880932807922363, -8.50626277923584, -8.131593704223633, -7.756924152374268, -7.382254600524902, -7.007585525512695, -6.63291597366333, -6.258246421813965, -5.883577346801758, -5.508907794952393, -5.134238243103027, -4.759568691253662, -4.384899139404297, -4.010229587554932, -3.6355600357055664, -3.2608907222747803, -2.886221170425415, -2.511551856994629, -2.1368823051452637, -1.7622127532958984, -1.3875434398651123, -1.012873888015747, -0.6382044553756714, -0.2635349631309509, 0.11113452911376953, 0.4858039617538452, 0.8604733943939209, 1.2351429462432861, 1.6098122596740723, 1.9844818115234375, 2.3591513633728027, 2.733820676803589, 3.108490228652954, 3.4831595420837402, 3.8578290939331055, 4.232498645782471, 4.607168197631836, 4.981837272644043, 5.356506824493408, 5.731176376342773, 6.1058454513549805, 6.480515003204346, 6.855184555053711, 7.229854106903076, 7.604523658752441, 7.979193210601807, 8.353862762451172, 8.728531837463379, 9.103201866149902, 9.47787094116211, 9.852540969848633, 10.22721004486084, 10.601879119873047, 10.97654914855957, 11.351218223571777, 11.7258882522583, 12.100557327270508, 12.475227355957031, 12.849896430969238, 13.224565505981445, 13.599235534667969, 13.973904609680176]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 8.0, 10.0, 25.0, 32.0, 29.0, 76.0, 77.0, 136.0, 161.0, 214.0, 316.0, 458.0, 632.0, 820.0, 1151.0, 1551.0, 2027.0, 2878.0, 3980.0, 5494.0, 7366.0, 1002805.0, 5604.0, 3959.0, 2945.0, 2142.0, 1568.0, 1166.0, 793.0, 614.0, 463.0, 322.0, 210.0, 183.0, 132.0, 84.0, 47.0, 35.0, 34.0, 12.0, 14.0, 8.0, 4.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-86.43949890136719, -83.82079315185547, -81.20208740234375, -78.58338165283203, -75.96467590332031, -73.3459701538086, -70.72726440429688, -68.10855865478516, -65.48985290527344, -62.87114715576172, -60.25244140625, -57.63373565673828, -55.01502990722656, -52.396324157714844, -49.777618408203125, -47.158912658691406, -44.54020690917969, -41.92150115966797, -39.30279541015625, -36.68408966064453, -34.06538391113281, -31.446678161621094, -28.827972412109375, -26.209266662597656, -23.590560913085938, -20.97185516357422, -18.3531494140625, -15.734443664550781, -13.115737915039062, -10.497032165527344, -7.878326416015625, -5.259620666503906, -2.6409225463867188, -0.022216796875, 2.5964889526367188, 5.2151947021484375, 7.833900451660156, 10.452606201171875, 13.071311950683594, 15.690017700195312, 18.30872344970703, 20.92742919921875, 23.54613494873047, 26.164840698242188, 28.783546447753906, 31.402252197265625, 34.020957946777344, 36.63966369628906, 39.25836944580078, 41.8770751953125, 44.49578094482422, 47.11448669433594, 49.733192443847656, 52.351898193359375, 54.970603942871094, 57.58930969238281, 60.20801544189453, 62.82672119140625, 65.44542694091797, 68.06413269042969, 70.6828384399414, 73.30154418945312, 75.92024993896484, 78.53895568847656, 81.15766143798828]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 4.0, 6.0, 11.0, 8.0, 15.0, 21.0, 22.0, 37.0, 37.0, 48.0, 54.0, 80.0, 93.0, 156.0, 192.0, 289.0, 420.0, 674.0, 922.0, 1341.0, 1798.0, 2984.0, 7156.0, 16331.0, 25800.0, 28678.0, 31650.0, 51165136.0, 87241.0, 25793.0, 27386.0, 22392.0, 11993.0, 4724.0, 2386.0, 1614.0, 1201.0, 832.0, 498.0, 350.0, 235.0, 180.0, 122.0, 112.0, 76.0, 59.0, 51.0, 41.0, 18.0, 20.0, 21.0, 11.0, 14.0, 9.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-493.5422668457031, -477.50006103515625, -461.4578552246094, -445.4156494140625, -429.3734436035156, -413.33123779296875, -397.2890319824219, -381.246826171875, -365.2046203613281, -349.16241455078125, -333.1202087402344, -317.0780029296875, -301.0357971191406, -284.99359130859375, -268.9513854980469, -252.9091796875, -236.86697387695312, -220.82476806640625, -204.78256225585938, -188.7403564453125, -172.69815063476562, -156.65594482421875, -140.61373901367188, -124.571533203125, -108.52932739257812, -92.48712158203125, -76.44491577148438, -60.4027099609375, -44.360504150390625, -28.31829833984375, -12.276092529296875, 3.76611328125, 19.808349609375, 35.850555419921875, 51.89276123046875, 67.93496704101562, 83.9771728515625, 100.01937866210938, 116.06158447265625, 132.10379028320312, 148.14599609375, 164.18820190429688, 180.23040771484375, 196.27261352539062, 212.3148193359375, 228.35702514648438, 244.39923095703125, 260.4414367675781, 276.483642578125, 292.5258483886719, 308.56805419921875, 324.6102600097656, 340.6524658203125, 356.6946716308594, 372.73687744140625, 388.7790832519531, 404.8212890625, 420.8634948730469, 436.90570068359375, 452.9479064941406, 468.9901123046875, 485.0323181152344, 501.07452392578125, 517.11669921875, 533.158935546875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 11.0, 7.0, 17.0, 29.0, 28.0, 35.0, 66.0, 80.0, 141.0, 235.0, 338.0, 472.0, 689.0, 970.0, 1575.0, 2344.0, 3438.0, 5368.0, 8679.0, 14230.0, 23366.0, 38818.0, 65619.0, 115049.0, 215279.0, 517524.0, 3749840.0, 891103.0, 288303.0, 146322.0, 81837.0, 46509.0, 27982.0, 16868.0, 10374.0, 6557.0, 3964.0, 2452.0, 1617.0, 1060.0, 749.0, 511.0, 322.0, 228.0, 149.0, 100.0, 76.0, 32.0, 36.0, 13.0, 9.0, 6.0, 9.0, 2.0, 1.0, 3.0], "bins": [-10.3671875, -10.068359375, -9.76953125, -9.470703125, -9.171875, -8.873046875, -8.57421875, -8.275390625, -7.9765625, -7.677734375, -7.37890625, -7.080078125, -6.78125, -6.482421875, -6.18359375, -5.884765625, -5.5859375, -5.287109375, -4.98828125, -4.689453125, -4.390625, -4.091796875, -3.79296875, -3.494140625, -3.1953125, -2.896484375, -2.59765625, -2.298828125, -2.0, -1.701171875, -1.40234375, -1.103515625, -0.8046875, -0.505859375, -0.20703125, 0.091796875, 0.390625, 0.689453125, 0.98828125, 1.287109375, 1.5859375, 1.884765625, 2.18359375, 2.482421875, 2.78125, 3.080078125, 3.37890625, 3.677734375, 3.9765625, 4.275390625, 4.57421875, 4.873046875, 5.171875, 5.470703125, 5.76953125, 6.068359375, 6.3671875, 6.666015625, 6.96484375, 7.263671875, 7.5625, 7.861328125, 8.16015625, 8.458984375, 8.7578125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 9.0, 16.0, 23.0, 19.0, 33.0, 22.0, 36.0, 25.0, 35.0, 45.0, 48.0, 52.0, 68.0, 125.0, 182.0, 454.0, 237.0, 124.0, 81.0, 53.0, 43.0, 36.0, 44.0, 38.0, 29.0, 19.0, 15.0, 23.0, 17.0, 8.0, 10.0, 9.0, 3.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.2265625, -14.7987060546875, -14.370849609375, -13.9429931640625, -13.51513671875, -13.0872802734375, -12.659423828125, -12.2315673828125, -11.8037109375, -11.3758544921875, -10.947998046875, -10.5201416015625, -10.09228515625, -9.6644287109375, -9.236572265625, -8.8087158203125, -8.380859375, -7.9530029296875, -7.525146484375, -7.0972900390625, -6.66943359375, -6.2415771484375, -5.813720703125, -5.3858642578125, -4.9580078125, -4.5301513671875, -4.102294921875, -3.6744384765625, -3.24658203125, -2.8187255859375, -2.390869140625, -1.9630126953125, -1.53515625, -1.1072998046875, -0.679443359375, -0.2515869140625, 0.17626953125, 0.6041259765625, 1.031982421875, 1.4598388671875, 1.8876953125, 2.3155517578125, 2.743408203125, 3.1712646484375, 3.59912109375, 4.0269775390625, 4.454833984375, 4.8826904296875, 5.310546875, 5.7384033203125, 6.166259765625, 6.5941162109375, 7.02197265625, 7.4498291015625, 7.877685546875, 8.3055419921875, 8.7333984375, 9.1612548828125, 9.589111328125, 10.0169677734375, 10.44482421875, 10.8726806640625, 11.300537109375, 11.7283935546875, 12.15625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [11.0, 3.0, 4.0, 12.0, 2.0, 6.0, 27.0, 19.0, 35.0, 44.0, 71.0, 70.0, 127.0, 202.0, 291.0, 406.0, 554.0, 978.0, 1547.0, 2377.0, 4110.0, 6885.0, 11769.0, 20698.0, 37361.0, 69041.0, 131833.0, 268371.0, 775126.0, 4006499.0, 502000.0, 212169.0, 108834.0, 56750.0, 30834.0, 17288.0, 9926.0, 5826.0, 3358.0, 2068.0, 1461.0, 897.0, 516.0, 316.0, 247.0, 163.0, 95.0, 60.0, 34.0, 35.0, 42.0, 27.0, 6.0, 3.0, 7.0, 1.0, 5.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-7.87890625, -7.61041259765625, -7.3419189453125, -7.07342529296875, -6.804931640625, -6.53643798828125, -6.2679443359375, -5.99945068359375, -5.73095703125, -5.46246337890625, -5.1939697265625, -4.92547607421875, -4.656982421875, -4.38848876953125, -4.1199951171875, -3.85150146484375, -3.5830078125, -3.31451416015625, -3.0460205078125, -2.77752685546875, -2.509033203125, -2.24053955078125, -1.9720458984375, -1.70355224609375, -1.43505859375, -1.16656494140625, -0.8980712890625, -0.62957763671875, -0.361083984375, -0.09259033203125, 0.1759033203125, 0.44439697265625, 0.712890625, 0.98138427734375, 1.2498779296875, 1.51837158203125, 1.786865234375, 2.05535888671875, 2.3238525390625, 2.59234619140625, 2.86083984375, 3.12933349609375, 3.3978271484375, 3.66632080078125, 3.934814453125, 4.20330810546875, 4.4718017578125, 4.74029541015625, 5.0087890625, 5.27728271484375, 5.5457763671875, 5.81427001953125, 6.082763671875, 6.35125732421875, 6.6197509765625, 6.88824462890625, 7.15673828125, 7.42523193359375, 7.6937255859375, 7.96221923828125, 8.230712890625, 8.49920654296875, 8.7677001953125, 9.03619384765625, 9.3046875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 10.0, 13.0, 9.0, 8.0, 12.0, 17.0, 27.0, 36.0, 23.0, 38.0, 50.0, 46.0, 44.0, 66.0, 109.0, 231.0, 556.0, 216.0, 103.0, 64.0, 58.0, 36.0, 44.0, 29.0, 31.0, 27.0, 30.0, 15.0, 24.0, 17.0, 12.0, 7.0, 2.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2265625, -9.8536376953125, -9.480712890625, -9.1077880859375, -8.73486328125, -8.3619384765625, -7.989013671875, -7.6160888671875, -7.2431640625, -6.8702392578125, -6.497314453125, -6.1243896484375, -5.75146484375, -5.3785400390625, -5.005615234375, -4.6326904296875, -4.259765625, -3.8868408203125, -3.513916015625, -3.1409912109375, -2.76806640625, -2.3951416015625, -2.022216796875, -1.6492919921875, -1.2763671875, -0.9034423828125, -0.530517578125, -0.1575927734375, 0.21533203125, 0.5882568359375, 0.961181640625, 1.3341064453125, 1.70703125, 2.0799560546875, 2.452880859375, 2.8258056640625, 3.19873046875, 3.5716552734375, 3.944580078125, 4.3175048828125, 4.6904296875, 5.0633544921875, 5.436279296875, 5.8092041015625, 6.18212890625, 6.5550537109375, 6.927978515625, 7.3009033203125, 7.673828125, 8.0467529296875, 8.419677734375, 8.7926025390625, 9.16552734375, 9.5384521484375, 9.911376953125, 10.2843017578125, 10.6572265625, 11.0301513671875, 11.403076171875, 11.7760009765625, 12.14892578125, 12.5218505859375, 12.894775390625, 13.2677001953125, 13.640625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 2.0, 9.0, 7.0, 1.0, 11.0, 17.0, 12.0, 41.0, 57.0, 72.0, 123.0, 89.0, 119.0, 164.0, 233.0, 386.0, 516.0, 572.0, 919.0, 1333.0, 1967.0, 3442.0, 5979.0, 12513.0, 30083.0, 113894.0, 5944462.0, 115456.0, 30083.0, 12433.0, 6133.0, 3421.0, 2272.0, 1321.0, 908.0, 688.0, 452.0, 326.0, 222.0, 140.0, 122.0, 97.0, 78.0, 68.0, 67.0, 43.0, 29.0, 14.0, 12.0, 3.0, 7.0, 2.0, 0.0, 6.0, 5.0, 3.0, 7.0], "bins": [-21.0625, -20.433837890625, -19.80517578125, -19.176513671875, -18.5478515625, -17.919189453125, -17.29052734375, -16.661865234375, -16.033203125, -15.404541015625, -14.77587890625, -14.147216796875, -13.5185546875, -12.889892578125, -12.26123046875, -11.632568359375, -11.00390625, -10.375244140625, -9.74658203125, -9.117919921875, -8.4892578125, -7.860595703125, -7.23193359375, -6.603271484375, -5.974609375, -5.345947265625, -4.71728515625, -4.088623046875, -3.4599609375, -2.831298828125, -2.20263671875, -1.573974609375, -0.9453125, -0.316650390625, 0.31201171875, 0.940673828125, 1.5693359375, 2.197998046875, 2.82666015625, 3.455322265625, 4.083984375, 4.712646484375, 5.34130859375, 5.969970703125, 6.5986328125, 7.227294921875, 7.85595703125, 8.484619140625, 9.11328125, 9.741943359375, 10.37060546875, 10.999267578125, 11.6279296875, 12.256591796875, 12.88525390625, 13.513916015625, 14.142578125, 14.771240234375, 15.39990234375, 16.028564453125, 16.6572265625, 17.285888671875, 17.91455078125, 18.543212890625, 19.171875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 6.0, 5.0, 10.0, 6.0, 10.0, 15.0, 12.0, 22.0, 19.0, 29.0, 36.0, 33.0, 35.0, 51.0, 60.0, 77.0, 107.0, 180.0, 502.0, 231.0, 122.0, 75.0, 57.0, 35.0, 35.0, 33.0, 31.0, 34.0, 21.0, 21.0, 22.0, 16.0, 11.0, 15.0, 6.0, 10.0, 10.0, 11.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.109375, -7.86798095703125, -7.6265869140625, -7.38519287109375, -7.143798828125, -6.90240478515625, -6.6610107421875, -6.41961669921875, -6.17822265625, -5.93682861328125, -5.6954345703125, -5.45404052734375, -5.212646484375, -4.97125244140625, -4.7298583984375, -4.48846435546875, -4.2470703125, -4.00567626953125, -3.7642822265625, -3.52288818359375, -3.281494140625, -3.04010009765625, -2.7987060546875, -2.55731201171875, -2.31591796875, -2.07452392578125, -1.8331298828125, -1.59173583984375, -1.350341796875, -1.10894775390625, -0.8675537109375, -0.62615966796875, -0.384765625, -0.14337158203125, 0.0980224609375, 0.33941650390625, 0.580810546875, 0.82220458984375, 1.0635986328125, 1.30499267578125, 1.54638671875, 1.78778076171875, 2.0291748046875, 2.27056884765625, 2.511962890625, 2.75335693359375, 2.9947509765625, 3.23614501953125, 3.4775390625, 3.71893310546875, 3.9603271484375, 4.20172119140625, 4.443115234375, 4.68450927734375, 4.9259033203125, 5.16729736328125, 5.40869140625, 5.65008544921875, 5.8914794921875, 6.13287353515625, 6.374267578125, 6.61566162109375, 6.8570556640625, 7.09844970703125, 7.33984375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 17.0, 42.0, 154.0, 508.0, 182.0, 47.0, 23.0, 6.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.06907081604004, -14.678471565246582, -13.287871360778809, -11.897272109985352, -10.506671905517578, -9.116072654724121, -7.725473403930664, -6.334873199462891, -4.944273948669434, -3.5536742210388184, -2.1630747318267822, -0.7724752426147461, 0.6181244850158691, 2.0087242126464844, 3.3993234634399414, 4.789923667907715, 6.180522918701172, 7.571122646331787, 8.961722373962402, 10.35232162475586, 11.742921829223633, 13.13352108001709, 14.524120330810547, 15.91472053527832, 17.305320739746094, 18.695920944213867, 20.086519241333008, 21.47711944580078, 22.867719650268555, 24.258319854736328, 25.64891815185547, 27.039518356323242, 28.430118560791016, 29.82071876525879, 31.21131706237793, 32.6019172668457, 33.992515563964844, 35.38311767578125, 36.77371597290039, 38.16431427001953, 39.55491638183594, 40.94551467895508, 42.336116790771484, 43.726715087890625, 45.117313385009766, 46.50791549682617, 47.89851379394531, 49.28911590576172, 50.679710388183594, 52.070308685302734, 53.46091079711914, 54.85150909423828, 56.24210739135742, 57.63270950317383, 59.02330780029297, 60.413909912109375, 61.804508209228516, 63.195106506347656, 64.58570861816406, 65.97630310058594, 67.36690521240234, 68.75750732421875, 70.14810180664062, 71.53870391845703, 72.92930603027344]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 9.0, 13.0, 17.0, 10.0, 19.0, 25.0, 13.0, 22.0, 29.0, 32.0, 42.0, 38.0, 35.0, 39.0, 40.0, 51.0, 42.0, 43.0, 43.0, 42.0, 46.0, 35.0, 24.0, 28.0, 35.0, 39.0, 35.0, 26.0, 15.0, 12.0, 20.0, 15.0, 14.0, 15.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.190006256103516, -10.849928855895996, -10.509851455688477, -10.169774055480957, -9.829696655273438, -9.489619255065918, -9.149541854858398, -8.809464454650879, -8.46938705444336, -8.12930965423584, -7.78923225402832, -7.449154853820801, -7.109077453613281, -6.769000053405762, -6.428922653198242, -6.088845252990723, -5.748767375946045, -5.408689975738525, -5.068612575531006, -4.728535175323486, -4.388457775115967, -4.048380374908447, -3.7083027362823486, -3.368225336074829, -3.0281479358673096, -2.68807053565979, -2.3479931354522705, -2.007915496826172, -1.667838215827942, -1.3277608156204224, -0.9876832962036133, -0.6476058959960938, -0.3075284957885742, 0.0325489342212677, 0.3726263642311096, 0.7127038240432739, 1.0527812242507935, 1.392858624458313, 1.732936143875122, 2.0730135440826416, 2.413090944290161, 2.7531683444976807, 3.0932457447052, 3.433323383331299, 3.7734007835388184, 4.113478183746338, 4.453555583953857, 4.793632984161377, 5.1337103843688965, 5.473787784576416, 5.8138651847839355, 6.153942584991455, 6.494019985198975, 6.834097385406494, 7.174175262451172, 7.514252662658691, 7.854330062866211, 8.19440746307373, 8.53448486328125, 8.87456226348877, 9.214639663696289, 9.554717063903809, 9.894794464111328, 10.234871864318848, 10.574949264526367]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 5.0, 3.0, 3.0, 5.0, 8.0, 10.0, 6.0, 21.0, 16.0, 18.0, 26.0, 27.0, 45.0, 66.0, 79.0, 80.0, 116.0, 145.0, 186.0, 249.0, 353.0, 507.0, 751.0, 1195.0, 1958.0, 3995.0, 10135.0, 37819.0, 727981.0, 3342614.0, 43292.0, 11575.0, 4608.0, 2312.0, 1324.0, 844.0, 542.0, 379.0, 264.0, 200.0, 130.0, 89.0, 82.0, 52.0, 42.0, 28.0, 27.0, 18.0, 17.0, 10.0, 6.0, 10.0, 5.0, 5.0, 3.0, 1.0], "bins": [-0.0352783203125, -0.034325361251831055, -0.03337240219116211, -0.032419443130493164, -0.03146648406982422, -0.030513525009155273, -0.029560565948486328, -0.028607606887817383, -0.027654647827148438, -0.026701688766479492, -0.025748729705810547, -0.0247957706451416, -0.023842811584472656, -0.02288985252380371, -0.021936893463134766, -0.02098393440246582, -0.020030975341796875, -0.01907801628112793, -0.018125057220458984, -0.01717209815979004, -0.016219139099121094, -0.015266180038452148, -0.014313220977783203, -0.013360261917114258, -0.012407302856445312, -0.011454343795776367, -0.010501384735107422, -0.009548425674438477, -0.008595466613769531, -0.007642507553100586, -0.006689548492431641, -0.005736589431762695, -0.00478363037109375, -0.0038306713104248047, -0.0028777122497558594, -0.001924753189086914, -0.0009717941284179688, -1.8835067749023438e-05, 0.0009341239929199219, 0.0018870830535888672, 0.0028400421142578125, 0.003793001174926758, 0.004745960235595703, 0.0056989192962646484, 0.006651878356933594, 0.007604837417602539, 0.008557796478271484, 0.00951075553894043, 0.010463714599609375, 0.01141667366027832, 0.012369632720947266, 0.013322591781616211, 0.014275550842285156, 0.015228509902954102, 0.016181468963623047, 0.017134428024291992, 0.018087387084960938, 0.019040346145629883, 0.019993305206298828, 0.020946264266967773, 0.02189922332763672, 0.022852182388305664, 0.02380514144897461, 0.024758100509643555, 0.0257110595703125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 4.0, 3.0, 5.0, 9.0, 13.0, 6.0, 11.0, 22.0, 13.0, 772.0, 22.0, 9.0, 18.0, 11.0, 5.0, 8.0, 9.0, 3.0, 7.0, 6.0, 7.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.004955291748046875, -0.004811882972717285, -0.004668474197387695, -0.0045250654220581055, -0.004381656646728516, -0.004238247871398926, -0.004094839096069336, -0.003951430320739746, -0.0038080215454101562, -0.0036646127700805664, -0.0035212039947509766, -0.0033777952194213867, -0.003234386444091797, -0.003090977668762207, -0.002947568893432617, -0.0028041601181030273, -0.0026607513427734375, -0.0025173425674438477, -0.002373933792114258, -0.002230525016784668, -0.002087116241455078, -0.0019437074661254883, -0.0018002986907958984, -0.0016568899154663086, -0.0015134811401367188, -0.001370072364807129, -0.001226663589477539, -0.0010832548141479492, -0.0009398460388183594, -0.0007964372634887695, -0.0006530284881591797, -0.0005096197128295898, -0.0003662109375, -0.00022280216217041016, -7.939338684082031e-05, 6.401538848876953e-05, 0.00020742416381835938, 0.0003508329391479492, 0.0004942417144775391, 0.0006376504898071289, 0.0007810592651367188, 0.0009244680404663086, 0.0010678768157958984, 0.0012112855911254883, 0.0013546943664550781, 0.001498103141784668, 0.0016415119171142578, 0.0017849206924438477, 0.0019283294677734375, 0.0020717382431030273, 0.002215147018432617, 0.002358555793762207, 0.002501964569091797, 0.0026453733444213867, 0.0027887821197509766, 0.0029321908950805664, 0.0030755996704101562, 0.003219008445739746, 0.003362417221069336, 0.0035058259963989258, 0.0036492347717285156, 0.0037926435470581055, 0.003936052322387695, 0.004079461097717285, 0.004222869873046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 6.0, 8.0, 4.0, 7.0, 14.0, 18.0, 33.0, 39.0, 52.0, 62.0, 118.0, 212.0, 385.0, 654.0, 1459.0, 3658.0, 16445.0, 303524.0, 3750405.0, 101833.0, 9969.0, 2791.0, 1129.0, 552.0, 310.0, 178.0, 118.0, 83.0, 59.0, 43.0, 25.0, 24.0, 16.0, 14.0, 9.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.046783447265625, -0.04546070098876953, -0.04413795471191406, -0.042815208435058594, -0.041492462158203125, -0.040169715881347656, -0.03884696960449219, -0.03752422332763672, -0.03620147705078125, -0.03487873077392578, -0.03355598449707031, -0.032233238220214844, -0.030910491943359375, -0.029587745666503906, -0.028264999389648438, -0.02694225311279297, -0.0256195068359375, -0.02429676055908203, -0.022974014282226562, -0.021651268005371094, -0.020328521728515625, -0.019005775451660156, -0.017683029174804688, -0.01636028289794922, -0.01503753662109375, -0.013714790344238281, -0.012392044067382812, -0.011069297790527344, -0.009746551513671875, -0.008423805236816406, -0.0071010589599609375, -0.005778312683105469, -0.00445556640625, -0.0031328201293945312, -0.0018100738525390625, -0.00048732757568359375, 0.000835418701171875, 0.0021581649780273438, 0.0034809112548828125, 0.004803657531738281, 0.00612640380859375, 0.007449150085449219, 0.008771896362304688, 0.010094642639160156, 0.011417388916015625, 0.012740135192871094, 0.014062881469726562, 0.015385627746582031, 0.0167083740234375, 0.01803112030029297, 0.019353866577148438, 0.020676612854003906, 0.021999359130859375, 0.023322105407714844, 0.024644851684570312, 0.02596759796142578, 0.02729034423828125, 0.02861309051513672, 0.029935836791992188, 0.031258583068847656, 0.032581329345703125, 0.033904075622558594, 0.03522682189941406, 0.03654956817626953, 0.037872314453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 0.0, 8.0, 10.0, 11.0, 12.0, 12.0, 21.0, 27.0, 36.0, 56.0, 73.0, 110.0, 206.0, 298.0, 480.0, 692.0, 773.0, 433.0, 304.0, 170.0, 102.0, 85.0, 62.0, 24.0, 17.0, 13.0, 8.0, 8.0, 5.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00644683837890625, -0.0062247514724731445, -0.006002664566040039, -0.005780577659606934, -0.005558490753173828, -0.005336403846740723, -0.005114316940307617, -0.004892230033874512, -0.004670143127441406, -0.004448056221008301, -0.004225969314575195, -0.00400388240814209, -0.0037817955017089844, -0.003559708595275879, -0.0033376216888427734, -0.003115534782409668, -0.0028934478759765625, -0.002671360969543457, -0.0024492740631103516, -0.002227187156677246, -0.0020051002502441406, -0.0017830133438110352, -0.0015609264373779297, -0.0013388395309448242, -0.0011167526245117188, -0.0008946657180786133, -0.0006725788116455078, -0.00045049190521240234, -0.00022840499877929688, -6.318092346191406e-06, 0.00021576881408691406, 0.00043785572052001953, 0.000659942626953125, 0.0008820295333862305, 0.001104116439819336, 0.0013262033462524414, 0.0015482902526855469, 0.0017703771591186523, 0.001992464065551758, 0.0022145509719848633, 0.0024366378784179688, 0.0026587247848510742, 0.0028808116912841797, 0.003102898597717285, 0.0033249855041503906, 0.003547072410583496, 0.0037691593170166016, 0.003991246223449707, 0.0042133331298828125, 0.004435420036315918, 0.0046575069427490234, 0.004879593849182129, 0.005101680755615234, 0.00532376766204834, 0.005545854568481445, 0.005767941474914551, 0.005990028381347656, 0.006212115287780762, 0.006434202194213867, 0.006656289100646973, 0.006878376007080078, 0.007100462913513184, 0.007322549819946289, 0.0075446367263793945, 0.0077667236328125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 8.0, 12.0, 48.0, 185.0, 367.0, 269.0, 72.0, 22.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.16172388195991516, -0.15854375064373016, -0.15536363422870636, -0.15218350291252136, -0.14900337159633636, -0.14582324028015137, -0.14264312386512756, -0.13946299254894257, -0.13628286123275757, -0.13310272991657257, -0.12992261350154877, -0.12674248218536377, -0.12356235086917877, -0.12038222700357437, -0.11720209568738937, -0.11402197182178497, -0.11084184050559998, -0.10766171663999557, -0.10448158532381058, -0.10130146145820618, -0.09812133014202118, -0.09494120627641678, -0.09176107496023178, -0.08858095109462738, -0.08540082722902298, -0.08222070336341858, -0.07904057204723358, -0.07586044818162918, -0.07268031686544418, -0.06950019299983978, -0.06632006168365479, -0.06313993781805038, -0.05995980277657509, -0.05677967518568039, -0.05359954759478569, -0.05041942000389099, -0.04723929241299629, -0.04405916482210159, -0.04087904095649719, -0.037698909640312195, -0.034518785774707794, -0.031338658183813095, -0.028158530592918396, -0.024978403002023697, -0.021798275411128998, -0.018618149682879448, -0.015438022091984749, -0.01225789450109005, -0.009077765047550201, -0.005897637456655502, -0.0027175103314220905, 0.00046261679381132126, 0.0036427443847060204, 0.006822871044278145, 0.010002998635172844, 0.013183126226067543, 0.016363253816962242, 0.01954338140785694, 0.02272350899875164, 0.02590363472700119, 0.02908376231789589, 0.03226388990879059, 0.03544401749968529, 0.03862414509057999, 0.041804272681474686]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 1.0, 6.0, 3.0, 7.0, 11.0, 12.0, 16.0, 16.0, 21.0, 26.0, 22.0, 32.0, 37.0, 44.0, 55.0, 56.0, 43.0, 54.0, 66.0, 61.0, 56.0, 52.0, 63.0, 38.0, 39.0, 29.0, 25.0, 29.0, 20.0, 11.0, 8.0, 4.0, 4.0, 7.0, 7.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02628767490386963, -0.02539699524641037, -0.02450631745159626, -0.02361563965678215, -0.02272495999932289, -0.021834280341863632, -0.020943602547049522, -0.020052924752235413, -0.019162245094776154, -0.018271565437316895, -0.017380887642502785, -0.016490209847688675, -0.015599530190229416, -0.014708851464092731, -0.013818172737956047, -0.012927494011819363, -0.012036815285682678, -0.011146136559545994, -0.01025545783340931, -0.009364779107272625, -0.00847410038113594, -0.007583421654999256, -0.006692742928862572, -0.005802064202725887, -0.004911385476589203, -0.0040207067504525185, -0.003130028024315834, -0.0022393492981791496, -0.0013486705720424652, -0.0004579918459057808, 0.0004326868802309036, 0.001323365606367588, 0.0022140443325042725, 0.003104723058640957, 0.003995401784777641, 0.004886080510914326, 0.00577675923705101, 0.0066674379631876945, 0.007558116689324379, 0.008448795415461063, 0.009339474141597748, 0.010230152867734432, 0.011120831593871117, 0.012011510320007801, 0.012902189046144485, 0.01379286777228117, 0.014683546498417854, 0.015574225224554539, 0.016464903950691223, 0.017355583608150482, 0.018246261402964592, 0.019136939197778702, 0.02002761885523796, 0.02091829851269722, 0.02180897630751133, 0.02269965410232544, 0.0235903337597847, 0.024481013417243958, 0.025371691212058067, 0.026262369006872177, 0.027153048664331436, 0.028043728321790695, 0.028934406116604805, 0.029825083911418915, 0.030715763568878174]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 4.0, 5.0, 5.0, 2.0, 8.0, 13.0, 7.0, 22.0, 24.0, 33.0, 48.0, 57.0, 76.0, 97.0, 138.0, 184.0, 243.0, 354.0, 480.0, 710.0, 1045.0, 1508.0, 2388.0, 3902.0, 6763.0, 13339.0, 30967.0, 739491.0, 192847.0, 25701.0, 11441.0, 6094.0, 3592.0, 2239.0, 1448.0, 1030.0, 598.0, 480.0, 330.0, 218.0, 129.0, 139.0, 89.0, 84.0, 53.0, 41.0, 14.0, 18.0, 17.0, 7.0, 9.0, 7.0, 3.0, 4.0, 5.0, 6.0, 2.0, 2.0, 3.0, 4.0], "bins": [-0.02996826171875, -0.029028892517089844, -0.028089523315429688, -0.02715015411376953, -0.026210784912109375, -0.02527141571044922, -0.024332046508789062, -0.023392677307128906, -0.02245330810546875, -0.021513938903808594, -0.020574569702148438, -0.01963520050048828, -0.018695831298828125, -0.01775646209716797, -0.016817092895507812, -0.015877723693847656, -0.0149383544921875, -0.013998985290527344, -0.013059616088867188, -0.012120246887207031, -0.011180877685546875, -0.010241508483886719, -0.009302139282226562, -0.008362770080566406, -0.00742340087890625, -0.006484031677246094, -0.0055446624755859375, -0.004605293273925781, -0.003665924072265625, -0.0027265548706054688, -0.0017871856689453125, -0.0008478164672851562, 9.1552734375e-05, 0.0010309219360351562, 0.0019702911376953125, 0.0029096603393554688, 0.003849029541015625, 0.004788398742675781, 0.0057277679443359375, 0.006667137145996094, 0.00760650634765625, 0.008545875549316406, 0.009485244750976562, 0.010424613952636719, 0.011363983154296875, 0.012303352355957031, 0.013242721557617188, 0.014182090759277344, 0.0151214599609375, 0.016060829162597656, 0.017000198364257812, 0.01793956756591797, 0.018878936767578125, 0.01981830596923828, 0.020757675170898438, 0.021697044372558594, 0.02263641357421875, 0.023575782775878906, 0.024515151977539062, 0.02545452117919922, 0.026393890380859375, 0.02733325958251953, 0.028272628784179688, 0.029211997985839844, 0.0301513671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 3.0, 6.0, 7.0, 10.0, 13.0, 17.0, 19.0, 39.0, 349.0, 366.0, 47.0, 18.0, 13.0, 9.0, 9.0, 7.0, 6.0, 8.0, 5.0, 2.0, 6.0, 5.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004528045654296875, -0.004395127296447754, -0.004262208938598633, -0.004129290580749512, -0.003996372222900391, -0.0038634538650512695, -0.0037305355072021484, -0.0035976171493530273, -0.0034646987915039062, -0.003331780433654785, -0.003198862075805664, -0.003065943717956543, -0.002933025360107422, -0.0028001070022583008, -0.0026671886444091797, -0.0025342702865600586, -0.0024013519287109375, -0.0022684335708618164, -0.0021355152130126953, -0.0020025968551635742, -0.0018696784973144531, -0.001736760139465332, -0.001603841781616211, -0.0014709234237670898, -0.0013380050659179688, -0.0012050867080688477, -0.0010721683502197266, -0.0009392499923706055, -0.0008063316345214844, -0.0006734132766723633, -0.0005404949188232422, -0.0004075765609741211, -0.000274658203125, -0.0001417398452758789, -8.821487426757812e-06, 0.00012409687042236328, 0.0002570152282714844, 0.00038993358612060547, 0.0005228519439697266, 0.0006557703018188477, 0.0007886886596679688, 0.0009216070175170898, 0.001054525375366211, 0.001187443733215332, 0.0013203620910644531, 0.0014532804489135742, 0.0015861988067626953, 0.0017191171646118164, 0.0018520355224609375, 0.0019849538803100586, 0.0021178722381591797, 0.0022507905960083008, 0.002383708953857422, 0.002516627311706543, 0.002649545669555664, 0.002782464027404785, 0.0029153823852539062, 0.0030483007431030273, 0.0031812191009521484, 0.0033141374588012695, 0.0034470558166503906, 0.0035799741744995117, 0.003712892532348633, 0.003845810890197754, 0.003978729248046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 0.0, 8.0, 6.0, 10.0, 10.0, 16.0, 14.0, 16.0, 19.0, 35.0, 59.0, 75.0, 101.0, 133.0, 150.0, 230.0, 361.0, 494.0, 693.0, 1157.0, 1827.0, 3426.0, 7535.0, 26492.0, 336728.0, 614083.0, 36168.0, 8996.0, 3854.0, 2079.0, 1170.0, 766.0, 515.0, 355.0, 259.0, 171.0, 116.0, 97.0, 84.0, 69.0, 52.0, 27.0, 28.0, 25.0, 16.0, 11.0, 7.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0482177734375, -0.04671525955200195, -0.045212745666503906, -0.04371023178100586, -0.04220771789550781, -0.040705204010009766, -0.03920269012451172, -0.03770017623901367, -0.036197662353515625, -0.03469514846801758, -0.03319263458251953, -0.031690120697021484, -0.030187606811523438, -0.02868509292602539, -0.027182579040527344, -0.025680065155029297, -0.02417755126953125, -0.022675037384033203, -0.021172523498535156, -0.01967000961303711, -0.018167495727539062, -0.016664981842041016, -0.015162467956542969, -0.013659954071044922, -0.012157440185546875, -0.010654926300048828, -0.009152412414550781, -0.007649898529052734, -0.0061473846435546875, -0.004644870758056641, -0.0031423568725585938, -0.0016398429870605469, -0.0001373291015625, 0.0013651847839355469, 0.0028676986694335938, 0.004370212554931641, 0.0058727264404296875, 0.007375240325927734, 0.008877754211425781, 0.010380268096923828, 0.011882781982421875, 0.013385295867919922, 0.014887809753417969, 0.016390323638916016, 0.017892837524414062, 0.01939535140991211, 0.020897865295410156, 0.022400379180908203, 0.02390289306640625, 0.025405406951904297, 0.026907920837402344, 0.02841043472290039, 0.029912948608398438, 0.031415462493896484, 0.03291797637939453, 0.03442049026489258, 0.035923004150390625, 0.03742551803588867, 0.03892803192138672, 0.040430545806884766, 0.04193305969238281, 0.04343557357788086, 0.044938087463378906, 0.04644060134887695, 0.047943115234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 10.0, 5.0, 11.0, 7.0, 11.0, 13.0, 18.0, 12.0, 24.0, 20.0, 20.0, 34.0, 30.0, 37.0, 32.0, 25.0, 41.0, 41.0, 29.0, 41.0, 35.0, 34.0, 38.0, 43.0, 48.0, 33.0, 33.0, 33.0, 19.0, 27.0, 33.0, 26.0, 16.0, 28.0, 13.0, 12.0, 17.0, 9.0, 7.0, 11.0, 8.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0186767578125, -0.018090248107910156, -0.017503738403320312, -0.01691722869873047, -0.016330718994140625, -0.01574420928955078, -0.015157699584960938, -0.014571189880371094, -0.01398468017578125, -0.013398170471191406, -0.012811660766601562, -0.012225151062011719, -0.011638641357421875, -0.011052131652832031, -0.010465621948242188, -0.009879112243652344, -0.0092926025390625, -0.008706092834472656, -0.008119583129882812, -0.007533073425292969, -0.006946563720703125, -0.006360054016113281, -0.0057735443115234375, -0.005187034606933594, -0.00460052490234375, -0.004014015197753906, -0.0034275054931640625, -0.0028409957885742188, -0.002254486083984375, -0.0016679763793945312, -0.0010814666748046875, -0.0004949569702148438, 9.1552734375e-05, 0.0006780624389648438, 0.0012645721435546875, 0.0018510818481445312, 0.002437591552734375, 0.0030241012573242188, 0.0036106109619140625, 0.004197120666503906, 0.00478363037109375, 0.005370140075683594, 0.0059566497802734375, 0.006543159484863281, 0.007129669189453125, 0.007716178894042969, 0.008302688598632812, 0.008889198303222656, 0.0094757080078125, 0.010062217712402344, 0.010648727416992188, 0.011235237121582031, 0.011821746826171875, 0.012408256530761719, 0.012994766235351562, 0.013581275939941406, 0.01416778564453125, 0.014754295349121094, 0.015340805053710938, 0.01592731475830078, 0.016513824462890625, 0.01710033416748047, 0.017686843872070312, 0.018273353576660156, 0.01885986328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 6.0, 6.0, 10.0, 13.0, 20.0, 32.0, 60.0, 83.0, 142.0, 267.0, 571.0, 1383.0, 4882.0, 35172.0, 930973.0, 65147.0, 6582.0, 1781.0, 671.0, 330.0, 165.0, 103.0, 55.0, 35.0, 21.0, 13.0, 6.0, 4.0, 9.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046905517578125, -0.04507303237915039, -0.04324054718017578, -0.04140806198120117, -0.03957557678222656, -0.03774309158325195, -0.035910606384277344, -0.034078121185302734, -0.032245635986328125, -0.030413150787353516, -0.028580665588378906, -0.026748180389404297, -0.024915695190429688, -0.023083209991455078, -0.02125072479248047, -0.01941823959350586, -0.01758575439453125, -0.01575326919555664, -0.013920783996582031, -0.012088298797607422, -0.010255813598632812, -0.008423328399658203, -0.006590843200683594, -0.004758358001708984, -0.002925872802734375, -0.0010933876037597656, 0.0007390975952148438, 0.002571582794189453, 0.0044040679931640625, 0.006236553192138672, 0.008069038391113281, 0.00990152359008789, 0.0117340087890625, 0.01356649398803711, 0.015398979187011719, 0.017231464385986328, 0.019063949584960938, 0.020896434783935547, 0.022728919982910156, 0.024561405181884766, 0.026393890380859375, 0.028226375579833984, 0.030058860778808594, 0.0318913459777832, 0.03372383117675781, 0.03555631637573242, 0.03738880157470703, 0.03922128677368164, 0.04105377197265625, 0.04288625717163086, 0.04471874237060547, 0.04655122756958008, 0.04838371276855469, 0.0502161979675293, 0.052048683166503906, 0.053881168365478516, 0.055713653564453125, 0.057546138763427734, 0.059378623962402344, 0.06121110916137695, 0.06304359436035156, 0.06487607955932617, 0.06670856475830078, 0.06854104995727539, 0.07037353515625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 6.0, 3.0, 3.0, 3.0, 11.0, 15.0, 16.0, 13.0, 40.0, 60.0, 88.0, 223.0, 209.0, 118.0, 64.0, 37.0, 22.0, 13.0, 10.0, 4.0, 8.0, 3.0, 8.0, 3.0, 3.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008015632629394531, -0.0007804855704307556, -0.0007594078779220581, -0.0007383301854133606, -0.0007172524929046631, -0.0006961748003959656, -0.0006750971078872681, -0.0006540194153785706, -0.000632941722869873, -0.0006118640303611755, -0.000590786337852478, -0.0005697086453437805, -0.000548630952835083, -0.0005275532603263855, -0.000506475567817688, -0.0004853978753089905, -0.00046432018280029297, -0.00044324249029159546, -0.00042216479778289795, -0.00040108710527420044, -0.00038000941276550293, -0.0003589317202568054, -0.0003378540277481079, -0.0003167763352394104, -0.0002956986427307129, -0.0002746209502220154, -0.00025354325771331787, -0.00023246556520462036, -0.00021138787269592285, -0.00019031018018722534, -0.00016923248767852783, -0.00014815479516983032, -0.0001270771026611328, -0.0001059994101524353, -8.492171764373779e-05, -6.384402513504028e-05, -4.2766332626342773e-05, -2.1688640117645264e-05, -6.109476089477539e-07, 2.0466744899749756e-05, 4.1544437408447266e-05, 6.262212991714478e-05, 8.369982242584229e-05, 0.0001047775149345398, 0.0001258552074432373, 0.00014693289995193481, 0.00016801059246063232, 0.00018908828496932983, 0.00021016597747802734, 0.00023124366998672485, 0.00025232136249542236, 0.0002733990550041199, 0.0002944767475128174, 0.0003155544400215149, 0.0003366321325302124, 0.0003577098250389099, 0.0003787875175476074, 0.00039986521005630493, 0.00042094290256500244, 0.00044202059507369995, 0.00046309828758239746, 0.00048417598009109497, 0.0005052536725997925, 0.00052633136510849, 0.0005474090576171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 4.0, 7.0, 16.0, 27.0, 27.0, 51.0, 59.0, 115.0, 163.0, 270.0, 516.0, 963.0, 2182.0, 5539.0, 18948.0, 170638.0, 779418.0, 52819.0, 10197.0, 3404.0, 1466.0, 708.0, 364.0, 244.0, 139.0, 77.0, 58.0, 27.0, 36.0, 15.0, 16.0, 4.0, 12.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.041351318359375, -0.04017925262451172, -0.03900718688964844, -0.037835121154785156, -0.036663055419921875, -0.035490989685058594, -0.03431892395019531, -0.03314685821533203, -0.03197479248046875, -0.03080272674560547, -0.029630661010742188, -0.028458595275878906, -0.027286529541015625, -0.026114463806152344, -0.024942398071289062, -0.02377033233642578, -0.0225982666015625, -0.02142620086669922, -0.020254135131835938, -0.019082069396972656, -0.017910003662109375, -0.016737937927246094, -0.015565872192382812, -0.014393806457519531, -0.01322174072265625, -0.012049674987792969, -0.010877609252929688, -0.009705543518066406, -0.008533477783203125, -0.007361412048339844, -0.0061893463134765625, -0.005017280578613281, -0.00384521484375, -0.0026731491088867188, -0.0015010833740234375, -0.00032901763916015625, 0.000843048095703125, 0.0020151138305664062, 0.0031871795654296875, 0.004359245300292969, 0.00553131103515625, 0.006703376770019531, 0.007875442504882812, 0.009047508239746094, 0.010219573974609375, 0.011391639709472656, 0.012563705444335938, 0.013735771179199219, 0.0149078369140625, 0.01607990264892578, 0.017251968383789062, 0.018424034118652344, 0.019596099853515625, 0.020768165588378906, 0.021940231323242188, 0.02311229705810547, 0.02428436279296875, 0.02545642852783203, 0.026628494262695312, 0.027800559997558594, 0.028972625732421875, 0.030144691467285156, 0.03131675720214844, 0.03248882293701172, 0.033660888671875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 5.0, 7.0, 10.0, 12.0, 11.0, 16.0, 19.0, 25.0, 31.0, 39.0, 53.0, 81.0, 58.0, 78.0, 87.0, 60.0, 66.0, 67.0, 64.0, 51.0, 36.0, 26.0, 19.0, 22.0, 16.0, 10.0, 4.0, 6.0, 3.0, 7.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0170135498046875, -0.01649165153503418, -0.01596975326538086, -0.015447854995727539, -0.014925956726074219, -0.014404058456420898, -0.013882160186767578, -0.013360261917114258, -0.012838363647460938, -0.012316465377807617, -0.011794567108154297, -0.011272668838500977, -0.010750770568847656, -0.010228872299194336, -0.009706974029541016, -0.009185075759887695, -0.008663177490234375, -0.008141279220581055, -0.007619380950927734, -0.007097482681274414, -0.006575584411621094, -0.0060536861419677734, -0.005531787872314453, -0.005009889602661133, -0.0044879913330078125, -0.003966093063354492, -0.003444194793701172, -0.0029222965240478516, -0.0024003982543945312, -0.001878499984741211, -0.0013566017150878906, -0.0008347034454345703, -0.00031280517578125, 0.0002090930938720703, 0.0007309913635253906, 0.001252889633178711, 0.0017747879028320312, 0.0022966861724853516, 0.002818584442138672, 0.003340482711791992, 0.0038623809814453125, 0.004384279251098633, 0.004906177520751953, 0.0054280757904052734, 0.005949974060058594, 0.006471872329711914, 0.006993770599365234, 0.007515668869018555, 0.008037567138671875, 0.008559465408325195, 0.009081363677978516, 0.009603261947631836, 0.010125160217285156, 0.010647058486938477, 0.011168956756591797, 0.011690855026245117, 0.012212753295898438, 0.012734651565551758, 0.013256549835205078, 0.013778448104858398, 0.014300346374511719, 0.014822244644165039, 0.01534414291381836, 0.01586604118347168, 0.016387939453125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 8.0, 10.0, 17.0, 110.0, 620.0, 162.0, 31.0, 12.0, 12.0, 7.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.9846861362457275, -0.9635157585144043, -0.942345380783081, -0.9211750030517578, -0.9000046849250793, -0.8788343071937561, -0.8576639294624329, -0.8364935517311096, -0.8153232336044312, -0.7941528558731079, -0.7729824781417847, -0.7518121004104614, -0.730641782283783, -0.7094714045524597, -0.6883010268211365, -0.6671306490898132, -0.64596027135849, -0.6247898936271667, -0.6036195158958435, -0.582449197769165, -0.5612788200378418, -0.5401084423065186, -0.5189380645751953, -0.49776768684387207, -0.4765973389148712, -0.455426961183548, -0.4342566132545471, -0.4130862355232239, -0.39191585779190063, -0.3707455098628998, -0.34957513213157654, -0.3284047842025757, -0.30723434686660767, -0.2860639691352844, -0.26489362120628357, -0.24372324347496033, -0.22255288064479828, -0.20138251781463623, -0.180212140083313, -0.15904177725315094, -0.1378714144229889, -0.11670105159282684, -0.0955306813120842, -0.07436031103134155, -0.053189948201179504, -0.032019585371017456, -0.010849207639694214, 0.010321155190467834, 0.03149151802062988, 0.05266188457608223, 0.07383225113153458, 0.09500262141227722, 0.11617298424243927, 0.13734334707260132, 0.15851372480392456, 0.1796840876340866, 0.20085445046424866, 0.2220248132944107, 0.24319517612457275, 0.264365553855896, 0.28553593158721924, 0.3067062795162201, 0.32787665724754333, 0.3490470051765442, 0.37021738290786743]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 6.0, 9.0, 6.0, 9.0, 18.0, 15.0, 29.0, 42.0, 86.0, 115.0, 140.0, 156.0, 103.0, 72.0, 66.0, 33.0, 17.0, 11.0, 8.0, 6.0, 8.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.37341636419296265, -0.3617608845233917, -0.3501054346561432, -0.33844995498657227, -0.32679450511932373, -0.3151390254497528, -0.3034835457801819, -0.29182809591293335, -0.2801726162433624, -0.2685171365737915, -0.25686168670654297, -0.24520620703697205, -0.23355074226856232, -0.2218952775001526, -0.21023979783058167, -0.19858433306217194, -0.1869288682937622, -0.17527340352535248, -0.16361793875694275, -0.15196245908737183, -0.1403069943189621, -0.12865152955055237, -0.11699605733156204, -0.10534058511257172, -0.09368512034416199, -0.08202965557575226, -0.07037418335676193, -0.058718714863061905, -0.04706324636936188, -0.03540777787566185, -0.023752309381961823, -0.012096837162971497, -0.0004413723945617676, 0.01121409609913826, 0.022869564592838287, 0.034525033086538315, 0.04618050158023834, 0.05783597007393837, 0.0694914385676384, 0.08114691078662872, 0.09280237555503845, 0.10445784032344818, 0.11611331254243851, 0.12776878476142883, 0.13942424952983856, 0.1510797142982483, 0.1627351939678192, 0.17439065873622894, 0.18604612350463867, 0.1977015882730484, 0.20935705304145813, 0.22101253271102905, 0.23266799747943878, 0.2443234622478485, 0.25597894191741943, 0.26763439178466797, 0.2792898714542389, 0.2909453511238098, 0.30260080099105835, 0.3142562806606293, 0.3259117603302002, 0.33756721019744873, 0.34922268986701965, 0.3608781695365906, 0.3725336194038391]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 9.0, 5.0, 13.0, 11.0, 18.0, 22.0, 41.0, 60.0, 262.0, 3839.0, 4145431.0, 43515.0, 725.0, 104.0, 42.0, 41.0, 26.0, 20.0, 17.0, 18.0, 6.0, 8.0, 5.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.90625, -2.822662353515625, -2.73907470703125, -2.655487060546875, -2.5718994140625, -2.488311767578125, -2.40472412109375, -2.321136474609375, -2.237548828125, -2.153961181640625, -2.07037353515625, -1.986785888671875, -1.9031982421875, -1.819610595703125, -1.73602294921875, -1.652435302734375, -1.56884765625, -1.485260009765625, -1.40167236328125, -1.318084716796875, -1.2344970703125, -1.150909423828125, -1.06732177734375, -0.983734130859375, -0.900146484375, -0.816558837890625, -0.73297119140625, -0.649383544921875, -0.5657958984375, -0.482208251953125, -0.39862060546875, -0.315032958984375, -0.2314453125, -0.147857666015625, -0.06427001953125, 0.019317626953125, 0.1029052734375, 0.186492919921875, 0.27008056640625, 0.353668212890625, 0.437255859375, 0.520843505859375, 0.60443115234375, 0.688018798828125, 0.7716064453125, 0.855194091796875, 0.93878173828125, 1.022369384765625, 1.10595703125, 1.189544677734375, 1.27313232421875, 1.356719970703125, 1.4403076171875, 1.523895263671875, 1.60748291015625, 1.691070556640625, 1.774658203125, 1.858245849609375, 1.94183349609375, 2.025421142578125, 2.1090087890625, 2.192596435546875, 2.27618408203125, 2.359771728515625, 2.443359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 8.0, 3.0, 5.0, 4.0, 7.0, 11.0, 12.0, 5.0, 6.0, 11.0, 22.0, 33.0, 78.0, 169.0, 273.0, 173.0, 59.0, 40.0, 8.0, 18.0, 7.0, 12.0, 5.0, 8.0, 1.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025787353515625, -0.002484828233718872, -0.002390921115875244, -0.002297013998031616, -0.0022031068801879883, -0.0021091997623443604, -0.0020152926445007324, -0.0019213855266571045, -0.0018274784088134766, -0.0017335712909698486, -0.0016396641731262207, -0.0015457570552825928, -0.0014518499374389648, -0.001357942819595337, -0.001264035701751709, -0.001170128583908081, -0.0010762214660644531, -0.0009823143482208252, -0.0008884072303771973, -0.0007945001125335693, -0.0007005929946899414, -0.0006066858768463135, -0.0005127787590026855, -0.0004188716411590576, -0.0003249645233154297, -0.00023105740547180176, -0.00013715028762817383, -4.32431697845459e-05, 5.066394805908203e-05, 0.00014457106590270996, 0.0002384781837463379, 0.0003323853015899658, 0.00042629241943359375, 0.0005201995372772217, 0.0006141066551208496, 0.0007080137729644775, 0.0008019208908081055, 0.0008958280086517334, 0.0009897351264953613, 0.0010836422443389893, 0.0011775493621826172, 0.0012714564800262451, 0.001365363597869873, 0.001459270715713501, 0.001553177833557129, 0.0016470849514007568, 0.0017409920692443848, 0.0018348991870880127, 0.0019288063049316406, 0.0020227134227752686, 0.0021166205406188965, 0.0022105276584625244, 0.0023044347763061523, 0.0023983418941497803, 0.002492249011993408, 0.002586156129837036, 0.002680063247680664, 0.002773970365524292, 0.00286787748336792, 0.002961784601211548, 0.0030556917190551758, 0.0031495988368988037, 0.0032435059547424316, 0.0033374130725860596, 0.0034313201904296875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 10.0, 13.0, 17.0, 26.0, 30.0, 42.0, 59.0, 82.0, 121.0, 124.0, 216.0, 391.0, 7389.0, 4181084.0, 3789.0, 299.0, 161.0, 112.0, 84.0, 65.0, 42.0, 34.0, 20.0, 16.0, 12.0, 10.0, 12.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.402587890625, -0.3846473693847656, -0.36670684814453125, -0.3487663269042969, -0.3308258056640625, -0.3128852844238281, -0.29494476318359375, -0.2770042419433594, -0.259063720703125, -0.24112319946289062, -0.22318267822265625, -0.20524215698242188, -0.1873016357421875, -0.16936111450195312, -0.15142059326171875, -0.13348007202148438, -0.11553955078125, -0.09759902954101562, -0.07965850830078125, -0.061717987060546875, -0.0437774658203125, -0.025836944580078125, -0.00789642333984375, 0.010044097900390625, 0.027984619140625, 0.045925140380859375, 0.06386566162109375, 0.08180618286132812, 0.0997467041015625, 0.11768722534179688, 0.13562774658203125, 0.15356826782226562, 0.1715087890625, 0.18944931030273438, 0.20738983154296875, 0.22533035278320312, 0.2432708740234375, 0.2612113952636719, 0.27915191650390625, 0.2970924377441406, 0.315032958984375, 0.3329734802246094, 0.35091400146484375, 0.3688545227050781, 0.3867950439453125, 0.4047355651855469, 0.42267608642578125, 0.4406166076660156, 0.45855712890625, 0.4764976501464844, 0.49443817138671875, 0.5123786926269531, 0.5303192138671875, 0.5482597351074219, 0.5662002563476562, 0.5841407775878906, 0.602081298828125, 0.6200218200683594, 0.6379623413085938, 0.6559028625488281, 0.6738433837890625, 0.6917839050292969, 0.7097244262695312, 0.7276649475097656, 0.74560546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 4.0, 8.0, 14.0, 31.0, 28.0, 36.0, 60.0, 68.0, 106.0, 119.0, 199.0, 254.0, 365.0, 522.0, 664.0, 496.0, 320.0, 218.0, 150.0, 112.0, 82.0, 65.0, 42.0, 26.0, 19.0, 19.0, 12.0, 9.0, 7.0, 4.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003925323486328125, -0.003750920295715332, -0.003576517105102539, -0.003402113914489746, -0.003227710723876953, -0.00305330753326416, -0.002878904342651367, -0.0027045011520385742, -0.0025300979614257812, -0.0023556947708129883, -0.0021812915802001953, -0.0020068883895874023, -0.0018324851989746094, -0.0016580820083618164, -0.0014836788177490234, -0.0013092756271362305, -0.0011348724365234375, -0.0009604692459106445, -0.0007860660552978516, -0.0006116628646850586, -0.0004372596740722656, -0.00026285648345947266, -8.845329284667969e-05, 8.594989776611328e-05, 0.00026035308837890625, 0.0004347562789916992, 0.0006091594696044922, 0.0007835626602172852, 0.0009579658508300781, 0.001132369041442871, 0.001306772232055664, 0.001481175422668457, 0.00165557861328125, 0.001829981803894043, 0.002004384994506836, 0.002178788185119629, 0.002353191375732422, 0.002527594566345215, 0.002701997756958008, 0.0028764009475708008, 0.0030508041381835938, 0.0032252073287963867, 0.0033996105194091797, 0.0035740137100219727, 0.0037484169006347656, 0.003922820091247559, 0.0040972232818603516, 0.0042716264724731445, 0.0044460296630859375, 0.0046204328536987305, 0.0047948360443115234, 0.004969239234924316, 0.005143642425537109, 0.005318045616149902, 0.005492448806762695, 0.005666851997375488, 0.005841255187988281, 0.006015658378601074, 0.006190061569213867, 0.00636446475982666, 0.006538867950439453, 0.006713271141052246, 0.006887674331665039, 0.007062077522277832, 0.007236480712890625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 11.0, 37.0, 160.0, 558.0, 166.0, 40.0, 22.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06724268198013306, -0.06093381717801094, -0.054624952375888824, -0.04831608384847641, -0.04200722277164459, -0.03569835424423218, -0.02938948944211006, -0.023080624639987946, -0.01677175983786583, -0.010462895035743713, -0.004154029302299023, 0.002154836431145668, 0.008463701233267784, 0.01477256789803505, 0.021081432700157166, 0.02739029750227928, 0.0336991623044014, 0.040008027106523514, 0.04631689190864563, 0.052625760436058044, 0.05893462151288986, 0.06524349004030228, 0.0715523511171341, 0.07786121964454651, 0.08417008817195892, 0.09047895669937134, 0.09678781777620316, 0.10309668630361557, 0.10940554738044739, 0.1157144159078598, 0.12202328443527222, 0.12833213806152344, 0.13464100658893585, 0.14094987511634827, 0.14725874364376068, 0.1535675972700119, 0.15987646579742432, 0.16618533432483673, 0.17249420285224915, 0.17880305647850037, 0.18511192500591278, 0.1914207935333252, 0.1977296620607376, 0.20403851568698883, 0.21034738421440125, 0.21665625274181366, 0.22296512126922607, 0.2292739748954773, 0.2355828583240509, 0.24189172685146332, 0.24820059537887573, 0.25450944900512695, 0.26081833243370056, 0.2671271860599518, 0.273436039686203, 0.2797449231147766, 0.28605377674102783, 0.29236263036727905, 0.29867151379585266, 0.3049803674221039, 0.3112892508506775, 0.3175981044769287, 0.32390695810317993, 0.33021584153175354, 0.33652469515800476]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 10.0, 8.0, 12.0, 11.0, 18.0, 10.0, 28.0, 23.0, 31.0, 38.0, 40.0, 47.0, 38.0, 48.0, 57.0, 53.0, 62.0, 52.0, 55.0, 60.0, 39.0, 44.0, 36.0, 36.0, 24.0, 18.0, 18.0, 16.0, 14.0, 12.0, 6.0, 10.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030827701091766357, -0.029587306082248688, -0.028346912935376167, -0.027106519788503647, -0.025866124778985977, -0.024625729769468307, -0.023385336622595787, -0.022144943475723267, -0.020904548466205597, -0.019664153456687927, -0.018423760309815407, -0.017183367162942886, -0.015942972153425217, -0.014702578075230122, -0.013462183997035027, -0.012221789918839931, -0.010981395840644836, -0.009741001762449741, -0.008500607684254646, -0.007260213606059551, -0.006019819527864456, -0.004779425449669361, -0.003539031371474266, -0.002298637293279171, -0.001058243215084076, 0.00018215086311101913, 0.0014225449413061142, 0.0026629390195012093, 0.0039033330976963043, 0.005143727175891399, 0.0063841212540864944, 0.0076245153322815895, 0.008864909410476685, 0.01010530348867178, 0.011345697566866875, 0.01258609164506197, 0.013826485723257065, 0.01506687980145216, 0.016307273879647255, 0.017547667026519775, 0.018788062036037445, 0.020028457045555115, 0.021268850192427635, 0.022509243339300156, 0.023749638348817825, 0.024990033358335495, 0.026230426505208015, 0.027470819652080536, 0.028711214661598206, 0.029951609671115875, 0.031192002817988396, 0.032432395964860916, 0.033672790974378586, 0.034913185983896255, 0.03615357726812363, 0.037393972277641296, 0.038634367287158966, 0.039874762296676636, 0.041115157306194305, 0.04235554859042168, 0.043595943599939346, 0.044836338609457016, 0.04607672989368439, 0.04731712490320206, 0.04855751991271973]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 6.0, 11.0, 17.0, 17.0, 36.0, 48.0, 67.0, 94.0, 123.0, 199.0, 263.0, 361.0, 598.0, 871.0, 1234.0, 1869.0, 2891.0, 4528.0, 7498.0, 13629.0, 29214.0, 183785.0, 696934.0, 58242.0, 19272.0, 10034.0, 5864.0, 3657.0, 2281.0, 1503.0, 1107.0, 686.0, 470.0, 347.0, 237.0, 175.0, 110.0, 85.0, 53.0, 29.0, 21.0, 23.0, 15.0, 17.0, 10.0, 7.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.03759765625, -0.03643226623535156, -0.035266876220703125, -0.03410148620605469, -0.03293609619140625, -0.03177070617675781, -0.030605316162109375, -0.029439926147460938, -0.0282745361328125, -0.027109146118164062, -0.025943756103515625, -0.024778366088867188, -0.02361297607421875, -0.022447586059570312, -0.021282196044921875, -0.020116806030273438, -0.018951416015625, -0.017786026000976562, -0.016620635986328125, -0.015455245971679688, -0.01428985595703125, -0.013124465942382812, -0.011959075927734375, -0.010793685913085938, -0.0096282958984375, -0.008462905883789062, -0.007297515869140625, -0.0061321258544921875, -0.00496673583984375, -0.0038013458251953125, -0.002635955810546875, -0.0014705657958984375, -0.00030517578125, 0.0008602142333984375, 0.002025604248046875, 0.0031909942626953125, 0.00435638427734375, 0.0055217742919921875, 0.006687164306640625, 0.007852554321289062, 0.0090179443359375, 0.010183334350585938, 0.011348724365234375, 0.012514114379882812, 0.01367950439453125, 0.014844894409179688, 0.016010284423828125, 0.017175674438476562, 0.018341064453125, 0.019506454467773438, 0.020671844482421875, 0.021837234497070312, 0.02300262451171875, 0.024168014526367188, 0.025333404541015625, 0.026498794555664062, 0.0276641845703125, 0.028829574584960938, 0.029994964599609375, 0.031160354614257812, 0.03232574462890625, 0.03349113464355469, 0.034656524658203125, 0.03582191467285156, 0.0369873046875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 6.0, 7.0, 14.0, 11.0, 8.0, 18.0, 51.0, 76.0, 160.0, 207.0, 157.0, 94.0, 52.0, 25.0, 19.0, 12.0, 9.0, 8.0, 4.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0026760101318359375, -0.002585798501968384, -0.00249558687210083, -0.0024053752422332764, -0.0023151636123657227, -0.002224951982498169, -0.0021347403526306152, -0.0020445287227630615, -0.001954317092895508, -0.001864105463027954, -0.0017738938331604004, -0.0016836822032928467, -0.001593470573425293, -0.0015032589435577393, -0.0014130473136901855, -0.0013228356838226318, -0.0012326240539550781, -0.0011424124240875244, -0.0010522007942199707, -0.000961989164352417, -0.0008717775344848633, -0.0007815659046173096, -0.0006913542747497559, -0.0006011426448822021, -0.0005109310150146484, -0.0004207193851470947, -0.000330507755279541, -0.0002402961254119873, -0.0001500844955444336, -5.987286567687988e-05, 3.0338764190673828e-05, 0.00012055039405822754, 0.00021076202392578125, 0.00030097365379333496, 0.00039118528366088867, 0.0004813969135284424, 0.0005716085433959961, 0.0006618201732635498, 0.0007520318031311035, 0.0008422434329986572, 0.0009324550628662109, 0.0010226666927337646, 0.0011128783226013184, 0.001203089952468872, 0.0012933015823364258, 0.0013835132122039795, 0.0014737248420715332, 0.001563936471939087, 0.0016541481018066406, 0.0017443597316741943, 0.001834571361541748, 0.0019247829914093018, 0.0020149946212768555, 0.002105206251144409, 0.002195417881011963, 0.0022856295108795166, 0.0023758411407470703, 0.002466052770614624, 0.0025562644004821777, 0.0026464760303497314, 0.002736687660217285, 0.002826899290084839, 0.0029171109199523926, 0.0030073225498199463, 0.0030975341796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 5.0, 11.0, 12.0, 16.0, 19.0, 26.0, 25.0, 48.0, 61.0, 110.0, 434.0, 2728.0, 47068.0, 981953.0, 13977.0, 1459.0, 281.0, 96.0, 52.0, 41.0, 23.0, 19.0, 16.0, 20.0, 12.0, 7.0, 5.0, 3.0, 7.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1285400390625, -0.12468433380126953, -0.12082862854003906, -0.1169729232788086, -0.11311721801757812, -0.10926151275634766, -0.10540580749511719, -0.10155010223388672, -0.09769439697265625, -0.09383869171142578, -0.08998298645019531, -0.08612728118896484, -0.08227157592773438, -0.0784158706665039, -0.07456016540527344, -0.07070446014404297, -0.0668487548828125, -0.06299304962158203, -0.05913734436035156, -0.055281639099121094, -0.051425933837890625, -0.047570228576660156, -0.04371452331542969, -0.03985881805419922, -0.03600311279296875, -0.03214740753173828, -0.028291702270507812, -0.024435997009277344, -0.020580291748046875, -0.016724586486816406, -0.012868881225585938, -0.009013175964355469, -0.005157470703125, -0.0013017654418945312, 0.0025539398193359375, 0.006409645080566406, 0.010265350341796875, 0.014121055603027344, 0.017976760864257812, 0.02183246612548828, 0.02568817138671875, 0.02954387664794922, 0.03339958190917969, 0.037255287170410156, 0.041110992431640625, 0.044966697692871094, 0.04882240295410156, 0.05267810821533203, 0.0565338134765625, 0.06038951873779297, 0.06424522399902344, 0.0681009292602539, 0.07195663452148438, 0.07581233978271484, 0.07966804504394531, 0.08352375030517578, 0.08737945556640625, 0.09123516082763672, 0.09509086608886719, 0.09894657135009766, 0.10280227661132812, 0.1066579818725586, 0.11051368713378906, 0.11436939239501953, 0.11822509765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 8.0, 13.0, 19.0, 20.0, 16.0, 18.0, 32.0, 31.0, 32.0, 30.0, 26.0, 25.0, 45.0, 44.0, 43.0, 45.0, 42.0, 50.0, 61.0, 50.0, 42.0, 41.0, 32.0, 23.0, 26.0, 28.0, 28.0, 22.0, 21.0, 16.0, 10.0, 12.0, 12.0, 12.0, 2.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0126800537109375, -0.012332916259765625, -0.01198577880859375, -0.011638641357421875, -0.01129150390625, -0.010944366455078125, -0.01059722900390625, -0.010250091552734375, -0.0099029541015625, -0.009555816650390625, -0.00920867919921875, -0.008861541748046875, -0.008514404296875, -0.008167266845703125, -0.00782012939453125, -0.007472991943359375, -0.0071258544921875, -0.006778717041015625, -0.00643157958984375, -0.006084442138671875, -0.0057373046875, -0.005390167236328125, -0.00504302978515625, -0.004695892333984375, -0.0043487548828125, -0.004001617431640625, -0.00365447998046875, -0.003307342529296875, -0.002960205078125, -0.002613067626953125, -0.00226593017578125, -0.001918792724609375, -0.0015716552734375, -0.001224517822265625, -0.00087738037109375, -0.000530242919921875, -0.00018310546875, 0.000164031982421875, 0.00051116943359375, 0.000858306884765625, 0.0012054443359375, 0.001552581787109375, 0.00189971923828125, 0.002246856689453125, 0.002593994140625, 0.002941131591796875, 0.00328826904296875, 0.003635406494140625, 0.0039825439453125, 0.004329681396484375, 0.00467681884765625, 0.005023956298828125, 0.00537109375, 0.005718231201171875, 0.00606536865234375, 0.006412506103515625, 0.0067596435546875, 0.007106781005859375, 0.00745391845703125, 0.007801055908203125, 0.008148193359375, 0.008495330810546875, 0.00884246826171875, 0.009189605712890625, 0.0095367431640625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 5.0, 11.0, 11.0, 14.0, 36.0, 42.0, 81.0, 152.0, 368.0, 1167.0, 5482.0, 82375.0, 927549.0, 26756.0, 3218.0, 723.0, 269.0, 129.0, 62.0, 26.0, 25.0, 12.0, 17.0, 8.0, 8.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09417724609375, -0.09085369110107422, -0.08753013610839844, -0.08420658111572266, -0.08088302612304688, -0.0775594711303711, -0.07423591613769531, -0.07091236114501953, -0.06758880615234375, -0.06426525115966797, -0.06094169616699219, -0.057618141174316406, -0.054294586181640625, -0.050971031188964844, -0.04764747619628906, -0.04432392120361328, -0.0410003662109375, -0.03767681121826172, -0.03435325622558594, -0.031029701232910156, -0.027706146240234375, -0.024382591247558594, -0.021059036254882812, -0.01773548126220703, -0.01441192626953125, -0.011088371276855469, -0.0077648162841796875, -0.004441261291503906, -0.001117706298828125, 0.0022058486938476562, 0.0055294036865234375, 0.008852958679199219, 0.012176513671875, 0.015500068664550781, 0.018823623657226562, 0.022147178649902344, 0.025470733642578125, 0.028794288635253906, 0.03211784362792969, 0.03544139862060547, 0.03876495361328125, 0.04208850860595703, 0.04541206359863281, 0.048735618591308594, 0.052059173583984375, 0.055382728576660156, 0.05870628356933594, 0.06202983856201172, 0.0653533935546875, 0.06867694854736328, 0.07200050354003906, 0.07532405853271484, 0.07864761352539062, 0.0819711685180664, 0.08529472351074219, 0.08861827850341797, 0.09194183349609375, 0.09526538848876953, 0.09858894348144531, 0.1019124984741211, 0.10523605346679688, 0.10855960845947266, 0.11188316345214844, 0.11520671844482422, 0.1185302734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 9.0, 10.0, 12.0, 22.0, 19.0, 36.0, 120.0, 432.0, 125.0, 57.0, 34.0, 31.0, 23.0, 13.0, 8.0, 8.0, 5.0, 6.0, 0.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.0010728836059570312, -0.0010470673441886902, -0.0010212510824203491, -0.000995434820652008, -0.000969618558883667, -0.0009438022971153259, -0.0009179860353469849, -0.0008921697735786438, -0.0008663535118103027, -0.0008405372500419617, -0.0008147209882736206, -0.0007889047265052795, -0.0007630884647369385, -0.0007372722029685974, -0.0007114559412002563, -0.0006856396794319153, -0.0006598234176635742, -0.0006340071558952332, -0.0006081908941268921, -0.000582374632358551, -0.00055655837059021, -0.0005307421088218689, -0.0005049258470535278, -0.00047910958528518677, -0.0004532933235168457, -0.00042747706174850464, -0.0004016607999801636, -0.0003758445382118225, -0.00035002827644348145, -0.0003242120146751404, -0.0002983957529067993, -0.00027257949113845825, -0.0002467632293701172, -0.00022094696760177612, -0.00019513070583343506, -0.000169314444065094, -0.00014349818229675293, -0.00011768192052841187, -9.18656587600708e-05, -6.604939699172974e-05, -4.023313522338867e-05, -1.4416873455047607e-05, 1.1399388313293457e-05, 3.721565008163452e-05, 6.303191184997559e-05, 8.884817361831665e-05, 0.00011466443538665771, 0.00014048069715499878, 0.00016629695892333984, 0.0001921132206916809, 0.00021792948246002197, 0.00024374574422836304, 0.0002695620059967041, 0.00029537826776504517, 0.00032119452953338623, 0.0003470107913017273, 0.00037282705307006836, 0.0003986433148384094, 0.0004244595766067505, 0.00045027583837509155, 0.0004760921001434326, 0.0005019083619117737, 0.0005277246236801147, 0.0005535408854484558, 0.0005793571472167969]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 5.0, 4.0, 6.0, 6.0, 7.0, 13.0, 13.0, 23.0, 64.0, 156.0, 538.0, 3198.0, 50697.0, 955163.0, 35382.0, 2517.0, 484.0, 144.0, 44.0, 38.0, 10.0, 16.0, 4.0, 9.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11669921875, -0.11321067810058594, -0.10972213745117188, -0.10623359680175781, -0.10274505615234375, -0.09925651550292969, -0.09576797485351562, -0.09227943420410156, -0.0887908935546875, -0.08530235290527344, -0.08181381225585938, -0.07832527160644531, -0.07483673095703125, -0.07134819030761719, -0.06785964965820312, -0.06437110900878906, -0.060882568359375, -0.05739402770996094, -0.053905487060546875, -0.05041694641113281, -0.04692840576171875, -0.04343986511230469, -0.039951324462890625, -0.03646278381347656, -0.0329742431640625, -0.029485702514648438, -0.025997161865234375, -0.022508621215820312, -0.01902008056640625, -0.015531539916992188, -0.012042999267578125, -0.008554458618164062, -0.00506591796875, -0.0015773773193359375, 0.001911163330078125, 0.0053997039794921875, 0.00888824462890625, 0.012376785278320312, 0.015865325927734375, 0.019353866577148438, 0.0228424072265625, 0.026330947875976562, 0.029819488525390625, 0.03330802917480469, 0.03679656982421875, 0.04028511047363281, 0.043773651123046875, 0.04726219177246094, 0.050750732421875, 0.05423927307128906, 0.057727813720703125, 0.06121635437011719, 0.06470489501953125, 0.06819343566894531, 0.07168197631835938, 0.07517051696777344, 0.0786590576171875, 0.08214759826660156, 0.08563613891601562, 0.08912467956542969, 0.09261322021484375, 0.09610176086425781, 0.09959030151367188, 0.10307884216308594, 0.1065673828125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 13.0, 12.0, 17.0, 20.0, 19.0, 34.0, 41.0, 38.0, 56.0, 73.0, 67.0, 79.0, 75.0, 83.0, 73.0, 59.0, 40.0, 34.0, 39.0, 20.0, 16.0, 14.0, 17.0, 11.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.014862060546875, -0.014399409294128418, -0.013936758041381836, -0.013474106788635254, -0.013011455535888672, -0.01254880428314209, -0.012086153030395508, -0.011623501777648926, -0.011160850524902344, -0.010698199272155762, -0.01023554801940918, -0.009772896766662598, -0.009310245513916016, -0.008847594261169434, -0.008384943008422852, -0.00792229175567627, -0.0074596405029296875, -0.0069969892501831055, -0.0065343379974365234, -0.006071686744689941, -0.005609035491943359, -0.005146384239196777, -0.004683732986450195, -0.004221081733703613, -0.0037584304809570312, -0.0032957792282104492, -0.002833127975463867, -0.002370476722717285, -0.0019078254699707031, -0.001445174217224121, -0.000982522964477539, -0.000519871711730957, -5.7220458984375e-05, 0.00040543079376220703, 0.0008680820465087891, 0.001330733299255371, 0.0017933845520019531, 0.002256035804748535, 0.002718687057495117, 0.0031813383102416992, 0.0036439895629882812, 0.004106640815734863, 0.004569292068481445, 0.005031943321228027, 0.005494594573974609, 0.005957245826721191, 0.0064198970794677734, 0.0068825483322143555, 0.0073451995849609375, 0.0078078508377075195, 0.008270502090454102, 0.008733153343200684, 0.009195804595947266, 0.009658455848693848, 0.01012110710144043, 0.010583758354187012, 0.011046409606933594, 0.011509060859680176, 0.011971712112426758, 0.01243436336517334, 0.012897014617919922, 0.013359665870666504, 0.013822317123413086, 0.014284968376159668, 0.01474761962890625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 6.0, 4.0, 6.0, 5.0, 7.0, 7.0, 34.0, 99.0, 309.0, 308.0, 144.0, 35.0, 25.0, 5.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.46810483932495117, -0.45876652002334595, -0.4494282305240631, -0.4400899112224579, -0.43075162172317505, -0.4214133024215698, -0.4120749831199646, -0.4027366638183594, -0.39339837431907654, -0.3840600550174713, -0.3747217655181885, -0.36538344621658325, -0.356045126914978, -0.3467068374156952, -0.33736851811408997, -0.32803022861480713, -0.3186919093132019, -0.3093535900115967, -0.30001530051231384, -0.2906769812107086, -0.2813386917114258, -0.27200037240982056, -0.26266205310821533, -0.2533237338066101, -0.24398544430732727, -0.23464713990688324, -0.2253088355064392, -0.21597051620483398, -0.20663221180438995, -0.19729390740394592, -0.1879555881023407, -0.17861728370189667, -0.16927894949913025, -0.15994064509868622, -0.1506023406982422, -0.14126402139663696, -0.13192571699619293, -0.1225874125957489, -0.11324910074472427, -0.10391078889369965, -0.09457248449325562, -0.08523418009281158, -0.07589586824178696, -0.06655755639076233, -0.0572192519903183, -0.04788094386458397, -0.03854263573884964, -0.029204323887825012, -0.01986601948738098, -0.010527711361646652, -0.001189403235912323, 0.008148904889822006, 0.017487213015556335, 0.026825521141290665, 0.036163829267024994, 0.04550214111804962, 0.05484044551849365, 0.06417874991893768, 0.07351706176996231, 0.08285537362098694, 0.09219367802143097, 0.101531982421875, 0.11087029427289963, 0.12020860612392426, 0.1295469105243683]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 9.0, 11.0, 5.0, 11.0, 11.0, 15.0, 24.0, 29.0, 36.0, 38.0, 60.0, 58.0, 70.0, 85.0, 69.0, 88.0, 71.0, 70.0, 44.0, 40.0, 41.0, 29.0, 18.0, 7.0, 8.0, 14.0, 9.0, 7.0, 1.0, 5.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10187232494354248, -0.09836287796497345, -0.09485343843698502, -0.09134399890899658, -0.08783455193042755, -0.08432510495185852, -0.08081566542387009, -0.07730622589588165, -0.07379677891731262, -0.07028733193874359, -0.06677789241075516, -0.06326845288276672, -0.05975900590419769, -0.05624956265091896, -0.05274011939764023, -0.049230676144361496, -0.045721232891082764, -0.04221178963780403, -0.0387023463845253, -0.03519290313124657, -0.031683459877967834, -0.028174016624689102, -0.02466457337141037, -0.021155130118131638, -0.017645686864852905, -0.014136243611574173, -0.01062680035829544, -0.007117357105016708, -0.003607913851737976, -9.847059845924377e-05, 0.0034109726548194885, 0.006920415908098221, 0.010429859161376953, 0.013939302414655685, 0.017448745667934418, 0.02095818892121315, 0.024467632174491882, 0.027977075427770615, 0.03148651868104935, 0.03499596193432808, 0.03850540518760681, 0.042014848440885544, 0.045524291694164276, 0.04903373494744301, 0.05254317820072174, 0.05605262145400047, 0.059562064707279205, 0.06307150423526764, 0.06658095121383667, 0.0700903981924057, 0.07359983772039413, 0.07710927724838257, 0.0806187242269516, 0.08412817120552063, 0.08763761073350906, 0.0911470502614975, 0.09465649724006653, 0.09816594421863556, 0.10167538374662399, 0.10518482327461243, 0.10869427025318146, 0.11220371723175049, 0.11571315675973892, 0.11922259628772736, 0.12273204326629639]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 4.0, 11.0, 15.0, 16.0, 16.0, 19.0, 16.0, 31.0, 34.0, 390.0, 4189446.0, 3949.0, 87.0, 29.0, 19.0, 19.0, 16.0, 12.0, 21.0, 18.0, 7.0, 13.0, 9.0, 2.0, 8.0, 9.0, 11.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0], "bins": [-1.4169921875, -1.376220703125, -1.33544921875, -1.294677734375, -1.25390625, -1.213134765625, -1.17236328125, -1.131591796875, -1.0908203125, -1.050048828125, -1.00927734375, -0.968505859375, -0.927734375, -0.886962890625, -0.84619140625, -0.805419921875, -0.7646484375, -0.723876953125, -0.68310546875, -0.642333984375, -0.6015625, -0.560791015625, -0.52001953125, -0.479248046875, -0.4384765625, -0.397705078125, -0.35693359375, -0.316162109375, -0.275390625, -0.234619140625, -0.19384765625, -0.153076171875, -0.1123046875, -0.071533203125, -0.03076171875, 0.010009765625, 0.05078125, 0.091552734375, 0.13232421875, 0.173095703125, 0.2138671875, 0.254638671875, 0.29541015625, 0.336181640625, 0.376953125, 0.417724609375, 0.45849609375, 0.499267578125, 0.5400390625, 0.580810546875, 0.62158203125, 0.662353515625, 0.703125, 0.743896484375, 0.78466796875, 0.825439453125, 0.8662109375, 0.906982421875, 0.94775390625, 0.988525390625, 1.029296875, 1.070068359375, 1.11083984375, 1.151611328125, 1.1923828125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 5.0, 11.0, 3.0, 8.0, 17.0, 20.0, 32.0, 62.0, 103.0, 139.0, 157.0, 157.0, 98.0, 62.0, 36.0, 14.0, 14.0, 8.0, 7.0, 9.0, 3.0, 7.0, 4.0, 4.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002849578857421875, -0.002759277820587158, -0.0026689767837524414, -0.0025786757469177246, -0.002488374710083008, -0.002398073673248291, -0.0023077726364135742, -0.0022174715995788574, -0.0021271705627441406, -0.002036869525909424, -0.001946568489074707, -0.0018562674522399902, -0.0017659664154052734, -0.0016756653785705566, -0.0015853643417358398, -0.001495063304901123, -0.0014047622680664062, -0.0013144612312316895, -0.0012241601943969727, -0.0011338591575622559, -0.001043558120727539, -0.0009532570838928223, -0.0008629560470581055, -0.0007726550102233887, -0.0006823539733886719, -0.0005920529365539551, -0.0005017518997192383, -0.0004114508628845215, -0.0003211498260498047, -0.0002308487892150879, -0.0001405477523803711, -5.02467155456543e-05, 4.00543212890625e-05, 0.0001303553581237793, 0.0002206563949584961, 0.0003109574317932129, 0.0004012584686279297, 0.0004915595054626465, 0.0005818605422973633, 0.0006721615791320801, 0.0007624626159667969, 0.0008527636528015137, 0.0009430646896362305, 0.0010333657264709473, 0.001123666763305664, 0.0012139678001403809, 0.0013042688369750977, 0.0013945698738098145, 0.0014848709106445312, 0.001575171947479248, 0.0016654729843139648, 0.0017557740211486816, 0.0018460750579833984, 0.0019363760948181152, 0.002026677131652832, 0.002116978168487549, 0.0022072792053222656, 0.0022975802421569824, 0.0023878812789916992, 0.002478182315826416, 0.002568483352661133, 0.0026587843894958496, 0.0027490854263305664, 0.002839386463165283, 0.0029296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 2.0, 7.0, 16.0, 19.0, 32.0, 60.0, 83.0, 211.0, 559.0, 3621.0, 4187649.0, 1200.0, 426.0, 190.0, 83.0, 43.0, 31.0, 14.0, 10.0, 6.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44140625, -0.42327117919921875, -0.4051361083984375, -0.38700103759765625, -0.368865966796875, -0.35073089599609375, -0.3325958251953125, -0.31446075439453125, -0.29632568359375, -0.27819061279296875, -0.2600555419921875, -0.24192047119140625, -0.223785400390625, -0.20565032958984375, -0.1875152587890625, -0.16938018798828125, -0.1512451171875, -0.13311004638671875, -0.1149749755859375, -0.09683990478515625, -0.078704833984375, -0.06056976318359375, -0.0424346923828125, -0.02429962158203125, -0.00616455078125, 0.01197052001953125, 0.0301055908203125, 0.04824066162109375, 0.066375732421875, 0.08451080322265625, 0.1026458740234375, 0.12078094482421875, 0.138916015625, 0.15705108642578125, 0.1751861572265625, 0.19332122802734375, 0.211456298828125, 0.22959136962890625, 0.2477264404296875, 0.26586151123046875, 0.28399658203125, 0.30213165283203125, 0.3202667236328125, 0.33840179443359375, 0.356536865234375, 0.37467193603515625, 0.3928070068359375, 0.41094207763671875, 0.4290771484375, 0.44721221923828125, 0.4653472900390625, 0.48348236083984375, 0.501617431640625, 0.5197525024414062, 0.5378875732421875, 0.5560226440429688, 0.57415771484375, 0.5922927856445312, 0.6104278564453125, 0.6285629272460938, 0.646697998046875, 0.6648330688476562, 0.6829681396484375, 0.7011032104492188, 0.71923828125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 12.0, 7.0, 13.0, 13.0, 17.0, 50.0, 63.0, 93.0, 164.0, 428.0, 663.0, 962.0, 714.0, 352.0, 211.0, 113.0, 67.0, 46.0, 24.0, 19.0, 14.0, 10.0, 7.0, 3.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.004322052001953125, -0.004110991954803467, -0.0038999319076538086, -0.0036888718605041504, -0.003477811813354492, -0.003266751766204834, -0.0030556917190551758, -0.0028446316719055176, -0.0026335716247558594, -0.002422511577606201, -0.002211451530456543, -0.0020003914833068848, -0.0017893314361572266, -0.0015782713890075684, -0.0013672113418579102, -0.001156151294708252, -0.0009450912475585938, -0.0007340312004089355, -0.0005229711532592773, -0.00031191110610961914, -0.00010085105895996094, 0.00011020898818969727, 0.00032126903533935547, 0.0005323290824890137, 0.0007433891296386719, 0.0009544491767883301, 0.0011655092239379883, 0.0013765692710876465, 0.0015876293182373047, 0.0017986893653869629, 0.002009749412536621, 0.0022208094596862793, 0.0024318695068359375, 0.0026429295539855957, 0.002853989601135254, 0.003065049648284912, 0.0032761096954345703, 0.0034871697425842285, 0.0036982297897338867, 0.003909289836883545, 0.004120349884033203, 0.004331409931182861, 0.0045424699783325195, 0.004753530025482178, 0.004964590072631836, 0.005175650119781494, 0.005386710166931152, 0.0055977702140808105, 0.005808830261230469, 0.006019890308380127, 0.006230950355529785, 0.006442010402679443, 0.0066530704498291016, 0.00686413049697876, 0.007075190544128418, 0.007286250591278076, 0.007497310638427734, 0.007708370685577393, 0.00791943073272705, 0.008130490779876709, 0.008341550827026367, 0.008552610874176025, 0.008763670921325684, 0.008974730968475342, 0.009185791015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 26.0, 152.0, 721.0, 91.0, 14.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9166123867034912, -0.8994352221488953, -0.8822580575942993, -0.8650809526443481, -0.8479037880897522, -0.8307266235351562, -0.8135495185852051, -0.7963723540306091, -0.7791951894760132, -0.7620180249214172, -0.7448408603668213, -0.7276637554168701, -0.7104865908622742, -0.6933094263076782, -0.676132321357727, -0.6589551568031311, -0.6417779922485352, -0.6246008276939392, -0.6074236631393433, -0.5902465581893921, -0.5730693936347961, -0.5558922290802002, -0.538715124130249, -0.5215379595756531, -0.5043607950210571, -0.4871836304664612, -0.4700064957141876, -0.45282936096191406, -0.4356521964073181, -0.41847503185272217, -0.4012978971004486, -0.38412076234817505, -0.3669436573982239, -0.34976649284362793, -0.33258935809135437, -0.3154122233390808, -0.29823505878448486, -0.2810578942298889, -0.26388075947761536, -0.2467036098241806, -0.22952646017074585, -0.2123493105173111, -0.19517216086387634, -0.1779950112104416, -0.16081786155700684, -0.14364071190357208, -0.12646356225013733, -0.10928641259670258, -0.09210926294326782, -0.07493211328983307, -0.057754963636398315, -0.04057781398296356, -0.02340066432952881, -0.006223514676094055, 0.010953634977340698, 0.02813078463077545, 0.045307934284210205, 0.06248508393764496, 0.07966223359107971, 0.09683938324451447, 0.11401653289794922, 0.13119368255138397, 0.14837083220481873, 0.16554798185825348, 0.18272513151168823]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 12.0, 15.0, 37.0, 51.0, 90.0, 100.0, 145.0, 169.0, 138.0, 111.0, 69.0, 30.0, 22.0, 9.0, 9.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03453254699707031, -0.03178812190890312, -0.02904369682073593, -0.02629927173256874, -0.02355484664440155, -0.02081042155623436, -0.01806599646806717, -0.015321571379899979, -0.012577146291732788, -0.009832721203565598, -0.007088296115398407, -0.004343871027231216, -0.0015994459390640259, 0.0011449791491031647, 0.0038894042372703552, 0.006633829325437546, 0.009378254413604736, 0.012122679501771927, 0.014867104589939117, 0.017611529678106308, 0.0203559547662735, 0.02310037985444069, 0.02584480494260788, 0.02858923003077507, 0.03133365511894226, 0.03407808020710945, 0.03682250529527664, 0.03956693038344383, 0.04231135547161102, 0.045055780559778214, 0.047800205647945404, 0.050544630736112595, 0.053289055824279785, 0.056033480912446976, 0.058777906000614166, 0.06152233108878136, 0.06426675617694855, 0.06701117753982544, 0.06975560635328293, 0.07250003516674042, 0.07524445652961731, 0.0779888778924942, 0.08073330670595169, 0.08347773551940918, 0.08622215688228607, 0.08896657824516296, 0.09171100705862045, 0.09445543587207794, 0.09719985723495483, 0.09994427859783173, 0.10268870741128922, 0.1054331362247467, 0.1081775575876236, 0.11092197895050049, 0.11366640776395798, 0.11641083657741547, 0.11915525794029236, 0.12189967930316925, 0.12464410811662674, 0.12738853693008423, 0.13013295829296112, 0.132877379655838, 0.1356218159198761, 0.138366237282753, 0.14111065864562988]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 7.0, 5.0, 4.0, 3.0, 8.0, 8.0, 11.0, 11.0, 20.0, 24.0, 27.0, 29.0, 46.0, 45.0, 58.0, 49.0, 56.0, 95.0, 1046961.0, 679.0, 60.0, 67.0, 50.0, 44.0, 48.0, 34.0, 38.0, 18.0, 13.0, 12.0, 7.0, 6.0, 7.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0517578125, -1.0214004516601562, -0.9910430908203125, -0.9606857299804688, -0.930328369140625, -0.8999710083007812, -0.8696136474609375, -0.8392562866210938, -0.80889892578125, -0.7785415649414062, -0.7481842041015625, -0.7178268432617188, -0.687469482421875, -0.6571121215820312, -0.6267547607421875, -0.5963973999023438, -0.5660400390625, -0.5356826782226562, -0.5053253173828125, -0.47496795654296875, -0.444610595703125, -0.41425323486328125, -0.3838958740234375, -0.35353851318359375, -0.32318115234375, -0.29282379150390625, -0.2624664306640625, -0.23210906982421875, -0.201751708984375, -0.17139434814453125, -0.1410369873046875, -0.11067962646484375, -0.080322265625, -0.04996490478515625, -0.0196075439453125, 0.01074981689453125, 0.041107177734375, 0.07146453857421875, 0.1018218994140625, 0.13217926025390625, 0.16253662109375, 0.19289398193359375, 0.2232513427734375, 0.25360870361328125, 0.283966064453125, 0.31432342529296875, 0.3446807861328125, 0.37503814697265625, 0.4053955078125, 0.43575286865234375, 0.4661102294921875, 0.49646759033203125, 0.526824951171875, 0.5571823120117188, 0.5875396728515625, 0.6178970336914062, 0.64825439453125, 0.6786117553710938, 0.7089691162109375, 0.7393264770507812, 0.769683837890625, 0.8000411987304688, 0.8303985595703125, 0.8607559204101562, 0.89111328125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 9.0, 30.0, 207.0, 543.0, 196.0, 27.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00435638427734375, -0.0037761926651000977, -0.0031960010528564453, -0.002615809440612793, -0.0020356178283691406, -0.0014554262161254883, -0.0008752346038818359, -0.0002950429916381836, 0.00028514862060546875, 0.0008653402328491211, 0.0014455318450927734, 0.0020257234573364258, 0.002605915069580078, 0.0031861066818237305, 0.003766298294067383, 0.004346489906311035, 0.0049266815185546875, 0.00550687313079834, 0.006087064743041992, 0.0066672563552856445, 0.007247447967529297, 0.00782763957977295, 0.008407831192016602, 0.008988022804260254, 0.009568214416503906, 0.010148406028747559, 0.010728597640991211, 0.011308789253234863, 0.011888980865478516, 0.012469172477722168, 0.01304936408996582, 0.013629555702209473, 0.014209747314453125, 0.014789938926696777, 0.01537013053894043, 0.015950322151184082, 0.016530513763427734, 0.017110705375671387, 0.01769089698791504, 0.01827108860015869, 0.018851280212402344, 0.019431471824645996, 0.02001166343688965, 0.0205918550491333, 0.021172046661376953, 0.021752238273620605, 0.022332429885864258, 0.02291262149810791, 0.023492813110351562, 0.024073004722595215, 0.024653196334838867, 0.02523338794708252, 0.025813579559326172, 0.026393771171569824, 0.026973962783813477, 0.02755415439605713, 0.02813434600830078, 0.028714537620544434, 0.029294729232788086, 0.02987492084503174, 0.03045511245727539, 0.031035304069519043, 0.031615495681762695, 0.03219568729400635, 0.03277587890625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 4.0, 7.0, 11.0, 12.0, 20.0, 29.0, 61.0, 93.0, 166.0, 301.0, 677.0, 1895.0, 6938.0, 45489.0, 811255.0, 161659.0, 14820.0, 3111.0, 1064.0, 396.0, 215.0, 131.0, 59.0, 49.0, 26.0, 17.0, 14.0, 8.0, 10.0, 4.0, 0.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2244873046875, -0.2166728973388672, -0.20885848999023438, -0.20104408264160156, -0.19322967529296875, -0.18541526794433594, -0.17760086059570312, -0.1697864532470703, -0.1619720458984375, -0.1541576385498047, -0.14634323120117188, -0.13852882385253906, -0.13071441650390625, -0.12290000915527344, -0.11508560180664062, -0.10727119445800781, -0.099456787109375, -0.09164237976074219, -0.08382797241210938, -0.07601356506347656, -0.06819915771484375, -0.06038475036621094, -0.052570343017578125, -0.04475593566894531, -0.0369415283203125, -0.029127120971679688, -0.021312713623046875, -0.013498306274414062, -0.00568389892578125, 0.0021305084228515625, 0.009944915771484375, 0.017759323120117188, 0.02557373046875, 0.03338813781738281, 0.041202545166015625, 0.04901695251464844, 0.05683135986328125, 0.06464576721191406, 0.07246017456054688, 0.08027458190917969, 0.0880889892578125, 0.09590339660644531, 0.10371780395507812, 0.11153221130371094, 0.11934661865234375, 0.12716102600097656, 0.13497543334960938, 0.1427898406982422, 0.150604248046875, 0.1584186553955078, 0.16623306274414062, 0.17404747009277344, 0.18186187744140625, 0.18967628479003906, 0.19749069213867188, 0.2053050994873047, 0.2131195068359375, 0.2209339141845703, 0.22874832153320312, 0.23656272888183594, 0.24437713623046875, 0.25219154357910156, 0.2600059509277344, 0.2678203582763672, 0.275634765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 7.0, 6.0, 14.0, 7.0, 17.0, 28.0, 28.0, 43.0, 45.0, 31.0, 66.0, 67.0, 79.0, 62.0, 80.0, 58.0, 73.0, 57.0, 49.0, 39.0, 34.0, 21.0, 23.0, 18.0, 14.0, 6.0, 4.0, 10.0, 6.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.039031982421875, -0.03793978691101074, -0.036847591400146484, -0.03575539588928223, -0.03466320037841797, -0.03357100486755371, -0.03247880935668945, -0.031386613845825195, -0.030294418334960938, -0.02920222282409668, -0.028110027313232422, -0.027017831802368164, -0.025925636291503906, -0.02483344078063965, -0.02374124526977539, -0.022649049758911133, -0.021556854248046875, -0.020464658737182617, -0.01937246322631836, -0.0182802677154541, -0.017188072204589844, -0.016095876693725586, -0.015003681182861328, -0.01391148567199707, -0.012819290161132812, -0.011727094650268555, -0.010634899139404297, -0.009542703628540039, -0.008450508117675781, -0.0073583126068115234, -0.006266117095947266, -0.005173921585083008, -0.00408172607421875, -0.002989530563354492, -0.0018973350524902344, -0.0008051395416259766, 0.00028705596923828125, 0.001379251480102539, 0.002471446990966797, 0.0035636425018310547, 0.0046558380126953125, 0.00574803352355957, 0.006840229034423828, 0.007932424545288086, 0.009024620056152344, 0.010116815567016602, 0.01120901107788086, 0.012301206588745117, 0.013393402099609375, 0.014485597610473633, 0.01557779312133789, 0.01666998863220215, 0.017762184143066406, 0.018854379653930664, 0.019946575164794922, 0.02103877067565918, 0.022130966186523438, 0.023223161697387695, 0.024315357208251953, 0.02540755271911621, 0.02649974822998047, 0.027591943740844727, 0.028684139251708984, 0.029776334762573242, 0.0308685302734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 3.0, 9.0, 10.0, 15.0, 24.0, 34.0, 37.0, 47.0, 75.0, 129.0, 215.0, 410.0, 873.0, 2357.0, 7612.0, 38147.0, 604759.0, 357876.0, 26308.0, 6001.0, 1923.0, 780.0, 371.0, 192.0, 115.0, 75.0, 46.0, 27.0, 15.0, 16.0, 8.0, 11.0, 3.0, 4.0, 7.0, 6.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.336669921875, -0.3277873992919922, -0.3189048767089844, -0.31002235412597656, -0.30113983154296875, -0.29225730895996094, -0.2833747863769531, -0.2744922637939453, -0.2656097412109375, -0.2567272186279297, -0.24784469604492188, -0.23896217346191406, -0.23007965087890625, -0.22119712829589844, -0.21231460571289062, -0.2034320831298828, -0.194549560546875, -0.1856670379638672, -0.17678451538085938, -0.16790199279785156, -0.15901947021484375, -0.15013694763183594, -0.14125442504882812, -0.1323719024658203, -0.1234893798828125, -0.11460685729980469, -0.10572433471679688, -0.09684181213378906, -0.08795928955078125, -0.07907676696777344, -0.07019424438476562, -0.06131172180175781, -0.05242919921875, -0.04354667663574219, -0.034664154052734375, -0.025781631469726562, -0.01689910888671875, -0.008016586303710938, 0.000865936279296875, 0.009748458862304688, 0.0186309814453125, 0.027513504028320312, 0.036396026611328125, 0.04527854919433594, 0.05416107177734375, 0.06304359436035156, 0.07192611694335938, 0.08080863952636719, 0.089691162109375, 0.09857368469238281, 0.10745620727539062, 0.11633872985839844, 0.12522125244140625, 0.13410377502441406, 0.14298629760742188, 0.1518688201904297, 0.1607513427734375, 0.1696338653564453, 0.17851638793945312, 0.18739891052246094, 0.19628143310546875, 0.20516395568847656, 0.21404647827148438, 0.2229290008544922, 0.2318115234375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 3.0, 3.0, 6.0, 11.0, 6.0, 9.0, 14.0, 19.0, 28.0, 35.0, 49.0, 70.0, 104.0, 164.0, 130.0, 84.0, 66.0, 57.0, 32.0, 19.0, 13.0, 10.0, 11.0, 6.0, 8.0, 8.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002256631851196289, -0.0002185683697462082, -0.00021147355437278748, -0.00020437873899936676, -0.00019728392362594604, -0.00019018910825252533, -0.00018309429287910461, -0.0001759994775056839, -0.00016890466213226318, -0.00016180984675884247, -0.00015471503138542175, -0.00014762021601200104, -0.00014052540063858032, -0.0001334305852651596, -0.0001263357698917389, -0.00011924095451831818, -0.00011214613914489746, -0.00010505132377147675, -9.795650839805603e-05, -9.086169302463531e-05, -8.37668776512146e-05, -7.667206227779388e-05, -6.957724690437317e-05, -6.248243153095245e-05, -5.538761615753174e-05, -4.829280078411102e-05, -4.119798541069031e-05, -3.410317003726959e-05, -2.7008354663848877e-05, -1.991353929042816e-05, -1.2818723917007446e-05, -5.723908543586731e-06, 1.3709068298339844e-06, 8.4657222032547e-06, 1.5560537576675415e-05, 2.265535295009613e-05, 2.9750168323516846e-05, 3.684498369693756e-05, 4.3939799070358276e-05, 5.103461444377899e-05, 5.812942981719971e-05, 6.522424519062042e-05, 7.231906056404114e-05, 7.941387593746185e-05, 8.650869131088257e-05, 9.360350668430328e-05, 0.000100698322057724, 0.00010779313743114471, 0.00011488795280456543, 0.00012198276817798615, 0.00012907758355140686, 0.00013617239892482758, 0.0001432672142982483, 0.000150362029671669, 0.00015745684504508972, 0.00016455166041851044, 0.00017164647579193115, 0.00017874129116535187, 0.00018583610653877258, 0.0001929309219121933, 0.00020002573728561401, 0.00020712055265903473, 0.00021421536803245544, 0.00022131018340587616, 0.00022840499877929688]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 0.0, 3.0, 5.0, 7.0, 2.0, 4.0, 8.0, 14.0, 6.0, 16.0, 30.0, 56.0, 86.0, 151.0, 342.0, 876.0, 2486.0, 10215.0, 401465.0, 616336.0, 11729.0, 2881.0, 995.0, 390.0, 196.0, 87.0, 62.0, 29.0, 21.0, 14.0, 9.0, 7.0, 5.0, 4.0, 10.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61669921875, -0.595458984375, -0.57421875, -0.552978515625, -0.53173828125, -0.510498046875, -0.4892578125, -0.468017578125, -0.44677734375, -0.425537109375, -0.404296875, -0.383056640625, -0.36181640625, -0.340576171875, -0.3193359375, -0.298095703125, -0.27685546875, -0.255615234375, -0.234375, -0.213134765625, -0.19189453125, -0.170654296875, -0.1494140625, -0.128173828125, -0.10693359375, -0.085693359375, -0.064453125, -0.043212890625, -0.02197265625, -0.000732421875, 0.0205078125, 0.041748046875, 0.06298828125, 0.084228515625, 0.10546875, 0.126708984375, 0.14794921875, 0.169189453125, 0.1904296875, 0.211669921875, 0.23291015625, 0.254150390625, 0.275390625, 0.296630859375, 0.31787109375, 0.339111328125, 0.3603515625, 0.381591796875, 0.40283203125, 0.424072265625, 0.4453125, 0.466552734375, 0.48779296875, 0.509033203125, 0.5302734375, 0.551513671875, 0.57275390625, 0.593994140625, 0.615234375, 0.636474609375, 0.65771484375, 0.678955078125, 0.7001953125, 0.721435546875, 0.74267578125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 13.0, 15.0, 12.0, 25.0, 39.0, 65.0, 110.0, 136.0, 183.0, 139.0, 85.0, 62.0, 27.0, 22.0, 10.0, 9.0, 12.0, 8.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07952880859375, -0.0753946304321289, -0.07126045227050781, -0.06712627410888672, -0.06299209594726562, -0.05885791778564453, -0.05472373962402344, -0.050589561462402344, -0.04645538330078125, -0.042321205139160156, -0.03818702697753906, -0.03405284881591797, -0.029918670654296875, -0.02578449249267578, -0.021650314331054688, -0.017516136169433594, -0.0133819580078125, -0.009247779846191406, -0.0051136016845703125, -0.0009794235229492188, 0.003154754638671875, 0.007288932800292969, 0.011423110961914062, 0.015557289123535156, 0.01969146728515625, 0.023825645446777344, 0.027959823608398438, 0.03209400177001953, 0.036228179931640625, 0.04036235809326172, 0.04449653625488281, 0.048630714416503906, 0.052764892578125, 0.056899070739746094, 0.06103324890136719, 0.06516742706298828, 0.06930160522460938, 0.07343578338623047, 0.07756996154785156, 0.08170413970947266, 0.08583831787109375, 0.08997249603271484, 0.09410667419433594, 0.09824085235595703, 0.10237503051757812, 0.10650920867919922, 0.11064338684082031, 0.1147775650024414, 0.1189117431640625, 0.1230459213256836, 0.1271800994873047, 0.13131427764892578, 0.13544845581054688, 0.13958263397216797, 0.14371681213378906, 0.14785099029541016, 0.15198516845703125, 0.15611934661865234, 0.16025352478027344, 0.16438770294189453, 0.16852188110351562, 0.17265605926513672, 0.1767902374267578, 0.1809244155883789, 0.18505859375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 10.0, 20.0, 60.0, 253.0, 410.0, 190.0, 34.0, 12.0, 5.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4380416870117188, -2.3689815998077393, -2.2999215126037598, -2.2308614253997803, -2.161801338195801, -2.0927412509918213, -2.023681163787842, -1.9546210765838623, -1.8855609893798828, -1.8165009021759033, -1.7474408149719238, -1.6783807277679443, -1.6093206405639648, -1.5402605533599854, -1.4712004661560059, -1.4021403789520264, -1.3330804109573364, -1.264020323753357, -1.1949602365493774, -1.125900149345398, -1.0568400621414185, -0.987779974937439, -0.9187199473381042, -0.8496598601341248, -0.7805997729301453, -0.7115396857261658, -0.6424795985221863, -0.5734195709228516, -0.5043594837188721, -0.4352993667125702, -0.3662393093109131, -0.2971792221069336, -0.22811925411224365, -0.15905916690826416, -0.08999909460544586, -0.020939022302627563, 0.04812106490135193, 0.11718115210533142, 0.18624120950698853, 0.255301296710968, 0.3243613839149475, 0.393421471118927, 0.4624815583229065, 0.5315415859222412, 0.6006016731262207, 0.6696617603302002, 0.7387218475341797, 0.8077819347381592, 0.8768420219421387, 0.9459021091461182, 1.0149621963500977, 1.0840222835540771, 1.1530823707580566, 1.2221424579620361, 1.2912025451660156, 1.3602626323699951, 1.4293227195739746, 1.498382806777954, 1.5674428939819336, 1.636502981185913, 1.7055630683898926, 1.774623155593872, 1.8436832427978516, 1.912743330001831, 1.981803297996521]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 10.0, 9.0, 11.0, 19.0, 20.0, 32.0, 30.0, 47.0, 53.0, 57.0, 81.0, 77.0, 67.0, 62.0, 73.0, 76.0, 57.0, 47.0, 45.0, 35.0, 24.0, 24.0, 19.0, 12.0, 9.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2689148783683777, -0.2575604021549225, -0.24620594084262848, -0.23485146462917328, -0.22349700331687927, -0.21214252710342407, -0.20078805088996887, -0.18943358957767487, -0.17807912826538086, -0.16672465205192566, -0.15537019073963165, -0.14401571452617645, -0.13266125321388245, -0.12130677700042725, -0.10995230823755264, -0.09859783947467804, -0.08724336326122284, -0.07588889449834824, -0.06453442573547363, -0.05317995324730873, -0.04182548448443413, -0.030471015721559525, -0.019116543233394623, -0.0077620744705200195, 0.0035923942923545837, 0.014946863986551762, 0.02630133368074894, 0.03765580430626869, 0.049010273069143295, 0.0603647418320179, 0.0717192143201828, 0.0830736830830574, 0.094428151845932, 0.10578262060880661, 0.11713708937168121, 0.1284915655851364, 0.13984602689743042, 0.15120050311088562, 0.16255497932434082, 0.17390944063663483, 0.18526390194892883, 0.19661837816238403, 0.20797283947467804, 0.21932731568813324, 0.23068177700042725, 0.24203625321388245, 0.25339072942733765, 0.26474517583847046, 0.27609968185424805, 0.28745415806770325, 0.29880863428115845, 0.31016308069229126, 0.32151755690574646, 0.33287203311920166, 0.34422650933265686, 0.35558098554611206, 0.3669354319572449, 0.3782899081707001, 0.3896443843841553, 0.4009988307952881, 0.4123533070087433, 0.4237077832221985, 0.4350622594356537, 0.4464167356491089, 0.4577711820602417]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 1.0, 8.0, 11.0, 15.0, 16.0, 29.0, 69.0, 67.0, 164.0, 291.0, 1209.0, 4184518.0, 6755.0, 424.0, 196.0, 118.0, 104.0, 78.0, 52.0, 43.0, 42.0, 21.0, 12.0, 8.0, 8.0, 10.0, 5.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76611328125, -0.7172470092773438, -0.6683807373046875, -0.6195144653320312, -0.570648193359375, -0.5217819213867188, -0.4729156494140625, -0.42404937744140625, -0.37518310546875, -0.32631683349609375, -0.2774505615234375, -0.22858428955078125, -0.179718017578125, -0.13085174560546875, -0.0819854736328125, -0.03311920166015625, 0.0157470703125, 0.06461334228515625, 0.1134796142578125, 0.16234588623046875, 0.211212158203125, 0.26007843017578125, 0.3089447021484375, 0.35781097412109375, 0.40667724609375, 0.45554351806640625, 0.5044097900390625, 0.5532760620117188, 0.602142333984375, 0.6510086059570312, 0.6998748779296875, 0.7487411499023438, 0.797607421875, 0.8464736938476562, 0.8953399658203125, 0.9442062377929688, 0.993072509765625, 1.0419387817382812, 1.0908050537109375, 1.1396713256835938, 1.18853759765625, 1.2374038696289062, 1.2862701416015625, 1.3351364135742188, 1.384002685546875, 1.4328689575195312, 1.4817352294921875, 1.5306015014648438, 1.5794677734375, 1.6283340454101562, 1.6772003173828125, 1.7260665893554688, 1.774932861328125, 1.8237991333007812, 1.8726654052734375, 1.9215316772460938, 1.97039794921875, 2.0192642211914062, 2.0681304931640625, 2.1169967651367188, 2.165863037109375, 2.2147293090820312, 2.2635955810546875, 2.3124618530273438, 2.361328125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 13.0, 35.0, 86.0, 168.0, 199.0, 232.0, 141.0, 92.0, 30.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006855010986328125, -0.006230056285858154, -0.005605101585388184, -0.004980146884918213, -0.004355192184448242, -0.0037302374839782715, -0.0031052827835083008, -0.00248032808303833, -0.0018553733825683594, -0.0012304186820983887, -0.000605463981628418, 1.9490718841552734e-05, 0.0006444454193115234, 0.0012694001197814941, 0.0018943548202514648, 0.0025193095207214355, 0.0031442642211914062, 0.003769218921661377, 0.004394173622131348, 0.005019128322601318, 0.005644083023071289, 0.00626903772354126, 0.0068939924240112305, 0.007518947124481201, 0.008143901824951172, 0.008768856525421143, 0.009393811225891113, 0.010018765926361084, 0.010643720626831055, 0.011268675327301025, 0.011893630027770996, 0.012518584728240967, 0.013143539428710938, 0.013768494129180908, 0.014393448829650879, 0.01501840353012085, 0.01564335823059082, 0.01626831293106079, 0.01689326763153076, 0.017518222332000732, 0.018143177032470703, 0.018768131732940674, 0.019393086433410645, 0.020018041133880615, 0.020642995834350586, 0.021267950534820557, 0.021892905235290527, 0.022517859935760498, 0.02314281463623047, 0.02376776933670044, 0.02439272403717041, 0.02501767873764038, 0.02564263343811035, 0.026267588138580322, 0.026892542839050293, 0.027517497539520264, 0.028142452239990234, 0.028767406940460205, 0.029392361640930176, 0.030017316341400146, 0.030642271041870117, 0.03126722574234009, 0.03189218044281006, 0.03251713514328003, 0.03314208984375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 12.0, 20.0, 52.0, 126.0, 279.0, 936.0, 5795.0, 3976822.0, 206688.0, 2647.0, 552.0, 198.0, 87.0, 33.0, 20.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.345703125, -1.30474853515625, -1.2637939453125, -1.22283935546875, -1.181884765625, -1.14093017578125, -1.0999755859375, -1.05902099609375, -1.01806640625, -0.97711181640625, -0.9361572265625, -0.89520263671875, -0.854248046875, -0.81329345703125, -0.7723388671875, -0.73138427734375, -0.6904296875, -0.64947509765625, -0.6085205078125, -0.56756591796875, -0.526611328125, -0.48565673828125, -0.4447021484375, -0.40374755859375, -0.36279296875, -0.32183837890625, -0.2808837890625, -0.23992919921875, -0.198974609375, -0.15802001953125, -0.1170654296875, -0.07611083984375, -0.03515625, 0.00579833984375, 0.0467529296875, 0.08770751953125, 0.128662109375, 0.16961669921875, 0.2105712890625, 0.25152587890625, 0.29248046875, 0.33343505859375, 0.3743896484375, 0.41534423828125, 0.456298828125, 0.49725341796875, 0.5382080078125, 0.57916259765625, 0.6201171875, 0.66107177734375, 0.7020263671875, 0.74298095703125, 0.783935546875, 0.82489013671875, 0.8658447265625, 0.90679931640625, 0.94775390625, 0.98870849609375, 1.0296630859375, 1.07061767578125, 1.111572265625, 1.15252685546875, 1.1934814453125, 1.23443603515625, 1.275390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 12.0, 23.0, 55.0, 120.0, 375.0, 1794.0, 1145.0, 303.0, 122.0, 68.0, 20.0, 9.0, 6.0, 5.0, 4.0, 1.0, 1.0], "bins": [-0.1353759765625, -0.13281464576721191, -0.13025331497192383, -0.12769198417663574, -0.12513065338134766, -0.12256932258605957, -0.12000799179077148, -0.1174466609954834, -0.11488533020019531, -0.11232399940490723, -0.10976266860961914, -0.10720133781433105, -0.10464000701904297, -0.10207867622375488, -0.0995173454284668, -0.09695601463317871, -0.09439468383789062, -0.09183335304260254, -0.08927202224731445, -0.08671069145202637, -0.08414936065673828, -0.0815880298614502, -0.07902669906616211, -0.07646536827087402, -0.07390403747558594, -0.07134270668029785, -0.06878137588500977, -0.06622004508972168, -0.0636587142944336, -0.06109738349914551, -0.05853605270385742, -0.055974721908569336, -0.05341339111328125, -0.050852060317993164, -0.04829072952270508, -0.04572939872741699, -0.043168067932128906, -0.04060673713684082, -0.038045406341552734, -0.03548407554626465, -0.03292274475097656, -0.030361413955688477, -0.02780008316040039, -0.025238752365112305, -0.02267742156982422, -0.020116090774536133, -0.017554759979248047, -0.014993429183959961, -0.012432098388671875, -0.009870767593383789, -0.007309436798095703, -0.004748106002807617, -0.0021867752075195312, 0.0003745555877685547, 0.0029358863830566406, 0.0054972171783447266, 0.008058547973632812, 0.010619878768920898, 0.013181209564208984, 0.01574254035949707, 0.018303871154785156, 0.020865201950073242, 0.023426532745361328, 0.025987863540649414, 0.0285491943359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 6.0, 20.0, 88.0, 306.0, 363.0, 141.0, 46.0, 21.0, 6.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6346023082733154, -1.599168062210083, -1.5637339353561401, -1.5282996892929077, -1.4928655624389648, -1.4574313163757324, -1.4219971895217896, -1.3865629434585571, -1.3511288166046143, -1.3156945705413818, -1.280260443687439, -1.2448261976242065, -1.2093920707702637, -1.1739578247070312, -1.1385236978530884, -1.103089451789856, -1.067655324935913, -1.0322210788726807, -0.9967869520187378, -0.9613527655601501, -0.9259185791015625, -0.8904843926429749, -0.8550502061843872, -0.8196159601211548, -0.7841817140579224, -0.7487475275993347, -0.7133133411407471, -0.6778791546821594, -0.6424449682235718, -0.6070107817649841, -0.5715765953063965, -0.5361423492431641, -0.5007082223892212, -0.46527403593063354, -0.4298398494720459, -0.39440566301345825, -0.3589714765548706, -0.32353729009628296, -0.2881030738353729, -0.2526688873767853, -0.21723470091819763, -0.18180051445960999, -0.14636632800102234, -0.1109321266412735, -0.07549794018268585, -0.040063753724098206, -0.004629552364349365, 0.03080463409423828, 0.06623882055282593, 0.10167300701141357, 0.13710719347000122, 0.17254139482975006, 0.2079755812883377, 0.24340976774692535, 0.2788439691066742, 0.31427815556526184, 0.3497123420238495, 0.38514652848243713, 0.4205807149410248, 0.4560149312019348, 0.49144911766052246, 0.5268833041191101, 0.5623174905776978, 0.5977516770362854, 0.633185863494873]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 8.0, 15.0, 12.0, 35.0, 45.0, 66.0, 77.0, 84.0, 94.0, 90.0, 82.0, 67.0, 75.0, 67.0, 54.0, 30.0, 41.0, 24.0, 13.0, 11.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3203514814376831, -0.30962052941322327, -0.2988895773887634, -0.288158655166626, -0.27742770314216614, -0.2666967511177063, -0.25596579909324646, -0.24523484706878662, -0.23450389504432678, -0.22377294301986694, -0.2130420058965683, -0.20231105387210846, -0.19158010184764862, -0.18084916472434998, -0.17011821269989014, -0.1593872606754303, -0.14865632355213165, -0.13792537152767181, -0.12719443440437317, -0.11646348237991333, -0.10573253035545349, -0.09500158578157425, -0.08427064120769501, -0.07353968918323517, -0.06280874460935593, -0.052077796310186386, -0.041346848011016846, -0.030615903437137604, -0.019884955137968063, -0.009154006838798523, 0.001576937735080719, 0.012307889759540558, 0.0230388343334198, 0.03376978263258934, 0.04450073093175888, 0.05523167550563812, 0.06596262753009796, 0.0766935721039772, 0.08742451667785645, 0.09815546870231628, 0.10888641327619553, 0.11961735785007477, 0.1303483098745346, 0.14107924699783325, 0.1518101990222931, 0.16254115104675293, 0.17327210307121277, 0.1840030550956726, 0.19473399221897125, 0.2054649442434311, 0.21619588136672974, 0.22692683339118958, 0.23765778541564941, 0.24838873744010925, 0.2591196894645691, 0.26985061168670654, 0.2805815637111664, 0.2913125157356262, 0.30204346776008606, 0.3127744197845459, 0.32350534200668335, 0.3342362940311432, 0.344967246055603, 0.35569819808006287, 0.3664291501045227]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 9.0, 5.0, 9.0, 11.0, 11.0, 7.0, 11.0, 13.0, 26.0, 41.0, 30.0, 28.0, 25.0, 34.0, 77.0, 161.0, 547.0, 5340.0, 369783.0, 662576.0, 8580.0, 653.0, 180.0, 69.0, 47.0, 39.0, 27.0, 33.0, 23.0, 16.0, 28.0, 19.0, 12.0, 13.0, 9.0, 13.0, 8.0, 5.0, 3.0, 3.0, 1.0, 6.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.5263671875, -0.5082626342773438, -0.4901580810546875, -0.47205352783203125, -0.453948974609375, -0.43584442138671875, -0.4177398681640625, -0.39963531494140625, -0.38153076171875, -0.36342620849609375, -0.3453216552734375, -0.32721710205078125, -0.309112548828125, -0.29100799560546875, -0.2729034423828125, -0.25479888916015625, -0.2366943359375, -0.21858978271484375, -0.2004852294921875, -0.18238067626953125, -0.164276123046875, -0.14617156982421875, -0.1280670166015625, -0.10996246337890625, -0.09185791015625, -0.07375335693359375, -0.0556488037109375, -0.03754425048828125, -0.019439697265625, -0.00133514404296875, 0.0167694091796875, 0.03487396240234375, 0.052978515625, 0.07108306884765625, 0.0891876220703125, 0.10729217529296875, 0.125396728515625, 0.14350128173828125, 0.1616058349609375, 0.17971038818359375, 0.19781494140625, 0.21591949462890625, 0.2340240478515625, 0.25212860107421875, 0.270233154296875, 0.28833770751953125, 0.3064422607421875, 0.32454681396484375, 0.3426513671875, 0.36075592041015625, 0.3788604736328125, 0.39696502685546875, 0.415069580078125, 0.43317413330078125, 0.4512786865234375, 0.46938323974609375, 0.48748779296875, 0.5055923461914062, 0.5236968994140625, 0.5418014526367188, 0.559906005859375, 0.5780105590820312, 0.5961151123046875, 0.6142196655273438, 0.63232421875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 6.0, 16.0, 24.0, 25.0, 47.0, 62.0, 68.0, 86.0, 88.0, 103.0, 102.0, 66.0, 78.0, 53.0, 48.0, 32.0, 31.0, 26.0, 10.0, 17.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01837158203125, -0.017791032791137695, -0.01721048355102539, -0.016629934310913086, -0.01604938507080078, -0.015468835830688477, -0.014888286590576172, -0.014307737350463867, -0.013727188110351562, -0.013146638870239258, -0.012566089630126953, -0.011985540390014648, -0.011404991149902344, -0.010824441909790039, -0.010243892669677734, -0.00966334342956543, -0.009082794189453125, -0.00850224494934082, -0.007921695709228516, -0.007341146469116211, -0.006760597229003906, -0.0061800479888916016, -0.005599498748779297, -0.005018949508666992, -0.0044384002685546875, -0.003857851028442383, -0.003277301788330078, -0.0026967525482177734, -0.0021162033081054688, -0.001535654067993164, -0.0009551048278808594, -0.0003745555877685547, 0.00020599365234375, 0.0007865428924560547, 0.0013670921325683594, 0.001947641372680664, 0.0025281906127929688, 0.0031087398529052734, 0.003689289093017578, 0.004269838333129883, 0.0048503875732421875, 0.005430936813354492, 0.006011486053466797, 0.0065920352935791016, 0.007172584533691406, 0.007753133773803711, 0.008333683013916016, 0.00891423225402832, 0.009494781494140625, 0.01007533073425293, 0.010655879974365234, 0.011236429214477539, 0.011816978454589844, 0.012397527694702148, 0.012978076934814453, 0.013558626174926758, 0.014139175415039062, 0.014719724655151367, 0.015300273895263672, 0.015880823135375977, 0.01646137237548828, 0.017041921615600586, 0.01762247085571289, 0.018203020095825195, 0.0187835693359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 7.0, 11.0, 13.0, 13.0, 21.0, 41.0, 63.0, 62.0, 104.0, 159.0, 244.0, 390.0, 679.0, 1226.0, 2671.0, 7509.0, 31225.0, 203289.0, 602482.0, 160443.0, 26033.0, 6575.0, 2428.0, 1155.0, 595.0, 365.0, 245.0, 163.0, 110.0, 60.0, 52.0, 32.0, 26.0, 20.0, 7.0, 12.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.1798095703125, -0.17487525939941406, -0.16994094848632812, -0.1650066375732422, -0.16007232666015625, -0.1551380157470703, -0.15020370483398438, -0.14526939392089844, -0.1403350830078125, -0.13540077209472656, -0.13046646118164062, -0.1255321502685547, -0.12059783935546875, -0.11566352844238281, -0.11072921752929688, -0.10579490661621094, -0.100860595703125, -0.09592628479003906, -0.09099197387695312, -0.08605766296386719, -0.08112335205078125, -0.07618904113769531, -0.07125473022460938, -0.06632041931152344, -0.0613861083984375, -0.05645179748535156, -0.051517486572265625, -0.04658317565917969, -0.04164886474609375, -0.03671455383300781, -0.031780242919921875, -0.026845932006835938, -0.02191162109375, -0.016977310180664062, -0.012042999267578125, -0.0071086883544921875, -0.00217437744140625, 0.0027599334716796875, 0.007694244384765625, 0.012628555297851562, 0.0175628662109375, 0.022497177124023438, 0.027431488037109375, 0.03236579895019531, 0.03730010986328125, 0.04223442077636719, 0.047168731689453125, 0.05210304260253906, 0.057037353515625, 0.06197166442871094, 0.06690597534179688, 0.07184028625488281, 0.07677459716796875, 0.08170890808105469, 0.08664321899414062, 0.09157752990722656, 0.0965118408203125, 0.10144615173339844, 0.10638046264648438, 0.11131477355957031, 0.11624908447265625, 0.12118339538574219, 0.12611770629882812, 0.13105201721191406, 0.135986328125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 3.0, 9.0, 9.0, 14.0, 17.0, 18.0, 18.0, 30.0, 27.0, 21.0, 34.0, 42.0, 52.0, 36.0, 29.0, 42.0, 36.0, 50.0, 31.0, 34.0, 64.0, 43.0, 31.0, 37.0, 30.0, 38.0, 29.0, 25.0, 20.0, 27.0, 15.0, 14.0, 12.0, 14.0, 7.0, 4.0, 6.0, 7.0, 8.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043731689453125, -0.042237281799316406, -0.04074287414550781, -0.03924846649169922, -0.037754058837890625, -0.03625965118408203, -0.03476524353027344, -0.033270835876464844, -0.03177642822265625, -0.030282020568847656, -0.028787612915039062, -0.02729320526123047, -0.025798797607421875, -0.02430438995361328, -0.022809982299804688, -0.021315574645996094, -0.0198211669921875, -0.018326759338378906, -0.016832351684570312, -0.015337944030761719, -0.013843536376953125, -0.012349128723144531, -0.010854721069335938, -0.009360313415527344, -0.00786590576171875, -0.006371498107910156, -0.0048770904541015625, -0.0033826828002929688, -0.001888275146484375, -0.00039386749267578125, 0.0011005401611328125, 0.0025949478149414062, 0.00408935546875, 0.005583763122558594, 0.0070781707763671875, 0.008572578430175781, 0.010066986083984375, 0.011561393737792969, 0.013055801391601562, 0.014550209045410156, 0.01604461669921875, 0.017539024353027344, 0.019033432006835938, 0.02052783966064453, 0.022022247314453125, 0.02351665496826172, 0.025011062622070312, 0.026505470275878906, 0.0279998779296875, 0.029494285583496094, 0.030988693237304688, 0.03248310089111328, 0.033977508544921875, 0.03547191619873047, 0.03696632385253906, 0.038460731506347656, 0.03995513916015625, 0.041449546813964844, 0.04294395446777344, 0.04443836212158203, 0.045932769775390625, 0.04742717742919922, 0.04892158508300781, 0.050415992736816406, 0.051910400390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 8.0, 4.0, 9.0, 14.0, 25.0, 19.0, 54.0, 75.0, 111.0, 172.0, 316.0, 573.0, 1281.0, 3004.0, 9203.0, 42011.0, 275916.0, 566008.0, 119760.0, 20431.0, 5589.0, 2050.0, 868.0, 424.0, 238.0, 150.0, 74.0, 50.0, 38.0, 22.0, 19.0, 9.0, 5.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.149169921875, -0.14505863189697266, -0.1409473419189453, -0.13683605194091797, -0.13272476196289062, -0.12861347198486328, -0.12450218200683594, -0.1203908920288086, -0.11627960205078125, -0.1121683120727539, -0.10805702209472656, -0.10394573211669922, -0.09983444213867188, -0.09572315216064453, -0.09161186218261719, -0.08750057220458984, -0.0833892822265625, -0.07927799224853516, -0.07516670227050781, -0.07105541229248047, -0.06694412231445312, -0.06283283233642578, -0.05872154235839844, -0.054610252380371094, -0.05049896240234375, -0.046387672424316406, -0.04227638244628906, -0.03816509246826172, -0.034053802490234375, -0.02994251251220703, -0.025831222534179688, -0.021719932556152344, -0.017608642578125, -0.013497352600097656, -0.009386062622070312, -0.005274772644042969, -0.001163482666015625, 0.0029478073120117188, 0.0070590972900390625, 0.011170387268066406, 0.01528167724609375, 0.019392967224121094, 0.023504257202148438, 0.02761554718017578, 0.031726837158203125, 0.03583812713623047, 0.03994941711425781, 0.044060707092285156, 0.0481719970703125, 0.052283287048339844, 0.05639457702636719, 0.06050586700439453, 0.06461715698242188, 0.06872844696044922, 0.07283973693847656, 0.0769510269165039, 0.08106231689453125, 0.0851736068725586, 0.08928489685058594, 0.09339618682861328, 0.09750747680664062, 0.10161876678466797, 0.10573005676269531, 0.10984134674072266, 0.11395263671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 5.0, 17.0, 20.0, 23.0, 18.0, 24.0, 38.0, 56.0, 65.0, 98.0, 106.0, 114.0, 78.0, 76.0, 52.0, 32.0, 34.0, 26.0, 12.0, 26.0, 11.0, 16.0, 7.0, 6.0, 9.0, 4.0, 9.0, 3.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013518333435058594, -0.0001301392912864685, -0.00012509524822235107, -0.00012005120515823364, -0.00011500716209411621, -0.00010996311902999878, -0.00010491907596588135, -9.987503290176392e-05, -9.483098983764648e-05, -8.978694677352905e-05, -8.474290370941162e-05, -7.969886064529419e-05, -7.465481758117676e-05, -6.961077451705933e-05, -6.45667314529419e-05, -5.952268838882446e-05, -5.447864532470703e-05, -4.94346022605896e-05, -4.439055919647217e-05, -3.9346516132354736e-05, -3.4302473068237305e-05, -2.9258430004119873e-05, -2.421438694000244e-05, -1.917034387588501e-05, -1.4126300811767578e-05, -9.082257747650146e-06, -4.038214683532715e-06, 1.0058283805847168e-06, 6.0498714447021484e-06, 1.109391450881958e-05, 1.6137957572937012e-05, 2.1182000637054443e-05, 2.6226043701171875e-05, 3.127008676528931e-05, 3.631412982940674e-05, 4.135817289352417e-05, 4.64022159576416e-05, 5.144625902175903e-05, 5.6490302085876465e-05, 6.15343451499939e-05, 6.657838821411133e-05, 7.162243127822876e-05, 7.666647434234619e-05, 8.171051740646362e-05, 8.675456047058105e-05, 9.179860353469849e-05, 9.684264659881592e-05, 0.00010188668966293335, 0.00010693073272705078, 0.00011197477579116821, 0.00011701881885528564, 0.00012206286191940308, 0.0001271069049835205, 0.00013215094804763794, 0.00013719499111175537, 0.0001422390341758728, 0.00014728307723999023, 0.00015232712030410767, 0.0001573711633682251, 0.00016241520643234253, 0.00016745924949645996, 0.0001725032925605774, 0.00017754733562469482, 0.00018259137868881226, 0.0001876354217529297]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 10.0, 20.0, 18.0, 51.0, 58.0, 107.0, 237.0, 464.0, 1121.0, 3226.0, 16491.0, 261016.0, 701165.0, 54652.0, 6538.0, 1890.0, 740.0, 319.0, 192.0, 83.0, 39.0, 30.0, 22.0, 6.0, 8.0, 10.0, 4.0, 8.0, 4.0, 1.0, 1.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1627197265625, -0.15627288818359375, -0.1498260498046875, -0.14337921142578125, -0.136932373046875, -0.13048553466796875, -0.1240386962890625, -0.11759185791015625, -0.11114501953125, -0.10469818115234375, -0.0982513427734375, -0.09180450439453125, -0.085357666015625, -0.07891082763671875, -0.0724639892578125, -0.06601715087890625, -0.0595703125, -0.05312347412109375, -0.0466766357421875, -0.04022979736328125, -0.033782958984375, -0.02733612060546875, -0.0208892822265625, -0.01444244384765625, -0.00799560546875, -0.00154876708984375, 0.0048980712890625, 0.01134490966796875, 0.017791748046875, 0.02423858642578125, 0.0306854248046875, 0.03713226318359375, 0.0435791015625, 0.05002593994140625, 0.0564727783203125, 0.06291961669921875, 0.069366455078125, 0.07581329345703125, 0.0822601318359375, 0.08870697021484375, 0.09515380859375, 0.10160064697265625, 0.1080474853515625, 0.11449432373046875, 0.120941162109375, 0.12738800048828125, 0.1338348388671875, 0.14028167724609375, 0.146728515625, 0.15317535400390625, 0.1596221923828125, 0.16606903076171875, 0.172515869140625, 0.17896270751953125, 0.1854095458984375, 0.19185638427734375, 0.19830322265625, 0.20475006103515625, 0.2111968994140625, 0.21764373779296875, 0.224090576171875, 0.23053741455078125, 0.2369842529296875, 0.24343109130859375, 0.2498779296875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 10.0, 14.0, 15.0, 33.0, 41.0, 56.0, 55.0, 64.0, 113.0, 87.0, 103.0, 104.0, 86.0, 55.0, 53.0, 33.0, 19.0, 20.0, 14.0, 9.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045013427734375, -0.04234170913696289, -0.03966999053955078, -0.03699827194213867, -0.03432655334472656, -0.03165483474731445, -0.028983116149902344, -0.026311397552490234, -0.023639678955078125, -0.020967960357666016, -0.018296241760253906, -0.015624523162841797, -0.012952804565429688, -0.010281085968017578, -0.007609367370605469, -0.004937648773193359, -0.00226593017578125, 0.0004057884216308594, 0.0030775070190429688, 0.005749225616455078, 0.008420944213867188, 0.011092662811279297, 0.013764381408691406, 0.016436100006103516, 0.019107818603515625, 0.021779537200927734, 0.024451255798339844, 0.027122974395751953, 0.029794692993164062, 0.03246641159057617, 0.03513813018798828, 0.03780984878540039, 0.0404815673828125, 0.04315328598022461, 0.04582500457763672, 0.04849672317504883, 0.05116844177246094, 0.05384016036987305, 0.056511878967285156, 0.059183597564697266, 0.061855316162109375, 0.06452703475952148, 0.0671987533569336, 0.0698704719543457, 0.07254219055175781, 0.07521390914916992, 0.07788562774658203, 0.08055734634399414, 0.08322906494140625, 0.08590078353881836, 0.08857250213623047, 0.09124422073364258, 0.09391593933105469, 0.0965876579284668, 0.0992593765258789, 0.10193109512329102, 0.10460281372070312, 0.10727453231811523, 0.10994625091552734, 0.11261796951293945, 0.11528968811035156, 0.11796140670776367, 0.12063312530517578, 0.12330484390258789, 0.1259765625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 21.0, 57.0, 168.0, 315.0, 283.0, 94.0, 33.0, 11.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.343329668045044, -2.2920548915863037, -2.2407801151275635, -2.1895053386688232, -2.138230562210083, -2.0869557857513428, -2.0356810092926025, -1.9844063520431519, -1.9331315755844116, -1.8818567991256714, -1.8305820226669312, -1.779307246208191, -1.7280324697494507, -1.6767578125, -1.6254830360412598, -1.5742082595825195, -1.5229334831237793, -1.471658706665039, -1.4203839302062988, -1.3691091537475586, -1.3178343772888184, -1.2665596008300781, -1.215284824371338, -1.1640101671218872, -1.1127352714538574, -1.0614604949951172, -1.010185718536377, -0.9589109420776367, -0.9076362252235413, -0.856361448764801, -0.8050866723060608, -0.7538119554519653, -0.7025371193885803, -0.6512623429298401, -0.5999875664710999, -0.5487128496170044, -0.49743807315826416, -0.4461632966995239, -0.3948885202407837, -0.34361377358436584, -0.2923389971256256, -0.24106423556804657, -0.18978947401046753, -0.1385146975517273, -0.08723993599414825, -0.035965174436569214, 0.01530960202217102, 0.06658434867858887, 0.1178591251373291, 0.16913388669490814, 0.22040864825248718, 0.2716834247112274, 0.32295817136764526, 0.3742329478263855, 0.42550772428512573, 0.4767824709415436, 0.5280572175979614, 0.5793319940567017, 0.6306067705154419, 0.6818815469741821, 0.7331562638282776, 0.7844310402870178, 0.8357058167457581, 0.8869805335998535, 0.9382553696632385]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 2.0, 3.0, 11.0, 6.0, 14.0, 17.0, 13.0, 26.0, 21.0, 23.0, 31.0, 33.0, 37.0, 35.0, 42.0, 32.0, 32.0, 45.0, 61.0, 53.0, 46.0, 45.0, 42.0, 37.0, 35.0, 32.0, 26.0, 37.0, 21.0, 31.0, 15.0, 14.0, 13.0, 10.0, 15.0, 6.0, 9.0, 5.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.3799285292625427, -0.3681080937385559, -0.3562876880168915, -0.34446725249290466, -0.33264681696891785, -0.32082638144493103, -0.3090059757232666, -0.2971855401992798, -0.28536510467529297, -0.27354466915130615, -0.2617242634296417, -0.2499038279056549, -0.2380833923816681, -0.22626297175884247, -0.21444255113601685, -0.20262211561203003, -0.1908016949892044, -0.17898127436637878, -0.16716083884239197, -0.15534041821956635, -0.14351998269557953, -0.1316995620727539, -0.11987913399934769, -0.10805870592594147, -0.09623827785253525, -0.08441784977912903, -0.07259742170572281, -0.06077699735760689, -0.04895656928420067, -0.03713614121079445, -0.025315716862678528, -0.013495288789272308, -0.0016748607158660889, 0.010145566426217556, 0.0219659935683012, 0.03378641977906227, 0.04560684785246849, 0.05742727592587471, 0.06924770027399063, 0.08106812834739685, 0.09288855642080307, 0.10470898449420929, 0.11652941256761551, 0.12834984064102173, 0.14017026126384735, 0.15199069678783417, 0.1638111174106598, 0.1756315529346466, 0.18745197355747223, 0.19927239418029785, 0.21109282970428467, 0.2229132503271103, 0.2347336858510971, 0.24655410647392273, 0.25837454199790955, 0.270194947719574, 0.2820153832435608, 0.2938358187675476, 0.30565622448921204, 0.31747666001319885, 0.32929709553718567, 0.3411175310611725, 0.3529379367828369, 0.36475837230682373, 0.37657880783081055]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 7.0, 6.0, 10.0, 16.0, 18.0, 17.0, 29.0, 41.0, 64.0, 79.0, 127.0, 209.0, 533.0, 2659.0, 38430.0, 3972726.0, 172666.0, 5198.0, 665.0, 191.0, 116.0, 90.0, 57.0, 44.0, 43.0, 32.0, 30.0, 19.0, 20.0, 15.0, 20.0, 14.0, 7.0, 10.0, 11.0, 10.0, 8.0, 1.0, 6.0, 3.0, 4.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.457275390625, -0.4401359558105469, -0.42299652099609375, -0.4058570861816406, -0.3887176513671875, -0.3715782165527344, -0.35443878173828125, -0.3372993469238281, -0.320159912109375, -0.3030204772949219, -0.28588104248046875, -0.2687416076660156, -0.2516021728515625, -0.23446273803710938, -0.21732330322265625, -0.20018386840820312, -0.18304443359375, -0.16590499877929688, -0.14876556396484375, -0.13162612915039062, -0.1144866943359375, -0.09734725952148438, -0.08020782470703125, -0.06306838989257812, -0.045928955078125, -0.028789520263671875, -0.01165008544921875, 0.005489349365234375, 0.0226287841796875, 0.039768218994140625, 0.05690765380859375, 0.07404708862304688, 0.0911865234375, 0.10832595825195312, 0.12546539306640625, 0.14260482788085938, 0.1597442626953125, 0.17688369750976562, 0.19402313232421875, 0.21116256713867188, 0.228302001953125, 0.24544143676757812, 0.26258087158203125, 0.2797203063964844, 0.2968597412109375, 0.3139991760253906, 0.33113861083984375, 0.3482780456542969, 0.36541748046875, 0.3825569152832031, 0.39969635009765625, 0.4168357849121094, 0.4339752197265625, 0.4511146545410156, 0.46825408935546875, 0.4853935241699219, 0.502532958984375, 0.5196723937988281, 0.5368118286132812, 0.5539512634277344, 0.5710906982421875, 0.5882301330566406, 0.6053695678710938, 0.6225090026855469, 0.6396484375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 10.0, 16.0, 13.0, 24.0, 19.0, 33.0, 38.0, 46.0, 57.0, 60.0, 57.0, 77.0, 65.0, 64.0, 69.0, 57.0, 51.0, 50.0, 42.0, 44.0, 20.0, 19.0, 21.0, 8.0, 16.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01242828369140625, -0.01196134090423584, -0.01149439811706543, -0.01102745532989502, -0.01056051254272461, -0.0100935697555542, -0.009626626968383789, -0.009159684181213379, -0.008692741394042969, -0.008225798606872559, -0.0077588558197021484, -0.007291913032531738, -0.006824970245361328, -0.006358027458190918, -0.005891084671020508, -0.005424141883850098, -0.0049571990966796875, -0.004490256309509277, -0.004023313522338867, -0.003556370735168457, -0.003089427947998047, -0.0026224851608276367, -0.0021555423736572266, -0.0016885995864868164, -0.0012216567993164062, -0.0007547140121459961, -0.00028777122497558594, 0.00017917156219482422, 0.0006461143493652344, 0.0011130571365356445, 0.0015799999237060547, 0.002046942710876465, 0.002513885498046875, 0.002980828285217285, 0.0034477710723876953, 0.0039147138595581055, 0.004381656646728516, 0.004848599433898926, 0.005315542221069336, 0.005782485008239746, 0.006249427795410156, 0.006716370582580566, 0.0071833133697509766, 0.007650256156921387, 0.008117198944091797, 0.008584141731262207, 0.009051084518432617, 0.009518027305603027, 0.009984970092773438, 0.010451912879943848, 0.010918855667114258, 0.011385798454284668, 0.011852741241455078, 0.012319684028625488, 0.012786626815795898, 0.013253569602966309, 0.013720512390136719, 0.014187455177307129, 0.014654397964477539, 0.01512134075164795, 0.01558828353881836, 0.01605522632598877, 0.01652216911315918, 0.01698911190032959, 0.0174560546875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 7.0, 10.0, 15.0, 19.0, 28.0, 33.0, 59.0, 92.0, 149.0, 339.0, 5882.0, 4181407.0, 5471.0, 335.0, 126.0, 85.0, 58.0, 52.0, 30.0, 39.0, 17.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.068359375, -2.0159912109375, -1.963623046875, -1.9112548828125, -1.85888671875, -1.8065185546875, -1.754150390625, -1.7017822265625, -1.6494140625, -1.5970458984375, -1.544677734375, -1.4923095703125, -1.43994140625, -1.3875732421875, -1.335205078125, -1.2828369140625, -1.23046875, -1.1781005859375, -1.125732421875, -1.0733642578125, -1.02099609375, -0.9686279296875, -0.916259765625, -0.8638916015625, -0.8115234375, -0.7591552734375, -0.706787109375, -0.6544189453125, -0.60205078125, -0.5496826171875, -0.497314453125, -0.4449462890625, -0.392578125, -0.3402099609375, -0.287841796875, -0.2354736328125, -0.18310546875, -0.1307373046875, -0.078369140625, -0.0260009765625, 0.0263671875, 0.0787353515625, 0.131103515625, 0.1834716796875, 0.23583984375, 0.2882080078125, 0.340576171875, 0.3929443359375, 0.4453125, 0.4976806640625, 0.550048828125, 0.6024169921875, 0.65478515625, 0.7071533203125, 0.759521484375, 0.8118896484375, 0.8642578125, 0.9166259765625, 0.968994140625, 1.0213623046875, 1.07373046875, 1.1260986328125, 1.178466796875, 1.2308349609375, 1.283203125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 18.0, 47.0, 220.0, 1135.0, 2136.0, 351.0, 104.0, 35.0, 16.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14453125, -0.14017677307128906, -0.13582229614257812, -0.1314678192138672, -0.12711334228515625, -0.12275886535644531, -0.11840438842773438, -0.11404991149902344, -0.1096954345703125, -0.10534095764160156, -0.10098648071289062, -0.09663200378417969, -0.09227752685546875, -0.08792304992675781, -0.08356857299804688, -0.07921409606933594, -0.074859619140625, -0.07050514221191406, -0.06615066528320312, -0.06179618835449219, -0.05744171142578125, -0.05308723449707031, -0.048732757568359375, -0.04437828063964844, -0.0400238037109375, -0.03566932678222656, -0.031314849853515625, -0.026960372924804688, -0.02260589599609375, -0.018251419067382812, -0.013896942138671875, -0.009542465209960938, -0.00518798828125, -0.0008335113525390625, 0.003520965576171875, 0.007875442504882812, 0.01222991943359375, 0.016584396362304688, 0.020938873291015625, 0.025293350219726562, 0.0296478271484375, 0.03400230407714844, 0.038356781005859375, 0.04271125793457031, 0.04706573486328125, 0.05142021179199219, 0.055774688720703125, 0.06012916564941406, 0.064483642578125, 0.06883811950683594, 0.07319259643554688, 0.07754707336425781, 0.08190155029296875, 0.08625602722167969, 0.09061050415039062, 0.09496498107910156, 0.0993194580078125, 0.10367393493652344, 0.10802841186523438, 0.11238288879394531, 0.11673736572265625, 0.12109184265136719, 0.12544631958007812, 0.12980079650878906, 0.1341552734375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 22.0, 48.0, 210.0, 366.0, 256.0, 72.0, 20.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4496011435985565, -0.41407954692840576, -0.3785579800605774, -0.343036413192749, -0.30751481652259827, -0.2719932198524475, -0.23647165298461914, -0.20095007121562958, -0.16542848944664001, -0.12990690767765045, -0.09438532590866089, -0.058863744139671326, -0.023342162370681763, 0.0121794193983078, 0.04770100116729736, 0.08322258293628693, 0.11874416470527649, 0.15426574647426605, 0.18978732824325562, 0.22530891001224518, 0.26083049178123474, 0.2963520884513855, 0.33187365531921387, 0.36739522218704224, 0.402916818857193, 0.43843841552734375, 0.4739599823951721, 0.5094815492630005, 0.5450031757354736, 0.580524742603302, 0.6160463094711304, 0.6515678763389587, 0.6870895624160767, 0.722611129283905, 0.7581326961517334, 0.7936543226242065, 0.8291758894920349, 0.8646974563598633, 0.9002190828323364, 0.9357406497001648, 0.9712622165679932, 1.0067838430404663, 1.04230535030365, 1.077826976776123, 1.1133484840393066, 1.1488701105117798, 1.184391736984253, 1.2199132442474365, 1.2554348707199097, 1.2909564971923828, 1.3264780044555664, 1.3619996309280396, 1.3975212574005127, 1.4330427646636963, 1.4685643911361694, 1.504085898399353, 1.5396075248718262, 1.5751291513442993, 1.610650658607483, 1.646172285079956, 1.6816937923431396, 1.7172154188156128, 1.752737045288086, 1.7882585525512695, 1.8237801790237427]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 7.0, 14.0, 29.0, 41.0, 48.0, 69.0, 63.0, 78.0, 81.0, 85.0, 76.0, 93.0, 84.0, 59.0, 57.0, 32.0, 34.0, 15.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4573060870170593, -0.44489821791648865, -0.43249037861824036, -0.4200825095176697, -0.407674640417099, -0.3952668011188507, -0.38285893201828003, -0.37045109272003174, -0.35804322361946106, -0.3456353545188904, -0.3332275152206421, -0.3208196461200714, -0.30841177701950073, -0.29600393772125244, -0.28359606862068176, -0.2711881995201111, -0.2587803602218628, -0.2463725060224533, -0.23396463692188263, -0.22155678272247314, -0.20914892852306366, -0.19674107432365417, -0.1843332052230835, -0.171925351023674, -0.15951746702194214, -0.14710961282253265, -0.13470174372196198, -0.12229388952255249, -0.109886035323143, -0.09747817367315292, -0.08507031202316284, -0.07266245782375336, -0.06025460362434387, -0.04784674569964409, -0.035438887774944305, -0.023031026124954224, -0.01062316820025444, 0.001784689724445343, 0.014192551374435425, 0.02660040557384491, 0.03900826722383499, 0.051416125148534775, 0.06382398307323456, 0.07623184472322464, 0.08863970637321472, 0.1010475605726242, 0.11345542222261429, 0.12586328387260437, 0.13827113807201385, 0.15067899227142334, 0.16308686137199402, 0.1754947155714035, 0.187902569770813, 0.20031043887138367, 0.21271829307079315, 0.22512614727020264, 0.23753401637077332, 0.2499418705701828, 0.2623497247695923, 0.27475759387016296, 0.28716546297073364, 0.29957330226898193, 0.3119811713695526, 0.3243890404701233, 0.3367968797683716]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 14.0, 14.0, 15.0, 18.0, 23.0, 21.0, 36.0, 38.0, 65.0, 96.0, 222.0, 564.0, 3017.0, 54375.0, 844811.0, 138423.0, 5311.0, 832.0, 249.0, 117.0, 61.0, 62.0, 28.0, 19.0, 19.0, 21.0, 17.0, 15.0, 13.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2919921875, -0.2810249328613281, -0.27005767822265625, -0.2590904235839844, -0.2481231689453125, -0.23715591430664062, -0.22618865966796875, -0.21522140502929688, -0.204254150390625, -0.19328689575195312, -0.18231964111328125, -0.17135238647460938, -0.1603851318359375, -0.14941787719726562, -0.13845062255859375, -0.12748336791992188, -0.11651611328125, -0.10554885864257812, -0.09458160400390625, -0.08361434936523438, -0.0726470947265625, -0.061679840087890625, -0.05071258544921875, -0.039745330810546875, -0.028778076171875, -0.017810821533203125, -0.00684356689453125, 0.004123687744140625, 0.0150909423828125, 0.026058197021484375, 0.03702545166015625, 0.047992706298828125, 0.0589599609375, 0.06992721557617188, 0.08089447021484375, 0.09186172485351562, 0.1028289794921875, 0.11379623413085938, 0.12476348876953125, 0.13573074340820312, 0.146697998046875, 0.15766525268554688, 0.16863250732421875, 0.17959976196289062, 0.1905670166015625, 0.20153427124023438, 0.21250152587890625, 0.22346878051757812, 0.23443603515625, 0.24540328979492188, 0.25637054443359375, 0.2673377990722656, 0.2783050537109375, 0.2892723083496094, 0.30023956298828125, 0.3112068176269531, 0.322174072265625, 0.3331413269042969, 0.34410858154296875, 0.3550758361816406, 0.3660430908203125, 0.3770103454589844, 0.38797760009765625, 0.3989448547363281, 0.409912109375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 13.0, 14.0, 20.0, 17.0, 23.0, 36.0, 39.0, 47.0, 46.0, 71.0, 68.0, 71.0, 84.0, 60.0, 64.0, 62.0, 58.0, 48.0, 46.0, 22.0, 19.0, 16.0, 13.0, 11.0, 6.0, 8.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0260162353515625, -0.025351524353027344, -0.024686813354492188, -0.02402210235595703, -0.023357391357421875, -0.02269268035888672, -0.022027969360351562, -0.021363258361816406, -0.02069854736328125, -0.020033836364746094, -0.019369125366210938, -0.01870441436767578, -0.018039703369140625, -0.01737499237060547, -0.016710281372070312, -0.016045570373535156, -0.015380859375, -0.014716148376464844, -0.014051437377929688, -0.013386726379394531, -0.012722015380859375, -0.012057304382324219, -0.011392593383789062, -0.010727882385253906, -0.01006317138671875, -0.009398460388183594, -0.008733749389648438, -0.008069038391113281, -0.007404327392578125, -0.006739616394042969, -0.0060749053955078125, -0.005410194396972656, -0.0047454833984375, -0.004080772399902344, -0.0034160614013671875, -0.0027513504028320312, -0.002086639404296875, -0.0014219284057617188, -0.0007572174072265625, -9.250640869140625e-05, 0.00057220458984375, 0.0012369155883789062, 0.0019016265869140625, 0.0025663375854492188, 0.003231048583984375, 0.0038957595825195312, 0.0045604705810546875, 0.005225181579589844, 0.005889892578125, 0.006554603576660156, 0.0072193145751953125, 0.007884025573730469, 0.008548736572265625, 0.009213447570800781, 0.009878158569335938, 0.010542869567871094, 0.01120758056640625, 0.011872291564941406, 0.012537002563476562, 0.013201713562011719, 0.013866424560546875, 0.014531135559082031, 0.015195846557617188, 0.015860557556152344, 0.0165252685546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 8.0, 6.0, 18.0, 18.0, 21.0, 21.0, 35.0, 51.0, 83.0, 93.0, 151.0, 197.0, 283.0, 509.0, 874.0, 1506.0, 3139.0, 7457.0, 21353.0, 75645.0, 270407.0, 427730.0, 169087.0, 45352.0, 13909.0, 5113.0, 2278.0, 1178.0, 662.0, 447.0, 267.0, 182.0, 112.0, 107.0, 71.0, 41.0, 36.0, 30.0, 20.0, 15.0, 11.0, 5.0, 6.0, 9.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.090576171875, -0.08748531341552734, -0.08439445495605469, -0.08130359649658203, -0.07821273803710938, -0.07512187957763672, -0.07203102111816406, -0.0689401626586914, -0.06584930419921875, -0.0627584457397461, -0.05966758728027344, -0.05657672882080078, -0.053485870361328125, -0.05039501190185547, -0.04730415344238281, -0.044213294982910156, -0.0411224365234375, -0.038031578063964844, -0.03494071960449219, -0.03184986114501953, -0.028759002685546875, -0.02566814422607422, -0.022577285766601562, -0.019486427307128906, -0.01639556884765625, -0.013304710388183594, -0.010213851928710938, -0.007122993469238281, -0.004032135009765625, -0.0009412765502929688, 0.0021495819091796875, 0.005240440368652344, 0.008331298828125, 0.011422157287597656, 0.014513015747070312, 0.01760387420654297, 0.020694732666015625, 0.02378559112548828, 0.026876449584960938, 0.029967308044433594, 0.03305816650390625, 0.036149024963378906, 0.03923988342285156, 0.04233074188232422, 0.045421600341796875, 0.04851245880126953, 0.05160331726074219, 0.054694175720214844, 0.0577850341796875, 0.060875892639160156, 0.06396675109863281, 0.06705760955810547, 0.07014846801757812, 0.07323932647705078, 0.07633018493652344, 0.0794210433959961, 0.08251190185546875, 0.0856027603149414, 0.08869361877441406, 0.09178447723388672, 0.09487533569335938, 0.09796619415283203, 0.10105705261230469, 0.10414791107177734, 0.10723876953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 7.0, 14.0, 8.0, 8.0, 17.0, 16.0, 29.0, 20.0, 27.0, 25.0, 34.0, 32.0, 39.0, 50.0, 47.0, 45.0, 39.0, 42.0, 58.0, 42.0, 61.0, 32.0, 35.0, 43.0, 30.0, 31.0, 35.0, 17.0, 23.0, 16.0, 11.0, 13.0, 8.0, 6.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.074951171875, -0.07270050048828125, -0.0704498291015625, -0.06819915771484375, -0.065948486328125, -0.06369781494140625, -0.0614471435546875, -0.05919647216796875, -0.05694580078125, -0.05469512939453125, -0.0524444580078125, -0.05019378662109375, -0.047943115234375, -0.04569244384765625, -0.0434417724609375, -0.04119110107421875, -0.0389404296875, -0.03668975830078125, -0.0344390869140625, -0.03218841552734375, -0.029937744140625, -0.02768707275390625, -0.0254364013671875, -0.02318572998046875, -0.02093505859375, -0.01868438720703125, -0.0164337158203125, -0.01418304443359375, -0.011932373046875, -0.00968170166015625, -0.0074310302734375, -0.00518035888671875, -0.0029296875, -0.00067901611328125, 0.0015716552734375, 0.00382232666015625, 0.006072998046875, 0.00832366943359375, 0.0105743408203125, 0.01282501220703125, 0.01507568359375, 0.01732635498046875, 0.0195770263671875, 0.02182769775390625, 0.024078369140625, 0.02632904052734375, 0.0285797119140625, 0.03083038330078125, 0.0330810546875, 0.03533172607421875, 0.0375823974609375, 0.03983306884765625, 0.042083740234375, 0.04433441162109375, 0.0465850830078125, 0.04883575439453125, 0.05108642578125, 0.05333709716796875, 0.0555877685546875, 0.05783843994140625, 0.060089111328125, 0.06233978271484375, 0.0645904541015625, 0.06684112548828125, 0.069091796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 6.0, 2.0, 12.0, 13.0, 15.0, 23.0, 37.0, 56.0, 83.0, 117.0, 166.0, 301.0, 547.0, 1047.0, 2020.0, 4557.0, 11463.0, 36156.0, 146925.0, 470988.0, 277032.0, 65503.0, 18646.0, 6936.0, 2795.0, 1350.0, 687.0, 426.0, 215.0, 137.0, 84.0, 60.0, 51.0, 26.0, 20.0, 10.0, 14.0, 8.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.080322265625, -0.0777902603149414, -0.07525825500488281, -0.07272624969482422, -0.07019424438476562, -0.06766223907470703, -0.06513023376464844, -0.06259822845458984, -0.06006622314453125, -0.057534217834472656, -0.05500221252441406, -0.05247020721435547, -0.049938201904296875, -0.04740619659423828, -0.04487419128417969, -0.042342185974121094, -0.0398101806640625, -0.037278175354003906, -0.03474617004394531, -0.03221416473388672, -0.029682159423828125, -0.02715015411376953, -0.024618148803710938, -0.022086143493652344, -0.01955413818359375, -0.017022132873535156, -0.014490127563476562, -0.011958122253417969, -0.009426116943359375, -0.006894111633300781, -0.0043621063232421875, -0.0018301010131835938, 0.000701904296875, 0.0032339096069335938, 0.0057659149169921875, 0.008297920227050781, 0.010829925537109375, 0.013361930847167969, 0.015893936157226562, 0.018425941467285156, 0.02095794677734375, 0.023489952087402344, 0.026021957397460938, 0.02855396270751953, 0.031085968017578125, 0.03361797332763672, 0.03614997863769531, 0.038681983947753906, 0.0412139892578125, 0.043745994567871094, 0.04627799987792969, 0.04881000518798828, 0.051342010498046875, 0.05387401580810547, 0.05640602111816406, 0.058938026428222656, 0.06147003173828125, 0.06400203704833984, 0.06653404235839844, 0.06906604766845703, 0.07159805297851562, 0.07413005828857422, 0.07666206359863281, 0.0791940689086914, 0.08172607421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 4.0, 10.0, 8.0, 21.0, 40.0, 44.0, 64.0, 79.0, 122.0, 159.0, 140.0, 97.0, 63.0, 47.0, 33.0, 19.0, 11.0, 11.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014448165893554688, -0.00013943016529083252, -0.00013437867164611816, -0.0001293271780014038, -0.00012427568435668945, -0.0001192241907119751, -0.00011417269706726074, -0.00010912120342254639, -0.00010406970977783203, -9.901821613311768e-05, -9.396672248840332e-05, -8.891522884368896e-05, -8.386373519897461e-05, -7.881224155426025e-05, -7.37607479095459e-05, -6.870925426483154e-05, -6.365776062011719e-05, -5.860626697540283e-05, -5.3554773330688477e-05, -4.850327968597412e-05, -4.3451786041259766e-05, -3.840029239654541e-05, -3.3348798751831055e-05, -2.82973051071167e-05, -2.3245811462402344e-05, -1.8194317817687988e-05, -1.3142824172973633e-05, -8.091330528259277e-06, -3.039836883544922e-06, 2.0116567611694336e-06, 7.063150405883789e-06, 1.2114644050598145e-05, 1.71661376953125e-05, 2.2217631340026855e-05, 2.726912498474121e-05, 3.2320618629455566e-05, 3.737211227416992e-05, 4.242360591888428e-05, 4.747509956359863e-05, 5.252659320831299e-05, 5.7578086853027344e-05, 6.26295804977417e-05, 6.768107414245605e-05, 7.273256778717041e-05, 7.778406143188477e-05, 8.283555507659912e-05, 8.788704872131348e-05, 9.293854236602783e-05, 9.799003601074219e-05, 0.00010304152965545654, 0.0001080930233001709, 0.00011314451694488525, 0.00011819601058959961, 0.00012324750423431396, 0.00012829899787902832, 0.00013335049152374268, 0.00013840198516845703, 0.0001434534788131714, 0.00014850497245788574, 0.0001535564661026001, 0.00015860795974731445, 0.0001636594533920288, 0.00016871094703674316, 0.00017376244068145752, 0.00017881393432617188]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 14.0, 15.0, 31.0, 32.0, 46.0, 89.0, 95.0, 131.0, 209.0, 356.0, 650.0, 1147.0, 2381.0, 5758.0, 16846.0, 62787.0, 257237.0, 478319.0, 162984.0, 39511.0, 11482.0, 4239.0, 1889.0, 911.0, 510.0, 291.0, 190.0, 114.0, 70.0, 61.0, 44.0, 27.0, 22.0, 17.0, 10.0, 7.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.07928466796875, -0.07690620422363281, -0.07452774047851562, -0.07214927673339844, -0.06977081298828125, -0.06739234924316406, -0.06501388549804688, -0.06263542175292969, -0.0602569580078125, -0.05787849426269531, -0.055500030517578125, -0.05312156677246094, -0.05074310302734375, -0.04836463928222656, -0.045986175537109375, -0.04360771179199219, -0.041229248046875, -0.03885078430175781, -0.036472320556640625, -0.03409385681152344, -0.03171539306640625, -0.029336929321289062, -0.026958465576171875, -0.024580001831054688, -0.0222015380859375, -0.019823074340820312, -0.017444610595703125, -0.015066146850585938, -0.01268768310546875, -0.010309219360351562, -0.007930755615234375, -0.0055522918701171875, -0.003173828125, -0.0007953643798828125, 0.001583099365234375, 0.0039615631103515625, 0.00634002685546875, 0.008718490600585938, 0.011096954345703125, 0.013475418090820312, 0.0158538818359375, 0.018232345581054688, 0.020610809326171875, 0.022989273071289062, 0.02536773681640625, 0.027746200561523438, 0.030124664306640625, 0.03250312805175781, 0.034881591796875, 0.03726005554199219, 0.039638519287109375, 0.04201698303222656, 0.04439544677734375, 0.04677391052246094, 0.049152374267578125, 0.05153083801269531, 0.0539093017578125, 0.05628776550292969, 0.058666229248046875, 0.06104469299316406, 0.06342315673828125, 0.06580162048339844, 0.06818008422851562, 0.07055854797363281, 0.07293701171875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 13.0, 9.0, 8.0, 11.0, 13.0, 17.0, 18.0, 22.0, 28.0, 29.0, 44.0, 48.0, 54.0, 67.0, 63.0, 63.0, 76.0, 62.0, 59.0, 42.0, 41.0, 36.0, 33.0, 28.0, 17.0, 19.0, 13.0, 9.0, 9.0, 12.0, 7.0, 6.0, 2.0, 1.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049652099609375, -0.04812335968017578, -0.04659461975097656, -0.045065879821777344, -0.043537139892578125, -0.042008399963378906, -0.04047966003417969, -0.03895092010498047, -0.03742218017578125, -0.03589344024658203, -0.03436470031738281, -0.032835960388183594, -0.031307220458984375, -0.029778480529785156, -0.028249740600585938, -0.02672100067138672, -0.0251922607421875, -0.02366352081298828, -0.022134780883789062, -0.020606040954589844, -0.019077301025390625, -0.017548561096191406, -0.016019821166992188, -0.014491081237792969, -0.01296234130859375, -0.011433601379394531, -0.009904861450195312, -0.008376121520996094, -0.006847381591796875, -0.005318641662597656, -0.0037899017333984375, -0.0022611618041992188, -0.000732421875, 0.0007963180541992188, 0.0023250579833984375, 0.0038537979125976562, 0.005382537841796875, 0.006911277770996094, 0.008440017700195312, 0.009968757629394531, 0.01149749755859375, 0.013026237487792969, 0.014554977416992188, 0.016083717346191406, 0.017612457275390625, 0.019141197204589844, 0.020669937133789062, 0.02219867706298828, 0.0237274169921875, 0.02525615692138672, 0.026784896850585938, 0.028313636779785156, 0.029842376708984375, 0.031371116638183594, 0.03289985656738281, 0.03442859649658203, 0.03595733642578125, 0.03748607635498047, 0.03901481628417969, 0.040543556213378906, 0.042072296142578125, 0.043601036071777344, 0.04512977600097656, 0.04665851593017578, 0.048187255859375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 9.0, 45.0, 91.0, 214.0, 263.0, 222.0, 98.0, 41.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.1085917949676514, -2.0650222301483154, -2.0214526653289795, -1.9778831005096436, -1.9343135356903076, -1.8907438516616821, -1.8471742868423462, -1.8036047220230103, -1.7600351572036743, -1.7164655923843384, -1.6728960275650024, -1.6293264627456665, -1.585756778717041, -1.542187213897705, -1.4986176490783691, -1.4550480842590332, -1.4114785194396973, -1.3679089546203613, -1.3243393898010254, -1.2807698249816895, -1.2372002601623535, -1.193630576133728, -1.150061011314392, -1.1064914464950562, -1.0629218816757202, -1.0193523168563843, -0.9757827520370483, -0.9322131276130676, -0.8886435627937317, -0.8450739979743958, -0.801504373550415, -0.7579348087310791, -0.7143653631210327, -0.6707957983016968, -0.6272262334823608, -0.5836566090583801, -0.5400870442390442, -0.49651747941970825, -0.4529478847980499, -0.4093782901763916, -0.36580872535705566, -0.3222391605377197, -0.2786695659160614, -0.23509998619556427, -0.19153040647506714, -0.14796082675457, -0.10439124703407288, -0.06082165241241455, -0.017252087593078613, 0.026317492127418518, 0.06988707184791565, 0.11345665156841278, 0.1570262312889099, 0.20059581100940704, 0.24416539072990417, 0.2877349853515625, 0.33130455017089844, 0.3748741149902344, 0.4184437096118927, 0.462013304233551, 0.505582869052887, 0.5491524338722229, 0.5927220582962036, 0.6362916231155396, 0.6798611879348755]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 9.0, 4.0, 9.0, 11.0, 11.0, 12.0, 17.0, 23.0, 23.0, 22.0, 23.0, 31.0, 31.0, 36.0, 37.0, 39.0, 43.0, 50.0, 34.0, 44.0, 37.0, 37.0, 39.0, 47.0, 39.0, 32.0, 28.0, 29.0, 34.0, 26.0, 23.0, 21.0, 23.0, 14.0, 14.0, 7.0, 12.0, 7.0, 9.0, 2.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.39478808641433716, -0.38276591897010803, -0.3707437515258789, -0.3587215840816498, -0.34669941663742065, -0.33467721939086914, -0.32265505194664, -0.3106328845024109, -0.29861071705818176, -0.28658854961395264, -0.2745663821697235, -0.2625442147254944, -0.25052201747894287, -0.23849986493587494, -0.22647768259048462, -0.2144555151462555, -0.20243334770202637, -0.19041118025779724, -0.17838901281356812, -0.1663668304681778, -0.15434466302394867, -0.14232249557971954, -0.13030031323432922, -0.1182781457901001, -0.10625597834587097, -0.09423381090164185, -0.08221163600683212, -0.0701894611120224, -0.058167293667793274, -0.04614512249827385, -0.034122951328754425, -0.022100776433944702, -0.010078608989715576, 0.0019435621798038483, 0.013965733349323273, 0.025987904518842697, 0.03801007568836212, 0.050032246857881546, 0.06205441802740097, 0.0740765929222107, 0.08609876036643982, 0.09812092781066895, 0.11014310270547867, 0.12216527760028839, 0.13418744504451752, 0.14620961248874664, 0.15823179483413696, 0.1702539622783661, 0.18227612972259521, 0.19429829716682434, 0.20632046461105347, 0.2183426469564438, 0.2303648144006729, 0.24238698184490204, 0.25440916419029236, 0.2664313316345215, 0.2784534990787506, 0.29047566652297974, 0.30249783396720886, 0.314520001411438, 0.3265421986579895, 0.33856436610221863, 0.35058653354644775, 0.3626087009906769, 0.374630868434906]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 13.0, 7.0, 13.0, 20.0, 17.0, 31.0, 64.0, 88.0, 170.0, 373.0, 1140.0, 7134.0, 230821.0, 3915658.0, 35521.0, 2373.0, 466.0, 162.0, 68.0, 38.0, 23.0, 18.0, 13.0, 14.0, 11.0, 5.0, 5.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.54150390625, -0.5283851623535156, -0.5152664184570312, -0.5021476745605469, -0.4890289306640625, -0.4759101867675781, -0.46279144287109375, -0.4496726989746094, -0.436553955078125, -0.4234352111816406, -0.41031646728515625, -0.3971977233886719, -0.3840789794921875, -0.3709602355957031, -0.35784149169921875, -0.3447227478027344, -0.33160400390625, -0.3184852600097656, -0.30536651611328125, -0.2922477722167969, -0.2791290283203125, -0.2660102844238281, -0.25289154052734375, -0.23977279663085938, -0.226654052734375, -0.21353530883789062, -0.20041656494140625, -0.18729782104492188, -0.1741790771484375, -0.16106033325195312, -0.14794158935546875, -0.13482284545898438, -0.1217041015625, -0.10858535766601562, -0.09546661376953125, -0.08234786987304688, -0.0692291259765625, -0.056110382080078125, -0.04299163818359375, -0.029872894287109375, -0.016754150390625, -0.003635406494140625, 0.00948333740234375, 0.022602081298828125, 0.0357208251953125, 0.048839569091796875, 0.06195831298828125, 0.07507705688476562, 0.08819580078125, 0.10131454467773438, 0.11443328857421875, 0.12755203247070312, 0.1406707763671875, 0.15378952026367188, 0.16690826416015625, 0.18002700805664062, 0.193145751953125, 0.20626449584960938, 0.21938323974609375, 0.23250198364257812, 0.2456207275390625, 0.2587394714355469, 0.27185821533203125, 0.2849769592285156, 0.298095703125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 8.0, 9.0, 7.0, 9.0, 15.0, 24.0, 28.0, 42.0, 48.0, 56.0, 66.0, 78.0, 73.0, 81.0, 64.0, 84.0, 57.0, 63.0, 56.0, 30.0, 28.0, 25.0, 13.0, 7.0, 11.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0291900634765625, -0.028463363647460938, -0.027736663818359375, -0.027009963989257812, -0.02628326416015625, -0.025556564331054688, -0.024829864501953125, -0.024103164672851562, -0.02337646484375, -0.022649765014648438, -0.021923065185546875, -0.021196365356445312, -0.02046966552734375, -0.019742965698242188, -0.019016265869140625, -0.018289566040039062, -0.0175628662109375, -0.016836166381835938, -0.016109466552734375, -0.015382766723632812, -0.01465606689453125, -0.013929367065429688, -0.013202667236328125, -0.012475967407226562, -0.011749267578125, -0.011022567749023438, -0.010295867919921875, -0.009569168090820312, -0.00884246826171875, -0.008115768432617188, -0.007389068603515625, -0.0066623687744140625, -0.0059356689453125, -0.0052089691162109375, -0.004482269287109375, -0.0037555694580078125, -0.00302886962890625, -0.0023021697998046875, -0.001575469970703125, -0.0008487701416015625, -0.0001220703125, 0.0006046295166015625, 0.001331329345703125, 0.0020580291748046875, 0.00278472900390625, 0.0035114288330078125, 0.004238128662109375, 0.0049648284912109375, 0.0056915283203125, 0.0064182281494140625, 0.007144927978515625, 0.007871627807617188, 0.00859832763671875, 0.009325027465820312, 0.010051727294921875, 0.010778427124023438, 0.011505126953125, 0.012231826782226562, 0.012958526611328125, 0.013685226440429688, 0.01441192626953125, 0.015138626098632812, 0.015865325927734375, 0.016592025756835938, 0.0173187255859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 10.0, 10.0, 22.0, 38.0, 63.0, 170.0, 948.0, 3703934.0, 488089.0, 638.0, 145.0, 64.0, 59.0, 40.0, 29.0, 16.0, 8.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.693359375, -1.6539230346679688, -1.6144866943359375, -1.5750503540039062, -1.535614013671875, -1.4961776733398438, -1.4567413330078125, -1.4173049926757812, -1.37786865234375, -1.3384323120117188, -1.2989959716796875, -1.2595596313476562, -1.220123291015625, -1.1806869506835938, -1.1412506103515625, -1.1018142700195312, -1.0623779296875, -1.0229415893554688, -0.9835052490234375, -0.9440689086914062, -0.904632568359375, -0.8651962280273438, -0.8257598876953125, -0.7863235473632812, -0.74688720703125, -0.7074508666992188, -0.6680145263671875, -0.6285781860351562, -0.589141845703125, -0.5497055053710938, -0.5102691650390625, -0.47083282470703125, -0.431396484375, -0.39196014404296875, -0.3525238037109375, -0.31308746337890625, -0.273651123046875, -0.23421478271484375, -0.1947784423828125, -0.15534210205078125, -0.11590576171875, -0.07646942138671875, -0.0370330810546875, 0.00240325927734375, 0.041839599609375, 0.08127593994140625, 0.1207122802734375, 0.16014862060546875, 0.1995849609375, 0.23902130126953125, 0.2784576416015625, 0.31789398193359375, 0.357330322265625, 0.39676666259765625, 0.4362030029296875, 0.47563934326171875, 0.51507568359375, 0.5545120239257812, 0.5939483642578125, 0.6333847045898438, 0.672821044921875, 0.7122573852539062, 0.7516937255859375, 0.7911300659179688, 0.83056640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 11.0, 26.0, 92.0, 405.0, 2130.0, 1109.0, 220.0, 59.0, 21.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048553466796875, -0.044451236724853516, -0.04034900665283203, -0.03624677658081055, -0.03214454650878906, -0.028042316436767578, -0.023940086364746094, -0.01983785629272461, -0.015735626220703125, -0.01163339614868164, -0.007531166076660156, -0.003428936004638672, 0.0006732940673828125, 0.004775524139404297, 0.008877754211425781, 0.012979984283447266, 0.01708221435546875, 0.021184444427490234, 0.02528667449951172, 0.029388904571533203, 0.03349113464355469, 0.03759336471557617, 0.041695594787597656, 0.04579782485961914, 0.049900054931640625, 0.05400228500366211, 0.058104515075683594, 0.06220674514770508, 0.06630897521972656, 0.07041120529174805, 0.07451343536376953, 0.07861566543579102, 0.0827178955078125, 0.08682012557983398, 0.09092235565185547, 0.09502458572387695, 0.09912681579589844, 0.10322904586791992, 0.1073312759399414, 0.11143350601196289, 0.11553573608398438, 0.11963796615600586, 0.12374019622802734, 0.12784242630004883, 0.1319446563720703, 0.1360468864440918, 0.14014911651611328, 0.14425134658813477, 0.14835357666015625, 0.15245580673217773, 0.15655803680419922, 0.1606602668762207, 0.1647624969482422, 0.16886472702026367, 0.17296695709228516, 0.17706918716430664, 0.18117141723632812, 0.1852736473083496, 0.1893758773803711, 0.19347810745239258, 0.19758033752441406, 0.20168256759643555, 0.20578479766845703, 0.20988702774047852, 0.2139892578125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 5.0, 6.0, 69.0, 263.0, 468.0, 161.0, 28.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6254324316978455, -0.5931128859519958, -0.5607932806015015, -0.5284737348556519, -0.49615412950515747, -0.46383458375930786, -0.43151500821113586, -0.39919543266296387, -0.36687585711479187, -0.3345562815666199, -0.3022367060184479, -0.2699171304702759, -0.23759756982326508, -0.20527799427509308, -0.17295843362808228, -0.14063885807991028, -0.10831928253173828, -0.07599970698356628, -0.043680138885974884, -0.011360570788383484, 0.020959004759788513, 0.05327858030796051, 0.08559814095497131, 0.11791771650314331, 0.1502372920513153, 0.1825568675994873, 0.2148764431476593, 0.2471960037946701, 0.2795155644416809, 0.3118351697921753, 0.3441547155380249, 0.3764742910861969, 0.4087938070297241, 0.4411133825778961, 0.4734329581260681, 0.5057525038719177, 0.5380721092224121, 0.5703916549682617, 0.6027112007141113, 0.6350308060646057, 0.6673504114151001, 0.6996699571609497, 0.7319895625114441, 0.7643091082572937, 0.7966287136077881, 0.8289482593536377, 0.8612678050994873, 0.8935874104499817, 0.9259069561958313, 0.9582265019416809, 0.9905461072921753, 1.022865653038025, 1.0551851987838745, 1.0875048637390137, 1.1198244094848633, 1.152143955230713, 1.1844635009765625, 1.216783046722412, 1.2491025924682617, 1.2814222574234009, 1.3137418031692505, 1.3460613489151, 1.3783808946609497, 1.4107005596160889, 1.4430201053619385]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 16.0, 13.0, 27.0, 36.0, 39.0, 43.0, 63.0, 85.0, 97.0, 91.0, 74.0, 86.0, 70.0, 57.0, 57.0, 37.0, 33.0, 34.0, 8.0, 11.0, 10.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29283571243286133, -0.2841697335243225, -0.2755037248134613, -0.2668377459049225, -0.25817176699638367, -0.24950577318668365, -0.24083977937698364, -0.23217380046844482, -0.2235078066587448, -0.2148418128490448, -0.20617583394050598, -0.19750984013080597, -0.18884384632110596, -0.18017786741256714, -0.17151187360286713, -0.16284587979316711, -0.1541799008846283, -0.14551390707492828, -0.13684792816638947, -0.12818193435668945, -0.11951594799757004, -0.11084996163845062, -0.10218396782875061, -0.0935179814696312, -0.08485199511051178, -0.07618600875139236, -0.06752002239227295, -0.05885402858257294, -0.05018804222345352, -0.041522055864334106, -0.03285606577992439, -0.02419007569551468, -0.015524089336395264, -0.006858101114630699, 0.0018078871071338654, 0.01047387532889843, 0.019139863550662994, 0.02780584990978241, 0.03647183999419212, 0.04513783007860184, 0.05380381643772125, 0.06246980279684067, 0.07113578915596008, 0.0798017829656601, 0.08846776932477951, 0.09713375568389893, 0.10579974949359894, 0.11446573585271835, 0.12313172221183777, 0.13179771602153778, 0.1404636949300766, 0.1491296887397766, 0.15779566764831543, 0.16646166145801544, 0.17512765526771545, 0.18379363417625427, 0.19245962798595428, 0.2011256217956543, 0.20979160070419312, 0.21845759451389313, 0.22712358832359314, 0.23578956723213196, 0.24445556104183197, 0.253121554851532, 0.2617875337600708]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 13.0, 9.0, 23.0, 37.0, 46.0, 68.0, 111.0, 363.0, 1579.0, 18411.0, 673998.0, 343658.0, 8695.0, 1016.0, 246.0, 88.0, 55.0, 36.0, 27.0, 22.0, 16.0, 14.0, 7.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.319580078125, -0.3088836669921875, -0.298187255859375, -0.2874908447265625, -0.27679443359375, -0.2660980224609375, -0.255401611328125, -0.2447052001953125, -0.2340087890625, -0.2233123779296875, -0.212615966796875, -0.2019195556640625, -0.19122314453125, -0.1805267333984375, -0.169830322265625, -0.1591339111328125, -0.1484375, -0.1377410888671875, -0.127044677734375, -0.1163482666015625, -0.10565185546875, -0.0949554443359375, -0.084259033203125, -0.0735626220703125, -0.0628662109375, -0.0521697998046875, -0.041473388671875, -0.0307769775390625, -0.02008056640625, -0.0093841552734375, 0.001312255859375, 0.0120086669921875, 0.022705078125, 0.0334014892578125, 0.044097900390625, 0.0547943115234375, 0.06549072265625, 0.0761871337890625, 0.086883544921875, 0.0975799560546875, 0.1082763671875, 0.1189727783203125, 0.129669189453125, 0.1403656005859375, 0.15106201171875, 0.1617584228515625, 0.172454833984375, 0.1831512451171875, 0.19384765625, 0.2045440673828125, 0.215240478515625, 0.2259368896484375, 0.23663330078125, 0.2473297119140625, 0.258026123046875, 0.2687225341796875, 0.2794189453125, 0.2901153564453125, 0.300811767578125, 0.3115081787109375, 0.32220458984375, 0.3329010009765625, 0.343597412109375, 0.3542938232421875, 0.364990234375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 6.0, 4.0, 7.0, 11.0, 12.0, 17.0, 20.0, 22.0, 21.0, 38.0, 36.0, 54.0, 61.0, 50.0, 68.0, 67.0, 58.0, 56.0, 64.0, 59.0, 63.0, 41.0, 36.0, 29.0, 30.0, 16.0, 16.0, 12.0, 8.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.022216796875, -0.021599769592285156, -0.020982742309570312, -0.02036571502685547, -0.019748687744140625, -0.01913166046142578, -0.018514633178710938, -0.017897605895996094, -0.01728057861328125, -0.016663551330566406, -0.016046524047851562, -0.015429496765136719, -0.014812469482421875, -0.014195442199707031, -0.013578414916992188, -0.012961387634277344, -0.0123443603515625, -0.011727333068847656, -0.011110305786132812, -0.010493278503417969, -0.009876251220703125, -0.009259223937988281, -0.008642196655273438, -0.008025169372558594, -0.00740814208984375, -0.006791114807128906, -0.0061740875244140625, -0.005557060241699219, -0.004940032958984375, -0.004323005676269531, -0.0037059783935546875, -0.0030889511108398438, -0.002471923828125, -0.0018548965454101562, -0.0012378692626953125, -0.0006208419799804688, -3.814697265625e-06, 0.0006132125854492188, 0.0012302398681640625, 0.0018472671508789062, 0.00246429443359375, 0.0030813217163085938, 0.0036983489990234375, 0.004315376281738281, 0.004932403564453125, 0.005549430847167969, 0.0061664581298828125, 0.006783485412597656, 0.0074005126953125, 0.008017539978027344, 0.008634567260742188, 0.009251594543457031, 0.009868621826171875, 0.010485649108886719, 0.011102676391601562, 0.011719703674316406, 0.01233673095703125, 0.012953758239746094, 0.013570785522460938, 0.014187812805175781, 0.014804840087890625, 0.015421867370605469, 0.016038894653320312, 0.016655921936035156, 0.01727294921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 3.0, 3.0, 4.0, 7.0, 16.0, 17.0, 29.0, 36.0, 60.0, 83.0, 119.0, 195.0, 327.0, 549.0, 1021.0, 2045.0, 4862.0, 15087.0, 65419.0, 323142.0, 474918.0, 121994.0, 25544.0, 7285.0, 2736.0, 1293.0, 694.0, 384.0, 241.0, 146.0, 89.0, 64.0, 66.0, 27.0, 18.0, 4.0, 11.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1397705078125, -0.13601207733154297, -0.13225364685058594, -0.1284952163696289, -0.12473678588867188, -0.12097835540771484, -0.11721992492675781, -0.11346149444580078, -0.10970306396484375, -0.10594463348388672, -0.10218620300292969, -0.09842777252197266, -0.09466934204101562, -0.0909109115600586, -0.08715248107910156, -0.08339405059814453, -0.0796356201171875, -0.07587718963623047, -0.07211875915527344, -0.0683603286743164, -0.06460189819335938, -0.060843467712402344, -0.05708503723144531, -0.05332660675048828, -0.04956817626953125, -0.04580974578857422, -0.04205131530761719, -0.038292884826660156, -0.034534454345703125, -0.030776023864746094, -0.027017593383789062, -0.02325916290283203, -0.019500732421875, -0.01574230194091797, -0.011983871459960938, -0.008225440979003906, -0.004467010498046875, -0.0007085800170898438, 0.0030498504638671875, 0.006808280944824219, 0.01056671142578125, 0.014325141906738281, 0.018083572387695312, 0.021842002868652344, 0.025600433349609375, 0.029358863830566406, 0.03311729431152344, 0.03687572479248047, 0.0406341552734375, 0.04439258575439453, 0.04815101623535156, 0.051909446716308594, 0.055667877197265625, 0.059426307678222656, 0.06318473815917969, 0.06694316864013672, 0.07070159912109375, 0.07446002960205078, 0.07821846008300781, 0.08197689056396484, 0.08573532104492188, 0.0894937515258789, 0.09325218200683594, 0.09701061248779297, 0.10076904296875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 10.0, 9.0, 9.0, 15.0, 15.0, 19.0, 22.0, 37.0, 28.0, 47.0, 40.0, 65.0, 43.0, 55.0, 52.0, 75.0, 58.0, 47.0, 65.0, 44.0, 50.0, 38.0, 49.0, 24.0, 28.0, 16.0, 15.0, 6.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1280517578125, -0.1250162124633789, -0.12198066711425781, -0.11894512176513672, -0.11590957641601562, -0.11287403106689453, -0.10983848571777344, -0.10680294036865234, -0.10376739501953125, -0.10073184967041016, -0.09769630432128906, -0.09466075897216797, -0.09162521362304688, -0.08858966827392578, -0.08555412292480469, -0.0825185775756836, -0.0794830322265625, -0.0764474868774414, -0.07341194152832031, -0.07037639617919922, -0.06734085083007812, -0.06430530548095703, -0.06126976013183594, -0.058234214782714844, -0.05519866943359375, -0.052163124084472656, -0.04912757873535156, -0.04609203338623047, -0.043056488037109375, -0.04002094268798828, -0.03698539733886719, -0.033949851989746094, -0.030914306640625, -0.027878761291503906, -0.024843215942382812, -0.02180767059326172, -0.018772125244140625, -0.01573657989501953, -0.012701034545898438, -0.009665489196777344, -0.00662994384765625, -0.0035943984985351562, -0.0005588531494140625, 0.0024766921997070312, 0.005512237548828125, 0.008547782897949219, 0.011583328247070312, 0.014618873596191406, 0.0176544189453125, 0.020689964294433594, 0.023725509643554688, 0.02676105499267578, 0.029796600341796875, 0.03283214569091797, 0.03586769104003906, 0.038903236389160156, 0.04193878173828125, 0.044974327087402344, 0.04800987243652344, 0.05104541778564453, 0.054080963134765625, 0.05711650848388672, 0.06015205383300781, 0.0631875991821289, 0.06622314453125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 7.0, 22.0, 24.0, 37.0, 61.0, 105.0, 224.0, 414.0, 985.0, 2653.0, 7951.0, 32811.0, 203707.0, 581009.0, 177414.0, 29620.0, 7261.0, 2382.0, 984.0, 405.0, 203.0, 90.0, 63.0, 37.0, 35.0, 17.0, 11.0, 6.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0841064453125, -0.0813455581665039, -0.07858467102050781, -0.07582378387451172, -0.07306289672851562, -0.07030200958251953, -0.06754112243652344, -0.06478023529052734, -0.06201934814453125, -0.059258460998535156, -0.05649757385253906, -0.05373668670654297, -0.050975799560546875, -0.04821491241455078, -0.04545402526855469, -0.042693138122558594, -0.0399322509765625, -0.037171363830566406, -0.03441047668457031, -0.03164958953857422, -0.028888702392578125, -0.02612781524658203, -0.023366928100585938, -0.020606040954589844, -0.01784515380859375, -0.015084266662597656, -0.012323379516601562, -0.009562492370605469, -0.006801605224609375, -0.004040718078613281, -0.0012798309326171875, 0.0014810562133789062, 0.004241943359375, 0.007002830505371094, 0.009763717651367188, 0.012524604797363281, 0.015285491943359375, 0.01804637908935547, 0.020807266235351562, 0.023568153381347656, 0.02632904052734375, 0.029089927673339844, 0.03185081481933594, 0.03461170196533203, 0.037372589111328125, 0.04013347625732422, 0.04289436340332031, 0.045655250549316406, 0.0484161376953125, 0.051177024841308594, 0.05393791198730469, 0.05669879913330078, 0.059459686279296875, 0.06222057342529297, 0.06498146057128906, 0.06774234771728516, 0.07050323486328125, 0.07326412200927734, 0.07602500915527344, 0.07878589630126953, 0.08154678344726562, 0.08430767059326172, 0.08706855773925781, 0.0898294448852539, 0.09259033203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 3.0, 7.0, 10.0, 12.0, 20.0, 32.0, 31.0, 48.0, 41.0, 79.0, 72.0, 93.0, 103.0, 95.0, 76.0, 68.0, 43.0, 38.0, 30.0, 16.0, 23.0, 9.0, 16.0, 7.0, 7.0, 3.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.079673767089844e-05, -5.809031426906586e-05, -5.5383890867233276e-05, -5.2677467465400696e-05, -4.9971044063568115e-05, -4.7264620661735535e-05, -4.4558197259902954e-05, -4.1851773858070374e-05, -3.914535045623779e-05, -3.643892705440521e-05, -3.373250365257263e-05, -3.102608025074005e-05, -2.831965684890747e-05, -2.561323344707489e-05, -2.290681004524231e-05, -2.020038664340973e-05, -1.749396324157715e-05, -1.4787539839744568e-05, -1.2081116437911987e-05, -9.374693036079407e-06, -6.668269634246826e-06, -3.961846232414246e-06, -1.255422830581665e-06, 1.4510005712509155e-06, 4.157423973083496e-06, 6.863847374916077e-06, 9.570270776748657e-06, 1.2276694178581238e-05, 1.4983117580413818e-05, 1.76895409822464e-05, 2.039596438407898e-05, 2.310238778591156e-05, 2.580881118774414e-05, 2.851523458957672e-05, 3.12216579914093e-05, 3.392808139324188e-05, 3.663450479507446e-05, 3.9340928196907043e-05, 4.2047351598739624e-05, 4.4753775000572205e-05, 4.7460198402404785e-05, 5.0166621804237366e-05, 5.2873045206069946e-05, 5.557946860790253e-05, 5.828589200973511e-05, 6.099231541156769e-05, 6.369873881340027e-05, 6.640516221523285e-05, 6.911158561706543e-05, 7.181800901889801e-05, 7.452443242073059e-05, 7.723085582256317e-05, 7.993727922439575e-05, 8.264370262622833e-05, 8.535012602806091e-05, 8.80565494298935e-05, 9.076297283172607e-05, 9.346939623355865e-05, 9.617581963539124e-05, 9.888224303722382e-05, 0.0001015886664390564, 0.00010429508984088898, 0.00010700151324272156, 0.00010970793664455414, 0.00011241436004638672]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 9.0, 13.0, 11.0, 23.0, 44.0, 62.0, 101.0, 228.0, 473.0, 915.0, 2178.0, 6023.0, 24065.0, 148016.0, 565005.0, 248675.0, 38884.0, 8732.0, 2817.0, 1123.0, 548.0, 264.0, 128.0, 85.0, 41.0, 25.0, 22.0, 12.0, 9.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.10333251953125, -0.10065841674804688, -0.09798431396484375, -0.09531021118164062, -0.0926361083984375, -0.08996200561523438, -0.08728790283203125, -0.08461380004882812, -0.081939697265625, -0.07926559448242188, -0.07659149169921875, -0.07391738891601562, -0.0712432861328125, -0.06856918334960938, -0.06589508056640625, -0.06322097778320312, -0.060546875, -0.057872772216796875, -0.05519866943359375, -0.052524566650390625, -0.0498504638671875, -0.047176361083984375, -0.04450225830078125, -0.041828155517578125, -0.039154052734375, -0.036479949951171875, -0.03380584716796875, -0.031131744384765625, -0.0284576416015625, -0.025783538818359375, -0.02310943603515625, -0.020435333251953125, -0.01776123046875, -0.015087127685546875, -0.01241302490234375, -0.009738922119140625, -0.0070648193359375, -0.004390716552734375, -0.00171661376953125, 0.000957489013671875, 0.003631591796875, 0.006305694580078125, 0.00897979736328125, 0.011653900146484375, 0.0143280029296875, 0.017002105712890625, 0.01967620849609375, 0.022350311279296875, 0.0250244140625, 0.027698516845703125, 0.03037261962890625, 0.033046722412109375, 0.0357208251953125, 0.038394927978515625, 0.04106903076171875, 0.043743133544921875, 0.046417236328125, 0.049091339111328125, 0.05176544189453125, 0.054439544677734375, 0.0571136474609375, 0.059787750244140625, 0.06246185302734375, 0.06513595581054688, 0.06781005859375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0, 5.0, 10.0, 14.0, 26.0, 39.0, 35.0, 58.0, 58.0, 81.0, 94.0, 108.0, 83.0, 77.0, 84.0, 59.0, 46.0, 32.0, 20.0, 18.0, 15.0, 6.0, 9.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08056640625, -0.07858419418334961, -0.07660198211669922, -0.07461977005004883, -0.07263755798339844, -0.07065534591674805, -0.06867313385009766, -0.06669092178344727, -0.06470870971679688, -0.06272649765014648, -0.060744285583496094, -0.0587620735168457, -0.05677986145019531, -0.05479764938354492, -0.05281543731689453, -0.05083322525024414, -0.04885101318359375, -0.04686880111694336, -0.04488658905029297, -0.04290437698364258, -0.04092216491699219, -0.0389399528503418, -0.036957740783691406, -0.034975528717041016, -0.032993316650390625, -0.031011104583740234, -0.029028892517089844, -0.027046680450439453, -0.025064468383789062, -0.023082256317138672, -0.02110004425048828, -0.01911783218383789, -0.0171356201171875, -0.01515340805053711, -0.013171195983886719, -0.011188983917236328, -0.009206771850585938, -0.007224559783935547, -0.005242347717285156, -0.0032601356506347656, -0.001277923583984375, 0.0007042884826660156, 0.0026865005493164062, 0.004668712615966797, 0.0066509246826171875, 0.008633136749267578, 0.010615348815917969, 0.01259756088256836, 0.01457977294921875, 0.01656198501586914, 0.01854419708251953, 0.020526409149169922, 0.022508621215820312, 0.024490833282470703, 0.026473045349121094, 0.028455257415771484, 0.030437469482421875, 0.032419681549072266, 0.034401893615722656, 0.03638410568237305, 0.03836631774902344, 0.04034852981567383, 0.04233074188232422, 0.04431295394897461, 0.046295166015625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 14.0, 52.0, 149.0, 316.0, 280.0, 129.0, 32.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2901668548583984, -1.2341132164001465, -1.1780595779418945, -1.1220059394836426, -1.0659524202346802, -1.0098987817764282, -0.9538451433181763, -0.8977915048599243, -0.8417378664016724, -0.7856842279434204, -0.7296306490898132, -0.6735770106315613, -0.6175233721733093, -0.5614697933197021, -0.5054161548614502, -0.44936251640319824, -0.39330893754959106, -0.3372553288936615, -0.28120169043540955, -0.22514808177947998, -0.16909445822238922, -0.11304083466529846, -0.056987226009368896, -0.0009335875511169434, 0.05512002110481262, 0.11117364466190338, 0.16722726821899414, 0.2232808768749237, 0.27933448553085327, 0.3353881239891052, 0.3914417326450348, 0.44749537110328674, 0.5035489797592163, 0.5596026182174683, 0.6156561970710754, 0.6717098355293274, 0.7277634739875793, 0.7838170528411865, 0.8398706912994385, 0.8959243297576904, 0.9519779682159424, 1.0080316066741943, 1.0640852451324463, 1.1201388835906982, 1.1761924028396606, 1.2322460412979126, 1.2882996797561646, 1.3443533182144165, 1.400406837463379, 1.4564604759216309, 1.5125141143798828, 1.5685677528381348, 1.6246212720870972, 1.6806749105453491, 1.736728549003601, 1.792782187461853, 1.848835825920105, 1.904889464378357, 1.9609431028366089, 2.0169966220855713, 2.0730502605438232, 2.129103899002075, 2.185157537460327, 2.241211175918579, 2.297264814376831]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 10.0, 5.0, 7.0, 8.0, 14.0, 16.0, 18.0, 18.0, 26.0, 22.0, 28.0, 25.0, 39.0, 38.0, 41.0, 36.0, 46.0, 39.0, 46.0, 43.0, 38.0, 36.0, 37.0, 36.0, 31.0, 39.0, 34.0, 33.0, 28.0, 12.0, 26.0, 19.0, 17.0, 15.0, 14.0, 9.0, 13.0, 11.0, 6.0, 2.0, 4.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.4393470883369446, -0.4269736409187317, -0.4146001935005188, -0.4022267460823059, -0.389853298664093, -0.3774798512458801, -0.36510640382766724, -0.35273295640945435, -0.34035950899124146, -0.32798606157302856, -0.3156126141548157, -0.3032391667366028, -0.2908657193183899, -0.278492271900177, -0.2661188244819641, -0.2537453770637512, -0.24137195944786072, -0.22899851202964783, -0.21662506461143494, -0.20425161719322205, -0.19187816977500916, -0.17950472235679626, -0.16713128983974457, -0.15475784242153168, -0.1423843950033188, -0.1300109475851059, -0.117637500166893, -0.10526406019926071, -0.09289061278104782, -0.08051716536283493, -0.06814372539520264, -0.055770277976989746, -0.043396830558776855, -0.031023385003209114, -0.018649939447641373, -0.0062764957547187805, 0.00609695166349411, 0.018470399081707, 0.030843839049339294, 0.043217286467552185, 0.055590733885765076, 0.06796418130397797, 0.08033762872219086, 0.09271106868982315, 0.10508451610803604, 0.11745796352624893, 0.12983140349388123, 0.14220485091209412, 0.154578298330307, 0.1669517457485199, 0.1793251931667328, 0.19169864058494568, 0.20407208800315857, 0.21644553542137146, 0.22881896793842316, 0.24119241535663605, 0.25356584787368774, 0.26593929529190063, 0.2783127427101135, 0.2906861901283264, 0.3030596375465393, 0.3154330849647522, 0.3278065323829651, 0.340179979801178, 0.35255342721939087]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 10.0, 16.0, 21.0, 27.0, 36.0, 65.0, 99.0, 202.0, 425.0, 1270.0, 4565.0, 31194.0, 1737772.0, 2378663.0, 33500.0, 4413.0, 1138.0, 413.0, 150.0, 77.0, 68.0, 28.0, 22.0, 19.0, 13.0, 12.0, 8.0, 3.0, 9.0, 8.0, 6.0, 3.0, 6.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2783203125, -0.2683868408203125, -0.258453369140625, -0.2485198974609375, -0.23858642578125, -0.2286529541015625, -0.218719482421875, -0.2087860107421875, -0.1988525390625, -0.1889190673828125, -0.178985595703125, -0.1690521240234375, -0.15911865234375, -0.1491851806640625, -0.139251708984375, -0.1293182373046875, -0.119384765625, -0.1094512939453125, -0.099517822265625, -0.0895843505859375, -0.07965087890625, -0.0697174072265625, -0.059783935546875, -0.0498504638671875, -0.0399169921875, -0.0299835205078125, -0.020050048828125, -0.0101165771484375, -0.00018310546875, 0.0097503662109375, 0.019683837890625, 0.0296173095703125, 0.03955078125, 0.0494842529296875, 0.059417724609375, 0.0693511962890625, 0.07928466796875, 0.0892181396484375, 0.099151611328125, 0.1090850830078125, 0.1190185546875, 0.1289520263671875, 0.138885498046875, 0.1488189697265625, 0.15875244140625, 0.1686859130859375, 0.178619384765625, 0.1885528564453125, 0.198486328125, 0.2084197998046875, 0.218353271484375, 0.2282867431640625, 0.23822021484375, 0.2481536865234375, 0.258087158203125, 0.2680206298828125, 0.2779541015625, 0.2878875732421875, 0.297821044921875, 0.3077545166015625, 0.31768798828125, 0.3276214599609375, 0.337554931640625, 0.3474884033203125, 0.357421875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 6.0, 7.0, 5.0, 7.0, 11.0, 18.0, 21.0, 24.0, 31.0, 29.0, 43.0, 51.0, 39.0, 43.0, 71.0, 87.0, 61.0, 67.0, 49.0, 51.0, 41.0, 43.0, 41.0, 31.0, 36.0, 14.0, 20.0, 14.0, 10.0, 10.0, 8.0, 5.0, 5.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0214996337890625, -0.02090597152709961, -0.02031230926513672, -0.019718647003173828, -0.019124984741210938, -0.018531322479248047, -0.017937660217285156, -0.017343997955322266, -0.016750335693359375, -0.016156673431396484, -0.015563011169433594, -0.014969348907470703, -0.014375686645507812, -0.013782024383544922, -0.013188362121582031, -0.01259469985961914, -0.01200103759765625, -0.01140737533569336, -0.010813713073730469, -0.010220050811767578, -0.009626388549804688, -0.009032726287841797, -0.008439064025878906, -0.007845401763916016, -0.007251739501953125, -0.006658077239990234, -0.006064414978027344, -0.005470752716064453, -0.0048770904541015625, -0.004283428192138672, -0.0036897659301757812, -0.0030961036682128906, -0.00250244140625, -0.0019087791442871094, -0.0013151168823242188, -0.0007214546203613281, -0.0001277923583984375, 0.0004658699035644531, 0.0010595321655273438, 0.0016531944274902344, 0.002246856689453125, 0.0028405189514160156, 0.0034341812133789062, 0.004027843475341797, 0.0046215057373046875, 0.005215167999267578, 0.005808830261230469, 0.006402492523193359, 0.00699615478515625, 0.007589817047119141, 0.008183479309082031, 0.008777141571044922, 0.009370803833007812, 0.009964466094970703, 0.010558128356933594, 0.011151790618896484, 0.011745452880859375, 0.012339115142822266, 0.012932777404785156, 0.013526439666748047, 0.014120101928710938, 0.014713764190673828, 0.015307426452636719, 0.01590108871459961, 0.0164947509765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 14.0, 19.0, 35.0, 88.0, 165.0, 507.0, 2132.0, 18714.0, 3964684.0, 200876.0, 5590.0, 976.0, 301.0, 102.0, 46.0, 18.0, 12.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46875, -0.4498138427734375, -0.430877685546875, -0.4119415283203125, -0.39300537109375, -0.3740692138671875, -0.355133056640625, -0.3361968994140625, -0.3172607421875, -0.2983245849609375, -0.279388427734375, -0.2604522705078125, -0.24151611328125, -0.2225799560546875, -0.203643798828125, -0.1847076416015625, -0.165771484375, -0.1468353271484375, -0.127899169921875, -0.1089630126953125, -0.09002685546875, -0.0710906982421875, -0.052154541015625, -0.0332183837890625, -0.0142822265625, 0.0046539306640625, 0.023590087890625, 0.0425262451171875, 0.06146240234375, 0.0803985595703125, 0.099334716796875, 0.1182708740234375, 0.13720703125, 0.1561431884765625, 0.175079345703125, 0.1940155029296875, 0.21295166015625, 0.2318878173828125, 0.250823974609375, 0.2697601318359375, 0.2886962890625, 0.3076324462890625, 0.326568603515625, 0.3455047607421875, 0.36444091796875, 0.3833770751953125, 0.402313232421875, 0.4212493896484375, 0.440185546875, 0.4591217041015625, 0.478057861328125, 0.4969940185546875, 0.51593017578125, 0.5348663330078125, 0.553802490234375, 0.5727386474609375, 0.5916748046875, 0.6106109619140625, 0.629547119140625, 0.6484832763671875, 0.66741943359375, 0.6863555908203125, 0.705291748046875, 0.7242279052734375, 0.7431640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 12.0, 20.0, 38.0, 76.0, 175.0, 444.0, 1332.0, 1188.0, 458.0, 176.0, 67.0, 33.0, 15.0, 13.0, 3.0, 8.0, 3.0, 3.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12548828125, -0.1217947006225586, -0.11810111999511719, -0.11440753936767578, -0.11071395874023438, -0.10702037811279297, -0.10332679748535156, -0.09963321685791016, -0.09593963623046875, -0.09224605560302734, -0.08855247497558594, -0.08485889434814453, -0.08116531372070312, -0.07747173309326172, -0.07377815246582031, -0.0700845718383789, -0.0663909912109375, -0.0626974105834961, -0.05900382995605469, -0.05531024932861328, -0.051616668701171875, -0.04792308807373047, -0.04422950744628906, -0.040535926818847656, -0.03684234619140625, -0.033148765563964844, -0.029455184936523438, -0.02576160430908203, -0.022068023681640625, -0.01837444305419922, -0.014680862426757812, -0.010987281799316406, -0.007293701171875, -0.0036001205444335938, 9.34600830078125e-05, 0.0037870407104492188, 0.007480621337890625, 0.011174201965332031, 0.014867782592773438, 0.018561363220214844, 0.02225494384765625, 0.025948524475097656, 0.029642105102539062, 0.03333568572998047, 0.037029266357421875, 0.04072284698486328, 0.04441642761230469, 0.048110008239746094, 0.0518035888671875, 0.055497169494628906, 0.05919075012207031, 0.06288433074951172, 0.06657791137695312, 0.07027149200439453, 0.07396507263183594, 0.07765865325927734, 0.08135223388671875, 0.08504581451416016, 0.08873939514160156, 0.09243297576904297, 0.09612655639648438, 0.09982013702392578, 0.10351371765136719, 0.1072072982788086, 0.11090087890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 6.0, 33.0, 159.0, 441.0, 287.0, 64.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8203022480010986, -0.7710500359535217, -0.7217978239059448, -0.6725456714630127, -0.6232934594154358, -0.5740412473678589, -0.524789035320282, -0.47553685307502747, -0.42628464102745056, -0.37703242897987366, -0.32778024673461914, -0.27852803468704224, -0.22927583754062653, -0.18002364039421082, -0.1307714283466339, -0.0815192461013794, -0.03226703405380249, 0.01698516681790352, 0.06623736768960953, 0.11548957228660583, 0.16474176943302155, 0.21399396657943726, 0.26324617862701416, 0.3124983608722687, 0.3617505729198456, 0.4110027849674225, 0.460254967212677, 0.5095071792602539, 0.5587593913078308, 0.6080116033554077, 0.6572637557983398, 0.7065159678459167, 0.7557681798934937, 0.8050203919410706, 0.8542726039886475, 0.9035247564315796, 0.9527769684791565, 1.0020291805267334, 1.051281452178955, 1.1005336046218872, 1.1497857570648193, 1.1990379095077515, 1.2482901811599731, 1.2975423336029053, 1.346794605255127, 1.396046757698059, 1.4452989101409912, 1.494551181793213, 1.5438034534454346, 1.5930556058883667, 1.6423078775405884, 1.6915600299835205, 1.7408123016357422, 1.7900644540786743, 1.8393166065216064, 1.8885688781738281, 1.9378210306167603, 1.9870731830596924, 2.036325454711914, 2.0855777263641357, 2.1348297595977783, 2.18408203125, 2.2333343029022217, 2.2825863361358643, 2.331838607788086]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 9.0, 16.0, 15.0, 22.0, 18.0, 27.0, 33.0, 43.0, 36.0, 51.0, 47.0, 57.0, 59.0, 58.0, 65.0, 56.0, 55.0, 48.0, 49.0, 33.0, 40.0, 32.0, 25.0, 18.0, 22.0, 15.0, 8.0, 8.0, 9.0, 7.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.31586652994155884, -0.30741360783576965, -0.29896068572998047, -0.2905077636241913, -0.2820548415184021, -0.2736019194126129, -0.26514899730682373, -0.25669607520103455, -0.24824315309524536, -0.23979023098945618, -0.231337308883667, -0.2228843867778778, -0.21443146467208862, -0.20597854256629944, -0.19752562046051025, -0.18907269835472107, -0.18061977624893188, -0.1721668541431427, -0.16371393203735352, -0.15526100993156433, -0.14680808782577515, -0.13835516571998596, -0.12990224361419678, -0.12144932150840759, -0.11299639940261841, -0.10454347729682922, -0.09609055519104004, -0.08763763308525085, -0.07918471097946167, -0.07073178887367249, -0.0622788667678833, -0.053825944662094116, -0.04537302255630493, -0.03692010045051575, -0.028467178344726562, -0.020014256238937378, -0.011561334133148193, -0.003108412027359009, 0.005344510078430176, 0.01379743218421936, 0.022250354290008545, 0.03070327639579773, 0.039156198501586914, 0.0476091206073761, 0.05606204271316528, 0.06451496481895447, 0.07296788692474365, 0.08142080903053284, 0.08987373113632202, 0.0983266532421112, 0.10677957534790039, 0.11523249745368958, 0.12368541955947876, 0.13213834166526794, 0.14059126377105713, 0.1490441858768463, 0.1574971079826355, 0.16595003008842468, 0.17440295219421387, 0.18285587430000305, 0.19130879640579224, 0.19976171851158142, 0.2082146406173706, 0.2166675627231598, 0.22512048482894897]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 8.0, 16.0, 13.0, 12.0, 26.0, 29.0, 32.0, 70.0, 74.0, 98.0, 143.0, 246.0, 411.0, 739.0, 1452.0, 3394.0, 10420.0, 42204.0, 187027.0, 462636.0, 256448.0, 60528.0, 14258.0, 4309.0, 1760.0, 851.0, 497.0, 264.0, 164.0, 108.0, 78.0, 54.0, 44.0, 33.0, 31.0, 16.0, 16.0, 11.0, 5.0, 6.0, 6.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12432861328125, -0.12039661407470703, -0.11646461486816406, -0.1125326156616211, -0.10860061645507812, -0.10466861724853516, -0.10073661804199219, -0.09680461883544922, -0.09287261962890625, -0.08894062042236328, -0.08500862121582031, -0.08107662200927734, -0.07714462280273438, -0.0732126235961914, -0.06928062438964844, -0.06534862518310547, -0.0614166259765625, -0.05748462677001953, -0.05355262756347656, -0.049620628356933594, -0.045688629150390625, -0.041756629943847656, -0.03782463073730469, -0.03389263153076172, -0.02996063232421875, -0.02602863311767578, -0.022096633911132812, -0.018164634704589844, -0.014232635498046875, -0.010300636291503906, -0.0063686370849609375, -0.0024366378784179688, 0.001495361328125, 0.005427360534667969, 0.009359359741210938, 0.013291358947753906, 0.017223358154296875, 0.021155357360839844, 0.025087356567382812, 0.02901935577392578, 0.03295135498046875, 0.03688335418701172, 0.04081535339355469, 0.044747352600097656, 0.048679351806640625, 0.052611351013183594, 0.05654335021972656, 0.06047534942626953, 0.0644073486328125, 0.06833934783935547, 0.07227134704589844, 0.0762033462524414, 0.08013534545898438, 0.08406734466552734, 0.08799934387207031, 0.09193134307861328, 0.09586334228515625, 0.09979534149169922, 0.10372734069824219, 0.10765933990478516, 0.11159133911132812, 0.1155233383178711, 0.11945533752441406, 0.12338733673095703, 0.1273193359375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 4.0, 8.0, 15.0, 11.0, 18.0, 28.0, 22.0, 31.0, 34.0, 37.0, 46.0, 57.0, 50.0, 72.0, 50.0, 63.0, 65.0, 58.0, 50.0, 35.0, 51.0, 33.0, 24.0, 30.0, 33.0, 11.0, 12.0, 9.0, 10.0, 9.0, 9.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0220489501953125, -0.021437406539916992, -0.020825862884521484, -0.020214319229125977, -0.01960277557373047, -0.01899123191833496, -0.018379688262939453, -0.017768144607543945, -0.017156600952148438, -0.01654505729675293, -0.015933513641357422, -0.015321969985961914, -0.014710426330566406, -0.014098882675170898, -0.01348733901977539, -0.012875795364379883, -0.012264251708984375, -0.011652708053588867, -0.01104116439819336, -0.010429620742797852, -0.009818077087402344, -0.009206533432006836, -0.008594989776611328, -0.00798344612121582, -0.0073719024658203125, -0.006760358810424805, -0.006148815155029297, -0.005537271499633789, -0.004925727844238281, -0.0043141841888427734, -0.0037026405334472656, -0.003091096878051758, -0.00247955322265625, -0.0018680095672607422, -0.0012564659118652344, -0.0006449222564697266, -3.337860107421875e-05, 0.0005781650543212891, 0.0011897087097167969, 0.0018012523651123047, 0.0024127960205078125, 0.0030243396759033203, 0.003635883331298828, 0.004247426986694336, 0.004858970642089844, 0.0054705142974853516, 0.006082057952880859, 0.006693601608276367, 0.007305145263671875, 0.007916688919067383, 0.00852823257446289, 0.009139776229858398, 0.009751319885253906, 0.010362863540649414, 0.010974407196044922, 0.01158595085144043, 0.012197494506835938, 0.012809038162231445, 0.013420581817626953, 0.014032125473022461, 0.014643669128417969, 0.015255212783813477, 0.015866756439208984, 0.016478300094604492, 0.01708984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 14.0, 27.0, 29.0, 28.0, 42.0, 67.0, 94.0, 148.0, 245.0, 351.0, 704.0, 1362.0, 3147.0, 8773.0, 28225.0, 95314.0, 272773.0, 377351.0, 177430.0, 55701.0, 16706.0, 5474.0, 2143.0, 990.0, 545.0, 284.0, 180.0, 104.0, 71.0, 53.0, 41.0, 34.0, 29.0, 14.0, 18.0, 9.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0750732421875, -0.07267284393310547, -0.07027244567871094, -0.0678720474243164, -0.06547164916992188, -0.06307125091552734, -0.06067085266113281, -0.05827045440673828, -0.05587005615234375, -0.05346965789794922, -0.05106925964355469, -0.048668861389160156, -0.046268463134765625, -0.043868064880371094, -0.04146766662597656, -0.03906726837158203, -0.0366668701171875, -0.03426647186279297, -0.03186607360839844, -0.029465675354003906, -0.027065277099609375, -0.024664878845214844, -0.022264480590820312, -0.01986408233642578, -0.01746368408203125, -0.015063285827636719, -0.012662887573242188, -0.010262489318847656, -0.007862091064453125, -0.005461692810058594, -0.0030612945556640625, -0.0006608963012695312, 0.001739501953125, 0.004139900207519531, 0.0065402984619140625, 0.008940696716308594, 0.011341094970703125, 0.013741493225097656, 0.016141891479492188, 0.01854228973388672, 0.02094268798828125, 0.02334308624267578, 0.025743484497070312, 0.028143882751464844, 0.030544281005859375, 0.032944679260253906, 0.03534507751464844, 0.03774547576904297, 0.0401458740234375, 0.04254627227783203, 0.04494667053222656, 0.047347068786621094, 0.049747467041015625, 0.052147865295410156, 0.05454826354980469, 0.05694866180419922, 0.05934906005859375, 0.06174945831298828, 0.06414985656738281, 0.06655025482177734, 0.06895065307617188, 0.0713510513305664, 0.07375144958496094, 0.07615184783935547, 0.07855224609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 0.0, 2.0, 2.0, 8.0, 11.0, 5.0, 14.0, 16.0, 10.0, 13.0, 11.0, 22.0, 24.0, 23.0, 29.0, 36.0, 31.0, 55.0, 38.0, 39.0, 40.0, 43.0, 28.0, 36.0, 40.0, 33.0, 44.0, 41.0, 42.0, 35.0, 28.0, 36.0, 34.0, 25.0, 21.0, 14.0, 10.0, 16.0, 14.0, 9.0, 12.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06756591796875, -0.06547164916992188, -0.06337738037109375, -0.061283111572265625, -0.0591888427734375, -0.057094573974609375, -0.05500030517578125, -0.052906036376953125, -0.050811767578125, -0.048717498779296875, -0.04662322998046875, -0.044528961181640625, -0.0424346923828125, -0.040340423583984375, -0.03824615478515625, -0.036151885986328125, -0.0340576171875, -0.031963348388671875, -0.02986907958984375, -0.027774810791015625, -0.0256805419921875, -0.023586273193359375, -0.02149200439453125, -0.019397735595703125, -0.017303466796875, -0.015209197998046875, -0.01311492919921875, -0.011020660400390625, -0.0089263916015625, -0.006832122802734375, -0.00473785400390625, -0.002643585205078125, -0.00054931640625, 0.001544952392578125, 0.00363922119140625, 0.005733489990234375, 0.0078277587890625, 0.009922027587890625, 0.01201629638671875, 0.014110565185546875, 0.016204833984375, 0.018299102783203125, 0.02039337158203125, 0.022487640380859375, 0.0245819091796875, 0.026676177978515625, 0.02877044677734375, 0.030864715576171875, 0.032958984375, 0.035053253173828125, 0.03714752197265625, 0.039241790771484375, 0.0413360595703125, 0.043430328369140625, 0.04552459716796875, 0.047618865966796875, 0.049713134765625, 0.051807403564453125, 0.05390167236328125, 0.055995941162109375, 0.0580902099609375, 0.060184478759765625, 0.06227874755859375, 0.06437301635742188, 0.06646728515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 7.0, 4.0, 9.0, 14.0, 24.0, 33.0, 56.0, 69.0, 132.0, 226.0, 433.0, 823.0, 1727.0, 4399.0, 13056.0, 45573.0, 173408.0, 405709.0, 283982.0, 84397.0, 22437.0, 6903.0, 2638.0, 1130.0, 625.0, 282.0, 157.0, 110.0, 65.0, 48.0, 24.0, 14.0, 15.0, 5.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06488037109375, -0.06311368942260742, -0.061347007751464844, -0.059580326080322266, -0.05781364440917969, -0.05604696273803711, -0.05428028106689453, -0.05251359939575195, -0.050746917724609375, -0.0489802360534668, -0.04721355438232422, -0.04544687271118164, -0.04368019104003906, -0.041913509368896484, -0.040146827697753906, -0.03838014602661133, -0.03661346435546875, -0.03484678268432617, -0.033080101013183594, -0.031313419342041016, -0.029546737670898438, -0.02778005599975586, -0.02601337432861328, -0.024246692657470703, -0.022480010986328125, -0.020713329315185547, -0.01894664764404297, -0.01717996597290039, -0.015413284301757812, -0.013646602630615234, -0.011879920959472656, -0.010113239288330078, -0.0083465576171875, -0.006579875946044922, -0.004813194274902344, -0.0030465126037597656, -0.0012798309326171875, 0.0004868507385253906, 0.0022535324096679688, 0.004020214080810547, 0.005786895751953125, 0.007553577423095703, 0.009320259094238281, 0.01108694076538086, 0.012853622436523438, 0.014620304107666016, 0.016386985778808594, 0.018153667449951172, 0.01992034912109375, 0.021687030792236328, 0.023453712463378906, 0.025220394134521484, 0.026987075805664062, 0.02875375747680664, 0.03052043914794922, 0.0322871208190918, 0.034053802490234375, 0.03582048416137695, 0.03758716583251953, 0.03935384750366211, 0.04112052917480469, 0.042887210845947266, 0.044653892517089844, 0.04642057418823242, 0.048187255859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 8.0, 15.0, 22.0, 30.0, 83.0, 91.0, 143.0, 201.0, 130.0, 105.0, 76.0, 36.0, 31.0, 18.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.00019669532775878906, -0.00019279494881629944, -0.00018889456987380981, -0.0001849941909313202, -0.00018109381198883057, -0.00017719343304634094, -0.00017329305410385132, -0.0001693926751613617, -0.00016549229621887207, -0.00016159191727638245, -0.00015769153833389282, -0.0001537911593914032, -0.00014989078044891357, -0.00014599040150642395, -0.00014209002256393433, -0.0001381896436214447, -0.00013428926467895508, -0.00013038888573646545, -0.00012648850679397583, -0.0001225881278514862, -0.00011868774890899658, -0.00011478736996650696, -0.00011088699102401733, -0.00010698661208152771, -0.00010308623313903809, -9.918585419654846e-05, -9.528547525405884e-05, -9.138509631156921e-05, -8.748471736907959e-05, -8.358433842658997e-05, -7.968395948410034e-05, -7.578358054161072e-05, -7.18832015991211e-05, -6.798282265663147e-05, -6.408244371414185e-05, -6.018206477165222e-05, -5.62816858291626e-05, -5.2381306886672974e-05, -4.848092794418335e-05, -4.4580549001693726e-05, -4.06801700592041e-05, -3.677979111671448e-05, -3.2879412174224854e-05, -2.897903323173523e-05, -2.5078654289245605e-05, -2.117827534675598e-05, -1.7277896404266357e-05, -1.3377517461776733e-05, -9.47713851928711e-06, -5.576759576797485e-06, -1.6763806343078613e-06, 2.2239983081817627e-06, 6.124377250671387e-06, 1.002475619316101e-05, 1.3925135135650635e-05, 1.782551407814026e-05, 2.1725893020629883e-05, 2.5626271963119507e-05, 2.952665090560913e-05, 3.3427029848098755e-05, 3.732740879058838e-05, 4.1227787733078e-05, 4.512816667556763e-05, 4.902854561805725e-05, 5.2928924560546875e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 5.0, 2.0, 8.0, 6.0, 12.0, 14.0, 20.0, 16.0, 47.0, 45.0, 69.0, 107.0, 163.0, 237.0, 435.0, 719.0, 1371.0, 2779.0, 6271.0, 16816.0, 51176.0, 156201.0, 348834.0, 293442.0, 111697.0, 36032.0, 12161.0, 4841.0, 2307.0, 1100.0, 592.0, 358.0, 256.0, 121.0, 102.0, 65.0, 39.0, 14.0, 18.0, 15.0, 22.0, 6.0, 5.0, 3.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04486083984375, -0.04340648651123047, -0.04195213317871094, -0.040497779846191406, -0.039043426513671875, -0.037589073181152344, -0.03613471984863281, -0.03468036651611328, -0.03322601318359375, -0.03177165985107422, -0.030317306518554688, -0.028862953186035156, -0.027408599853515625, -0.025954246520996094, -0.024499893188476562, -0.02304553985595703, -0.0215911865234375, -0.02013683319091797, -0.018682479858398438, -0.017228126525878906, -0.015773773193359375, -0.014319419860839844, -0.012865066528320312, -0.011410713195800781, -0.00995635986328125, -0.008502006530761719, -0.0070476531982421875, -0.005593299865722656, -0.004138946533203125, -0.0026845932006835938, -0.0012302398681640625, 0.00022411346435546875, 0.001678466796875, 0.0031328201293945312, 0.0045871734619140625, 0.006041526794433594, 0.007495880126953125, 0.008950233459472656, 0.010404586791992188, 0.011858940124511719, 0.01331329345703125, 0.014767646789550781, 0.016222000122070312, 0.017676353454589844, 0.019130706787109375, 0.020585060119628906, 0.022039413452148438, 0.02349376678466797, 0.0249481201171875, 0.02640247344970703, 0.027856826782226562, 0.029311180114746094, 0.030765533447265625, 0.032219886779785156, 0.03367424011230469, 0.03512859344482422, 0.03658294677734375, 0.03803730010986328, 0.03949165344238281, 0.040946006774902344, 0.042400360107421875, 0.043854713439941406, 0.04530906677246094, 0.04676342010498047, 0.0482177734375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 3.0, 5.0, 3.0, 8.0, 8.0, 12.0, 15.0, 21.0, 24.0, 42.0, 49.0, 47.0, 41.0, 59.0, 63.0, 77.0, 69.0, 77.0, 63.0, 67.0, 54.0, 37.0, 29.0, 23.0, 26.0, 19.0, 15.0, 21.0, 8.0, 6.0, 1.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039764404296875, -0.038402557373046875, -0.03704071044921875, -0.035678863525390625, -0.0343170166015625, -0.032955169677734375, -0.03159332275390625, -0.030231475830078125, -0.02886962890625, -0.027507781982421875, -0.02614593505859375, -0.024784088134765625, -0.0234222412109375, -0.022060394287109375, -0.02069854736328125, -0.019336700439453125, -0.017974853515625, -0.016613006591796875, -0.01525115966796875, -0.013889312744140625, -0.0125274658203125, -0.011165618896484375, -0.00980377197265625, -0.008441925048828125, -0.007080078125, -0.005718231201171875, -0.00435638427734375, -0.002994537353515625, -0.0016326904296875, -0.000270843505859375, 0.00109100341796875, 0.002452850341796875, 0.003814697265625, 0.005176544189453125, 0.00653839111328125, 0.007900238037109375, 0.0092620849609375, 0.010623931884765625, 0.01198577880859375, 0.013347625732421875, 0.01470947265625, 0.016071319580078125, 0.01743316650390625, 0.018795013427734375, 0.0201568603515625, 0.021518707275390625, 0.02288055419921875, 0.024242401123046875, 0.025604248046875, 0.026966094970703125, 0.02832794189453125, 0.029689788818359375, 0.0310516357421875, 0.032413482666015625, 0.03377532958984375, 0.035137176513671875, 0.0364990234375, 0.037860870361328125, 0.03922271728515625, 0.040584564208984375, 0.0419464111328125, 0.043308258056640625, 0.04467010498046875, 0.046031951904296875, 0.047393798828125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 14.0, 33.0, 92.0, 136.0, 222.0, 221.0, 127.0, 76.0, 45.0, 14.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.4792819023132324, -1.4471585750579834, -1.4150351285934448, -1.3829118013381958, -1.3507883548736572, -1.3186650276184082, -1.2865415811538696, -1.2544182538986206, -1.222294807434082, -1.190171480178833, -1.1580480337142944, -1.1259247064590454, -1.0938012599945068, -1.0616779327392578, -1.0295544862747192, -0.9974311590194702, -0.9653078317642212, -0.9331844449043274, -0.9010610580444336, -0.8689376711845398, -0.836814284324646, -0.804690957069397, -0.7725675702095032, -0.7404441833496094, -0.7083207964897156, -0.6761974096298218, -0.644074022769928, -0.6119506359100342, -0.5798273086547852, -0.5477038621902466, -0.5155805349349976, -0.48345714807510376, -0.4513338804244995, -0.4192104935646057, -0.3870871067047119, -0.3549637496471405, -0.3228403627872467, -0.2907169759273529, -0.2585936188697815, -0.2264702320098877, -0.1943468451499939, -0.1622234582901001, -0.1301000863313675, -0.09797670692205429, -0.06585332751274109, -0.03372994065284729, -0.001606568694114685, 0.03051680326461792, 0.06264019012451172, 0.09476356953382492, 0.12688694894313812, 0.15901032090187073, 0.19113370776176453, 0.22325709462165833, 0.25538045167922974, 0.28750383853912354, 0.31962722539901733, 0.35175061225891113, 0.38387399911880493, 0.41599735617637634, 0.44812074303627014, 0.48024412989616394, 0.5123674869537354, 0.5444908738136292, 0.576614260673523]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 13.0, 7.0, 15.0, 14.0, 23.0, 15.0, 26.0, 19.0, 36.0, 34.0, 43.0, 44.0, 48.0, 59.0, 50.0, 66.0, 49.0, 49.0, 59.0, 45.0, 43.0, 34.0, 33.0, 30.0, 27.0, 25.0, 22.0, 17.0, 16.0, 10.0, 8.0, 5.0, 3.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.5736936330795288, -0.5585599541664124, -0.5434263348579407, -0.5282926559448242, -0.5131590366363525, -0.4980253577232361, -0.482891708612442, -0.46775805950164795, -0.4526243805885315, -0.4374907314777374, -0.42235708236694336, -0.4072234034538269, -0.39208975434303284, -0.37695610523223877, -0.3618224561214447, -0.34668880701065063, -0.33155515789985657, -0.3164215087890625, -0.30128785967826843, -0.28615421056747437, -0.2710205316543579, -0.25588688254356384, -0.24075323343276978, -0.2256195843219757, -0.21048592031002045, -0.19535227119922638, -0.18021860718727112, -0.16508495807647705, -0.14995130896568298, -0.13481764495372772, -0.11968399584293365, -0.10455033928155899, -0.08941668272018433, -0.07428302615880966, -0.059149373322725296, -0.04401572048664093, -0.028882063925266266, -0.013748407363891602, 0.0013852417469024658, 0.01651889830827713, 0.031652554869651794, 0.04678621143102646, 0.061919864267110825, 0.07705351710319519, 0.09218717366456985, 0.10732083022594452, 0.12245447933673859, 0.13758814334869385, 0.15272179245948792, 0.16785544157028198, 0.18298910558223724, 0.1981227546930313, 0.21325641870498657, 0.22839006781578064, 0.2435237169265747, 0.2586573660373688, 0.27379101514816284, 0.2889246642589569, 0.304058313369751, 0.31919199228286743, 0.3343256413936615, 0.34945929050445557, 0.36459293961524963, 0.3797265887260437, 0.39486026763916016]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 4.0, 8.0, 13.0, 17.0, 32.0, 43.0, 92.0, 147.0, 329.0, 740.0, 1908.0, 7065.0, 46630.0, 2388507.0, 1696446.0, 43573.0, 6194.0, 1492.0, 534.0, 218.0, 101.0, 56.0, 25.0, 29.0, 18.0, 11.0, 9.0, 10.0, 6.0, 4.0, 6.0, 2.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.17148399353027344, -0.16535568237304688, -0.1592273712158203, -0.15309906005859375, -0.1469707489013672, -0.14084243774414062, -0.13471412658691406, -0.1285858154296875, -0.12245750427246094, -0.11632919311523438, -0.11020088195800781, -0.10407257080078125, -0.09794425964355469, -0.09181594848632812, -0.08568763732910156, -0.079559326171875, -0.07343101501464844, -0.06730270385742188, -0.06117439270019531, -0.05504608154296875, -0.04891777038574219, -0.042789459228515625, -0.03666114807128906, -0.0305328369140625, -0.024404525756835938, -0.018276214599609375, -0.012147903442382812, -0.00601959228515625, 0.0001087188720703125, 0.006237030029296875, 0.012365341186523438, 0.01849365234375, 0.024621963500976562, 0.030750274658203125, 0.03687858581542969, 0.04300689697265625, 0.04913520812988281, 0.055263519287109375, 0.06139183044433594, 0.0675201416015625, 0.07364845275878906, 0.07977676391601562, 0.08590507507324219, 0.09203338623046875, 0.09816169738769531, 0.10429000854492188, 0.11041831970214844, 0.116546630859375, 0.12267494201660156, 0.12880325317382812, 0.1349315643310547, 0.14105987548828125, 0.1471881866455078, 0.15331649780273438, 0.15944480895996094, 0.1655731201171875, 0.17170143127441406, 0.17782974243164062, 0.1839580535888672, 0.19008636474609375, 0.1962146759033203, 0.20234298706054688, 0.20847129821777344, 0.214599609375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 9.0, 15.0, 22.0, 23.0, 36.0, 41.0, 68.0, 80.0, 71.0, 90.0, 89.0, 87.0, 82.0, 70.0, 51.0, 45.0, 37.0, 19.0, 18.0, 12.0, 8.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.041961669921875, -0.041010379791259766, -0.04005908966064453, -0.0391077995300293, -0.03815650939941406, -0.03720521926879883, -0.036253929138183594, -0.03530263900756836, -0.034351348876953125, -0.03340005874633789, -0.032448768615722656, -0.03149747848510742, -0.030546188354492188, -0.029594898223876953, -0.02864360809326172, -0.027692317962646484, -0.02674102783203125, -0.025789737701416016, -0.02483844757080078, -0.023887157440185547, -0.022935867309570312, -0.021984577178955078, -0.021033287048339844, -0.02008199691772461, -0.019130706787109375, -0.01817941665649414, -0.017228126525878906, -0.016276836395263672, -0.015325546264648438, -0.014374256134033203, -0.013422966003417969, -0.012471675872802734, -0.0115203857421875, -0.010569095611572266, -0.009617805480957031, -0.008666515350341797, -0.0077152252197265625, -0.006763935089111328, -0.005812644958496094, -0.004861354827880859, -0.003910064697265625, -0.0029587745666503906, -0.0020074844360351562, -0.0010561943054199219, -0.0001049041748046875, 0.0008463859558105469, 0.0017976760864257812, 0.0027489662170410156, 0.00370025634765625, 0.004651546478271484, 0.005602836608886719, 0.006554126739501953, 0.0075054168701171875, 0.008456707000732422, 0.009407997131347656, 0.01035928726196289, 0.011310577392578125, 0.01226186752319336, 0.013213157653808594, 0.014164447784423828, 0.015115737915039062, 0.016067028045654297, 0.01701831817626953, 0.017969608306884766, 0.0189208984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 8.0, 9.0, 19.0, 26.0, 44.0, 67.0, 116.0, 235.0, 676.0, 3223.0, 33691.0, 2656834.0, 1468403.0, 26994.0, 2757.0, 632.0, 214.0, 155.0, 72.0, 47.0, 24.0, 17.0, 15.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2410888671875, -0.23276329040527344, -0.22443771362304688, -0.2161121368408203, -0.20778656005859375, -0.1994609832763672, -0.19113540649414062, -0.18280982971191406, -0.1744842529296875, -0.16615867614746094, -0.15783309936523438, -0.1495075225830078, -0.14118194580078125, -0.1328563690185547, -0.12453079223632812, -0.11620521545410156, -0.107879638671875, -0.09955406188964844, -0.09122848510742188, -0.08290290832519531, -0.07457733154296875, -0.06625175476074219, -0.057926177978515625, -0.04960060119628906, -0.0412750244140625, -0.03294944763183594, -0.024623870849609375, -0.016298294067382812, -0.00797271728515625, 0.0003528594970703125, 0.008678436279296875, 0.017004013061523438, 0.02532958984375, 0.03365516662597656, 0.041980743408203125, 0.05030632019042969, 0.05863189697265625, 0.06695747375488281, 0.07528305053710938, 0.08360862731933594, 0.0919342041015625, 0.10025978088378906, 0.10858535766601562, 0.11691093444824219, 0.12523651123046875, 0.1335620880126953, 0.14188766479492188, 0.15021324157714844, 0.158538818359375, 0.16686439514160156, 0.17518997192382812, 0.1835155487060547, 0.19184112548828125, 0.2001667022705078, 0.20849227905273438, 0.21681785583496094, 0.2251434326171875, 0.23346900939941406, 0.24179458618164062, 0.2501201629638672, 0.25844573974609375, 0.2667713165283203, 0.2750968933105469, 0.28342247009277344, 0.291748046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 6.0, 19.0, 16.0, 35.0, 45.0, 80.0, 129.0, 210.0, 407.0, 1055.0, 992.0, 418.0, 241.0, 150.0, 95.0, 51.0, 31.0, 20.0, 20.0, 13.0, 11.0, 6.0, 10.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037261962890625, -0.035642147064208984, -0.03402233123779297, -0.03240251541137695, -0.030782699584960938, -0.029162883758544922, -0.027543067932128906, -0.02592325210571289, -0.024303436279296875, -0.02268362045288086, -0.021063804626464844, -0.019443988800048828, -0.017824172973632812, -0.016204357147216797, -0.014584541320800781, -0.012964725494384766, -0.01134490966796875, -0.009725093841552734, -0.008105278015136719, -0.006485462188720703, -0.0048656463623046875, -0.003245830535888672, -0.0016260147094726562, -6.198883056640625e-06, 0.001613616943359375, 0.0032334327697753906, 0.004853248596191406, 0.006473064422607422, 0.008092880249023438, 0.009712696075439453, 0.011332511901855469, 0.012952327728271484, 0.0145721435546875, 0.016191959381103516, 0.01781177520751953, 0.019431591033935547, 0.021051406860351562, 0.022671222686767578, 0.024291038513183594, 0.02591085433959961, 0.027530670166015625, 0.02915048599243164, 0.030770301818847656, 0.03239011764526367, 0.03400993347167969, 0.0356297492980957, 0.03724956512451172, 0.038869380950927734, 0.04048919677734375, 0.042109012603759766, 0.04372882843017578, 0.0453486442565918, 0.04696846008300781, 0.04858827590942383, 0.050208091735839844, 0.05182790756225586, 0.053447723388671875, 0.05506753921508789, 0.056687355041503906, 0.05830717086791992, 0.05992698669433594, 0.06154680252075195, 0.06316661834716797, 0.06478643417358398, 0.06640625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 25.0, 48.0, 114.0, 154.0, 203.0, 177.0, 121.0, 71.0, 30.0, 19.0, 17.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1904492825269699, -0.17635327577590942, -0.16225726902484894, -0.14816126227378845, -0.13406524062156677, -0.11996923387050629, -0.1058732271194458, -0.09177721291780472, -0.07768120616674423, -0.06358519941568375, -0.049489185214042664, -0.03539317846298218, -0.021297167986631393, -0.007201157510280609, 0.006894849240779877, 0.02099086344242096, 0.035086870193481445, 0.04918288066983223, 0.06327889114618301, 0.0773748978972435, 0.09147091209888458, 0.10556691884994507, 0.11966292560100555, 0.13375893235206604, 0.14785495400428772, 0.1619509607553482, 0.1760469675064087, 0.19014298915863037, 0.20423899590969086, 0.21833500266075134, 0.23243100941181183, 0.24652701616287231, 0.2606230080127716, 0.2747190296649933, 0.2888150215148926, 0.30291104316711426, 0.31700703501701355, 0.33110305666923523, 0.3451990485191345, 0.3592950701713562, 0.3733910918235779, 0.38748711347579956, 0.40158310532569885, 0.41567912697792053, 0.4297751188278198, 0.4438711404800415, 0.4579671621322632, 0.4720631539821625, 0.48615914583206177, 0.5002551674842834, 0.5143511891365051, 0.528447151184082, 0.5425431728363037, 0.5566391944885254, 0.5707352161407471, 0.5848312377929688, 0.5989272594451904, 0.6130232810974121, 0.6271193027496338, 0.6412152647972107, 0.6553112864494324, 0.669407308101654, 0.6835033297538757, 0.6975993514060974, 0.7116953134536743]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 9.0, 14.0, 12.0, 23.0, 12.0, 24.0, 41.0, 38.0, 60.0, 58.0, 48.0, 64.0, 56.0, 60.0, 63.0, 51.0, 63.0, 55.0, 49.0, 27.0, 41.0, 34.0, 35.0, 17.0, 6.0, 11.0, 16.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17899328470230103, -0.17189201712608337, -0.16479076445102692, -0.15768949687480927, -0.1505882441997528, -0.14348697662353516, -0.1363857090473175, -0.12928444147109985, -0.1221831887960434, -0.11508192867040634, -0.10798066854476929, -0.10087940096855164, -0.09377814084291458, -0.08667688071727753, -0.07957561314105988, -0.07247435301542282, -0.06537309288978577, -0.05827183276414871, -0.05117056891322136, -0.044069305062294006, -0.03696804493665695, -0.029866784811019897, -0.022765520960092545, -0.01566425710916519, -0.008562996983528137, -0.0014617349952459335, 0.00563952699303627, 0.012740788981318474, 0.019842050969600677, 0.026943311095237732, 0.034044574946165085, 0.04114583879709244, 0.04824709892272949, 0.05534835904836655, 0.0624496228992939, 0.06955088675022125, 0.0766521468758583, 0.08375340700149536, 0.09085467457771301, 0.09795593470335007, 0.10505719482898712, 0.11215845495462418, 0.11925971508026123, 0.12636098265647888, 0.13346225023269653, 0.140563502907753, 0.14766477048397064, 0.1547660231590271, 0.16186729073524475, 0.1689685583114624, 0.17606981098651886, 0.1831710785627365, 0.19027233123779297, 0.19737359881401062, 0.20447486639022827, 0.21157613396644592, 0.21867738664150238, 0.22577865421772003, 0.2328799068927765, 0.23998117446899414, 0.2470824420452118, 0.25418370962142944, 0.2612849473953247, 0.26838621497154236, 0.27548748254776]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 4.0, 6.0, 11.0, 11.0, 17.0, 13.0, 25.0, 41.0, 62.0, 109.0, 172.0, 288.0, 590.0, 1213.0, 3009.0, 9006.0, 30597.0, 112580.0, 349587.0, 368699.0, 123202.0, 33791.0, 9571.0, 3185.0, 1308.0, 625.0, 298.0, 149.0, 119.0, 88.0, 36.0, 29.0, 23.0, 22.0, 9.0, 14.0, 14.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.107177734375, -0.10402870178222656, -0.10087966918945312, -0.09773063659667969, -0.09458160400390625, -0.09143257141113281, -0.08828353881835938, -0.08513450622558594, -0.0819854736328125, -0.07883644104003906, -0.07568740844726562, -0.07253837585449219, -0.06938934326171875, -0.06624031066894531, -0.06309127807617188, -0.05994224548339844, -0.056793212890625, -0.05364418029785156, -0.050495147705078125, -0.04734611511230469, -0.04419708251953125, -0.04104804992675781, -0.037899017333984375, -0.03474998474121094, -0.0316009521484375, -0.028451919555664062, -0.025302886962890625, -0.022153854370117188, -0.01900482177734375, -0.015855789184570312, -0.012706756591796875, -0.009557723999023438, -0.00640869140625, -0.0032596588134765625, -0.000110626220703125, 0.0030384063720703125, 0.00618743896484375, 0.009336471557617188, 0.012485504150390625, 0.015634536743164062, 0.0187835693359375, 0.021932601928710938, 0.025081634521484375, 0.028230667114257812, 0.03137969970703125, 0.03452873229980469, 0.037677764892578125, 0.04082679748535156, 0.043975830078125, 0.04712486267089844, 0.050273895263671875, 0.05342292785644531, 0.05657196044921875, 0.05972099304199219, 0.06287002563476562, 0.06601905822753906, 0.0691680908203125, 0.07231712341308594, 0.07546615600585938, 0.07861518859863281, 0.08176422119140625, 0.08491325378417969, 0.08806228637695312, 0.09121131896972656, 0.0943603515625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 6.0, 5.0, 14.0, 16.0, 22.0, 18.0, 16.0, 25.0, 28.0, 35.0, 31.0, 51.0, 43.0, 68.0, 61.0, 57.0, 69.0, 61.0, 47.0, 41.0, 35.0, 39.0, 40.0, 33.0, 23.0, 24.0, 15.0, 15.0, 13.0, 9.0, 11.0, 5.0, 1.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.02154541015625, -0.02090907096862793, -0.02027273178100586, -0.01963639259338379, -0.01900005340576172, -0.01836371421813965, -0.017727375030517578, -0.017091035842895508, -0.016454696655273438, -0.015818357467651367, -0.015182018280029297, -0.014545679092407227, -0.013909339904785156, -0.013273000717163086, -0.012636661529541016, -0.012000322341918945, -0.011363983154296875, -0.010727643966674805, -0.010091304779052734, -0.009454965591430664, -0.008818626403808594, -0.008182287216186523, -0.007545948028564453, -0.006909608840942383, -0.0062732696533203125, -0.005636930465698242, -0.005000591278076172, -0.0043642520904541016, -0.0037279129028320312, -0.003091573715209961, -0.0024552345275878906, -0.0018188953399658203, -0.00118255615234375, -0.0005462169647216797, 9.012222290039062e-05, 0.0007264614105224609, 0.0013628005981445312, 0.0019991397857666016, 0.002635478973388672, 0.003271818161010742, 0.0039081573486328125, 0.004544496536254883, 0.005180835723876953, 0.0058171749114990234, 0.006453514099121094, 0.007089853286743164, 0.007726192474365234, 0.008362531661987305, 0.008998870849609375, 0.009635210037231445, 0.010271549224853516, 0.010907888412475586, 0.011544227600097656, 0.012180566787719727, 0.012816905975341797, 0.013453245162963867, 0.014089584350585938, 0.014725923538208008, 0.015362262725830078, 0.01599860191345215, 0.01663494110107422, 0.01727128028869629, 0.01790761947631836, 0.01854395866394043, 0.0191802978515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 17.0, 9.0, 17.0, 29.0, 35.0, 33.0, 61.0, 99.0, 129.0, 225.0, 379.0, 656.0, 1323.0, 3282.0, 10619.0, 43078.0, 185070.0, 467900.0, 252176.0, 61081.0, 14433.0, 4168.0, 1681.0, 805.0, 439.0, 287.0, 160.0, 114.0, 73.0, 43.0, 34.0, 26.0, 19.0, 18.0, 8.0, 2.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0899658203125, -0.08702754974365234, -0.08408927917480469, -0.08115100860595703, -0.07821273803710938, -0.07527446746826172, -0.07233619689941406, -0.0693979263305664, -0.06645965576171875, -0.0635213851928711, -0.06058311462402344, -0.05764484405517578, -0.054706573486328125, -0.05176830291748047, -0.04883003234863281, -0.045891761779785156, -0.0429534912109375, -0.040015220642089844, -0.03707695007324219, -0.03413867950439453, -0.031200408935546875, -0.02826213836669922, -0.025323867797851562, -0.022385597229003906, -0.01944732666015625, -0.016509056091308594, -0.013570785522460938, -0.010632514953613281, -0.007694244384765625, -0.004755973815917969, -0.0018177032470703125, 0.0011205673217773438, 0.004058837890625, 0.006997108459472656, 0.009935379028320312, 0.012873649597167969, 0.015811920166015625, 0.01875019073486328, 0.021688461303710938, 0.024626731872558594, 0.02756500244140625, 0.030503273010253906, 0.03344154357910156, 0.03637981414794922, 0.039318084716796875, 0.04225635528564453, 0.04519462585449219, 0.048132896423339844, 0.0510711669921875, 0.054009437561035156, 0.05694770812988281, 0.05988597869873047, 0.06282424926757812, 0.06576251983642578, 0.06870079040527344, 0.0716390609741211, 0.07457733154296875, 0.0775156021118164, 0.08045387268066406, 0.08339214324951172, 0.08633041381835938, 0.08926868438720703, 0.09220695495605469, 0.09514522552490234, 0.09808349609375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 1.0, 2.0, 12.0, 13.0, 11.0, 16.0, 10.0, 19.0, 14.0, 13.0, 12.0, 27.0, 29.0, 25.0, 29.0, 27.0, 40.0, 27.0, 35.0, 36.0, 43.0, 43.0, 32.0, 25.0, 43.0, 44.0, 33.0, 28.0, 36.0, 41.0, 32.0, 30.0, 23.0, 25.0, 17.0, 23.0, 12.0, 11.0, 13.0, 10.0, 11.0, 9.0, 5.0, 2.0, 7.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.07958984375, -0.07748126983642578, -0.07537269592285156, -0.07326412200927734, -0.07115554809570312, -0.0690469741821289, -0.06693840026855469, -0.06482982635498047, -0.06272125244140625, -0.06061267852783203, -0.05850410461425781, -0.056395530700683594, -0.054286956787109375, -0.052178382873535156, -0.05006980895996094, -0.04796123504638672, -0.0458526611328125, -0.04374408721923828, -0.04163551330566406, -0.039526939392089844, -0.037418365478515625, -0.035309791564941406, -0.03320121765136719, -0.03109264373779297, -0.02898406982421875, -0.02687549591064453, -0.024766921997070312, -0.022658348083496094, -0.020549774169921875, -0.018441200256347656, -0.016332626342773438, -0.014224052429199219, -0.012115478515625, -0.010006904602050781, -0.007898330688476562, -0.005789756774902344, -0.003681182861328125, -0.0015726089477539062, 0.0005359649658203125, 0.0026445388793945312, 0.00475311279296875, 0.006861686706542969, 0.008970260620117188, 0.011078834533691406, 0.013187408447265625, 0.015295982360839844, 0.017404556274414062, 0.01951313018798828, 0.0216217041015625, 0.02373027801513672, 0.025838851928710938, 0.027947425842285156, 0.030055999755859375, 0.032164573669433594, 0.03427314758300781, 0.03638172149658203, 0.03849029541015625, 0.04059886932373047, 0.04270744323730469, 0.044816017150878906, 0.046924591064453125, 0.049033164978027344, 0.05114173889160156, 0.05325031280517578, 0.05535888671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 11.0, 15.0, 13.0, 24.0, 44.0, 74.0, 117.0, 204.0, 418.0, 892.0, 2551.0, 9036.0, 49260.0, 325335.0, 533979.0, 103207.0, 16880.0, 4006.0, 1296.0, 554.0, 268.0, 136.0, 89.0, 42.0, 39.0, 24.0, 9.0, 9.0, 8.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0745849609375, -0.07219409942626953, -0.06980323791503906, -0.0674123764038086, -0.06502151489257812, -0.06263065338134766, -0.06023979187011719, -0.05784893035888672, -0.05545806884765625, -0.05306720733642578, -0.05067634582519531, -0.048285484313964844, -0.045894622802734375, -0.043503761291503906, -0.04111289978027344, -0.03872203826904297, -0.0363311767578125, -0.03394031524658203, -0.03154945373535156, -0.029158592224121094, -0.026767730712890625, -0.024376869201660156, -0.021986007690429688, -0.01959514617919922, -0.01720428466796875, -0.014813423156738281, -0.012422561645507812, -0.010031700134277344, -0.007640838623046875, -0.005249977111816406, -0.0028591156005859375, -0.00046825408935546875, 0.001922607421875, 0.004313468933105469, 0.0067043304443359375, 0.009095191955566406, 0.011486053466796875, 0.013876914978027344, 0.016267776489257812, 0.01865863800048828, 0.02104949951171875, 0.02344036102294922, 0.025831222534179688, 0.028222084045410156, 0.030612945556640625, 0.033003807067871094, 0.03539466857910156, 0.03778553009033203, 0.0401763916015625, 0.04256725311279297, 0.04495811462402344, 0.047348976135253906, 0.049739837646484375, 0.052130699157714844, 0.05452156066894531, 0.05691242218017578, 0.05930328369140625, 0.06169414520263672, 0.06408500671386719, 0.06647586822509766, 0.06886672973632812, 0.0712575912475586, 0.07364845275878906, 0.07603931427001953, 0.07843017578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 7.0, 17.0, 13.0, 18.0, 29.0, 36.0, 53.0, 57.0, 73.0, 73.0, 83.0, 79.0, 81.0, 67.0, 59.0, 39.0, 40.0, 33.0, 25.0, 16.0, 25.0, 10.0, 11.0, 7.0, 6.0, 2.0, 5.0, 3.0, 0.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.35385513305664e-05, -6.173364818096161e-05, -5.992874503135681e-05, -5.8123841881752014e-05, -5.631893873214722e-05, -5.451403558254242e-05, -5.270913243293762e-05, -5.0904229283332825e-05, -4.909932613372803e-05, -4.729442298412323e-05, -4.548951983451843e-05, -4.3684616684913635e-05, -4.187971353530884e-05, -4.007481038570404e-05, -3.826990723609924e-05, -3.6465004086494446e-05, -3.466010093688965e-05, -3.285519778728485e-05, -3.1050294637680054e-05, -2.9245391488075256e-05, -2.744048833847046e-05, -2.563558518886566e-05, -2.3830682039260864e-05, -2.2025778889656067e-05, -2.022087574005127e-05, -1.8415972590446472e-05, -1.6611069440841675e-05, -1.4806166291236877e-05, -1.300126314163208e-05, -1.1196359992027283e-05, -9.391456842422485e-06, -7.586553692817688e-06, -5.781650543212891e-06, -3.976747393608093e-06, -2.171844244003296e-06, -3.6694109439849854e-07, 1.4379620552062988e-06, 3.242865204811096e-06, 5.0477683544158936e-06, 6.852671504020691e-06, 8.657574653625488e-06, 1.0462477803230286e-05, 1.2267380952835083e-05, 1.407228410243988e-05, 1.5877187252044678e-05, 1.7682090401649475e-05, 1.9486993551254272e-05, 2.129189670085907e-05, 2.3096799850463867e-05, 2.4901703000068665e-05, 2.6706606149673462e-05, 2.851150929927826e-05, 3.0316412448883057e-05, 3.2121315598487854e-05, 3.392621874809265e-05, 3.573112189769745e-05, 3.7536025047302246e-05, 3.9340928196907043e-05, 4.114583134651184e-05, 4.295073449611664e-05, 4.4755637645721436e-05, 4.656054079532623e-05, 4.836544394493103e-05, 5.017034709453583e-05, 5.1975250244140625e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 9.0, 8.0, 4.0, 20.0, 19.0, 34.0, 46.0, 76.0, 128.0, 230.0, 413.0, 773.0, 1923.0, 5668.0, 22627.0, 125473.0, 534287.0, 290757.0, 49939.0, 10347.0, 3137.0, 1216.0, 602.0, 344.0, 193.0, 110.0, 54.0, 52.0, 23.0, 15.0, 6.0, 8.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.063232421875, -0.06103229522705078, -0.05883216857910156, -0.056632041931152344, -0.054431915283203125, -0.052231788635253906, -0.05003166198730469, -0.04783153533935547, -0.04563140869140625, -0.04343128204345703, -0.04123115539550781, -0.039031028747558594, -0.036830902099609375, -0.034630775451660156, -0.03243064880371094, -0.03023052215576172, -0.0280303955078125, -0.02583026885986328, -0.023630142211914062, -0.021430015563964844, -0.019229888916015625, -0.017029762268066406, -0.014829635620117188, -0.012629508972167969, -0.01042938232421875, -0.008229255676269531, -0.0060291290283203125, -0.0038290023803710938, -0.001628875732421875, 0.0005712509155273438, 0.0027713775634765625, 0.004971504211425781, 0.007171630859375, 0.009371757507324219, 0.011571884155273438, 0.013772010803222656, 0.015972137451171875, 0.018172264099121094, 0.020372390747070312, 0.02257251739501953, 0.02477264404296875, 0.02697277069091797, 0.029172897338867188, 0.031373023986816406, 0.033573150634765625, 0.035773277282714844, 0.03797340393066406, 0.04017353057861328, 0.0423736572265625, 0.04457378387451172, 0.04677391052246094, 0.048974037170410156, 0.051174163818359375, 0.053374290466308594, 0.05557441711425781, 0.05777454376220703, 0.05997467041015625, 0.06217479705810547, 0.06437492370605469, 0.0665750503540039, 0.06877517700195312, 0.07097530364990234, 0.07317543029785156, 0.07537555694580078, 0.07757568359375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 10.0, 11.0, 13.0, 29.0, 24.0, 41.0, 64.0, 88.0, 81.0, 102.0, 102.0, 104.0, 77.0, 66.0, 42.0, 33.0, 30.0, 26.0, 19.0, 14.0, 8.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0618896484375, -0.05997323989868164, -0.05805683135986328, -0.05614042282104492, -0.05422401428222656, -0.0523076057434082, -0.050391197204589844, -0.048474788665771484, -0.046558380126953125, -0.044641971588134766, -0.042725563049316406, -0.04080915451049805, -0.03889274597167969, -0.03697633743286133, -0.03505992889404297, -0.03314352035522461, -0.03122711181640625, -0.02931070327758789, -0.02739429473876953, -0.025477886199951172, -0.023561477661132812, -0.021645069122314453, -0.019728660583496094, -0.017812252044677734, -0.015895843505859375, -0.013979434967041016, -0.012063026428222656, -0.010146617889404297, -0.008230209350585938, -0.006313800811767578, -0.004397392272949219, -0.0024809837341308594, -0.0005645751953125, 0.0013518333435058594, 0.0032682418823242188, 0.005184650421142578, 0.0071010589599609375, 0.009017467498779297, 0.010933876037597656, 0.012850284576416016, 0.014766693115234375, 0.016683101654052734, 0.018599510192871094, 0.020515918731689453, 0.022432327270507812, 0.024348735809326172, 0.02626514434814453, 0.02818155288696289, 0.03009796142578125, 0.03201436996459961, 0.03393077850341797, 0.03584718704223633, 0.03776359558105469, 0.03968000411987305, 0.041596412658691406, 0.043512821197509766, 0.045429229736328125, 0.047345638275146484, 0.049262046813964844, 0.0511784553527832, 0.05309486389160156, 0.05501127243041992, 0.05692768096923828, 0.05884408950805664, 0.060760498046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 34.0, 74.0, 152.0, 235.0, 235.0, 142.0, 75.0, 21.0, 12.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3923864364624023, -1.354572057723999, -1.3167575597763062, -1.2789431810379028, -1.24112868309021, -1.2033143043518066, -1.1654998064041138, -1.1276854276657104, -1.0898709297180176, -1.0520565509796143, -1.0142420530319214, -0.9764276146888733, -0.9386131763458252, -0.9007987976074219, -0.8629843592643738, -0.8251699209213257, -0.7873555421829224, -0.7495411038398743, -0.7117266654968262, -0.6739122271537781, -0.63609778881073, -0.5982834100723267, -0.5604689717292786, -0.5226545333862305, -0.4848400950431824, -0.4470256567001343, -0.4092112183570862, -0.3713968098163605, -0.3335823714733124, -0.2957679331302643, -0.2579535245895386, -0.22013908624649048, -0.18232464790344238, -0.1445102095603943, -0.10669578611850739, -0.06888135522603989, -0.031066924333572388, 0.006747514009475708, 0.04456193745136261, 0.08237636089324951, 0.12019079923629761, 0.1580052375793457, 0.1958196610212326, 0.2336340844631195, 0.2714485228061676, 0.3092629611492157, 0.3470773696899414, 0.3848918080329895, 0.4227062463760376, 0.4605206847190857, 0.4983351230621338, 0.5361495614051819, 0.57396399974823, 0.6117783784866333, 0.6495928168296814, 0.6874072551727295, 0.7252216935157776, 0.7630361318588257, 0.8008505702018738, 0.8386650085449219, 0.8764793872833252, 0.9142938852310181, 0.9521082639694214, 0.9899227023124695, 1.0277371406555176]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 6.0, 10.0, 7.0, 11.0, 8.0, 20.0, 17.0, 25.0, 20.0, 23.0, 36.0, 40.0, 43.0, 27.0, 35.0, 51.0, 41.0, 45.0, 49.0, 48.0, 48.0, 41.0, 40.0, 31.0, 34.0, 28.0, 33.0, 24.0, 18.0, 23.0, 20.0, 20.0, 9.0, 13.0, 10.0, 9.0, 8.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.45164233446121216, -0.4382320046424866, -0.424821674823761, -0.411411315202713, -0.3980009853839874, -0.38459065556526184, -0.37118029594421387, -0.3577699661254883, -0.3443596363067627, -0.3309493064880371, -0.3175389766693115, -0.30412861704826355, -0.29071828722953796, -0.2773079574108124, -0.2638975977897644, -0.2504872679710388, -0.23707693815231323, -0.22366660833358765, -0.21025626361370087, -0.1968459188938141, -0.1834355890750885, -0.17002525925636292, -0.15661491453647614, -0.14320456981658936, -0.12979423999786377, -0.11638390272855759, -0.1029735654592514, -0.08956322818994522, -0.07615289092063904, -0.06274255365133286, -0.04933221638202667, -0.03592187911272049, -0.022511541843414307, -0.009101204574108124, 0.004309132695198059, 0.017719469964504242, 0.031129807233810425, 0.04454014450311661, 0.05795048177242279, 0.07136081904172897, 0.08477115631103516, 0.09818149358034134, 0.11159183084964752, 0.1250021755695343, 0.1384125053882599, 0.15182283520698547, 0.16523317992687225, 0.17864352464675903, 0.19205385446548462, 0.2054641842842102, 0.21887452900409698, 0.23228487372398376, 0.24569520354270935, 0.25910553336143494, 0.2725158929824829, 0.2859262228012085, 0.2993365526199341, 0.31274688243865967, 0.32615721225738525, 0.3395675718784332, 0.3529779016971588, 0.3663882315158844, 0.3797985911369324, 0.39320892095565796, 0.40661925077438354]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 1.0, 6.0, 7.0, 3.0, 10.0, 18.0, 13.0, 22.0, 42.0, 53.0, 89.0, 128.0, 220.0, 344.0, 586.0, 1260.0, 2902.0, 7616.0, 26966.0, 162959.0, 3276754.0, 629935.0, 62247.0, 13952.0, 4405.0, 1808.0, 799.0, 454.0, 225.0, 146.0, 85.0, 58.0, 34.0, 35.0, 24.0, 16.0, 13.0, 7.0, 7.0, 11.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.1375732421875, -0.1334972381591797, -0.12942123413085938, -0.12534523010253906, -0.12126922607421875, -0.11719322204589844, -0.11311721801757812, -0.10904121398925781, -0.1049652099609375, -0.10088920593261719, -0.09681320190429688, -0.09273719787597656, -0.08866119384765625, -0.08458518981933594, -0.08050918579101562, -0.07643318176269531, -0.072357177734375, -0.06828117370605469, -0.06420516967773438, -0.06012916564941406, -0.05605316162109375, -0.05197715759277344, -0.047901153564453125, -0.04382514953613281, -0.0397491455078125, -0.03567314147949219, -0.031597137451171875, -0.027521133422851562, -0.02344512939453125, -0.019369125366210938, -0.015293121337890625, -0.011217117309570312, -0.00714111328125, -0.0030651092529296875, 0.001010894775390625, 0.0050868988037109375, 0.00916290283203125, 0.013238906860351562, 0.017314910888671875, 0.021390914916992188, 0.0254669189453125, 0.029542922973632812, 0.033618927001953125, 0.03769493103027344, 0.04177093505859375, 0.04584693908691406, 0.049922943115234375, 0.05399894714355469, 0.058074951171875, 0.06215095520019531, 0.06622695922851562, 0.07030296325683594, 0.07437896728515625, 0.07845497131347656, 0.08253097534179688, 0.08660697937011719, 0.0906829833984375, 0.09475898742675781, 0.09883499145507812, 0.10291099548339844, 0.10698699951171875, 0.11106300354003906, 0.11513900756835938, 0.11921501159667969, 0.123291015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 4.0, 11.0, 20.0, 15.0, 23.0, 30.0, 37.0, 40.0, 46.0, 49.0, 43.0, 60.0, 61.0, 62.0, 58.0, 65.0, 58.0, 58.0, 47.0, 44.0, 33.0, 26.0, 15.0, 15.0, 18.0, 18.0, 6.0, 10.0, 7.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022491455078125, -0.021729707717895508, -0.020967960357666016, -0.020206212997436523, -0.01944446563720703, -0.01868271827697754, -0.017920970916748047, -0.017159223556518555, -0.016397476196289062, -0.01563572883605957, -0.014873981475830078, -0.014112234115600586, -0.013350486755371094, -0.012588739395141602, -0.01182699203491211, -0.011065244674682617, -0.010303497314453125, -0.009541749954223633, -0.00878000259399414, -0.008018255233764648, -0.007256507873535156, -0.006494760513305664, -0.005733013153076172, -0.00497126579284668, -0.0042095184326171875, -0.0034477710723876953, -0.002686023712158203, -0.001924276351928711, -0.0011625289916992188, -0.00040078163146972656, 0.0003609657287597656, 0.0011227130889892578, 0.00188446044921875, 0.002646207809448242, 0.0034079551696777344, 0.0041697025299072266, 0.004931449890136719, 0.005693197250366211, 0.006454944610595703, 0.007216691970825195, 0.007978439331054688, 0.00874018669128418, 0.009501934051513672, 0.010263681411743164, 0.011025428771972656, 0.011787176132202148, 0.01254892349243164, 0.013310670852661133, 0.014072418212890625, 0.014834165573120117, 0.01559591293334961, 0.0163576602935791, 0.017119407653808594, 0.017881155014038086, 0.018642902374267578, 0.01940464973449707, 0.020166397094726562, 0.020928144454956055, 0.021689891815185547, 0.02245163917541504, 0.02321338653564453, 0.023975133895874023, 0.024736881256103516, 0.025498628616333008, 0.0262603759765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 6.0, 12.0, 23.0, 43.0, 89.0, 159.0, 346.0, 1070.0, 3867.0, 20495.0, 184121.0, 3381098.0, 550405.0, 43173.0, 6813.0, 1628.0, 484.0, 222.0, 108.0, 41.0, 26.0, 14.0, 9.0, 7.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1402587890625, -0.13519287109375, -0.130126953125, -0.12506103515625, -0.1199951171875, -0.11492919921875, -0.10986328125, -0.10479736328125, -0.0997314453125, -0.09466552734375, -0.089599609375, -0.08453369140625, -0.0794677734375, -0.07440185546875, -0.0693359375, -0.06427001953125, -0.0592041015625, -0.05413818359375, -0.049072265625, -0.04400634765625, -0.0389404296875, -0.03387451171875, -0.02880859375, -0.02374267578125, -0.0186767578125, -0.01361083984375, -0.008544921875, -0.00347900390625, 0.0015869140625, 0.00665283203125, 0.01171875, 0.01678466796875, 0.0218505859375, 0.02691650390625, 0.031982421875, 0.03704833984375, 0.0421142578125, 0.04718017578125, 0.05224609375, 0.05731201171875, 0.0623779296875, 0.06744384765625, 0.072509765625, 0.07757568359375, 0.0826416015625, 0.08770751953125, 0.0927734375, 0.09783935546875, 0.1029052734375, 0.10797119140625, 0.113037109375, 0.11810302734375, 0.1231689453125, 0.12823486328125, 0.13330078125, 0.13836669921875, 0.1434326171875, 0.14849853515625, 0.153564453125, 0.15863037109375, 0.1636962890625, 0.16876220703125, 0.173828125, 0.17889404296875, 0.1839599609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 7.0, 4.0, 7.0, 20.0, 14.0, 20.0, 37.0, 50.0, 77.0, 88.0, 145.0, 271.0, 429.0, 951.0, 847.0, 407.0, 230.0, 147.0, 105.0, 74.0, 37.0, 37.0, 20.0, 17.0, 12.0, 9.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.06939697265625, -0.0677785873413086, -0.06616020202636719, -0.06454181671142578, -0.06292343139648438, -0.06130504608154297, -0.05968666076660156, -0.058068275451660156, -0.05644989013671875, -0.054831504821777344, -0.05321311950683594, -0.05159473419189453, -0.049976348876953125, -0.04835796356201172, -0.04673957824707031, -0.045121192932128906, -0.0435028076171875, -0.041884422302246094, -0.04026603698730469, -0.03864765167236328, -0.037029266357421875, -0.03541088104248047, -0.03379249572753906, -0.032174110412597656, -0.03055572509765625, -0.028937339782714844, -0.027318954467773438, -0.02570056915283203, -0.024082183837890625, -0.02246379852294922, -0.020845413208007812, -0.019227027893066406, -0.017608642578125, -0.015990257263183594, -0.014371871948242188, -0.012753486633300781, -0.011135101318359375, -0.009516716003417969, -0.007898330688476562, -0.006279945373535156, -0.00466156005859375, -0.0030431747436523438, -0.0014247894287109375, 0.00019359588623046875, 0.001811981201171875, 0.0034303665161132812, 0.0050487518310546875, 0.006667137145996094, 0.0082855224609375, 0.009903907775878906, 0.011522293090820312, 0.013140678405761719, 0.014759063720703125, 0.01637744903564453, 0.017995834350585938, 0.019614219665527344, 0.02123260498046875, 0.022850990295410156, 0.024469375610351562, 0.02608776092529297, 0.027706146240234375, 0.02932453155517578, 0.030942916870117188, 0.032561302185058594, 0.0341796875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 10.0, 59.0, 336.0, 467.0, 115.0, 12.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5065604448318481, -0.46088355779647827, -0.4152066707611084, -0.3695297837257385, -0.32385289669036865, -0.2781760096549988, -0.2324991226196289, -0.18682223558425903, -0.14114534854888916, -0.09546846151351929, -0.049791574478149414, -0.004114687442779541, 0.04156219959259033, 0.0872390866279602, 0.13291597366333008, 0.17859286069869995, 0.22426974773406982, 0.2699466347694397, 0.31562352180480957, 0.36130040884017944, 0.4069772958755493, 0.4526541829109192, 0.49833106994628906, 0.5440079569816589, 0.5896848440170288, 0.6353617310523987, 0.6810386180877686, 0.7267155051231384, 0.7723923921585083, 0.8180692791938782, 0.863746166229248, 0.9094230532646179, 0.9551000595092773, 1.000777006149292, 1.046453833580017, 1.0921306610107422, 1.1378076076507568, 1.1834845542907715, 1.2291613817214966, 1.2748382091522217, 1.3205151557922363, 1.366192102432251, 1.411868929862976, 1.4575457572937012, 1.5032227039337158, 1.5488996505737305, 1.5945764780044556, 1.6402533054351807, 1.6859302520751953, 1.73160719871521, 1.777284026145935, 1.8229608535766602, 1.8686378002166748, 1.9143147468566895, 1.9599915742874146, 2.0056684017181396, 2.0513453483581543, 2.097022294998169, 2.1426992416381836, 2.188375949859619, 2.234052896499634, 2.2797298431396484, 2.325406551361084, 2.3710834980010986, 2.4167604446411133]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 9.0, 5.0, 5.0, 9.0, 12.0, 20.0, 17.0, 33.0, 18.0, 25.0, 23.0, 28.0, 45.0, 45.0, 47.0, 41.0, 54.0, 48.0, 51.0, 51.0, 39.0, 39.0, 43.0, 38.0, 50.0, 33.0, 23.0, 25.0, 20.0, 21.0, 13.0, 10.0, 17.0, 14.0, 6.0, 9.0, 5.0, 3.0, 6.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.16080904006958008, -0.15483719110488892, -0.14886535704135895, -0.14289352297782898, -0.13692167401313782, -0.13094982504844666, -0.12497799098491669, -0.11900614947080612, -0.11303430795669556, -0.10706246644258499, -0.10109062492847443, -0.09511878341436386, -0.0891469419002533, -0.08317510038614273, -0.07720325887203217, -0.0712314173579216, -0.06525957584381104, -0.05928773432970047, -0.053315892815589905, -0.04734405130147934, -0.041372209787368774, -0.03540036827325821, -0.029428526759147644, -0.02345668524503708, -0.017484843730926514, -0.011513002216815948, -0.005541160702705383, 0.0004306808114051819, 0.006402522325515747, 0.012374363839626312, 0.018346205353736877, 0.024318046867847443, 0.030289888381958008, 0.03626172989606857, 0.04223357141017914, 0.0482054129242897, 0.05417725443840027, 0.060149095952510834, 0.0661209374666214, 0.07209277898073196, 0.07806462049484253, 0.0840364620089531, 0.09000830352306366, 0.09598014503717422, 0.10195198655128479, 0.10792382806539536, 0.11389566957950592, 0.11986751109361649, 0.12583935260772705, 0.1318112015724182, 0.13778303563594818, 0.14375486969947815, 0.1497267186641693, 0.15569856762886047, 0.16167040169239044, 0.1676422357559204, 0.17361408472061157, 0.17958593368530273, 0.1855577677488327, 0.19152960181236267, 0.19750145077705383, 0.203473299741745, 0.20944513380527496, 0.21541696786880493, 0.2213888168334961]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 11.0, 15.0, 21.0, 53.0, 98.0, 174.0, 397.0, 871.0, 2455.0, 8646.0, 44917.0, 313202.0, 557746.0, 97414.0, 16252.0, 3891.0, 1334.0, 525.0, 233.0, 121.0, 78.0, 32.0, 18.0, 21.0, 8.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.1567535400390625, -0.151885986328125, -0.1470184326171875, -0.14215087890625, -0.1372833251953125, -0.132415771484375, -0.1275482177734375, -0.1226806640625, -0.1178131103515625, -0.112945556640625, -0.1080780029296875, -0.10321044921875, -0.0983428955078125, -0.093475341796875, -0.0886077880859375, -0.083740234375, -0.0788726806640625, -0.074005126953125, -0.0691375732421875, -0.06427001953125, -0.0594024658203125, -0.054534912109375, -0.0496673583984375, -0.0447998046875, -0.0399322509765625, -0.035064697265625, -0.0301971435546875, -0.02532958984375, -0.0204620361328125, -0.015594482421875, -0.0107269287109375, -0.005859375, -0.0009918212890625, 0.003875732421875, 0.0087432861328125, 0.01361083984375, 0.0184783935546875, 0.023345947265625, 0.0282135009765625, 0.0330810546875, 0.0379486083984375, 0.042816162109375, 0.0476837158203125, 0.05255126953125, 0.0574188232421875, 0.062286376953125, 0.0671539306640625, 0.072021484375, 0.0768890380859375, 0.081756591796875, 0.0866241455078125, 0.09149169921875, 0.0963592529296875, 0.101226806640625, 0.1060943603515625, 0.1109619140625, 0.1158294677734375, 0.120697021484375, 0.1255645751953125, 0.13043212890625, 0.1352996826171875, 0.140167236328125, 0.1450347900390625, 0.14990234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 4.0, 13.0, 7.0, 7.0, 8.0, 23.0, 23.0, 25.0, 29.0, 43.0, 37.0, 34.0, 51.0, 44.0, 60.0, 46.0, 55.0, 59.0, 54.0, 44.0, 53.0, 45.0, 44.0, 32.0, 38.0, 22.0, 20.0, 14.0, 13.0, 11.0, 7.0, 11.0, 7.0, 3.0, 0.0, 4.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0263824462890625, -0.02563643455505371, -0.024890422821044922, -0.024144411087036133, -0.023398399353027344, -0.022652387619018555, -0.021906375885009766, -0.021160364151000977, -0.020414352416992188, -0.0196683406829834, -0.01892232894897461, -0.01817631721496582, -0.01743030548095703, -0.016684293746948242, -0.015938282012939453, -0.015192270278930664, -0.014446258544921875, -0.013700246810913086, -0.012954235076904297, -0.012208223342895508, -0.011462211608886719, -0.01071619987487793, -0.00997018814086914, -0.009224176406860352, -0.008478164672851562, -0.0077321529388427734, -0.006986141204833984, -0.006240129470825195, -0.005494117736816406, -0.004748106002807617, -0.004002094268798828, -0.003256082534790039, -0.00251007080078125, -0.001764059066772461, -0.0010180473327636719, -0.0002720355987548828, 0.00047397613525390625, 0.0012199878692626953, 0.0019659996032714844, 0.0027120113372802734, 0.0034580230712890625, 0.0042040348052978516, 0.004950046539306641, 0.00569605827331543, 0.006442070007324219, 0.007188081741333008, 0.007934093475341797, 0.008680105209350586, 0.009426116943359375, 0.010172128677368164, 0.010918140411376953, 0.011664152145385742, 0.012410163879394531, 0.01315617561340332, 0.01390218734741211, 0.014648199081420898, 0.015394210815429688, 0.016140222549438477, 0.016886234283447266, 0.017632246017456055, 0.018378257751464844, 0.019124269485473633, 0.019870281219482422, 0.02061629295349121, 0.0213623046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 2.0, 6.0, 10.0, 10.0, 15.0, 20.0, 35.0, 41.0, 67.0, 118.0, 152.0, 242.0, 409.0, 767.0, 1508.0, 3871.0, 13797.0, 65268.0, 339233.0, 481257.0, 110125.0, 21760.0, 5545.0, 2010.0, 898.0, 523.0, 284.0, 197.0, 121.0, 83.0, 46.0, 43.0, 23.0, 19.0, 16.0, 9.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11260986328125, -0.1093130111694336, -0.10601615905761719, -0.10271930694580078, -0.09942245483398438, -0.09612560272216797, -0.09282875061035156, -0.08953189849853516, -0.08623504638671875, -0.08293819427490234, -0.07964134216308594, -0.07634449005126953, -0.07304763793945312, -0.06975078582763672, -0.06645393371582031, -0.0631570816040039, -0.0598602294921875, -0.056563377380371094, -0.05326652526855469, -0.04996967315673828, -0.046672821044921875, -0.04337596893310547, -0.04007911682128906, -0.036782264709472656, -0.03348541259765625, -0.030188560485839844, -0.026891708374023438, -0.02359485626220703, -0.020298004150390625, -0.01700115203857422, -0.013704299926757812, -0.010407447814941406, -0.007110595703125, -0.0038137435913085938, -0.0005168914794921875, 0.0027799606323242188, 0.006076812744140625, 0.009373664855957031, 0.012670516967773438, 0.015967369079589844, 0.01926422119140625, 0.022561073303222656, 0.025857925415039062, 0.02915477752685547, 0.032451629638671875, 0.03574848175048828, 0.03904533386230469, 0.042342185974121094, 0.0456390380859375, 0.048935890197753906, 0.05223274230957031, 0.05552959442138672, 0.058826446533203125, 0.06212329864501953, 0.06542015075683594, 0.06871700286865234, 0.07201385498046875, 0.07531070709228516, 0.07860755920410156, 0.08190441131591797, 0.08520126342773438, 0.08849811553955078, 0.09179496765136719, 0.0950918197631836, 0.098388671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 9.0, 4.0, 9.0, 12.0, 15.0, 18.0, 19.0, 20.0, 26.0, 30.0, 37.0, 41.0, 34.0, 42.0, 42.0, 45.0, 43.0, 36.0, 45.0, 51.0, 37.0, 40.0, 41.0, 46.0, 34.0, 44.0, 22.0, 20.0, 22.0, 14.0, 18.0, 16.0, 11.0, 8.0, 5.0, 7.0, 10.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.081298828125, -0.07851314544677734, -0.07572746276855469, -0.07294178009033203, -0.07015609741210938, -0.06737041473388672, -0.06458473205566406, -0.061799049377441406, -0.05901336669921875, -0.056227684020996094, -0.05344200134277344, -0.05065631866455078, -0.047870635986328125, -0.04508495330810547, -0.04229927062988281, -0.039513587951660156, -0.0367279052734375, -0.033942222595214844, -0.031156539916992188, -0.02837085723876953, -0.025585174560546875, -0.02279949188232422, -0.020013809204101562, -0.017228126525878906, -0.01444244384765625, -0.011656761169433594, -0.008871078491210938, -0.006085395812988281, -0.003299713134765625, -0.0005140304565429688, 0.0022716522216796875, 0.005057334899902344, 0.007843017578125, 0.010628700256347656, 0.013414382934570312, 0.01620006561279297, 0.018985748291015625, 0.02177143096923828, 0.024557113647460938, 0.027342796325683594, 0.03012847900390625, 0.032914161682128906, 0.03569984436035156, 0.03848552703857422, 0.041271209716796875, 0.04405689239501953, 0.04684257507324219, 0.049628257751464844, 0.0524139404296875, 0.055199623107910156, 0.05798530578613281, 0.06077098846435547, 0.06355667114257812, 0.06634235382080078, 0.06912803649902344, 0.0719137191772461, 0.07469940185546875, 0.0774850845336914, 0.08027076721191406, 0.08305644989013672, 0.08584213256835938, 0.08862781524658203, 0.09141349792480469, 0.09419918060302734, 0.09698486328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 7.0, 14.0, 30.0, 43.0, 96.0, 175.0, 287.0, 715.0, 2057.0, 7978.0, 49793.0, 508465.0, 427803.0, 41154.0, 6835.0, 1788.0, 679.0, 300.0, 130.0, 72.0, 51.0, 20.0, 15.0, 9.0, 8.0, 6.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.09698486328125, -0.09412860870361328, -0.09127235412597656, -0.08841609954833984, -0.08555984497070312, -0.0827035903930664, -0.07984733581542969, -0.07699108123779297, -0.07413482666015625, -0.07127857208251953, -0.06842231750488281, -0.0655660629272461, -0.06270980834960938, -0.059853553771972656, -0.05699729919433594, -0.05414104461669922, -0.0512847900390625, -0.04842853546142578, -0.04557228088378906, -0.042716026306152344, -0.039859771728515625, -0.037003517150878906, -0.03414726257324219, -0.03129100799560547, -0.02843475341796875, -0.02557849884033203, -0.022722244262695312, -0.019865989685058594, -0.017009735107421875, -0.014153480529785156, -0.011297225952148438, -0.008440971374511719, -0.005584716796875, -0.0027284622192382812, 0.0001277923583984375, 0.0029840469360351562, 0.005840301513671875, 0.008696556091308594, 0.011552810668945312, 0.014409065246582031, 0.01726531982421875, 0.02012157440185547, 0.022977828979492188, 0.025834083557128906, 0.028690338134765625, 0.031546592712402344, 0.03440284729003906, 0.03725910186767578, 0.0401153564453125, 0.04297161102294922, 0.04582786560058594, 0.048684120178222656, 0.051540374755859375, 0.054396629333496094, 0.05725288391113281, 0.06010913848876953, 0.06296539306640625, 0.06582164764404297, 0.06867790222167969, 0.0715341567993164, 0.07439041137695312, 0.07724666595458984, 0.08010292053222656, 0.08295917510986328, 0.0858154296875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 5.0, 13.0, 28.0, 49.0, 95.0, 122.0, 171.0, 188.0, 145.0, 74.0, 47.0, 24.0, 22.0, 8.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00022351741790771484, -0.00021895859390497208, -0.0002143997699022293, -0.00020984094589948654, -0.00020528212189674377, -0.000200723297894001, -0.00019616447389125824, -0.00019160564988851547, -0.0001870468258857727, -0.00018248800188302994, -0.00017792917788028717, -0.0001733703538775444, -0.00016881152987480164, -0.00016425270587205887, -0.0001596938818693161, -0.00015513505786657333, -0.00015057623386383057, -0.0001460174098610878, -0.00014145858585834503, -0.00013689976185560226, -0.0001323409378528595, -0.00012778211385011673, -0.00012322328984737396, -0.0001186644658446312, -0.00011410564184188843, -0.00010954681783914566, -0.00010498799383640289, -0.00010042916983366013, -9.587034583091736e-05, -9.131152182817459e-05, -8.675269782543182e-05, -8.219387382268906e-05, -7.763504981994629e-05, -7.307622581720352e-05, -6.851740181446075e-05, -6.395857781171799e-05, -5.939975380897522e-05, -5.484092980623245e-05, -5.0282105803489685e-05, -4.572328180074692e-05, -4.116445779800415e-05, -3.660563379526138e-05, -3.2046809792518616e-05, -2.748798578977585e-05, -2.292916178703308e-05, -1.8370337784290314e-05, -1.3811513781547546e-05, -9.252689778804779e-06, -4.693865776062012e-06, -1.3504177331924438e-07, 4.423782229423523e-06, 8.98260623216629e-06, 1.3541430234909058e-05, 1.8100254237651825e-05, 2.2659078240394592e-05, 2.721790224313736e-05, 3.177672624588013e-05, 3.6335550248622894e-05, 4.089437425136566e-05, 4.545319825410843e-05, 5.0012022256851196e-05, 5.4570846259593964e-05, 5.912967026233673e-05, 6.36884942650795e-05, 6.824731826782227e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 7.0, 13.0, 24.0, 26.0, 41.0, 79.0, 148.0, 321.0, 638.0, 1620.0, 5941.0, 42005.0, 669126.0, 300446.0, 22090.0, 3811.0, 1172.0, 483.0, 261.0, 142.0, 57.0, 44.0, 19.0, 17.0, 6.0, 9.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125244140625, -0.12165069580078125, -0.1180572509765625, -0.11446380615234375, -0.110870361328125, -0.10727691650390625, -0.1036834716796875, -0.10009002685546875, -0.09649658203125, -0.09290313720703125, -0.0893096923828125, -0.08571624755859375, -0.082122802734375, -0.07852935791015625, -0.0749359130859375, -0.07134246826171875, -0.0677490234375, -0.06415557861328125, -0.0605621337890625, -0.05696868896484375, -0.053375244140625, -0.04978179931640625, -0.0461883544921875, -0.04259490966796875, -0.03900146484375, -0.03540802001953125, -0.0318145751953125, -0.02822113037109375, -0.024627685546875, -0.02103424072265625, -0.0174407958984375, -0.01384735107421875, -0.01025390625, -0.00666046142578125, -0.0030670166015625, 0.00052642822265625, 0.004119873046875, 0.00771331787109375, 0.0113067626953125, 0.01490020751953125, 0.01849365234375, 0.02208709716796875, 0.0256805419921875, 0.02927398681640625, 0.032867431640625, 0.03646087646484375, 0.0400543212890625, 0.04364776611328125, 0.0472412109375, 0.05083465576171875, 0.0544281005859375, 0.05802154541015625, 0.061614990234375, 0.06520843505859375, 0.0688018798828125, 0.07239532470703125, 0.07598876953125, 0.07958221435546875, 0.0831756591796875, 0.08676910400390625, 0.090362548828125, 0.09395599365234375, 0.0975494384765625, 0.10114288330078125, 0.104736328125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 3.0, 4.0, 10.0, 11.0, 16.0, 33.0, 42.0, 60.0, 74.0, 108.0, 127.0, 119.0, 119.0, 72.0, 49.0, 39.0, 24.0, 26.0, 21.0, 15.0, 2.0, 4.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0836181640625, -0.08142280578613281, -0.07922744750976562, -0.07703208923339844, -0.07483673095703125, -0.07264137268066406, -0.07044601440429688, -0.06825065612792969, -0.0660552978515625, -0.06385993957519531, -0.061664581298828125, -0.05946922302246094, -0.05727386474609375, -0.05507850646972656, -0.052883148193359375, -0.05068778991699219, -0.048492431640625, -0.04629707336425781, -0.044101715087890625, -0.04190635681152344, -0.03971099853515625, -0.03751564025878906, -0.035320281982421875, -0.03312492370605469, -0.0309295654296875, -0.028734207153320312, -0.026538848876953125, -0.024343490600585938, -0.02214813232421875, -0.019952774047851562, -0.017757415771484375, -0.015562057495117188, -0.01336669921875, -0.011171340942382812, -0.008975982666015625, -0.0067806243896484375, -0.00458526611328125, -0.0023899078369140625, -0.000194549560546875, 0.0020008087158203125, 0.0041961669921875, 0.0063915252685546875, 0.008586883544921875, 0.010782241821289062, 0.01297760009765625, 0.015172958374023438, 0.017368316650390625, 0.019563674926757812, 0.021759033203125, 0.023954391479492188, 0.026149749755859375, 0.028345108032226562, 0.03054046630859375, 0.03273582458496094, 0.034931182861328125, 0.03712654113769531, 0.0393218994140625, 0.04151725769042969, 0.043712615966796875, 0.04590797424316406, 0.04810333251953125, 0.05029869079589844, 0.052494049072265625, 0.05468940734863281, 0.056884765625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 11.0, 8.0, 69.0, 297.0, 470.0, 122.0, 16.0, 12.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07457971572876, -3.990049123764038, -3.9055185317993164, -3.8209877014160156, -3.736457109451294, -3.6519265174865723, -3.5673956871032715, -3.48286509513855, -3.398334503173828, -3.3138039112091064, -3.2292733192443848, -3.144742488861084, -3.0602118968963623, -2.9756813049316406, -2.89115047454834, -2.806619882583618, -2.7220892906188965, -2.637558698654175, -2.553028106689453, -2.4684972763061523, -2.3839666843414307, -2.299436092376709, -2.214905261993408, -2.1303746700286865, -2.045844078063965, -1.9613134860992432, -1.876782774925232, -1.7922520637512207, -1.707721471786499, -1.6231908798217773, -1.5386601686477661, -1.4541294574737549, -1.3695991039276123, -1.2850685119628906, -1.2005378007888794, -1.1160070896148682, -1.0314764976501465, -0.94694584608078, -0.8624151945114136, -0.7778845429420471, -0.6933538913726807, -0.6088232398033142, -0.5242925882339478, -0.4397619366645813, -0.35523128509521484, -0.2707006335258484, -0.18616998195648193, -0.10163933038711548, -0.017108678817749023, 0.06742197275161743, 0.1519526243209839, 0.23648327589035034, 0.3210139274597168, 0.40554457902908325, 0.4900752305984497, 0.5746058821678162, 0.6591365337371826, 0.7436671853065491, 0.8281978368759155, 0.912728488445282, 0.9972591400146484, 1.0817897319793701, 1.1663204431533813, 1.2508511543273926, 1.3353817462921143]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 6.0, 10.0, 13.0, 6.0, 9.0, 7.0, 17.0, 15.0, 17.0, 21.0, 24.0, 16.0, 34.0, 35.0, 36.0, 31.0, 32.0, 38.0, 38.0, 45.0, 41.0, 45.0, 43.0, 32.0, 38.0, 34.0, 43.0, 19.0, 32.0, 27.0, 26.0, 24.0, 31.0, 21.0, 16.0, 19.0, 11.0, 6.0, 8.0, 9.0, 4.0, 7.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.42437469959259033, -0.4111730456352234, -0.39797139167785645, -0.3847697079181671, -0.37156805396080017, -0.3583664000034332, -0.3451647460460663, -0.33196306228637695, -0.31876140832901, -0.30555975437164307, -0.2923581004142761, -0.2791564166545868, -0.26595476269721985, -0.2527531087398529, -0.23955145478248596, -0.22634978592395782, -0.21314813196659088, -0.19994647800922394, -0.1867448091506958, -0.17354315519332886, -0.16034148633480072, -0.14713983237743378, -0.13393816351890564, -0.1207365095615387, -0.10753484815359116, -0.09433318674564362, -0.08113152533769608, -0.06792986392974854, -0.05472820624709129, -0.04152654856443405, -0.02832488715648651, -0.015123225748538971, -0.0019215643405914307, 0.011280096136033535, 0.0244817566126585, 0.03768341615796089, 0.05088507756590843, 0.06408673524856567, 0.07728839665651321, 0.09049005806446075, 0.1036917194724083, 0.11689338088035583, 0.13009503483772278, 0.14329670369625092, 0.15649835765361786, 0.169700026512146, 0.18290168046951294, 0.19610333442687988, 0.20930500328540802, 0.22250665724277496, 0.2357083261013031, 0.24890998005867004, 0.262111634016037, 0.2753133177757263, 0.28851497173309326, 0.3017166256904602, 0.31491827964782715, 0.3281199336051941, 0.34132158756256104, 0.35452327132225037, 0.3677249252796173, 0.38092657923698425, 0.3941282331943512, 0.4073299169540405, 0.42053157091140747]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 11.0, 15.0, 13.0, 35.0, 69.0, 83.0, 144.0, 275.0, 611.0, 1454.0, 4430.0, 18493.0, 135049.0, 3621952.0, 367029.0, 34397.0, 6862.0, 1924.0, 717.0, 300.0, 175.0, 99.0, 45.0, 36.0, 15.0, 14.0, 15.0, 7.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.159912109375, -0.15530014038085938, -0.15068817138671875, -0.14607620239257812, -0.1414642333984375, -0.13685226440429688, -0.13224029541015625, -0.12762832641601562, -0.123016357421875, -0.11840438842773438, -0.11379241943359375, -0.10918045043945312, -0.1045684814453125, -0.09995651245117188, -0.09534454345703125, -0.09073257446289062, -0.08612060546875, -0.08150863647460938, -0.07689666748046875, -0.07228469848632812, -0.0676727294921875, -0.06306076049804688, -0.05844879150390625, -0.053836822509765625, -0.049224853515625, -0.044612884521484375, -0.04000091552734375, -0.035388946533203125, -0.0307769775390625, -0.026165008544921875, -0.02155303955078125, -0.016941070556640625, -0.0123291015625, -0.007717132568359375, -0.00310516357421875, 0.001506805419921875, 0.0061187744140625, 0.010730743408203125, 0.01534271240234375, 0.019954681396484375, 0.024566650390625, 0.029178619384765625, 0.03379058837890625, 0.038402557373046875, 0.0430145263671875, 0.047626495361328125, 0.05223846435546875, 0.056850433349609375, 0.06146240234375, 0.06607437133789062, 0.07068634033203125, 0.07529830932617188, 0.0799102783203125, 0.08452224731445312, 0.08913421630859375, 0.09374618530273438, 0.098358154296875, 0.10297012329101562, 0.10758209228515625, 0.11219406127929688, 0.1168060302734375, 0.12141799926757812, 0.12602996826171875, 0.13064193725585938, 0.13525390625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 8.0, 4.0, 12.0, 14.0, 13.0, 19.0, 20.0, 25.0, 26.0, 24.0, 27.0, 40.0, 50.0, 52.0, 53.0, 53.0, 46.0, 49.0, 45.0, 63.0, 49.0, 52.0, 50.0, 42.0, 31.0, 36.0, 23.0, 21.0, 12.0, 12.0, 13.0, 8.0, 7.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.027923583984375, -0.027126312255859375, -0.02632904052734375, -0.025531768798828125, -0.0247344970703125, -0.023937225341796875, -0.02313995361328125, -0.022342681884765625, -0.02154541015625, -0.020748138427734375, -0.01995086669921875, -0.019153594970703125, -0.0183563232421875, -0.017559051513671875, -0.01676177978515625, -0.015964508056640625, -0.015167236328125, -0.014369964599609375, -0.01357269287109375, -0.012775421142578125, -0.0119781494140625, -0.011180877685546875, -0.01038360595703125, -0.009586334228515625, -0.0087890625, -0.007991790771484375, -0.00719451904296875, -0.006397247314453125, -0.0055999755859375, -0.004802703857421875, -0.00400543212890625, -0.003208160400390625, -0.002410888671875, -0.001613616943359375, -0.00081634521484375, -1.9073486328125e-05, 0.0007781982421875, 0.001575469970703125, 0.00237274169921875, 0.003170013427734375, 0.00396728515625, 0.004764556884765625, 0.00556182861328125, 0.006359100341796875, 0.0071563720703125, 0.007953643798828125, 0.00875091552734375, 0.009548187255859375, 0.010345458984375, 0.011142730712890625, 0.01194000244140625, 0.012737274169921875, 0.0135345458984375, 0.014331817626953125, 0.01512908935546875, 0.015926361083984375, 0.0167236328125, 0.017520904541015625, 0.01831817626953125, 0.019115447998046875, 0.0199127197265625, 0.020709991455078125, 0.02150726318359375, 0.022304534912109375, 0.023101806640625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 5.0, 13.0, 33.0, 62.0, 143.0, 411.0, 1202.0, 4790.0, 28719.0, 560602.0, 3500818.0, 84611.0, 9675.0, 2181.0, 621.0, 226.0, 87.0, 31.0, 27.0, 12.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18017578125, -0.1740093231201172, -0.16784286499023438, -0.16167640686035156, -0.15550994873046875, -0.14934349060058594, -0.14317703247070312, -0.1370105743408203, -0.1308441162109375, -0.12467765808105469, -0.11851119995117188, -0.11234474182128906, -0.10617828369140625, -0.10001182556152344, -0.09384536743164062, -0.08767890930175781, -0.081512451171875, -0.07534599304199219, -0.06917953491210938, -0.06301307678222656, -0.05684661865234375, -0.05068016052246094, -0.044513702392578125, -0.03834724426269531, -0.0321807861328125, -0.026014328002929688, -0.019847869873046875, -0.013681411743164062, -0.00751495361328125, -0.0013484954833984375, 0.004817962646484375, 0.010984420776367188, 0.01715087890625, 0.023317337036132812, 0.029483795166015625, 0.03565025329589844, 0.04181671142578125, 0.04798316955566406, 0.054149627685546875, 0.06031608581542969, 0.0664825439453125, 0.07264900207519531, 0.07881546020507812, 0.08498191833496094, 0.09114837646484375, 0.09731483459472656, 0.10348129272460938, 0.10964775085449219, 0.115814208984375, 0.12198066711425781, 0.12814712524414062, 0.13431358337402344, 0.14048004150390625, 0.14664649963378906, 0.15281295776367188, 0.1589794158935547, 0.1651458740234375, 0.1713123321533203, 0.17747879028320312, 0.18364524841308594, 0.18981170654296875, 0.19597816467285156, 0.20214462280273438, 0.2083110809326172, 0.2144775390625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 1.0, 4.0, 4.0, 11.0, 10.0, 13.0, 22.0, 31.0, 38.0, 56.0, 76.0, 114.0, 156.0, 276.0, 474.0, 1183.0, 697.0, 316.0, 168.0, 125.0, 73.0, 55.0, 54.0, 29.0, 13.0, 15.0, 9.0, 7.0, 3.0, 5.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04022216796875, -0.03899049758911133, -0.037758827209472656, -0.036527156829833984, -0.03529548645019531, -0.03406381607055664, -0.03283214569091797, -0.0316004753112793, -0.030368804931640625, -0.029137134552001953, -0.02790546417236328, -0.02667379379272461, -0.025442123413085938, -0.024210453033447266, -0.022978782653808594, -0.021747112274169922, -0.02051544189453125, -0.019283771514892578, -0.018052101135253906, -0.016820430755615234, -0.015588760375976562, -0.01435708999633789, -0.013125419616699219, -0.011893749237060547, -0.010662078857421875, -0.009430408477783203, -0.008198738098144531, -0.006967067718505859, -0.0057353973388671875, -0.004503726959228516, -0.0032720565795898438, -0.002040386199951172, -0.0008087158203125, 0.0004229545593261719, 0.0016546249389648438, 0.0028862953186035156, 0.0041179656982421875, 0.005349636077880859, 0.006581306457519531, 0.007812976837158203, 0.009044647216796875, 0.010276317596435547, 0.011507987976074219, 0.01273965835571289, 0.013971328735351562, 0.015202999114990234, 0.016434669494628906, 0.017666339874267578, 0.01889801025390625, 0.020129680633544922, 0.021361351013183594, 0.022593021392822266, 0.023824691772460938, 0.02505636215209961, 0.02628803253173828, 0.027519702911376953, 0.028751373291015625, 0.029983043670654297, 0.03121471405029297, 0.03244638442993164, 0.03367805480957031, 0.034909725189208984, 0.036141395568847656, 0.03737306594848633, 0.038604736328125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 10.0, 36.0, 93.0, 231.0, 325.0, 205.0, 62.0, 19.0, 10.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0939297676086426, -1.0722848176956177, -1.0506398677825928, -1.0289949178695679, -1.007349967956543, -0.9857049584388733, -0.9640600085258484, -0.9424150586128235, -0.9207701086997986, -0.8991251587867737, -0.8774802088737488, -0.8558351993560791, -0.8341902494430542, -0.8125452995300293, -0.7909003496170044, -0.7692553997039795, -0.7476104497909546, -0.7259654998779297, -0.7043205499649048, -0.6826756000518799, -0.6610305905342102, -0.6393856406211853, -0.6177406907081604, -0.5960957407951355, -0.5744507312774658, -0.5528057813644409, -0.531160831451416, -0.5095158815383911, -0.4878709018230438, -0.46622592210769653, -0.44458097219467163, -0.42293602228164673, -0.4012910723686218, -0.3796461224555969, -0.35800114274024963, -0.33635619282722473, -0.31471124291419983, -0.29306626319885254, -0.27142131328582764, -0.24977636337280273, -0.22813139855861664, -0.20648643374443054, -0.18484148383140564, -0.16319651901721954, -0.14155155420303345, -0.11990660429000854, -0.09826163947582245, -0.07661668956279755, -0.05497172474861145, -0.03332676738500595, -0.011681806296110153, 0.009963154792785645, 0.031608112156391144, 0.05325306951999664, 0.07489803433418274, 0.09654298424720764, 0.11818794906139374, 0.13983291387557983, 0.16147786378860474, 0.18312282860279083, 0.20476779341697693, 0.22641274333000183, 0.24805770814418793, 0.269702672958374, 0.2913476228713989]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 6.0, 9.0, 6.0, 17.0, 17.0, 23.0, 20.0, 31.0, 31.0, 43.0, 39.0, 43.0, 46.0, 49.0, 61.0, 56.0, 52.0, 44.0, 63.0, 43.0, 34.0, 42.0, 30.0, 40.0, 24.0, 22.0, 22.0, 14.0, 19.0, 15.0, 14.0, 6.0, 9.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1718946099281311, -0.16655950248241425, -0.1612243950366974, -0.15588930249214172, -0.15055419504642487, -0.145219087600708, -0.13988398015499115, -0.1345488727092743, -0.12921378016471863, -0.12387867271900177, -0.11854357272386551, -0.11320846527814865, -0.10787336528301239, -0.10253825783729553, -0.09720315039157867, -0.09186804294586182, -0.08653293550014496, -0.0811978280544281, -0.07586272805929184, -0.07052762061357498, -0.06519252061843872, -0.05985741317272186, -0.054522305727005005, -0.049187202006578445, -0.043852098286151886, -0.03851699456572533, -0.03318189084529877, -0.02784678339958191, -0.02251167967915535, -0.01717657595872879, -0.011841468513011932, -0.006506364792585373, -0.0011712610721588135, 0.004163843579590321, 0.009498948231339455, 0.014834053814411163, 0.020169157534837723, 0.025504261255264282, 0.03083936870098114, 0.0361744724214077, 0.04150957614183426, 0.04684467986226082, 0.05217978358268738, 0.057514891028404236, 0.0628499984741211, 0.06818509846925735, 0.07352020591497421, 0.07885530591011047, 0.08419041335582733, 0.08952552080154419, 0.09486062079668045, 0.10019572824239731, 0.10553082823753357, 0.11086593568325043, 0.11620104312896729, 0.12153615057468414, 0.126871258020401, 0.13220636546611786, 0.13754147291183472, 0.14287656545639038, 0.14821167290210724, 0.1535467803478241, 0.15888188779354095, 0.1642169952392578, 0.16955208778381348]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 2.0, 10.0, 12.0, 21.0, 26.0, 39.0, 74.0, 107.0, 156.0, 321.0, 558.0, 1230.0, 2817.0, 7558.0, 23268.0, 83287.0, 313171.0, 428646.0, 133593.0, 35601.0, 10870.0, 3976.0, 1601.0, 685.0, 372.0, 199.0, 123.0, 70.0, 58.0, 29.0, 22.0, 18.0, 11.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10015869140625, -0.09713935852050781, -0.09412002563476562, -0.09110069274902344, -0.08808135986328125, -0.08506202697753906, -0.08204269409179688, -0.07902336120605469, -0.0760040283203125, -0.07298469543457031, -0.06996536254882812, -0.06694602966308594, -0.06392669677734375, -0.06090736389160156, -0.057888031005859375, -0.05486869812011719, -0.051849365234375, -0.04883003234863281, -0.045810699462890625, -0.04279136657714844, -0.03977203369140625, -0.03675270080566406, -0.033733367919921875, -0.030714035034179688, -0.0276947021484375, -0.024675369262695312, -0.021656036376953125, -0.018636703491210938, -0.01561737060546875, -0.012598037719726562, -0.009578704833984375, -0.0065593719482421875, -0.0035400390625, -0.0005207061767578125, 0.002498626708984375, 0.0055179595947265625, 0.00853729248046875, 0.011556625366210938, 0.014575958251953125, 0.017595291137695312, 0.0206146240234375, 0.023633956909179688, 0.026653289794921875, 0.029672622680664062, 0.03269195556640625, 0.03571128845214844, 0.038730621337890625, 0.04174995422363281, 0.044769287109375, 0.04778861999511719, 0.050807952880859375, 0.05382728576660156, 0.05684661865234375, 0.05986595153808594, 0.06288528442382812, 0.06590461730957031, 0.0689239501953125, 0.07194328308105469, 0.07496261596679688, 0.07798194885253906, 0.08100128173828125, 0.08402061462402344, 0.08703994750976562, 0.09005928039550781, 0.09307861328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 9.0, 8.0, 15.0, 12.0, 16.0, 26.0, 17.0, 30.0, 35.0, 28.0, 35.0, 53.0, 52.0, 50.0, 59.0, 59.0, 45.0, 44.0, 64.0, 54.0, 44.0, 27.0, 36.0, 40.0, 38.0, 19.0, 26.0, 19.0, 10.0, 13.0, 1.0, 9.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025299072265625, -0.02445673942565918, -0.02361440658569336, -0.02277207374572754, -0.02192974090576172, -0.0210874080657959, -0.020245075225830078, -0.019402742385864258, -0.018560409545898438, -0.017718076705932617, -0.016875743865966797, -0.016033411026000977, -0.015191078186035156, -0.014348745346069336, -0.013506412506103516, -0.012664079666137695, -0.011821746826171875, -0.010979413986206055, -0.010137081146240234, -0.009294748306274414, -0.008452415466308594, -0.0076100826263427734, -0.006767749786376953, -0.005925416946411133, -0.0050830841064453125, -0.004240751266479492, -0.003398418426513672, -0.0025560855865478516, -0.0017137527465820312, -0.0008714199066162109, -2.9087066650390625e-05, 0.0008132457733154297, 0.00165557861328125, 0.0024979114532470703, 0.0033402442932128906, 0.004182577133178711, 0.005024909973144531, 0.0058672428131103516, 0.006709575653076172, 0.007551908493041992, 0.008394241333007812, 0.009236574172973633, 0.010078907012939453, 0.010921239852905273, 0.011763572692871094, 0.012605905532836914, 0.013448238372802734, 0.014290571212768555, 0.015132904052734375, 0.015975236892700195, 0.016817569732666016, 0.017659902572631836, 0.018502235412597656, 0.019344568252563477, 0.020186901092529297, 0.021029233932495117, 0.021871566772460938, 0.022713899612426758, 0.023556232452392578, 0.0243985652923584, 0.02524089813232422, 0.02608323097229004, 0.02692556381225586, 0.02776789665222168, 0.0286102294921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 2.0, 8.0, 10.0, 8.0, 19.0, 12.0, 28.0, 36.0, 45.0, 57.0, 77.0, 94.0, 127.0, 190.0, 324.0, 516.0, 981.0, 2190.0, 6269.0, 20525.0, 77273.0, 302088.0, 444890.0, 140929.0, 35298.0, 10001.0, 3417.0, 1331.0, 627.0, 386.0, 201.0, 157.0, 99.0, 74.0, 49.0, 40.0, 29.0, 39.0, 29.0, 10.0, 19.0, 11.0, 5.0, 6.0, 5.0, 5.0, 0.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.07098388671875, -0.06855392456054688, -0.06612396240234375, -0.06369400024414062, -0.0612640380859375, -0.058834075927734375, -0.05640411376953125, -0.053974151611328125, -0.051544189453125, -0.049114227294921875, -0.04668426513671875, -0.044254302978515625, -0.0418243408203125, -0.039394378662109375, -0.03696441650390625, -0.034534454345703125, -0.0321044921875, -0.029674530029296875, -0.02724456787109375, -0.024814605712890625, -0.0223846435546875, -0.019954681396484375, -0.01752471923828125, -0.015094757080078125, -0.012664794921875, -0.010234832763671875, -0.00780487060546875, -0.005374908447265625, -0.0029449462890625, -0.000514984130859375, 0.00191497802734375, 0.004344940185546875, 0.00677490234375, 0.009204864501953125, 0.01163482666015625, 0.014064788818359375, 0.0164947509765625, 0.018924713134765625, 0.02135467529296875, 0.023784637451171875, 0.026214599609375, 0.028644561767578125, 0.03107452392578125, 0.033504486083984375, 0.0359344482421875, 0.038364410400390625, 0.04079437255859375, 0.043224334716796875, 0.045654296875, 0.048084259033203125, 0.05051422119140625, 0.052944183349609375, 0.0553741455078125, 0.057804107666015625, 0.06023406982421875, 0.06266403198242188, 0.065093994140625, 0.06752395629882812, 0.06995391845703125, 0.07238388061523438, 0.0748138427734375, 0.07724380493164062, 0.07967376708984375, 0.08210372924804688, 0.08453369140625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 4.0, 8.0, 10.0, 9.0, 6.0, 10.0, 10.0, 20.0, 18.0, 26.0, 25.0, 21.0, 34.0, 33.0, 39.0, 49.0, 41.0, 44.0, 46.0, 44.0, 60.0, 54.0, 39.0, 37.0, 41.0, 41.0, 49.0, 30.0, 28.0, 32.0, 16.0, 17.0, 11.0, 6.0, 17.0, 6.0, 7.0, 7.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.10821533203125, -0.10500144958496094, -0.10178756713867188, -0.09857368469238281, -0.09535980224609375, -0.09214591979980469, -0.08893203735351562, -0.08571815490722656, -0.0825042724609375, -0.07929039001464844, -0.07607650756835938, -0.07286262512207031, -0.06964874267578125, -0.06643486022949219, -0.06322097778320312, -0.06000709533691406, -0.056793212890625, -0.05357933044433594, -0.050365447998046875, -0.04715156555175781, -0.04393768310546875, -0.04072380065917969, -0.037509918212890625, -0.03429603576660156, -0.0310821533203125, -0.027868270874023438, -0.024654388427734375, -0.021440505981445312, -0.01822662353515625, -0.015012741088867188, -0.011798858642578125, -0.008584976196289062, -0.00537109375, -0.0021572113037109375, 0.001056671142578125, 0.0042705535888671875, 0.00748443603515625, 0.010698318481445312, 0.013912200927734375, 0.017126083374023438, 0.0203399658203125, 0.023553848266601562, 0.026767730712890625, 0.029981613159179688, 0.03319549560546875, 0.03640937805175781, 0.039623260498046875, 0.04283714294433594, 0.046051025390625, 0.04926490783691406, 0.052478790283203125, 0.05569267272949219, 0.05890655517578125, 0.06212043762207031, 0.06533432006835938, 0.06854820251464844, 0.0717620849609375, 0.07497596740722656, 0.07818984985351562, 0.08140373229980469, 0.08461761474609375, 0.08783149719238281, 0.09104537963867188, 0.09425926208496094, 0.09747314453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 10.0, 14.0, 17.0, 29.0, 32.0, 52.0, 103.0, 188.0, 370.0, 733.0, 1809.0, 5469.0, 20191.0, 86652.0, 424549.0, 401093.0, 80014.0, 18780.0, 5138.0, 1806.0, 691.0, 376.0, 172.0, 105.0, 53.0, 36.0, 19.0, 13.0, 10.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056243896484375, -0.05472278594970703, -0.05320167541503906, -0.051680564880371094, -0.050159454345703125, -0.048638343811035156, -0.04711723327636719, -0.04559612274169922, -0.04407501220703125, -0.04255390167236328, -0.04103279113769531, -0.039511680603027344, -0.037990570068359375, -0.036469459533691406, -0.03494834899902344, -0.03342723846435547, -0.0319061279296875, -0.03038501739501953, -0.028863906860351562, -0.027342796325683594, -0.025821685791015625, -0.024300575256347656, -0.022779464721679688, -0.02125835418701172, -0.01973724365234375, -0.01821613311767578, -0.016695022583007812, -0.015173912048339844, -0.013652801513671875, -0.012131690979003906, -0.010610580444335938, -0.009089469909667969, -0.007568359375, -0.006047248840332031, -0.0045261383056640625, -0.0030050277709960938, -0.001483917236328125, 3.719329833984375e-05, 0.0015583038330078125, 0.0030794143676757812, 0.00460052490234375, 0.006121635437011719, 0.0076427459716796875, 0.009163856506347656, 0.010684967041015625, 0.012206077575683594, 0.013727188110351562, 0.015248298645019531, 0.0167694091796875, 0.01829051971435547, 0.019811630249023438, 0.021332740783691406, 0.022853851318359375, 0.024374961853027344, 0.025896072387695312, 0.02741718292236328, 0.02893829345703125, 0.03045940399169922, 0.03198051452636719, 0.033501625061035156, 0.035022735595703125, 0.036543846130371094, 0.03806495666503906, 0.03958606719970703, 0.041107177734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 3.0, 9.0, 10.0, 13.0, 20.0, 28.0, 38.0, 53.0, 70.0, 105.0, 134.0, 107.0, 116.0, 94.0, 60.0, 44.0, 37.0, 17.0, 12.0, 12.0, 10.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.164478302001953e-05, -6.892159581184387e-05, -6.619840860366821e-05, -6.347522139549255e-05, -6.0752034187316895e-05, -5.8028846979141235e-05, -5.5305659770965576e-05, -5.258247256278992e-05, -4.985928535461426e-05, -4.71360981464386e-05, -4.441291093826294e-05, -4.168972373008728e-05, -3.896653652191162e-05, -3.624334931373596e-05, -3.35201621055603e-05, -3.0796974897384644e-05, -2.8073787689208984e-05, -2.5350600481033325e-05, -2.2627413272857666e-05, -1.9904226064682007e-05, -1.7181038856506348e-05, -1.4457851648330688e-05, -1.173466444015503e-05, -9.01147723197937e-06, -6.288290023803711e-06, -3.5651028156280518e-06, -8.419156074523926e-07, 1.8812716007232666e-06, 4.604458808898926e-06, 7.327646017074585e-06, 1.0050833225250244e-05, 1.2774020433425903e-05, 1.5497207641601562e-05, 1.822039484977722e-05, 2.094358205795288e-05, 2.366676926612854e-05, 2.63899564743042e-05, 2.911314368247986e-05, 3.183633089065552e-05, 3.455951809883118e-05, 3.7282705307006836e-05, 4.0005892515182495e-05, 4.2729079723358154e-05, 4.5452266931533813e-05, 4.817545413970947e-05, 5.089864134788513e-05, 5.362182855606079e-05, 5.634501576423645e-05, 5.906820297241211e-05, 6.179139018058777e-05, 6.451457738876343e-05, 6.723776459693909e-05, 6.996095180511475e-05, 7.26841390132904e-05, 7.540732622146606e-05, 7.813051342964172e-05, 8.085370063781738e-05, 8.357688784599304e-05, 8.63000750541687e-05, 8.902326226234436e-05, 9.174644947052002e-05, 9.446963667869568e-05, 9.719282388687134e-05, 9.9916011095047e-05, 0.00010263919830322266]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 8.0, 10.0, 12.0, 31.0, 39.0, 47.0, 82.0, 133.0, 237.0, 421.0, 875.0, 1897.0, 5319.0, 18862.0, 94707.0, 577044.0, 289684.0, 42879.0, 10253.0, 3170.0, 1361.0, 641.0, 329.0, 203.0, 117.0, 60.0, 42.0, 24.0, 22.0, 8.0, 9.0, 9.0, 6.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060791015625, -0.058936119079589844, -0.05708122253417969, -0.05522632598876953, -0.053371429443359375, -0.05151653289794922, -0.04966163635253906, -0.047806739807128906, -0.04595184326171875, -0.044096946716308594, -0.04224205017089844, -0.04038715362548828, -0.038532257080078125, -0.03667736053466797, -0.03482246398925781, -0.032967567443847656, -0.0311126708984375, -0.029257774353027344, -0.027402877807617188, -0.02554798126220703, -0.023693084716796875, -0.02183818817138672, -0.019983291625976562, -0.018128395080566406, -0.01627349853515625, -0.014418601989746094, -0.012563705444335938, -0.010708808898925781, -0.008853912353515625, -0.006999015808105469, -0.0051441192626953125, -0.0032892227172851562, -0.001434326171875, 0.00042057037353515625, 0.0022754669189453125, 0.004130363464355469, 0.005985260009765625, 0.007840156555175781, 0.009695053100585938, 0.011549949645996094, 0.01340484619140625, 0.015259742736816406, 0.017114639282226562, 0.01896953582763672, 0.020824432373046875, 0.02267932891845703, 0.024534225463867188, 0.026389122009277344, 0.0282440185546875, 0.030098915100097656, 0.03195381164550781, 0.03380870819091797, 0.035663604736328125, 0.03751850128173828, 0.03937339782714844, 0.041228294372558594, 0.04308319091796875, 0.044938087463378906, 0.04679298400878906, 0.04864788055419922, 0.050502777099609375, 0.05235767364501953, 0.05421257019042969, 0.056067466735839844, 0.05792236328125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 8.0, 15.0, 26.0, 19.0, 41.0, 58.0, 105.0, 144.0, 161.0, 139.0, 92.0, 56.0, 38.0, 30.0, 18.0, 14.0, 9.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060638427734375, -0.05850553512573242, -0.056372642517089844, -0.054239749908447266, -0.05210685729980469, -0.04997396469116211, -0.04784107208251953, -0.04570817947387695, -0.043575286865234375, -0.0414423942565918, -0.03930950164794922, -0.03717660903930664, -0.03504371643066406, -0.032910823822021484, -0.030777931213378906, -0.028645038604736328, -0.02651214599609375, -0.024379253387451172, -0.022246360778808594, -0.020113468170166016, -0.017980575561523438, -0.01584768295288086, -0.013714790344238281, -0.011581897735595703, -0.009449005126953125, -0.007316112518310547, -0.005183219909667969, -0.0030503273010253906, -0.0009174346923828125, 0.0012154579162597656, 0.0033483505249023438, 0.005481243133544922, 0.0076141357421875, 0.009747028350830078, 0.011879920959472656, 0.014012813568115234, 0.016145706176757812, 0.01827859878540039, 0.02041149139404297, 0.022544384002685547, 0.024677276611328125, 0.026810169219970703, 0.02894306182861328, 0.03107595443725586, 0.03320884704589844, 0.035341739654541016, 0.037474632263183594, 0.03960752487182617, 0.04174041748046875, 0.04387331008911133, 0.046006202697753906, 0.048139095306396484, 0.05027198791503906, 0.05240488052368164, 0.05453777313232422, 0.0566706657409668, 0.058803558349609375, 0.06093645095825195, 0.06306934356689453, 0.06520223617553711, 0.06733512878417969, 0.06946802139282227, 0.07160091400146484, 0.07373380661010742, 0.07586669921875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 12.0, 4.0, 20.0, 58.0, 147.0, 272.0, 228.0, 167.0, 60.0, 21.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6740647554397583, -0.6344435811042786, -0.5948224663734436, -0.5552012920379639, -0.5155801773071289, -0.47595900297164917, -0.43633782863616943, -0.3967166841030121, -0.35709553956985474, -0.3174743950366974, -0.27785325050354004, -0.2382320761680603, -0.19861093163490295, -0.1589897871017456, -0.11936862766742706, -0.07974746823310852, -0.04012632369995117, -0.0005051717162132263, 0.03911598026752472, 0.07873713225126266, 0.11835828423500061, 0.15797942876815796, 0.1976005882024765, 0.23722174763679504, 0.2768428921699524, 0.31646403670310974, 0.3560851812362671, 0.3957063555717468, 0.4353275001049042, 0.4749486446380615, 0.5145698189735413, 0.554190993309021, 0.5938122272491455, 0.6334334015846252, 0.6730545163154602, 0.7126756906509399, 0.7522968053817749, 0.7919179797172546, 0.8315391540527344, 0.8711602687835693, 0.9107814431190491, 0.9504026174545288, 0.9900237321853638, 1.0296448469161987, 1.0692660808563232, 1.1088871955871582, 1.1485083103179932, 1.1881295442581177, 1.2277506589889526, 1.2673717737197876, 1.306993007659912, 1.346614122390747, 1.386235237121582, 1.425856351852417, 1.4654775857925415, 1.5050987005233765, 1.544719934463501, 1.584341049194336, 1.6239622831344604, 1.6635833978652954, 1.7032045125961304, 1.7428257465362549, 1.7824468612670898, 1.8220679759979248, 1.8616890907287598]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 4.0, 2.0, 5.0, 8.0, 6.0, 4.0, 11.0, 14.0, 17.0, 12.0, 13.0, 19.0, 22.0, 22.0, 19.0, 25.0, 24.0, 18.0, 33.0, 27.0, 30.0, 46.0, 31.0, 36.0, 39.0, 27.0, 37.0, 37.0, 35.0, 38.0, 34.0, 35.0, 27.0, 32.0, 32.0, 27.0, 22.0, 17.0, 25.0, 9.0, 20.0, 13.0, 12.0, 8.0, 5.0, 9.0, 6.0, 5.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.41575491428375244, -0.4035694897174835, -0.3913840353488922, -0.3791986107826233, -0.36701318621635437, -0.35482773184776306, -0.34264230728149414, -0.33045685291290283, -0.3182714283466339, -0.306086003780365, -0.2939005494117737, -0.28171512484550476, -0.26952970027923584, -0.25734424591064453, -0.2451588213443756, -0.2329733818769455, -0.22078795731067657, -0.20860251784324646, -0.19641709327697754, -0.18423165380954742, -0.1720462143421173, -0.1598607897758484, -0.14767535030841827, -0.13548991084098816, -0.12330447882413864, -0.11111904680728912, -0.09893360733985901, -0.08674817532300949, -0.07456274330615997, -0.06237730383872986, -0.05019187182188034, -0.038006432354450226, -0.025821000337600708, -0.013635565526783466, -0.0014501307159662247, 0.010735303163528442, 0.02292073890566826, 0.035106174647808075, 0.04729160666465759, 0.05947704613208771, 0.07166247814893723, 0.08384791016578674, 0.09603334963321686, 0.10821878165006638, 0.1204042136669159, 0.132589653134346, 0.14477509260177612, 0.15696051716804504, 0.16914595663547516, 0.18133139610290527, 0.1935168206691742, 0.2057022601366043, 0.21788769960403442, 0.23007312417030334, 0.24225856363773346, 0.2544440031051636, 0.2666294276714325, 0.2788148522377014, 0.2910003066062927, 0.30318573117256165, 0.31537115573883057, 0.3275566101074219, 0.3397420346736908, 0.3519274592399597, 0.364112913608551]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 2.0, 10.0, 15.0, 31.0, 41.0, 111.0, 163.0, 295.0, 583.0, 1616.0, 5062.0, 19039.0, 122796.0, 3766803.0, 239882.0, 27667.0, 6754.0, 1970.0, 763.0, 292.0, 171.0, 79.0, 55.0, 30.0, 20.0, 11.0, 8.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1685791015625, -0.1628875732421875, -0.157196044921875, -0.1515045166015625, -0.14581298828125, -0.1401214599609375, -0.134429931640625, -0.1287384033203125, -0.123046875, -0.1173553466796875, -0.111663818359375, -0.1059722900390625, -0.10028076171875, -0.0945892333984375, -0.088897705078125, -0.0832061767578125, -0.0775146484375, -0.0718231201171875, -0.066131591796875, -0.0604400634765625, -0.05474853515625, -0.0490570068359375, -0.043365478515625, -0.0376739501953125, -0.031982421875, -0.0262908935546875, -0.020599365234375, -0.0149078369140625, -0.00921630859375, -0.0035247802734375, 0.002166748046875, 0.0078582763671875, 0.0135498046875, 0.0192413330078125, 0.024932861328125, 0.0306243896484375, 0.03631591796875, 0.0420074462890625, 0.047698974609375, 0.0533905029296875, 0.05908203125, 0.0647735595703125, 0.070465087890625, 0.0761566162109375, 0.08184814453125, 0.0875396728515625, 0.093231201171875, 0.0989227294921875, 0.1046142578125, 0.1103057861328125, 0.115997314453125, 0.1216888427734375, 0.12738037109375, 0.1330718994140625, 0.138763427734375, 0.1444549560546875, 0.150146484375, 0.1558380126953125, 0.161529541015625, 0.1672210693359375, 0.17291259765625, 0.1786041259765625, 0.184295654296875, 0.1899871826171875, 0.1956787109375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 17.0, 10.0, 15.0, 11.0, 19.0, 21.0, 22.0, 36.0, 25.0, 28.0, 32.0, 47.0, 32.0, 30.0, 46.0, 43.0, 52.0, 49.0, 52.0, 40.0, 46.0, 45.0, 31.0, 25.0, 24.0, 27.0, 27.0, 19.0, 21.0, 20.0, 20.0, 12.0, 11.0, 11.0, 3.0, 5.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0241241455078125, -0.02338409423828125, -0.02264404296875, -0.02190399169921875, -0.0211639404296875, -0.02042388916015625, -0.019683837890625, -0.01894378662109375, -0.0182037353515625, -0.01746368408203125, -0.0167236328125, -0.01598358154296875, -0.0152435302734375, -0.01450347900390625, -0.013763427734375, -0.01302337646484375, -0.0122833251953125, -0.01154327392578125, -0.01080322265625, -0.01006317138671875, -0.0093231201171875, -0.00858306884765625, -0.007843017578125, -0.00710296630859375, -0.0063629150390625, -0.00562286376953125, -0.0048828125, -0.00414276123046875, -0.0034027099609375, -0.00266265869140625, -0.001922607421875, -0.00118255615234375, -0.0004425048828125, 0.00029754638671875, 0.00103759765625, 0.00177764892578125, 0.0025177001953125, 0.00325775146484375, 0.003997802734375, 0.00473785400390625, 0.0054779052734375, 0.00621795654296875, 0.0069580078125, 0.00769805908203125, 0.0084381103515625, 0.00917816162109375, 0.009918212890625, 0.01065826416015625, 0.0113983154296875, 0.01213836669921875, 0.01287841796875, 0.01361846923828125, 0.0143585205078125, 0.01509857177734375, 0.015838623046875, 0.01657867431640625, 0.0173187255859375, 0.01805877685546875, 0.018798828125, 0.01953887939453125, 0.0202789306640625, 0.02101898193359375, 0.021759033203125, 0.02249908447265625, 0.0232391357421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 10.0, 17.0, 21.0, 41.0, 107.0, 194.0, 406.0, 1041.0, 3284.0, 16201.0, 150519.0, 3735747.0, 257496.0, 22871.0, 4249.0, 1175.0, 474.0, 213.0, 108.0, 41.0, 26.0, 18.0, 6.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0], "bins": [-0.2958984375, -0.2895469665527344, -0.28319549560546875, -0.2768440246582031, -0.2704925537109375, -0.2641410827636719, -0.25778961181640625, -0.2514381408691406, -0.245086669921875, -0.23873519897460938, -0.23238372802734375, -0.22603225708007812, -0.2196807861328125, -0.21332931518554688, -0.20697784423828125, -0.20062637329101562, -0.19427490234375, -0.18792343139648438, -0.18157196044921875, -0.17522048950195312, -0.1688690185546875, -0.16251754760742188, -0.15616607666015625, -0.14981460571289062, -0.143463134765625, -0.13711166381835938, -0.13076019287109375, -0.12440872192382812, -0.1180572509765625, -0.11170578002929688, -0.10535430908203125, -0.09900283813476562, -0.0926513671875, -0.08629989624023438, -0.07994842529296875, -0.07359695434570312, -0.0672454833984375, -0.060894012451171875, -0.05454254150390625, -0.048191070556640625, -0.041839599609375, -0.035488128662109375, -0.02913665771484375, -0.022785186767578125, -0.0164337158203125, -0.010082244873046875, -0.00373077392578125, 0.002620697021484375, 0.00897216796875, 0.015323638916015625, 0.02167510986328125, 0.028026580810546875, 0.0343780517578125, 0.040729522705078125, 0.04708099365234375, 0.053432464599609375, 0.059783935546875, 0.06613540649414062, 0.07248687744140625, 0.07883834838867188, 0.0851898193359375, 0.09154129028320312, 0.09789276123046875, 0.10424423217773438, 0.110595703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 8.0, 3.0, 10.0, 15.0, 17.0, 24.0, 36.0, 60.0, 126.0, 260.0, 1056.0, 1620.0, 412.0, 191.0, 99.0, 54.0, 34.0, 20.0, 14.0, 7.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0833740234375, -0.08112812042236328, -0.07888221740722656, -0.07663631439208984, -0.07439041137695312, -0.0721445083618164, -0.06989860534667969, -0.06765270233154297, -0.06540679931640625, -0.06316089630126953, -0.06091499328613281, -0.058669090270996094, -0.056423187255859375, -0.054177284240722656, -0.05193138122558594, -0.04968547821044922, -0.0474395751953125, -0.04519367218017578, -0.04294776916503906, -0.040701866149902344, -0.038455963134765625, -0.036210060119628906, -0.03396415710449219, -0.03171825408935547, -0.02947235107421875, -0.02722644805908203, -0.024980545043945312, -0.022734642028808594, -0.020488739013671875, -0.018242835998535156, -0.015996932983398438, -0.013751029968261719, -0.011505126953125, -0.009259223937988281, -0.0070133209228515625, -0.004767417907714844, -0.002521514892578125, -0.00027561187744140625, 0.0019702911376953125, 0.004216194152832031, 0.00646209716796875, 0.008708000183105469, 0.010953903198242188, 0.013199806213378906, 0.015445709228515625, 0.017691612243652344, 0.019937515258789062, 0.02218341827392578, 0.0244293212890625, 0.02667522430419922, 0.028921127319335938, 0.031167030334472656, 0.033412933349609375, 0.035658836364746094, 0.03790473937988281, 0.04015064239501953, 0.04239654541015625, 0.04464244842529297, 0.04688835144042969, 0.049134254455566406, 0.051380157470703125, 0.053626060485839844, 0.05587196350097656, 0.05811786651611328, 0.06036376953125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 9.0, 17.0, 39.0, 138.0, 331.0, 302.0, 112.0, 31.0, 12.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8705629110336304, -0.8469116687774658, -0.8232604265213013, -0.7996092438697815, -0.7759580016136169, -0.7523067593574524, -0.7286555171012878, -0.7050043344497681, -0.6813530921936035, -0.657701849937439, -0.6340506076812744, -0.6103994250297546, -0.5867481827735901, -0.5630969405174255, -0.539445698261261, -0.5157945156097412, -0.4921432435512543, -0.4684920012950897, -0.44484078884124756, -0.421189546585083, -0.39753833413124084, -0.3738870918750763, -0.35023587942123413, -0.3265846371650696, -0.30293339490890503, -0.2792821526527405, -0.2556309401988983, -0.23197969794273376, -0.2083284854888916, -0.18467724323272705, -0.1610260158777237, -0.13737478852272034, -0.11372357606887817, -0.09007234871387482, -0.06642112135887146, -0.042769886553287506, -0.01911865919828415, 0.004532568156719208, 0.02818380296230316, 0.05183503031730652, 0.07548625767230988, 0.09913748502731323, 0.12278871238231659, 0.14643993973731995, 0.1700911819934845, 0.19374239444732666, 0.2173936367034912, 0.24104486405849457, 0.2646960914134979, 0.2883473336696625, 0.31199854612350464, 0.3356497883796692, 0.35930100083351135, 0.3829522430896759, 0.40660345554351807, 0.4302546977996826, 0.45390594005584717, 0.4775571823120117, 0.5012084245681763, 0.524859607219696, 0.5485108494758606, 0.5721620917320251, 0.5958133339881897, 0.6194645166397095, 0.643115758895874]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 8.0, 13.0, 6.0, 7.0, 11.0, 9.0, 25.0, 15.0, 14.0, 25.0, 29.0, 19.0, 25.0, 25.0, 33.0, 27.0, 39.0, 36.0, 34.0, 33.0, 35.0, 43.0, 34.0, 32.0, 37.0, 37.0, 34.0, 27.0, 39.0, 28.0, 24.0, 33.0, 18.0, 25.0, 16.0, 20.0, 20.0, 7.0, 11.0, 4.0, 6.0, 4.0, 4.0, 6.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.12422674894332886, -0.12009643018245697, -0.11596611142158508, -0.1118357926607132, -0.10770547389984131, -0.10357515513896942, -0.09944483637809753, -0.09531451761722565, -0.09118419885635376, -0.08705388009548187, -0.08292356133460999, -0.0787932425737381, -0.07466292381286621, -0.07053260505199432, -0.06640228629112244, -0.06227196753025055, -0.05814164876937866, -0.054011330008506775, -0.04988101124763489, -0.045750692486763, -0.04162037372589111, -0.037490054965019226, -0.03335973620414734, -0.02922941744327545, -0.025099098682403564, -0.020968779921531677, -0.01683846116065979, -0.012708142399787903, -0.008577823638916016, -0.004447504878044128, -0.0003171861171722412, 0.003813132643699646, 0.007943451404571533, 0.01207377016544342, 0.016204088926315308, 0.020334407687187195, 0.024464726448059082, 0.02859504520893097, 0.032725363969802856, 0.036855682730674744, 0.04098600149154663, 0.04511632025241852, 0.049246639013290405, 0.05337695777416229, 0.05750727653503418, 0.06163759529590607, 0.06576791405677795, 0.06989823281764984, 0.07402855157852173, 0.07815887033939362, 0.0822891891002655, 0.08641950786113739, 0.09054982662200928, 0.09468014538288116, 0.09881046414375305, 0.10294078290462494, 0.10707110166549683, 0.11120142042636871, 0.1153317391872406, 0.11946205794811249, 0.12359237670898438, 0.12772269546985626, 0.13185301423072815, 0.13598333299160004, 0.14011365175247192]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 6.0, 1.0, 4.0, 10.0, 9.0, 21.0, 29.0, 40.0, 77.0, 87.0, 151.0, 206.0, 388.0, 666.0, 1171.0, 2166.0, 4249.0, 9259.0, 22372.0, 55717.0, 131679.0, 258616.0, 283728.0, 158676.0, 68871.0, 28015.0, 11600.0, 5152.0, 2473.0, 1327.0, 692.0, 413.0, 245.0, 146.0, 92.0, 70.0, 37.0, 33.0, 17.0, 10.0, 5.0, 14.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.07733154296875, -0.07512950897216797, -0.07292747497558594, -0.0707254409790039, -0.06852340698242188, -0.06632137298583984, -0.06411933898925781, -0.06191730499267578, -0.05971527099609375, -0.05751323699951172, -0.05531120300292969, -0.053109169006347656, -0.050907135009765625, -0.048705101013183594, -0.04650306701660156, -0.04430103302001953, -0.0420989990234375, -0.03989696502685547, -0.03769493103027344, -0.035492897033691406, -0.033290863037109375, -0.031088829040527344, -0.028886795043945312, -0.02668476104736328, -0.02448272705078125, -0.02228069305419922, -0.020078659057617188, -0.017876625061035156, -0.015674591064453125, -0.013472557067871094, -0.011270523071289062, -0.009068489074707031, -0.006866455078125, -0.004664421081542969, -0.0024623870849609375, -0.00026035308837890625, 0.001941680908203125, 0.004143714904785156, 0.0063457489013671875, 0.008547782897949219, 0.01074981689453125, 0.012951850891113281, 0.015153884887695312, 0.017355918884277344, 0.019557952880859375, 0.021759986877441406, 0.023962020874023438, 0.02616405487060547, 0.0283660888671875, 0.03056812286376953, 0.03277015686035156, 0.034972190856933594, 0.037174224853515625, 0.039376258850097656, 0.04157829284667969, 0.04378032684326172, 0.04598236083984375, 0.04818439483642578, 0.05038642883300781, 0.052588462829589844, 0.054790496826171875, 0.056992530822753906, 0.05919456481933594, 0.06139659881591797, 0.0635986328125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 10.0, 12.0, 3.0, 7.0, 12.0, 21.0, 22.0, 22.0, 18.0, 36.0, 27.0, 31.0, 39.0, 34.0, 42.0, 28.0, 50.0, 33.0, 59.0, 30.0, 57.0, 40.0, 40.0, 34.0, 40.0, 32.0, 30.0, 31.0, 28.0, 31.0, 13.0, 17.0, 16.0, 11.0, 16.0, 8.0, 4.0, 1.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0275726318359375, -0.02677464485168457, -0.02597665786743164, -0.02517867088317871, -0.02438068389892578, -0.02358269691467285, -0.022784709930419922, -0.021986722946166992, -0.021188735961914062, -0.020390748977661133, -0.019592761993408203, -0.018794775009155273, -0.017996788024902344, -0.017198801040649414, -0.016400814056396484, -0.015602827072143555, -0.014804840087890625, -0.014006853103637695, -0.013208866119384766, -0.012410879135131836, -0.011612892150878906, -0.010814905166625977, -0.010016918182373047, -0.009218931198120117, -0.008420944213867188, -0.007622957229614258, -0.006824970245361328, -0.0060269832611083984, -0.005228996276855469, -0.004431009292602539, -0.0036330223083496094, -0.0028350353240966797, -0.00203704833984375, -0.0012390613555908203, -0.0004410743713378906, 0.00035691261291503906, 0.0011548995971679688, 0.0019528865814208984, 0.002750873565673828, 0.003548860549926758, 0.0043468475341796875, 0.005144834518432617, 0.005942821502685547, 0.0067408084869384766, 0.007538795471191406, 0.008336782455444336, 0.009134769439697266, 0.009932756423950195, 0.010730743408203125, 0.011528730392456055, 0.012326717376708984, 0.013124704360961914, 0.013922691345214844, 0.014720678329467773, 0.015518665313720703, 0.016316652297973633, 0.017114639282226562, 0.017912626266479492, 0.018710613250732422, 0.01950860023498535, 0.02030658721923828, 0.02110457420349121, 0.02190256118774414, 0.02270054817199707, 0.02349853515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 0.0, 4.0, 7.0, 7.0, 13.0, 22.0, 26.0, 43.0, 61.0, 107.0, 158.0, 289.0, 424.0, 865.0, 2203.0, 9172.0, 90068.0, 640942.0, 273567.0, 24074.0, 3717.0, 1290.0, 615.0, 358.0, 197.0, 133.0, 72.0, 41.0, 27.0, 20.0, 7.0, 11.0, 7.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.183349609375, -0.17848968505859375, -0.1736297607421875, -0.16876983642578125, -0.163909912109375, -0.15904998779296875, -0.1541900634765625, -0.14933013916015625, -0.14447021484375, -0.13961029052734375, -0.1347503662109375, -0.12989044189453125, -0.125030517578125, -0.12017059326171875, -0.1153106689453125, -0.11045074462890625, -0.1055908203125, -0.10073089599609375, -0.0958709716796875, -0.09101104736328125, -0.086151123046875, -0.08129119873046875, -0.0764312744140625, -0.07157135009765625, -0.06671142578125, -0.06185150146484375, -0.0569915771484375, -0.05213165283203125, -0.047271728515625, -0.04241180419921875, -0.0375518798828125, -0.03269195556640625, -0.02783203125, -0.02297210693359375, -0.0181121826171875, -0.01325225830078125, -0.008392333984375, -0.00353240966796875, 0.0013275146484375, 0.00618743896484375, 0.01104736328125, 0.01590728759765625, 0.0207672119140625, 0.02562713623046875, 0.030487060546875, 0.03534698486328125, 0.0402069091796875, 0.04506683349609375, 0.0499267578125, 0.05478668212890625, 0.0596466064453125, 0.06450653076171875, 0.069366455078125, 0.07422637939453125, 0.0790863037109375, 0.08394622802734375, 0.08880615234375, 0.09366607666015625, 0.0985260009765625, 0.10338592529296875, 0.108245849609375, 0.11310577392578125, 0.1179656982421875, 0.12282562255859375, 0.127685546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 2.0, 6.0, 2.0, 7.0, 6.0, 8.0, 8.0, 10.0, 10.0, 18.0, 17.0, 17.0, 17.0, 34.0, 19.0, 18.0, 31.0, 32.0, 44.0, 28.0, 40.0, 46.0, 53.0, 45.0, 35.0, 41.0, 35.0, 38.0, 35.0, 30.0, 38.0, 26.0, 28.0, 26.0, 19.0, 20.0, 15.0, 13.0, 16.0, 11.0, 8.0, 11.0, 11.0, 5.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.10247802734375, -0.09924030303955078, -0.09600257873535156, -0.09276485443115234, -0.08952713012695312, -0.0862894058227539, -0.08305168151855469, -0.07981395721435547, -0.07657623291015625, -0.07333850860595703, -0.07010078430175781, -0.0668630599975586, -0.06362533569335938, -0.060387611389160156, -0.05714988708496094, -0.05391216278076172, -0.0506744384765625, -0.04743671417236328, -0.04419898986816406, -0.040961265563964844, -0.037723541259765625, -0.034485816955566406, -0.031248092651367188, -0.02801036834716797, -0.02477264404296875, -0.02153491973876953, -0.018297195434570312, -0.015059471130371094, -0.011821746826171875, -0.008584022521972656, -0.0053462982177734375, -0.0021085739135742188, 0.001129150390625, 0.004366874694824219, 0.0076045989990234375, 0.010842323303222656, 0.014080047607421875, 0.017317771911621094, 0.020555496215820312, 0.02379322052001953, 0.02703094482421875, 0.03026866912841797, 0.03350639343261719, 0.036744117736816406, 0.039981842041015625, 0.043219566345214844, 0.04645729064941406, 0.04969501495361328, 0.0529327392578125, 0.05617046356201172, 0.05940818786621094, 0.06264591217041016, 0.06588363647460938, 0.0691213607788086, 0.07235908508300781, 0.07559680938720703, 0.07883453369140625, 0.08207225799560547, 0.08530998229980469, 0.0885477066040039, 0.09178543090820312, 0.09502315521240234, 0.09826087951660156, 0.10149860382080078, 0.104736328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 20.0, 44.0, 123.0, 426.0, 2132.0, 31809.0, 884395.0, 124573.0, 4077.0, 658.0, 179.0, 47.0, 31.0, 17.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.17313385009765625, -0.1684112548828125, -0.16368865966796875, -0.158966064453125, -0.15424346923828125, -0.1495208740234375, -0.14479827880859375, -0.14007568359375, -0.13535308837890625, -0.1306304931640625, -0.12590789794921875, -0.121185302734375, -0.11646270751953125, -0.1117401123046875, -0.10701751708984375, -0.102294921875, -0.09757232666015625, -0.0928497314453125, -0.08812713623046875, -0.083404541015625, -0.07868194580078125, -0.0739593505859375, -0.06923675537109375, -0.06451416015625, -0.05979156494140625, -0.0550689697265625, -0.05034637451171875, -0.045623779296875, -0.04090118408203125, -0.0361785888671875, -0.03145599365234375, -0.0267333984375, -0.02201080322265625, -0.0172882080078125, -0.01256561279296875, -0.007843017578125, -0.00312042236328125, 0.0016021728515625, 0.00632476806640625, 0.01104736328125, 0.01576995849609375, 0.0204925537109375, 0.02521514892578125, 0.029937744140625, 0.03466033935546875, 0.0393829345703125, 0.04410552978515625, 0.048828125, 0.05355072021484375, 0.0582733154296875, 0.06299591064453125, 0.067718505859375, 0.07244110107421875, 0.0771636962890625, 0.08188629150390625, 0.08660888671875, 0.09133148193359375, 0.0960540771484375, 0.10077667236328125, 0.105499267578125, 0.11022186279296875, 0.1149444580078125, 0.11966705322265625, 0.1243896484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 10.0, 7.0, 18.0, 6.0, 15.0, 14.0, 26.0, 49.0, 60.0, 78.0, 110.0, 110.0, 120.0, 103.0, 87.0, 49.0, 34.0, 33.0, 28.0, 18.0, 17.0, 4.0, 1.0, 11.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.00011104345321655273, -0.00010872632265090942, -0.00010640919208526611, -0.0001040920615196228, -0.00010177493095397949, -9.945780038833618e-05, -9.714066982269287e-05, -9.482353925704956e-05, -9.250640869140625e-05, -9.018927812576294e-05, -8.787214756011963e-05, -8.555501699447632e-05, -8.323788642883301e-05, -8.09207558631897e-05, -7.860362529754639e-05, -7.628649473190308e-05, -7.396936416625977e-05, -7.165223360061646e-05, -6.933510303497314e-05, -6.701797246932983e-05, -6.470084190368652e-05, -6.238371133804321e-05, -6.00665807723999e-05, -5.774945020675659e-05, -5.543231964111328e-05, -5.311518907546997e-05, -5.079805850982666e-05, -4.848092794418335e-05, -4.616379737854004e-05, -4.384666681289673e-05, -4.152953624725342e-05, -3.921240568161011e-05, -3.68952751159668e-05, -3.4578144550323486e-05, -3.2261013984680176e-05, -2.9943883419036865e-05, -2.7626752853393555e-05, -2.5309622287750244e-05, -2.2992491722106934e-05, -2.0675361156463623e-05, -1.8358230590820312e-05, -1.6041100025177002e-05, -1.3723969459533691e-05, -1.1406838893890381e-05, -9.08970832824707e-06, -6.77257776260376e-06, -4.455447196960449e-06, -2.1383166313171387e-06, 1.7881393432617188e-07, 2.4959444999694824e-06, 4.813075065612793e-06, 7.1302056312561035e-06, 9.447336196899414e-06, 1.1764466762542725e-05, 1.4081597328186035e-05, 1.6398727893829346e-05, 1.8715858459472656e-05, 2.1032989025115967e-05, 2.3350119590759277e-05, 2.5667250156402588e-05, 2.79843807220459e-05, 3.030151128768921e-05, 3.261864185333252e-05, 3.493577241897583e-05, 3.725290298461914e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 20.0, 11.0, 28.0, 37.0, 53.0, 114.0, 244.0, 399.0, 946.0, 2801.0, 14646.0, 205252.0, 727293.0, 85405.0, 7927.0, 1887.0, 696.0, 351.0, 169.0, 106.0, 69.0, 26.0, 28.0, 11.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0799560546875, -0.07667160034179688, -0.07338714599609375, -0.07010269165039062, -0.0668182373046875, -0.06353378295898438, -0.06024932861328125, -0.056964874267578125, -0.053680419921875, -0.050395965576171875, -0.04711151123046875, -0.043827056884765625, -0.0405426025390625, -0.037258148193359375, -0.03397369384765625, -0.030689239501953125, -0.02740478515625, -0.024120330810546875, -0.02083587646484375, -0.017551422119140625, -0.0142669677734375, -0.010982513427734375, -0.00769805908203125, -0.004413604736328125, -0.001129150390625, 0.002155303955078125, 0.00543975830078125, 0.008724212646484375, 0.0120086669921875, 0.015293121337890625, 0.01857757568359375, 0.021862030029296875, 0.025146484375, 0.028430938720703125, 0.03171539306640625, 0.034999847412109375, 0.0382843017578125, 0.041568756103515625, 0.04485321044921875, 0.048137664794921875, 0.051422119140625, 0.054706573486328125, 0.05799102783203125, 0.061275482177734375, 0.0645599365234375, 0.06784439086914062, 0.07112884521484375, 0.07441329956054688, 0.07769775390625, 0.08098220825195312, 0.08426666259765625, 0.08755111694335938, 0.0908355712890625, 0.09412002563476562, 0.09740447998046875, 0.10068893432617188, 0.103973388671875, 0.10725784301757812, 0.11054229736328125, 0.11382675170898438, 0.1171112060546875, 0.12039566040039062, 0.12368011474609375, 0.12696456909179688, 0.1302490234375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 15.0, 19.0, 23.0, 51.0, 78.0, 126.0, 154.0, 145.0, 120.0, 108.0, 53.0, 45.0, 24.0, 12.0, 9.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1328125, -0.12950992584228516, -0.1262073516845703, -0.12290477752685547, -0.11960220336914062, -0.11629962921142578, -0.11299705505371094, -0.1096944808959961, -0.10639190673828125, -0.1030893325805664, -0.09978675842285156, -0.09648418426513672, -0.09318161010742188, -0.08987903594970703, -0.08657646179199219, -0.08327388763427734, -0.0799713134765625, -0.07666873931884766, -0.07336616516113281, -0.07006359100341797, -0.06676101684570312, -0.06345844268798828, -0.06015586853027344, -0.056853294372558594, -0.05355072021484375, -0.050248146057128906, -0.04694557189941406, -0.04364299774169922, -0.040340423583984375, -0.03703784942626953, -0.03373527526855469, -0.030432701110839844, -0.027130126953125, -0.023827552795410156, -0.020524978637695312, -0.01722240447998047, -0.013919830322265625, -0.010617256164550781, -0.0073146820068359375, -0.004012107849121094, -0.00070953369140625, 0.0025930404663085938, 0.0058956146240234375, 0.009198188781738281, 0.012500762939453125, 0.01580333709716797, 0.019105911254882812, 0.022408485412597656, 0.0257110595703125, 0.029013633728027344, 0.03231620788574219, 0.03561878204345703, 0.038921356201171875, 0.04222393035888672, 0.04552650451660156, 0.048829078674316406, 0.05213165283203125, 0.055434226989746094, 0.05873680114746094, 0.06203937530517578, 0.06534194946289062, 0.06864452362060547, 0.07194709777832031, 0.07524967193603516, 0.07855224609375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 10.0, 45.0, 177.0, 402.0, 285.0, 62.0, 20.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.800501823425293, -3.7226123809814453, -3.6447229385375977, -3.566833734512329, -3.4889442920684814, -3.411054849624634, -3.333165407180786, -3.2552762031555176, -3.17738676071167, -3.0994973182678223, -3.0216078758239746, -2.943718671798706, -2.8658292293548584, -2.7879397869110107, -2.710050344467163, -2.6321611404418945, -2.554271697998047, -2.476382255554199, -2.3984928131103516, -2.320603609085083, -2.2427141666412354, -2.1648247241973877, -2.08693528175354, -2.0090460777282715, -1.9311563968658447, -1.853266954421997, -1.775377631187439, -1.6974881887435913, -1.6195988655090332, -1.5417094230651855, -1.463819980621338, -1.3859306573867798, -1.3080413341522217, -1.230151891708374, -1.152262568473816, -1.0743731260299683, -0.9964838027954102, -0.9185943603515625, -0.8407049775123596, -0.7628155946731567, -0.6849262118339539, -0.607036828994751, -0.5291474461555481, -0.4512580335140228, -0.37336865067481995, -0.29547926783561707, -0.2175898551940918, -0.13970047235488892, -0.061811089515686035, 0.016078300774097443, 0.09396769106388092, 0.171857088804245, 0.24974647164344788, 0.32763585448265076, 0.405525267124176, 0.4834146499633789, 0.5613040328025818, 0.6391934156417847, 0.7170827984809875, 0.7949721813201904, 0.8728616237640381, 0.9507509469985962, 1.0286403894424438, 1.106529712677002, 1.1844191551208496]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 4.0, 7.0, 6.0, 10.0, 18.0, 10.0, 13.0, 27.0, 26.0, 20.0, 29.0, 29.0, 43.0, 33.0, 35.0, 43.0, 36.0, 45.0, 38.0, 45.0, 40.0, 53.0, 41.0, 50.0, 34.0, 36.0, 27.0, 33.0, 31.0, 24.0, 24.0, 17.0, 13.0, 12.0, 10.0, 9.0, 5.0, 9.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6177189350128174, -0.5986857414245605, -0.5796524882316589, -0.5606192946434021, -0.5415860414505005, -0.5225528478622437, -0.5035196542739868, -0.4844864308834076, -0.46545320749282837, -0.44641998410224915, -0.4273867607116699, -0.4083535671234131, -0.38932034373283386, -0.37028712034225464, -0.3512539267539978, -0.3322207033634186, -0.31318747997283936, -0.29415425658226013, -0.2751210331916809, -0.2560878396034241, -0.23705461621284485, -0.21802139282226562, -0.1989881843328476, -0.17995497584342957, -0.16092175245285034, -0.14188852906227112, -0.12285532057285309, -0.10382210463285446, -0.08478888869285583, -0.06575567275285721, -0.04672245681285858, -0.027689248323440552, -0.008655965328216553, 0.010377250611782074, 0.0294104665517807, 0.04844368249177933, 0.06747689843177795, 0.08651011437177658, 0.10554333031177521, 0.12457653880119324, 0.14360976219177246, 0.16264298558235168, 0.18167619407176971, 0.20070940256118774, 0.21974262595176697, 0.2387758493423462, 0.257809042930603, 0.27684226632118225, 0.2958754897117615, 0.3149087131023407, 0.3339419364929199, 0.35297513008117676, 0.372008353471756, 0.3910415768623352, 0.41007477045059204, 0.42910799384117126, 0.4481412172317505, 0.4671744406223297, 0.48620766401290894, 0.5052408576011658, 0.5242741107940674, 0.5433073043823242, 0.562340497970581, 0.5813736915588379, 0.6004069447517395]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 11.0, 15.0, 26.0, 37.0, 57.0, 101.0, 207.0, 401.0, 735.0, 1591.0, 3641.0, 10547.0, 41241.0, 309035.0, 3596327.0, 185611.0, 30401.0, 8511.0, 3036.0, 1296.0, 661.0, 338.0, 180.0, 88.0, 66.0, 43.0, 22.0, 20.0, 9.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10552978515625, -0.1015329360961914, -0.09753608703613281, -0.09353923797607422, -0.08954238891601562, -0.08554553985595703, -0.08154869079589844, -0.07755184173583984, -0.07355499267578125, -0.06955814361572266, -0.06556129455566406, -0.06156444549560547, -0.057567596435546875, -0.05357074737548828, -0.04957389831542969, -0.045577049255371094, -0.0415802001953125, -0.037583351135253906, -0.03358650207519531, -0.02958965301513672, -0.025592803955078125, -0.02159595489501953, -0.017599105834960938, -0.013602256774902344, -0.00960540771484375, -0.005608558654785156, -0.0016117095947265625, 0.0023851394653320312, 0.006381988525390625, 0.010378837585449219, 0.014375686645507812, 0.018372535705566406, 0.022369384765625, 0.026366233825683594, 0.030363082885742188, 0.03435993194580078, 0.038356781005859375, 0.04235363006591797, 0.04635047912597656, 0.050347328186035156, 0.05434417724609375, 0.058341026306152344, 0.06233787536621094, 0.06633472442626953, 0.07033157348632812, 0.07432842254638672, 0.07832527160644531, 0.0823221206665039, 0.0863189697265625, 0.0903158187866211, 0.09431266784667969, 0.09830951690673828, 0.10230636596679688, 0.10630321502685547, 0.11030006408691406, 0.11429691314697266, 0.11829376220703125, 0.12229061126708984, 0.12628746032714844, 0.13028430938720703, 0.13428115844726562, 0.13827800750732422, 0.1422748565673828, 0.1462717056274414, 0.1502685546875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 5.0, 12.0, 8.0, 10.0, 18.0, 21.0, 21.0, 21.0, 23.0, 30.0, 47.0, 30.0, 47.0, 41.0, 44.0, 51.0, 59.0, 43.0, 54.0, 62.0, 47.0, 43.0, 38.0, 29.0, 27.0, 21.0, 30.0, 26.0, 27.0, 12.0, 9.0, 9.0, 5.0, 10.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02630615234375, -0.02536773681640625, -0.0244293212890625, -0.02349090576171875, -0.022552490234375, -0.02161407470703125, -0.0206756591796875, -0.01973724365234375, -0.018798828125, -0.01786041259765625, -0.0169219970703125, -0.01598358154296875, -0.015045166015625, -0.01410675048828125, -0.0131683349609375, -0.01222991943359375, -0.01129150390625, -0.01035308837890625, -0.0094146728515625, -0.00847625732421875, -0.007537841796875, -0.00659942626953125, -0.0056610107421875, -0.00472259521484375, -0.0037841796875, -0.00284576416015625, -0.0019073486328125, -0.00096893310546875, -3.0517578125e-05, 0.00090789794921875, 0.0018463134765625, 0.00278472900390625, 0.00372314453125, 0.00466156005859375, 0.0055999755859375, 0.00653839111328125, 0.007476806640625, 0.00841522216796875, 0.0093536376953125, 0.01029205322265625, 0.01123046875, 0.01216888427734375, 0.0131072998046875, 0.01404571533203125, 0.014984130859375, 0.01592254638671875, 0.0168609619140625, 0.01779937744140625, 0.01873779296875, 0.01967620849609375, 0.0206146240234375, 0.02155303955078125, 0.022491455078125, 0.02342987060546875, 0.0243682861328125, 0.02530670166015625, 0.0262451171875, 0.02718353271484375, 0.0281219482421875, 0.02906036376953125, 0.029998779296875, 0.03093719482421875, 0.0318756103515625, 0.03281402587890625, 0.03375244140625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 13.0, 14.0, 21.0, 47.0, 78.0, 151.0, 363.0, 784.0, 2049.0, 5709.0, 19384.0, 92791.0, 1434972.0, 2486413.0, 117832.0, 23064.0, 6569.0, 2364.0, 912.0, 382.0, 185.0, 81.0, 41.0, 17.0, 15.0, 10.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1453857421875, -0.14123916625976562, -0.13709259033203125, -0.13294601440429688, -0.1287994384765625, -0.12465286254882812, -0.12050628662109375, -0.11635971069335938, -0.112213134765625, -0.10806655883789062, -0.10391998291015625, -0.09977340698242188, -0.0956268310546875, -0.09148025512695312, -0.08733367919921875, -0.08318710327148438, -0.07904052734375, -0.07489395141601562, -0.07074737548828125, -0.06660079956054688, -0.0624542236328125, -0.058307647705078125, -0.05416107177734375, -0.050014495849609375, -0.045867919921875, -0.041721343994140625, -0.03757476806640625, -0.033428192138671875, -0.0292816162109375, -0.025135040283203125, -0.02098846435546875, -0.016841888427734375, -0.0126953125, -0.008548736572265625, -0.00440216064453125, -0.000255584716796875, 0.0038909912109375, 0.008037567138671875, 0.01218414306640625, 0.016330718994140625, 0.020477294921875, 0.024623870849609375, 0.02877044677734375, 0.032917022705078125, 0.0370635986328125, 0.041210174560546875, 0.04535675048828125, 0.049503326416015625, 0.05364990234375, 0.057796478271484375, 0.06194305419921875, 0.06608963012695312, 0.0702362060546875, 0.07438278198242188, 0.07852935791015625, 0.08267593383789062, 0.086822509765625, 0.09096908569335938, 0.09511566162109375, 0.09926223754882812, 0.1034088134765625, 0.10755538940429688, 0.11170196533203125, 0.11584854125976562, 0.1199951171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 9.0, 12.0, 12.0, 21.0, 27.0, 41.0, 36.0, 67.0, 95.0, 180.0, 311.0, 713.0, 1284.0, 551.0, 240.0, 130.0, 75.0, 76.0, 41.0, 33.0, 30.0, 18.0, 7.0, 17.0, 10.0, 6.0, 5.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054412841796875, -0.05267524719238281, -0.050937652587890625, -0.04920005798339844, -0.04746246337890625, -0.04572486877441406, -0.043987274169921875, -0.04224967956542969, -0.0405120849609375, -0.03877449035644531, -0.037036895751953125, -0.03529930114746094, -0.03356170654296875, -0.03182411193847656, -0.030086517333984375, -0.028348922729492188, -0.026611328125, -0.024873733520507812, -0.023136138916015625, -0.021398544311523438, -0.01966094970703125, -0.017923355102539062, -0.016185760498046875, -0.014448165893554688, -0.0127105712890625, -0.010972976684570312, -0.009235382080078125, -0.0074977874755859375, -0.00576019287109375, -0.0040225982666015625, -0.002285003662109375, -0.0005474090576171875, 0.001190185546875, 0.0029277801513671875, 0.004665374755859375, 0.0064029693603515625, 0.00814056396484375, 0.009878158569335938, 0.011615753173828125, 0.013353347778320312, 0.0150909423828125, 0.016828536987304688, 0.018566131591796875, 0.020303726196289062, 0.02204132080078125, 0.023778915405273438, 0.025516510009765625, 0.027254104614257812, 0.02899169921875, 0.030729293823242188, 0.032466888427734375, 0.03420448303222656, 0.03594207763671875, 0.03767967224121094, 0.039417266845703125, 0.04115486145019531, 0.0428924560546875, 0.04463005065917969, 0.046367645263671875, 0.04810523986816406, 0.04984283447265625, 0.05158042907714844, 0.053318023681640625, 0.05505561828613281, 0.056793212890625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 7.0, 7.0, 7.0, 69.0, 144.0, 231.0, 244.0, 161.0, 72.0, 34.0, 10.0, 3.0, 5.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3769323527812958, -0.3549281358718872, -0.33292391896247864, -0.31091970205307007, -0.2889154851436615, -0.26691126823425293, -0.24490706622600555, -0.22290284931659698, -0.20089863240718842, -0.17889441549777985, -0.15689019858837128, -0.1348859965801239, -0.11288177222013474, -0.09087755531072617, -0.0688733458518982, -0.046869128942489624, -0.024864912033081055, -0.0028606969863176346, 0.019143518060445786, 0.041147731244564056, 0.06315194815397263, 0.0851561650633812, 0.10716037452220917, 0.12916459143161774, 0.1511688083410263, 0.17317302525043488, 0.19517724215984344, 0.21718144416809082, 0.2391856610774994, 0.26118987798690796, 0.28319409489631653, 0.3051983118057251, 0.3272024989128113, 0.34920671582221985, 0.3712109327316284, 0.393215149641037, 0.41521936655044556, 0.4372235834598541, 0.4592278003692627, 0.4812319874763489, 0.5032362341880798, 0.525240421295166, 0.547244668006897, 0.5692488551139832, 0.5912531018257141, 0.6132572889328003, 0.6352615356445312, 0.6572657227516174, 0.6792699098587036, 0.7012740969657898, 0.7232783436775208, 0.7452825307846069, 0.7672867774963379, 0.7892909646034241, 0.811295211315155, 0.8332993984222412, 0.8553036451339722, 0.8773078322410583, 0.8993120789527893, 0.9213162660598755, 0.9433205127716064, 0.9653246998786926, 0.9873289465904236, 1.0093331336975098, 1.0313373804092407]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 9.0, 3.0, 12.0, 9.0, 15.0, 17.0, 13.0, 31.0, 23.0, 28.0, 30.0, 39.0, 37.0, 32.0, 43.0, 31.0, 47.0, 61.0, 39.0, 47.0, 34.0, 49.0, 47.0, 32.0, 35.0, 33.0, 40.0, 28.0, 25.0, 27.0, 15.0, 12.0, 13.0, 7.0, 13.0, 7.0, 6.0, 1.0, 5.0, 2.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20056742429733276, -0.194375678896904, -0.18818391859531403, -0.18199217319488525, -0.17580042779445648, -0.1696086823940277, -0.16341692209243774, -0.15722517669200897, -0.1510334312915802, -0.14484168589115143, -0.13864992558956146, -0.1324581801891327, -0.12626643478870392, -0.12007468193769455, -0.11388292908668518, -0.10769118368625641, -0.10149942338466644, -0.09530767053365707, -0.0891159251332283, -0.08292417228221893, -0.07673242688179016, -0.07054067403078079, -0.06434892117977142, -0.05815717205405235, -0.05196542292833328, -0.04577367380261421, -0.03958192467689514, -0.03339017182588577, -0.027198422700166702, -0.021006673574447632, -0.014814920723438263, -0.008623171597719193, -0.002431422472000122, 0.003760327585041523, 0.009952077642083168, 0.016143828630447388, 0.022335577756166458, 0.02852732688188553, 0.0347190797328949, 0.04091082885861397, 0.04710257798433304, 0.05329432711005211, 0.05948607623577118, 0.06567782908678055, 0.07186958193778992, 0.07806132733821869, 0.08425308018922806, 0.09044483304023743, 0.0966365784406662, 0.10282833129167557, 0.10902007669210434, 0.11521182954311371, 0.12140357494354248, 0.12759533524513245, 0.13378708064556122, 0.13997882604599, 0.14617058634757996, 0.15236233174800873, 0.1585540920495987, 0.16474583745002747, 0.17093758285045624, 0.177129328250885, 0.18332108855247498, 0.18951283395290375, 0.19570457935333252]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 9.0, 7.0, 11.0, 15.0, 28.0, 41.0, 68.0, 110.0, 186.0, 300.0, 599.0, 1054.0, 2413.0, 5822.0, 15253.0, 44353.0, 131955.0, 308788.0, 320161.0, 141564.0, 47844.0, 16624.0, 6139.0, 2564.0, 1136.0, 615.0, 336.0, 207.0, 119.0, 85.0, 48.0, 31.0, 18.0, 11.0, 11.0, 9.0, 8.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07183837890625, -0.06944656372070312, -0.06705474853515625, -0.06466293334960938, -0.0622711181640625, -0.059879302978515625, -0.05748748779296875, -0.055095672607421875, -0.052703857421875, -0.050312042236328125, -0.04792022705078125, -0.045528411865234375, -0.0431365966796875, -0.040744781494140625, -0.03835296630859375, -0.035961151123046875, -0.0335693359375, -0.031177520751953125, -0.02878570556640625, -0.026393890380859375, -0.0240020751953125, -0.021610260009765625, -0.01921844482421875, -0.016826629638671875, -0.014434814453125, -0.012042999267578125, -0.00965118408203125, -0.007259368896484375, -0.0048675537109375, -0.002475738525390625, -8.392333984375e-05, 0.002307891845703125, 0.00469970703125, 0.007091522216796875, 0.00948333740234375, 0.011875152587890625, 0.0142669677734375, 0.016658782958984375, 0.01905059814453125, 0.021442413330078125, 0.023834228515625, 0.026226043701171875, 0.02861785888671875, 0.031009674072265625, 0.0334014892578125, 0.035793304443359375, 0.03818511962890625, 0.040576934814453125, 0.04296875, 0.045360565185546875, 0.04775238037109375, 0.050144195556640625, 0.0525360107421875, 0.054927825927734375, 0.05731964111328125, 0.059711456298828125, 0.062103271484375, 0.06449508666992188, 0.06688690185546875, 0.06927871704101562, 0.0716705322265625, 0.07406234741210938, 0.07645416259765625, 0.07884597778320312, 0.08123779296875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 6.0, 2.0, 8.0, 6.0, 8.0, 10.0, 13.0, 27.0, 22.0, 25.0, 41.0, 37.0, 30.0, 40.0, 46.0, 52.0, 46.0, 50.0, 40.0, 59.0, 57.0, 54.0, 49.0, 40.0, 36.0, 27.0, 35.0, 36.0, 20.0, 22.0, 17.0, 16.0, 14.0, 1.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034515380859375, -0.03345537185668945, -0.032395362854003906, -0.03133535385131836, -0.030275344848632812, -0.029215335845947266, -0.02815532684326172, -0.027095317840576172, -0.026035308837890625, -0.024975299835205078, -0.02391529083251953, -0.022855281829833984, -0.021795272827148438, -0.02073526382446289, -0.019675254821777344, -0.018615245819091797, -0.01755523681640625, -0.016495227813720703, -0.015435218811035156, -0.01437520980834961, -0.013315200805664062, -0.012255191802978516, -0.011195182800292969, -0.010135173797607422, -0.009075164794921875, -0.008015155792236328, -0.006955146789550781, -0.005895137786865234, -0.0048351287841796875, -0.0037751197814941406, -0.0027151107788085938, -0.0016551017761230469, -0.0005950927734375, 0.0004649162292480469, 0.0015249252319335938, 0.0025849342346191406, 0.0036449432373046875, 0.004704952239990234, 0.005764961242675781, 0.006824970245361328, 0.007884979248046875, 0.008944988250732422, 0.010004997253417969, 0.011065006256103516, 0.012125015258789062, 0.01318502426147461, 0.014245033264160156, 0.015305042266845703, 0.01636505126953125, 0.017425060272216797, 0.018485069274902344, 0.01954507827758789, 0.020605087280273438, 0.021665096282958984, 0.02272510528564453, 0.023785114288330078, 0.024845123291015625, 0.025905132293701172, 0.02696514129638672, 0.028025150299072266, 0.029085159301757812, 0.03014516830444336, 0.031205177307128906, 0.03226518630981445, 0.0333251953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 5.0, 7.0, 3.0, 6.0, 15.0, 15.0, 21.0, 28.0, 44.0, 51.0, 70.0, 113.0, 139.0, 225.0, 306.0, 506.0, 848.0, 1932.0, 5856.0, 29975.0, 215317.0, 607500.0, 154472.0, 22560.0, 4794.0, 1575.0, 729.0, 470.0, 310.0, 201.0, 115.0, 95.0, 59.0, 57.0, 28.0, 25.0, 24.0, 15.0, 10.0, 12.0, 8.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1280517578125, -0.12421989440917969, -0.12038803100585938, -0.11655616760253906, -0.11272430419921875, -0.10889244079589844, -0.10506057739257812, -0.10122871398925781, -0.0973968505859375, -0.09356498718261719, -0.08973312377929688, -0.08590126037597656, -0.08206939697265625, -0.07823753356933594, -0.07440567016601562, -0.07057380676269531, -0.066741943359375, -0.06291007995605469, -0.059078216552734375, -0.05524635314941406, -0.05141448974609375, -0.04758262634277344, -0.043750762939453125, -0.03991889953613281, -0.0360870361328125, -0.03225517272949219, -0.028423309326171875, -0.024591445922851562, -0.02075958251953125, -0.016927719116210938, -0.013095855712890625, -0.009263992309570312, -0.00543212890625, -0.0016002655029296875, 0.002231597900390625, 0.0060634613037109375, 0.00989532470703125, 0.013727188110351562, 0.017559051513671875, 0.021390914916992188, 0.0252227783203125, 0.029054641723632812, 0.032886505126953125, 0.03671836853027344, 0.04055023193359375, 0.04438209533691406, 0.048213958740234375, 0.05204582214355469, 0.055877685546875, 0.05970954895019531, 0.06354141235351562, 0.06737327575683594, 0.07120513916015625, 0.07503700256347656, 0.07886886596679688, 0.08270072937011719, 0.0865325927734375, 0.09036445617675781, 0.09419631958007812, 0.09802818298339844, 0.10186004638671875, 0.10569190979003906, 0.10952377319335938, 0.11335563659667969, 0.1171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 7.0, 7.0, 6.0, 15.0, 21.0, 18.0, 20.0, 19.0, 34.0, 33.0, 34.0, 44.0, 42.0, 45.0, 47.0, 63.0, 46.0, 47.0, 51.0, 57.0, 50.0, 39.0, 33.0, 36.0, 32.0, 31.0, 20.0, 25.0, 12.0, 17.0, 11.0, 11.0, 4.0, 3.0, 2.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1732177734375, -0.16808319091796875, -0.1629486083984375, -0.15781402587890625, -0.152679443359375, -0.14754486083984375, -0.1424102783203125, -0.13727569580078125, -0.13214111328125, -0.12700653076171875, -0.1218719482421875, -0.11673736572265625, -0.111602783203125, -0.10646820068359375, -0.1013336181640625, -0.09619903564453125, -0.091064453125, -0.08592987060546875, -0.0807952880859375, -0.07566070556640625, -0.070526123046875, -0.06539154052734375, -0.0602569580078125, -0.05512237548828125, -0.04998779296875, -0.04485321044921875, -0.0397186279296875, -0.03458404541015625, -0.029449462890625, -0.02431488037109375, -0.0191802978515625, -0.01404571533203125, -0.0089111328125, -0.00377655029296875, 0.0013580322265625, 0.00649261474609375, 0.011627197265625, 0.01676177978515625, 0.0218963623046875, 0.02703094482421875, 0.03216552734375, 0.03730010986328125, 0.0424346923828125, 0.04756927490234375, 0.052703857421875, 0.05783843994140625, 0.0629730224609375, 0.06810760498046875, 0.0732421875, 0.07837677001953125, 0.0835113525390625, 0.08864593505859375, 0.093780517578125, 0.09891510009765625, 0.1040496826171875, 0.10918426513671875, 0.11431884765625, 0.11945343017578125, 0.1245880126953125, 0.12972259521484375, 0.134857177734375, 0.13999176025390625, 0.1451263427734375, 0.15026092529296875, 0.1553955078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 6.0, 9.0, 6.0, 17.0, 17.0, 30.0, 56.0, 63.0, 113.0, 188.0, 389.0, 824.0, 1918.0, 5904.0, 24619.0, 150480.0, 549527.0, 259417.0, 41461.0, 8754.0, 2557.0, 1075.0, 508.0, 265.0, 140.0, 75.0, 30.0, 31.0, 23.0, 20.0, 5.0, 7.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0609130859375, -0.05885887145996094, -0.056804656982421875, -0.05475044250488281, -0.05269622802734375, -0.05064201354980469, -0.048587799072265625, -0.04653358459472656, -0.0444793701171875, -0.04242515563964844, -0.040370941162109375, -0.03831672668457031, -0.03626251220703125, -0.03420829772949219, -0.032154083251953125, -0.030099868774414062, -0.028045654296875, -0.025991439819335938, -0.023937225341796875, -0.021883010864257812, -0.01982879638671875, -0.017774581909179688, -0.015720367431640625, -0.013666152954101562, -0.0116119384765625, -0.009557723999023438, -0.007503509521484375, -0.0054492950439453125, -0.00339508056640625, -0.0013408660888671875, 0.000713348388671875, 0.0027675628662109375, 0.00482177734375, 0.0068759918212890625, 0.008930206298828125, 0.010984420776367188, 0.01303863525390625, 0.015092849731445312, 0.017147064208984375, 0.019201278686523438, 0.0212554931640625, 0.023309707641601562, 0.025363922119140625, 0.027418136596679688, 0.02947235107421875, 0.03152656555175781, 0.033580780029296875, 0.03563499450683594, 0.037689208984375, 0.03974342346191406, 0.041797637939453125, 0.04385185241699219, 0.04590606689453125, 0.04796028137207031, 0.050014495849609375, 0.05206871032714844, 0.0541229248046875, 0.05617713928222656, 0.058231353759765625, 0.06028556823730469, 0.06233978271484375, 0.06439399719238281, 0.06644821166992188, 0.06850242614746094, 0.070556640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 7.0, 10.0, 9.0, 12.0, 17.0, 13.0, 34.0, 23.0, 44.0, 47.0, 62.0, 75.0, 87.0, 80.0, 93.0, 67.0, 66.0, 60.0, 35.0, 30.0, 27.0, 17.0, 19.0, 11.0, 9.0, 9.0, 6.0, 3.0, 5.0, 8.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.186962127685547e-05, -6.013549864292145e-05, -5.840137600898743e-05, -5.6667253375053406e-05, -5.4933130741119385e-05, -5.3199008107185364e-05, -5.146488547325134e-05, -4.973076283931732e-05, -4.79966402053833e-05, -4.626251757144928e-05, -4.452839493751526e-05, -4.279427230358124e-05, -4.106014966964722e-05, -3.9326027035713196e-05, -3.7591904401779175e-05, -3.5857781767845154e-05, -3.412365913391113e-05, -3.238953649997711e-05, -3.065541386604309e-05, -2.892129123210907e-05, -2.718716859817505e-05, -2.5453045964241028e-05, -2.3718923330307007e-05, -2.1984800696372986e-05, -2.0250678062438965e-05, -1.8516555428504944e-05, -1.6782432794570923e-05, -1.5048310160636902e-05, -1.3314187526702881e-05, -1.158006489276886e-05, -9.845942258834839e-06, -8.111819624900818e-06, -6.377696990966797e-06, -4.643574357032776e-06, -2.909451723098755e-06, -1.1753290891647339e-06, 5.587935447692871e-07, 2.292916178703308e-06, 4.027038812637329e-06, 5.76116144657135e-06, 7.495284080505371e-06, 9.229406714439392e-06, 1.0963529348373413e-05, 1.2697651982307434e-05, 1.4431774616241455e-05, 1.6165897250175476e-05, 1.7900019884109497e-05, 1.9634142518043518e-05, 2.136826515197754e-05, 2.310238778591156e-05, 2.483651041984558e-05, 2.6570633053779602e-05, 2.8304755687713623e-05, 3.0038878321647644e-05, 3.1773000955581665e-05, 3.3507123589515686e-05, 3.524124622344971e-05, 3.697536885738373e-05, 3.870949149131775e-05, 4.044361412525177e-05, 4.217773675918579e-05, 4.391185939311981e-05, 4.564598202705383e-05, 4.7380104660987854e-05, 4.9114227294921875e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 7.0, 18.0, 13.0, 12.0, 21.0, 27.0, 41.0, 65.0, 97.0, 159.0, 211.0, 400.0, 808.0, 1590.0, 3727.0, 10863.0, 42091.0, 213196.0, 508950.0, 207777.0, 40950.0, 10511.0, 3598.0, 1572.0, 734.0, 420.0, 212.0, 144.0, 81.0, 67.0, 55.0, 35.0, 24.0, 17.0, 15.0, 11.0, 8.0, 4.0, 6.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.06378173828125, -0.06187725067138672, -0.05997276306152344, -0.058068275451660156, -0.056163787841796875, -0.054259300231933594, -0.05235481262207031, -0.05045032501220703, -0.04854583740234375, -0.04664134979248047, -0.04473686218261719, -0.042832374572753906, -0.040927886962890625, -0.039023399353027344, -0.03711891174316406, -0.03521442413330078, -0.0333099365234375, -0.03140544891357422, -0.029500961303710938, -0.027596473693847656, -0.025691986083984375, -0.023787498474121094, -0.021883010864257812, -0.01997852325439453, -0.01807403564453125, -0.01616954803466797, -0.014265060424804688, -0.012360572814941406, -0.010456085205078125, -0.008551597595214844, -0.0066471099853515625, -0.004742622375488281, -0.002838134765625, -0.0009336471557617188, 0.0009708404541015625, 0.0028753280639648438, 0.004779815673828125, 0.006684303283691406, 0.008588790893554688, 0.010493278503417969, 0.01239776611328125, 0.014302253723144531, 0.016206741333007812, 0.018111228942871094, 0.020015716552734375, 0.021920204162597656, 0.023824691772460938, 0.02572917938232422, 0.0276336669921875, 0.02953815460205078, 0.03144264221191406, 0.033347129821777344, 0.035251617431640625, 0.037156105041503906, 0.03906059265136719, 0.04096508026123047, 0.04286956787109375, 0.04477405548095703, 0.04667854309082031, 0.048583030700683594, 0.050487518310546875, 0.052392005920410156, 0.05429649353027344, 0.05620098114013672, 0.05810546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 13.0, 11.0, 9.0, 10.0, 33.0, 43.0, 48.0, 57.0, 76.0, 81.0, 90.0, 86.0, 82.0, 69.0, 71.0, 44.0, 45.0, 35.0, 21.0, 28.0, 22.0, 7.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07427978515625, -0.07223701477050781, -0.07019424438476562, -0.06815147399902344, -0.06610870361328125, -0.06406593322753906, -0.062023162841796875, -0.05998039245605469, -0.0579376220703125, -0.05589485168457031, -0.053852081298828125, -0.05180931091308594, -0.04976654052734375, -0.04772377014160156, -0.045680999755859375, -0.04363822937011719, -0.041595458984375, -0.03955268859863281, -0.037509918212890625, -0.03546714782714844, -0.03342437744140625, -0.03138160705566406, -0.029338836669921875, -0.027296066284179688, -0.0252532958984375, -0.023210525512695312, -0.021167755126953125, -0.019124984741210938, -0.01708221435546875, -0.015039443969726562, -0.012996673583984375, -0.010953903198242188, -0.0089111328125, -0.0068683624267578125, -0.004825592041015625, -0.0027828216552734375, -0.00074005126953125, 0.0013027191162109375, 0.003345489501953125, 0.0053882598876953125, 0.0074310302734375, 0.009473800659179688, 0.011516571044921875, 0.013559341430664062, 0.01560211181640625, 0.017644882202148438, 0.019687652587890625, 0.021730422973632812, 0.023773193359375, 0.025815963745117188, 0.027858734130859375, 0.029901504516601562, 0.03194427490234375, 0.03398704528808594, 0.036029815673828125, 0.03807258605957031, 0.0401153564453125, 0.04215812683105469, 0.044200897216796875, 0.04624366760253906, 0.04828643798828125, 0.05032920837402344, 0.052371978759765625, 0.05441474914550781, 0.05645751953125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 7.0, 7.0, 16.0, 53.0, 239.0, 368.0, 222.0, 68.0, 14.0, 8.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.0850982666015625, -3.0128817558288574, -2.9406652450561523, -2.8684487342834473, -2.796232223510742, -2.724015474319458, -2.651798963546753, -2.579582452774048, -2.5073659420013428, -2.4351494312286377, -2.3629329204559326, -2.2907164096832275, -2.2184996604919434, -2.1462831497192383, -2.074066638946533, -2.001850128173828, -1.929633617401123, -1.857417106628418, -1.785200595855713, -1.7129839658737183, -1.6407674551010132, -1.568550944328308, -1.4963343143463135, -1.4241178035736084, -1.3519012928009033, -1.2796847820281982, -1.2074682712554932, -1.1352516412734985, -1.0630351305007935, -0.9908186197280884, -0.9186020493507385, -0.8463854789733887, -0.7741690874099731, -0.7019525766372681, -0.6297360062599182, -0.5575194358825684, -0.4853029251098633, -0.4130863845348358, -0.34086984395980835, -0.2686532735824585, -0.19643676280975342, -0.12422022223472595, -0.052003681659698486, 0.02021285891532898, 0.09242939949035645, 0.1646459400653839, 0.23686248064041138, 0.30907905101776123, 0.3812955617904663, 0.4535121023654938, 0.5257286429405212, 0.5979452133178711, 0.6701617240905762, 0.7423782348632812, 0.8145948052406311, 0.886811375617981, 0.959027886390686, 1.0312443971633911, 1.1034610271453857, 1.1756775379180908, 1.247894048690796, 1.320110559463501, 1.392327070236206, 1.4645437002182007, 1.5367602109909058]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 9.0, 9.0, 13.0, 9.0, 19.0, 14.0, 19.0, 20.0, 22.0, 25.0, 26.0, 28.0, 40.0, 32.0, 40.0, 42.0, 44.0, 49.0, 40.0, 57.0, 35.0, 47.0, 51.0, 37.0, 25.0, 39.0, 38.0, 26.0, 23.0, 21.0, 18.0, 16.0, 18.0, 17.0, 11.0, 4.0, 4.0, 3.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7265070676803589, -0.7030975818634033, -0.6796880960464478, -0.6562786102294922, -0.6328690648078918, -0.6094595789909363, -0.5860500931739807, -0.5626406073570251, -0.5392311215400696, -0.515821635723114, -0.49241212010383606, -0.4690026342868805, -0.4455931484699249, -0.422183632850647, -0.3987741470336914, -0.37536466121673584, -0.3519551455974579, -0.3285456597805023, -0.30513614416122437, -0.2817266583442688, -0.25831717252731323, -0.23490767180919647, -0.2114981710910797, -0.18808868527412415, -0.16467918455600739, -0.14126968383789062, -0.11786019802093506, -0.0944506973028183, -0.07104120403528214, -0.04763171076774597, -0.02422221004962921, -0.000812724232673645, 0.022596776485443115, 0.04600626975297928, 0.06941576302051544, 0.0928252637386322, 0.11623475700616837, 0.13964425027370453, 0.1630537509918213, 0.18646323680877686, 0.20987273752689362, 0.23328223824501038, 0.25669172406196594, 0.2801012396812439, 0.30351072549819946, 0.32692021131515503, 0.3503296971321106, 0.37373918294906616, 0.3971486985683441, 0.4205581843852997, 0.44396770000457764, 0.4673771858215332, 0.49078667163848877, 0.5141961574554443, 0.5376056432723999, 0.5610151290893555, 0.5844246745109558, 0.6078341603279114, 0.6312436461448669, 0.6546531915664673, 0.6780626773834229, 0.7014721632003784, 0.724881649017334, 0.7482911348342896, 0.7717006206512451]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 10.0, 13.0, 24.0, 21.0, 40.0, 94.0, 110.0, 163.0, 301.0, 474.0, 916.0, 1807.0, 4407.0, 13956.0, 118274.0, 3985485.0, 51958.0, 9428.0, 3342.0, 1515.0, 777.0, 458.0, 266.0, 162.0, 86.0, 73.0, 38.0, 32.0, 19.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11993408203125, -0.1159830093383789, -0.11203193664550781, -0.10808086395263672, -0.10412979125976562, -0.10017871856689453, -0.09622764587402344, -0.09227657318115234, -0.08832550048828125, -0.08437442779541016, -0.08042335510253906, -0.07647228240966797, -0.07252120971679688, -0.06857013702392578, -0.06461906433105469, -0.060667991638183594, -0.0567169189453125, -0.052765846252441406, -0.04881477355957031, -0.04486370086669922, -0.040912628173828125, -0.03696155548095703, -0.03301048278808594, -0.029059410095214844, -0.02510833740234375, -0.021157264709472656, -0.017206192016601562, -0.013255119323730469, -0.009304046630859375, -0.005352973937988281, -0.0014019012451171875, 0.0025491714477539062, 0.006500244140625, 0.010451316833496094, 0.014402389526367188, 0.01835346221923828, 0.022304534912109375, 0.02625560760498047, 0.030206680297851562, 0.034157752990722656, 0.03810882568359375, 0.042059898376464844, 0.04601097106933594, 0.04996204376220703, 0.053913116455078125, 0.05786418914794922, 0.06181526184082031, 0.0657663345336914, 0.0697174072265625, 0.0736684799194336, 0.07761955261230469, 0.08157062530517578, 0.08552169799804688, 0.08947277069091797, 0.09342384338378906, 0.09737491607666016, 0.10132598876953125, 0.10527706146240234, 0.10922813415527344, 0.11317920684814453, 0.11713027954101562, 0.12108135223388672, 0.1250324249267578, 0.1289834976196289, 0.1329345703125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 4.0, 12.0, 11.0, 21.0, 19.0, 30.0, 28.0, 35.0, 32.0, 43.0, 46.0, 30.0, 55.0, 52.0, 47.0, 44.0, 61.0, 45.0, 53.0, 40.0, 37.0, 45.0, 32.0, 30.0, 28.0, 26.0, 13.0, 18.0, 16.0, 10.0, 8.0, 11.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03515625, -0.03396129608154297, -0.03276634216308594, -0.031571388244628906, -0.030376434326171875, -0.029181480407714844, -0.027986526489257812, -0.02679157257080078, -0.02559661865234375, -0.02440166473388672, -0.023206710815429688, -0.022011756896972656, -0.020816802978515625, -0.019621849060058594, -0.018426895141601562, -0.01723194122314453, -0.0160369873046875, -0.014842033386230469, -0.013647079467773438, -0.012452125549316406, -0.011257171630859375, -0.010062217712402344, -0.008867263793945312, -0.007672309875488281, -0.00647735595703125, -0.005282402038574219, -0.0040874481201171875, -0.0028924942016601562, -0.001697540283203125, -0.0005025863647460938, 0.0006923675537109375, 0.0018873214721679688, 0.003082275390625, 0.004277229309082031, 0.0054721832275390625, 0.006667137145996094, 0.007862091064453125, 0.009057044982910156, 0.010251998901367188, 0.011446952819824219, 0.01264190673828125, 0.013836860656738281, 0.015031814575195312, 0.016226768493652344, 0.017421722412109375, 0.018616676330566406, 0.019811630249023438, 0.02100658416748047, 0.0222015380859375, 0.02339649200439453, 0.024591445922851562, 0.025786399841308594, 0.026981353759765625, 0.028176307678222656, 0.029371261596679688, 0.03056621551513672, 0.03176116943359375, 0.03295612335205078, 0.03415107727050781, 0.035346031188964844, 0.036540985107421875, 0.037735939025878906, 0.03893089294433594, 0.04012584686279297, 0.04132080078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 6.0, 7.0, 18.0, 27.0, 24.0, 43.0, 83.0, 129.0, 189.0, 314.0, 462.0, 844.0, 1630.0, 3128.0, 6792.0, 17638.0, 64816.0, 2893388.0, 1114091.0, 60534.0, 16797.0, 6596.0, 3095.0, 1624.0, 800.0, 474.0, 270.0, 161.0, 119.0, 64.0, 47.0, 24.0, 15.0, 7.0, 3.0, 10.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.11334228515625, -0.11019229888916016, -0.10704231262207031, -0.10389232635498047, -0.10074234008789062, -0.09759235382080078, -0.09444236755371094, -0.0912923812866211, -0.08814239501953125, -0.0849924087524414, -0.08184242248535156, -0.07869243621826172, -0.07554244995117188, -0.07239246368408203, -0.06924247741699219, -0.06609249114990234, -0.0629425048828125, -0.059792518615722656, -0.05664253234863281, -0.05349254608154297, -0.050342559814453125, -0.04719257354736328, -0.04404258728027344, -0.040892601013183594, -0.03774261474609375, -0.034592628479003906, -0.03144264221191406, -0.02829265594482422, -0.025142669677734375, -0.02199268341064453, -0.018842697143554688, -0.015692710876464844, -0.012542724609375, -0.009392738342285156, -0.0062427520751953125, -0.0030927658081054688, 5.7220458984375e-05, 0.0032072067260742188, 0.0063571929931640625, 0.009507179260253906, 0.01265716552734375, 0.015807151794433594, 0.018957138061523438, 0.02210712432861328, 0.025257110595703125, 0.02840709686279297, 0.03155708312988281, 0.034707069396972656, 0.0378570556640625, 0.041007041931152344, 0.04415702819824219, 0.04730701446533203, 0.050457000732421875, 0.05360698699951172, 0.05675697326660156, 0.059906959533691406, 0.06305694580078125, 0.0662069320678711, 0.06935691833496094, 0.07250690460205078, 0.07565689086914062, 0.07880687713623047, 0.08195686340332031, 0.08510684967041016, 0.0882568359375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 6.0, 5.0, 8.0, 14.0, 32.0, 33.0, 69.0, 85.0, 210.0, 2430.0, 811.0, 163.0, 71.0, 47.0, 18.0, 14.0, 13.0, 9.0, 8.0, 8.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03179931640625, -0.031022071838378906, -0.030244827270507812, -0.02946758270263672, -0.028690338134765625, -0.02791309356689453, -0.027135848999023438, -0.026358604431152344, -0.02558135986328125, -0.024804115295410156, -0.024026870727539062, -0.02324962615966797, -0.022472381591796875, -0.02169513702392578, -0.020917892456054688, -0.020140647888183594, -0.0193634033203125, -0.018586158752441406, -0.017808914184570312, -0.01703166961669922, -0.016254425048828125, -0.015477180480957031, -0.014699935913085938, -0.013922691345214844, -0.01314544677734375, -0.012368202209472656, -0.011590957641601562, -0.010813713073730469, -0.010036468505859375, -0.009259223937988281, -0.008481979370117188, -0.007704734802246094, -0.006927490234375, -0.006150245666503906, -0.0053730010986328125, -0.004595756530761719, -0.003818511962890625, -0.0030412673950195312, -0.0022640228271484375, -0.0014867782592773438, -0.00070953369140625, 6.771087646484375e-05, 0.0008449554443359375, 0.0016222000122070312, 0.002399444580078125, 0.0031766891479492188, 0.0039539337158203125, 0.004731178283691406, 0.0055084228515625, 0.006285667419433594, 0.0070629119873046875, 0.007840156555175781, 0.008617401123046875, 0.009394645690917969, 0.010171890258789062, 0.010949134826660156, 0.01172637939453125, 0.012503623962402344, 0.013280868530273438, 0.014058113098144531, 0.014835357666015625, 0.015612602233886719, 0.016389846801757812, 0.017167091369628906, 0.0179443359375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 6.0, 24.0, 134.0, 326.0, 355.0, 123.0, 24.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5581967830657959, -0.5466429591178894, -0.5350891947746277, -0.5235353708267212, -0.5119816064834595, -0.500427782535553, -0.48887398838996887, -0.47732019424438477, -0.46576637029647827, -0.45421257615089417, -0.44265878200531006, -0.43110495805740356, -0.41955116391181946, -0.40799736976623535, -0.39644357562065125, -0.38488978147506714, -0.37333595752716064, -0.36178216338157654, -0.35022836923599243, -0.33867454528808594, -0.32712075114250183, -0.3155669569969177, -0.3040131628513336, -0.2924593687057495, -0.2809055745601654, -0.2693517804145813, -0.2577979862689972, -0.2462441772222519, -0.2346903681755066, -0.22313657402992249, -0.21158277988433838, -0.20002897083759308, -0.18847517669200897, -0.17692138254642487, -0.16536757349967957, -0.15381377935409546, -0.14225997030735016, -0.13070617616176605, -0.11915237456560135, -0.10759857296943665, -0.09604477137327194, -0.08449096977710724, -0.07293716818094254, -0.06138337031006813, -0.04982956871390343, -0.038275767117738724, -0.02672196924686432, -0.015168167650699615, -0.003614366054534912, 0.007939434610307217, 0.019493235275149345, 0.0310470350086689, 0.0426008366048336, 0.054154638200998306, 0.06570843607187271, 0.07726223766803741, 0.08881603926420212, 0.10036984086036682, 0.11192364245653152, 0.12347744405269623, 0.13503123819828033, 0.14658504724502563, 0.15813884139060974, 0.16969263553619385, 0.18124644458293915]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 3.0, 8.0, 11.0, 6.0, 12.0, 15.0, 21.0, 18.0, 20.0, 17.0, 30.0, 23.0, 31.0, 22.0, 45.0, 44.0, 34.0, 43.0, 34.0, 38.0, 37.0, 30.0, 48.0, 37.0, 27.0, 36.0, 35.0, 32.0, 40.0, 28.0, 41.0, 26.0, 29.0, 12.0, 16.0, 12.0, 9.0, 4.0, 4.0, 7.0, 5.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06199377775192261, -0.059915244579315186, -0.057836711406707764, -0.05575817450881004, -0.05367964133620262, -0.0516011081635952, -0.04952257126569748, -0.04744403809309006, -0.045365504920482635, -0.043286971747875214, -0.04120843857526779, -0.03912990167737007, -0.03705136850476265, -0.03497283533215523, -0.03289429843425751, -0.030815765261650085, -0.028737232089042664, -0.02665869891643524, -0.02458016388118267, -0.0225016288459301, -0.020423095673322678, -0.018344562500715256, -0.016266027465462685, -0.014187493361532688, -0.012108959257602692, -0.010030425153672695, -0.007951891049742699, -0.005873356945812702, -0.0037948228418827057, -0.0017162887379527092, 0.0003622453659772873, 0.0024407794699072838, 0.00451931357383728, 0.006597847677767277, 0.008676381781697273, 0.01075491588562727, 0.012833449989557266, 0.014911984093487263, 0.01699051819741726, 0.01906905323266983, 0.021147586405277252, 0.023226119577884674, 0.025304654613137245, 0.027383189648389816, 0.029461722820997238, 0.03154025599360466, 0.03361879289150238, 0.0356973260641098, 0.037775859236717224, 0.039854392409324646, 0.04193292558193207, 0.04401146247982979, 0.04608999565243721, 0.04816852882504463, 0.05024706572294235, 0.052325598895549774, 0.054404132068157196, 0.05648266524076462, 0.05856119841337204, 0.06063973531126976, 0.06271827220916748, 0.0647968053817749, 0.06687533855438232, 0.06895387172698975, 0.07103240489959717]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 13.0, 11.0, 22.0, 39.0, 49.0, 93.0, 190.0, 276.0, 687.0, 1599.0, 4651.0, 14706.0, 51351.0, 181579.0, 389652.0, 278013.0, 88907.0, 24812.0, 7414.0, 2564.0, 962.0, 448.0, 209.0, 115.0, 72.0, 38.0, 20.0, 14.0, 14.0, 8.0, 7.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063720703125, -0.06103324890136719, -0.058345794677734375, -0.05565834045410156, -0.05297088623046875, -0.05028343200683594, -0.047595977783203125, -0.04490852355957031, -0.0422210693359375, -0.03953361511230469, -0.036846160888671875, -0.03415870666503906, -0.03147125244140625, -0.028783798217773438, -0.026096343994140625, -0.023408889770507812, -0.020721435546875, -0.018033981323242188, -0.015346527099609375, -0.012659072875976562, -0.00997161865234375, -0.0072841644287109375, -0.004596710205078125, -0.0019092559814453125, 0.0007781982421875, 0.0034656524658203125, 0.006153106689453125, 0.008840560913085938, 0.01152801513671875, 0.014215469360351562, 0.016902923583984375, 0.019590377807617188, 0.02227783203125, 0.024965286254882812, 0.027652740478515625, 0.030340194702148438, 0.03302764892578125, 0.03571510314941406, 0.038402557373046875, 0.04109001159667969, 0.0437774658203125, 0.04646492004394531, 0.049152374267578125, 0.05183982849121094, 0.05452728271484375, 0.05721473693847656, 0.059902191162109375, 0.06258964538574219, 0.065277099609375, 0.06796455383300781, 0.07065200805664062, 0.07333946228027344, 0.07602691650390625, 0.07871437072753906, 0.08140182495117188, 0.08408927917480469, 0.0867767333984375, 0.08946418762207031, 0.09215164184570312, 0.09483909606933594, 0.09752655029296875, 0.10021400451660156, 0.10290145874023438, 0.10558891296386719, 0.1082763671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 10.0, 9.0, 9.0, 12.0, 12.0, 10.0, 19.0, 25.0, 31.0, 28.0, 35.0, 38.0, 45.0, 49.0, 54.0, 36.0, 45.0, 47.0, 32.0, 46.0, 44.0, 49.0, 43.0, 44.0, 34.0, 24.0, 28.0, 23.0, 14.0, 19.0, 22.0, 14.0, 16.0, 7.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.034210205078125, -0.03306007385253906, -0.031909942626953125, -0.030759811401367188, -0.02960968017578125, -0.028459548950195312, -0.027309417724609375, -0.026159286499023438, -0.0250091552734375, -0.023859024047851562, -0.022708892822265625, -0.021558761596679688, -0.02040863037109375, -0.019258499145507812, -0.018108367919921875, -0.016958236694335938, -0.01580810546875, -0.014657974243164062, -0.013507843017578125, -0.012357711791992188, -0.01120758056640625, -0.010057449340820312, -0.008907318115234375, -0.0077571868896484375, -0.0066070556640625, -0.0054569244384765625, -0.004306793212890625, -0.0031566619873046875, -0.00200653076171875, -0.0008563995361328125, 0.000293731689453125, 0.0014438629150390625, 0.002593994140625, 0.0037441253662109375, 0.004894256591796875, 0.0060443878173828125, 0.00719451904296875, 0.008344650268554688, 0.009494781494140625, 0.010644912719726562, 0.0117950439453125, 0.012945175170898438, 0.014095306396484375, 0.015245437622070312, 0.01639556884765625, 0.017545700073242188, 0.018695831298828125, 0.019845962524414062, 0.02099609375, 0.022146224975585938, 0.023296356201171875, 0.024446487426757812, 0.02559661865234375, 0.026746749877929688, 0.027896881103515625, 0.029047012329101562, 0.0301971435546875, 0.03134727478027344, 0.032497406005859375, 0.03364753723144531, 0.03479766845703125, 0.03594779968261719, 0.037097930908203125, 0.03824806213378906, 0.039398193359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 8.0, 11.0, 14.0, 14.0, 38.0, 31.0, 48.0, 80.0, 119.0, 160.0, 208.0, 343.0, 540.0, 985.0, 2068.0, 6702.0, 36147.0, 253280.0, 588102.0, 131963.0, 19658.0, 4411.0, 1472.0, 707.0, 456.0, 275.0, 211.0, 135.0, 109.0, 70.0, 53.0, 36.0, 26.0, 20.0, 13.0, 5.0, 4.0, 8.0, 8.0, 3.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1026611328125, -0.09916114807128906, -0.09566116333007812, -0.09216117858886719, -0.08866119384765625, -0.08516120910644531, -0.08166122436523438, -0.07816123962402344, -0.0746612548828125, -0.07116127014160156, -0.06766128540039062, -0.06416130065917969, -0.06066131591796875, -0.05716133117675781, -0.053661346435546875, -0.05016136169433594, -0.046661376953125, -0.04316139221191406, -0.039661407470703125, -0.03616142272949219, -0.03266143798828125, -0.029161453247070312, -0.025661468505859375, -0.022161483764648438, -0.0186614990234375, -0.015161514282226562, -0.011661529541015625, -0.008161544799804688, -0.00466156005859375, -0.0011615753173828125, 0.002338409423828125, 0.0058383941650390625, 0.00933837890625, 0.012838363647460938, 0.016338348388671875, 0.019838333129882812, 0.02333831787109375, 0.026838302612304688, 0.030338287353515625, 0.03383827209472656, 0.0373382568359375, 0.04083824157714844, 0.044338226318359375, 0.04783821105957031, 0.05133819580078125, 0.05483818054199219, 0.058338165283203125, 0.06183815002441406, 0.065338134765625, 0.06883811950683594, 0.07233810424804688, 0.07583808898925781, 0.07933807373046875, 0.08283805847167969, 0.08633804321289062, 0.08983802795410156, 0.0933380126953125, 0.09683799743652344, 0.10033798217773438, 0.10383796691894531, 0.10733795166015625, 0.11083793640136719, 0.11433792114257812, 0.11783790588378906, 0.121337890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 10.0, 10.0, 17.0, 13.0, 22.0, 29.0, 29.0, 35.0, 35.0, 28.0, 42.0, 62.0, 34.0, 56.0, 49.0, 44.0, 44.0, 46.0, 63.0, 46.0, 34.0, 29.0, 33.0, 26.0, 34.0, 24.0, 22.0, 11.0, 15.0, 10.0, 5.0, 9.0, 3.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1785888671875, -0.17324066162109375, -0.1678924560546875, -0.16254425048828125, -0.157196044921875, -0.15184783935546875, -0.1464996337890625, -0.14115142822265625, -0.13580322265625, -0.13045501708984375, -0.1251068115234375, -0.11975860595703125, -0.114410400390625, -0.10906219482421875, -0.1037139892578125, -0.09836578369140625, -0.093017578125, -0.08766937255859375, -0.0823211669921875, -0.07697296142578125, -0.071624755859375, -0.06627655029296875, -0.0609283447265625, -0.05558013916015625, -0.05023193359375, -0.04488372802734375, -0.0395355224609375, -0.03418731689453125, -0.028839111328125, -0.02349090576171875, -0.0181427001953125, -0.01279449462890625, -0.0074462890625, -0.00209808349609375, 0.0032501220703125, 0.00859832763671875, 0.013946533203125, 0.01929473876953125, 0.0246429443359375, 0.02999114990234375, 0.03533935546875, 0.04068756103515625, 0.0460357666015625, 0.05138397216796875, 0.056732177734375, 0.06208038330078125, 0.0674285888671875, 0.07277679443359375, 0.078125, 0.08347320556640625, 0.0888214111328125, 0.09416961669921875, 0.099517822265625, 0.10486602783203125, 0.1102142333984375, 0.11556243896484375, 0.12091064453125, 0.12625885009765625, 0.1316070556640625, 0.13695526123046875, 0.142303466796875, 0.14765167236328125, 0.1529998779296875, 0.15834808349609375, 0.1636962890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 0.0, 11.0, 11.0, 18.0, 27.0, 36.0, 68.0, 106.0, 193.0, 396.0, 808.0, 1896.0, 6270.0, 30427.0, 219475.0, 618031.0, 141838.0, 21103.0, 4859.0, 1503.0, 687.0, 346.0, 165.0, 106.0, 70.0, 26.0, 20.0, 27.0, 12.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0694580078125, -0.06764888763427734, -0.06583976745605469, -0.06403064727783203, -0.062221527099609375, -0.06041240692138672, -0.05860328674316406, -0.056794166564941406, -0.05498504638671875, -0.053175926208496094, -0.05136680603027344, -0.04955768585205078, -0.047748565673828125, -0.04593944549560547, -0.04413032531738281, -0.042321205139160156, -0.0405120849609375, -0.038702964782714844, -0.03689384460449219, -0.03508472442626953, -0.033275604248046875, -0.03146648406982422, -0.029657363891601562, -0.027848243713378906, -0.02603912353515625, -0.024230003356933594, -0.022420883178710938, -0.02061176300048828, -0.018802642822265625, -0.01699352264404297, -0.015184402465820312, -0.013375282287597656, -0.011566162109375, -0.009757041931152344, -0.007947921752929688, -0.006138801574707031, -0.004329681396484375, -0.0025205612182617188, -0.0007114410400390625, 0.0010976791381835938, 0.00290679931640625, 0.004715919494628906, 0.0065250396728515625, 0.008334159851074219, 0.010143280029296875, 0.011952400207519531, 0.013761520385742188, 0.015570640563964844, 0.0173797607421875, 0.019188880920410156, 0.020998001098632812, 0.02280712127685547, 0.024616241455078125, 0.02642536163330078, 0.028234481811523438, 0.030043601989746094, 0.03185272216796875, 0.033661842346191406, 0.03547096252441406, 0.03728008270263672, 0.039089202880859375, 0.04089832305908203, 0.04270744323730469, 0.044516563415527344, 0.04632568359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 9.0, 6.0, 13.0, 12.0, 15.0, 16.0, 15.0, 31.0, 42.0, 61.0, 48.0, 86.0, 75.0, 103.0, 95.0, 94.0, 59.0, 54.0, 48.0, 33.0, 15.0, 17.0, 9.0, 9.0, 6.0, 11.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.439188003540039e-05, -3.293342888355255e-05, -3.147497773170471e-05, -3.0016526579856873e-05, -2.8558075428009033e-05, -2.7099624276161194e-05, -2.5641173124313354e-05, -2.4182721972465515e-05, -2.2724270820617676e-05, -2.1265819668769836e-05, -1.9807368516921997e-05, -1.8348917365074158e-05, -1.689046621322632e-05, -1.543201506137848e-05, -1.397356390953064e-05, -1.25151127576828e-05, -1.1056661605834961e-05, -9.598210453987122e-06, -8.139759302139282e-06, -6.681308150291443e-06, -5.2228569984436035e-06, -3.764405846595764e-06, -2.305954694747925e-06, -8.475035429000854e-07, 6.109476089477539e-07, 2.0693987607955933e-06, 3.5278499126434326e-06, 4.986301064491272e-06, 6.444752216339111e-06, 7.90320336818695e-06, 9.36165452003479e-06, 1.082010567188263e-05, 1.2278556823730469e-05, 1.3737007975578308e-05, 1.5195459127426147e-05, 1.6653910279273987e-05, 1.8112361431121826e-05, 1.9570812582969666e-05, 2.1029263734817505e-05, 2.2487714886665344e-05, 2.3946166038513184e-05, 2.5404617190361023e-05, 2.6863068342208862e-05, 2.83215194940567e-05, 2.977997064590454e-05, 3.123842179775238e-05, 3.269687294960022e-05, 3.415532410144806e-05, 3.56137752532959e-05, 3.707222640514374e-05, 3.853067755699158e-05, 3.9989128708839417e-05, 4.1447579860687256e-05, 4.2906031012535095e-05, 4.4364482164382935e-05, 4.5822933316230774e-05, 4.728138446807861e-05, 4.873983561992645e-05, 5.019828677177429e-05, 5.165673792362213e-05, 5.311518907546997e-05, 5.457364022731781e-05, 5.603209137916565e-05, 5.749054253101349e-05, 5.894899368286133e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 5.0, 7.0, 9.0, 13.0, 18.0, 39.0, 44.0, 77.0, 134.0, 181.0, 352.0, 737.0, 1420.0, 3930.0, 15139.0, 89802.0, 505107.0, 360328.0, 55221.0, 10337.0, 3043.0, 1186.0, 610.0, 298.0, 183.0, 103.0, 74.0, 54.0, 22.0, 21.0, 14.0, 11.0, 9.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0645751953125, -0.0627751350402832, -0.060975074768066406, -0.05917501449584961, -0.05737495422363281, -0.055574893951416016, -0.05377483367919922, -0.05197477340698242, -0.050174713134765625, -0.04837465286254883, -0.04657459259033203, -0.044774532318115234, -0.04297447204589844, -0.04117441177368164, -0.039374351501464844, -0.03757429122924805, -0.03577423095703125, -0.03397417068481445, -0.032174110412597656, -0.03037405014038086, -0.028573989868164062, -0.026773929595947266, -0.02497386932373047, -0.023173809051513672, -0.021373748779296875, -0.019573688507080078, -0.01777362823486328, -0.015973567962646484, -0.014173507690429688, -0.01237344741821289, -0.010573387145996094, -0.008773326873779297, -0.0069732666015625, -0.005173206329345703, -0.0033731460571289062, -0.0015730857849121094, 0.0002269744873046875, 0.0020270347595214844, 0.0038270950317382812, 0.005627155303955078, 0.007427215576171875, 0.009227275848388672, 0.011027336120605469, 0.012827396392822266, 0.014627456665039062, 0.01642751693725586, 0.018227577209472656, 0.020027637481689453, 0.02182769775390625, 0.023627758026123047, 0.025427818298339844, 0.02722787857055664, 0.029027938842773438, 0.030827999114990234, 0.03262805938720703, 0.03442811965942383, 0.036228179931640625, 0.03802824020385742, 0.03982830047607422, 0.041628360748291016, 0.04342842102050781, 0.04522848129272461, 0.047028541564941406, 0.0488286018371582, 0.050628662109375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 4.0, 4.0, 6.0, 15.0, 17.0, 26.0, 33.0, 34.0, 53.0, 54.0, 55.0, 78.0, 65.0, 63.0, 72.0, 62.0, 52.0, 57.0, 55.0, 30.0, 36.0, 38.0, 18.0, 11.0, 14.0, 10.0, 5.0, 5.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.045623779296875, -0.044152259826660156, -0.04268074035644531, -0.04120922088623047, -0.039737701416015625, -0.03826618194580078, -0.03679466247558594, -0.035323143005371094, -0.03385162353515625, -0.032380104064941406, -0.030908584594726562, -0.02943706512451172, -0.027965545654296875, -0.02649402618408203, -0.025022506713867188, -0.023550987243652344, -0.0220794677734375, -0.020607948303222656, -0.019136428833007812, -0.01766490936279297, -0.016193389892578125, -0.014721870422363281, -0.013250350952148438, -0.011778831481933594, -0.01030731201171875, -0.008835792541503906, -0.0073642730712890625, -0.005892753601074219, -0.004421234130859375, -0.0029497146606445312, -0.0014781951904296875, -6.67572021484375e-06, 0.00146484375, 0.0029363632202148438, 0.0044078826904296875, 0.005879402160644531, 0.007350921630859375, 0.008822441101074219, 0.010293960571289062, 0.011765480041503906, 0.01323699951171875, 0.014708518981933594, 0.016180038452148438, 0.01765155792236328, 0.019123077392578125, 0.02059459686279297, 0.022066116333007812, 0.023537635803222656, 0.0250091552734375, 0.026480674743652344, 0.027952194213867188, 0.02942371368408203, 0.030895233154296875, 0.03236675262451172, 0.03383827209472656, 0.035309791564941406, 0.03678131103515625, 0.038252830505371094, 0.03972434997558594, 0.04119586944580078, 0.042667388916015625, 0.04413890838623047, 0.04561042785644531, 0.047081947326660156, 0.048553466796875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 36.0, 244.0, 504.0, 198.0, 19.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.765563011169434, -5.6595306396484375, -5.553498268127441, -5.447465419769287, -5.341433048248291, -5.235400676727295, -5.129367828369141, -5.0233354568481445, -4.917303085327148, -4.811270713806152, -4.705238342285156, -4.599205493927002, -4.493173122406006, -4.38714075088501, -4.2811079025268555, -4.175075531005859, -4.069043159484863, -3.963010787963867, -3.856978178024292, -3.750945568084717, -3.6449131965637207, -3.5388808250427246, -3.4328482151031494, -3.326815605163574, -3.220783233642578, -3.114750862121582, -3.008718252182007, -2.9026856422424316, -2.7966532707214355, -2.6906208992004395, -2.5845882892608643, -2.478555679321289, -2.372523307800293, -2.266490936279297, -2.1604583263397217, -2.0544257164001465, -1.9483933448791504, -1.8423608541488647, -1.736328363418579, -1.6302958726882935, -1.5242633819580078, -1.4182308912277222, -1.3121984004974365, -1.2061659097671509, -1.1001334190368652, -0.9941009283065796, -0.888068437576294, -0.7820359468460083, -0.6760034561157227, -0.569970965385437, -0.46393847465515137, -0.3579059839248657, -0.2518734931945801, -0.14584100246429443, -0.03980851173400879, 0.06622397899627686, 0.1722564697265625, 0.27828896045684814, 0.3843214511871338, 0.49035394191741943, 0.5963864326477051, 0.7024189233779907, 0.8084514141082764, 0.914483904838562, 1.0205163955688477]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 4.0, 9.0, 13.0, 20.0, 20.0, 17.0, 20.0, 24.0, 33.0, 31.0, 36.0, 36.0, 34.0, 50.0, 40.0, 61.0, 59.0, 49.0, 46.0, 55.0, 35.0, 49.0, 42.0, 31.0, 28.0, 30.0, 23.0, 15.0, 18.0, 14.0, 9.0, 9.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.8531871438026428, -0.8289320468902588, -0.80467689037323, -0.780421793460846, -0.7561666965484619, -0.7319115996360779, -0.7076565027236938, -0.683401346206665, -0.659146249294281, -0.634891152381897, -0.6106359958648682, -0.5863808989524841, -0.5621258020401001, -0.5378707051277161, -0.513615608215332, -0.4893604516983032, -0.4651053547859192, -0.44085025787353516, -0.41659513115882874, -0.3923400044441223, -0.3680849075317383, -0.34382981061935425, -0.3195746839046478, -0.2953195571899414, -0.2710644602775574, -0.24680934846401215, -0.22255423665046692, -0.1982991248369217, -0.17404401302337646, -0.14978890120983124, -0.125533789396286, -0.10127867758274078, -0.07702362537384033, -0.052768513560295105, -0.028513401746749878, -0.004258289933204651, 0.019996821880340576, 0.0442519336938858, 0.06850704550743103, 0.09276215732097626, 0.11701726913452148, 0.1412723809480667, 0.16552749276161194, 0.18978260457515717, 0.2140377163887024, 0.23829282820224762, 0.26254794001579285, 0.28680306673049927, 0.3110581636428833, 0.33531326055526733, 0.35956838726997375, 0.3838235139846802, 0.4080786108970642, 0.43233370780944824, 0.45658883452415466, 0.4808439612388611, 0.5050990581512451, 0.5293541550636292, 0.5536092519760132, 0.577864408493042, 0.602119505405426, 0.6263746023178101, 0.6506297588348389, 0.6748848557472229, 0.6991399526596069]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 7.0, 10.0, 8.0, 15.0, 28.0, 50.0, 74.0, 113.0, 204.0, 314.0, 544.0, 1071.0, 2449.0, 7327.0, 38236.0, 3967897.0, 153413.0, 15059.0, 4102.0, 1565.0, 712.0, 413.0, 225.0, 156.0, 113.0, 65.0, 38.0, 27.0, 12.0, 10.0, 5.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1702880859375, -0.16565322875976562, -0.16101837158203125, -0.15638351440429688, -0.1517486572265625, -0.14711380004882812, -0.14247894287109375, -0.13784408569335938, -0.133209228515625, -0.12857437133789062, -0.12393951416015625, -0.11930465698242188, -0.1146697998046875, -0.11003494262695312, -0.10540008544921875, -0.10076522827148438, -0.09613037109375, -0.09149551391601562, -0.08686065673828125, -0.08222579956054688, -0.0775909423828125, -0.07295608520507812, -0.06832122802734375, -0.06368637084960938, -0.059051513671875, -0.054416656494140625, -0.04978179931640625, -0.045146942138671875, -0.0405120849609375, -0.035877227783203125, -0.03124237060546875, -0.026607513427734375, -0.02197265625, -0.017337799072265625, -0.01270294189453125, -0.008068084716796875, -0.0034332275390625, 0.001201629638671875, 0.00583648681640625, 0.010471343994140625, 0.015106201171875, 0.019741058349609375, 0.02437591552734375, 0.029010772705078125, 0.0336456298828125, 0.038280487060546875, 0.04291534423828125, 0.047550201416015625, 0.05218505859375, 0.056819915771484375, 0.06145477294921875, 0.06608963012695312, 0.0707244873046875, 0.07535934448242188, 0.07999420166015625, 0.08462905883789062, 0.089263916015625, 0.09389877319335938, 0.09853363037109375, 0.10316848754882812, 0.1078033447265625, 0.11243820190429688, 0.11707305908203125, 0.12170791625976562, 0.1263427734375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 5.0, 9.0, 12.0, 20.0, 22.0, 13.0, 31.0, 35.0, 28.0, 37.0, 54.0, 48.0, 49.0, 52.0, 47.0, 55.0, 44.0, 47.0, 53.0, 55.0, 43.0, 39.0, 39.0, 38.0, 22.0, 27.0, 19.0, 15.0, 8.0, 9.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04351806640625, -0.042212486267089844, -0.04090690612792969, -0.03960132598876953, -0.038295745849609375, -0.03699016571044922, -0.03568458557128906, -0.034379005432128906, -0.03307342529296875, -0.031767845153808594, -0.030462265014648438, -0.02915668487548828, -0.027851104736328125, -0.02654552459716797, -0.025239944458007812, -0.023934364318847656, -0.0226287841796875, -0.021323204040527344, -0.020017623901367188, -0.01871204376220703, -0.017406463623046875, -0.01610088348388672, -0.014795303344726562, -0.013489723205566406, -0.01218414306640625, -0.010878562927246094, -0.009572982788085938, -0.008267402648925781, -0.006961822509765625, -0.005656242370605469, -0.0043506622314453125, -0.0030450820922851562, -0.001739501953125, -0.00043392181396484375, 0.0008716583251953125, 0.0021772384643554688, 0.003482818603515625, 0.004788398742675781, 0.0060939788818359375, 0.007399559020996094, 0.00870513916015625, 0.010010719299316406, 0.011316299438476562, 0.012621879577636719, 0.013927459716796875, 0.015233039855957031, 0.016538619995117188, 0.017844200134277344, 0.0191497802734375, 0.020455360412597656, 0.021760940551757812, 0.02306652069091797, 0.024372100830078125, 0.02567768096923828, 0.026983261108398438, 0.028288841247558594, 0.02959442138671875, 0.030900001525878906, 0.03220558166503906, 0.03351116180419922, 0.034816741943359375, 0.03612232208251953, 0.03742790222167969, 0.038733482360839844, 0.0400390625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 10.0, 12.0, 18.0, 24.0, 43.0, 66.0, 68.0, 135.0, 211.0, 357.0, 543.0, 924.0, 1706.0, 3352.0, 7119.0, 16868.0, 57624.0, 653161.0, 3334053.0, 80090.0, 21146.0, 8183.0, 3876.0, 1983.0, 1108.0, 614.0, 346.0, 225.0, 135.0, 86.0, 57.0, 42.0, 28.0, 16.0, 9.0, 17.0, 6.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.10687255859375, -0.10406780242919922, -0.10126304626464844, -0.09845829010009766, -0.09565353393554688, -0.0928487777709961, -0.09004402160644531, -0.08723926544189453, -0.08443450927734375, -0.08162975311279297, -0.07882499694824219, -0.0760202407836914, -0.07321548461914062, -0.07041072845458984, -0.06760597229003906, -0.06480121612548828, -0.0619964599609375, -0.05919170379638672, -0.05638694763183594, -0.053582191467285156, -0.050777435302734375, -0.047972679138183594, -0.04516792297363281, -0.04236316680908203, -0.03955841064453125, -0.03675365447998047, -0.03394889831542969, -0.031144142150878906, -0.028339385986328125, -0.025534629821777344, -0.022729873657226562, -0.01992511749267578, -0.017120361328125, -0.014315605163574219, -0.011510848999023438, -0.008706092834472656, -0.005901336669921875, -0.0030965805053710938, -0.0002918243408203125, 0.0025129318237304688, 0.00531768798828125, 0.008122444152832031, 0.010927200317382812, 0.013731956481933594, 0.016536712646484375, 0.019341468811035156, 0.022146224975585938, 0.02495098114013672, 0.0277557373046875, 0.03056049346923828, 0.03336524963378906, 0.036170005798339844, 0.038974761962890625, 0.041779518127441406, 0.04458427429199219, 0.04738903045654297, 0.05019378662109375, 0.05299854278564453, 0.05580329895019531, 0.058608055114746094, 0.061412811279296875, 0.06421756744384766, 0.06702232360839844, 0.06982707977294922, 0.0726318359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 0.0, 3.0, 5.0, 14.0, 8.0, 12.0, 23.0, 28.0, 38.0, 100.0, 264.0, 2530.0, 673.0, 176.0, 74.0, 42.0, 25.0, 19.0, 9.0, 4.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0328369140625, -0.03192019462585449, -0.031003475189208984, -0.030086755752563477, -0.02917003631591797, -0.02825331687927246, -0.027336597442626953, -0.026419878005981445, -0.025503158569335938, -0.02458643913269043, -0.023669719696044922, -0.022753000259399414, -0.021836280822753906, -0.0209195613861084, -0.02000284194946289, -0.019086122512817383, -0.018169403076171875, -0.017252683639526367, -0.01633596420288086, -0.015419244766235352, -0.014502525329589844, -0.013585805892944336, -0.012669086456298828, -0.01175236701965332, -0.010835647583007812, -0.009918928146362305, -0.009002208709716797, -0.008085489273071289, -0.007168769836425781, -0.0062520503997802734, -0.005335330963134766, -0.004418611526489258, -0.00350189208984375, -0.002585172653198242, -0.0016684532165527344, -0.0007517337799072266, 0.00016498565673828125, 0.001081705093383789, 0.001998424530029297, 0.0029151439666748047, 0.0038318634033203125, 0.00474858283996582, 0.005665302276611328, 0.006582021713256836, 0.007498741149902344, 0.008415460586547852, 0.00933218002319336, 0.010248899459838867, 0.011165618896484375, 0.012082338333129883, 0.01299905776977539, 0.013915777206420898, 0.014832496643066406, 0.015749216079711914, 0.016665935516357422, 0.01758265495300293, 0.018499374389648438, 0.019416093826293945, 0.020332813262939453, 0.02124953269958496, 0.02216625213623047, 0.023082971572875977, 0.023999691009521484, 0.024916410446166992, 0.0258331298828125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 16.0, 61.0, 163.0, 287.0, 256.0, 162.0, 32.0, 12.0, 6.0, 4.0, 2.0, 1.0], "bins": [-0.5583873987197876, -0.5484293699264526, -0.5384712815284729, -0.5285131931304932, -0.5185551643371582, -0.5085971355438232, -0.4986390471458435, -0.48868098855018616, -0.4787229299545288, -0.46876487135887146, -0.4588068127632141, -0.44884875416755676, -0.4388906955718994, -0.42893263697624207, -0.4189745783805847, -0.40901651978492737, -0.39905846118927, -0.38910040259361267, -0.3791423439979553, -0.369184285402298, -0.3592262268066406, -0.3492681682109833, -0.3393101096153259, -0.3293520510196686, -0.31939399242401123, -0.3094359338283539, -0.29947787523269653, -0.2895198166370392, -0.27956175804138184, -0.2696036994457245, -0.25964564085006714, -0.2496875822544098, -0.23972955346107483, -0.22977149486541748, -0.21981343626976013, -0.20985537767410278, -0.19989731907844543, -0.18993926048278809, -0.17998120188713074, -0.1700231432914734, -0.16006508469581604, -0.1501070261001587, -0.14014896750450134, -0.130190908908844, -0.12023285031318665, -0.1102747917175293, -0.10031673312187195, -0.0903586745262146, -0.08040060847997665, -0.0704425498843193, -0.06048449128866196, -0.05052643269300461, -0.04056837409734726, -0.03061031550168991, -0.020652256906032562, -0.010694198310375214, -0.000736139714717865, 0.009221918880939484, 0.019179977476596832, 0.02913803607225418, 0.03909609466791153, 0.04905415326356888, 0.05901221185922623, 0.06897027045488358, 0.07892832905054092]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 9.0, 12.0, 15.0, 22.0, 21.0, 23.0, 32.0, 35.0, 46.0, 37.0, 46.0, 53.0, 62.0, 53.0, 50.0, 46.0, 45.0, 45.0, 49.0, 37.0, 39.0, 34.0, 22.0, 33.0, 29.0, 19.0, 22.0, 20.0, 4.0, 6.0, 6.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08511948585510254, -0.08261630684137344, -0.08011312782764435, -0.07760994881391525, -0.07510676980018616, -0.07260359078645706, -0.07010041177272797, -0.06759723275899887, -0.06509405374526978, -0.06259087473154068, -0.060087695717811584, -0.05758451670408249, -0.055081337690353394, -0.0525781586766243, -0.0500749796628952, -0.04757180064916611, -0.04506862163543701, -0.042565442621707916, -0.04006226360797882, -0.037559084594249725, -0.03505590558052063, -0.032552726566791534, -0.03004954755306244, -0.027546368539333344, -0.025043189525604248, -0.022540010511875153, -0.020036831498146057, -0.01753365248441696, -0.015030473470687866, -0.01252729445695877, -0.010024115443229675, -0.00752093642950058, -0.005017757415771484, -0.002514578402042389, -1.1399388313293457e-05, 0.002491779625415802, 0.0049949586391448975, 0.007498137652873993, 0.010001316666603088, 0.012504495680332184, 0.01500767469406128, 0.017510853707790375, 0.02001403272151947, 0.022517211735248566, 0.02502039074897766, 0.027523569762706757, 0.030026748776435852, 0.03252992779016495, 0.03503310680389404, 0.03753628581762314, 0.040039464831352234, 0.04254264384508133, 0.045045822858810425, 0.04754900187253952, 0.050052180886268616, 0.05255535989999771, 0.05505853891372681, 0.0575617179274559, 0.060064896941185, 0.06256807595491409, 0.06507125496864319, 0.06757443398237228, 0.07007761299610138, 0.07258079200983047, 0.07508397102355957]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 9.0, 8.0, 20.0, 13.0, 28.0, 50.0, 68.0, 105.0, 184.0, 301.0, 555.0, 898.0, 1812.0, 3544.0, 7215.0, 16016.0, 38332.0, 92363.0, 195771.0, 277121.0, 220339.0, 111004.0, 46370.0, 19322.0, 8394.0, 4049.0, 2030.0, 1074.0, 604.0, 363.0, 206.0, 133.0, 81.0, 54.0, 44.0, 29.0, 11.0, 7.0, 8.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05047607421875, -0.048879146575927734, -0.04728221893310547, -0.0456852912902832, -0.04408836364746094, -0.04249143600463867, -0.040894508361816406, -0.03929758071899414, -0.037700653076171875, -0.03610372543334961, -0.034506797790527344, -0.03290987014770508, -0.03131294250488281, -0.029716014862060547, -0.02811908721923828, -0.026522159576416016, -0.02492523193359375, -0.023328304290771484, -0.02173137664794922, -0.020134449005126953, -0.018537521362304688, -0.016940593719482422, -0.015343666076660156, -0.01374673843383789, -0.012149810791015625, -0.01055288314819336, -0.008955955505371094, -0.007359027862548828, -0.0057621002197265625, -0.004165172576904297, -0.0025682449340820312, -0.0009713172912597656, 0.0006256103515625, 0.0022225379943847656, 0.0038194656372070312, 0.005416393280029297, 0.0070133209228515625, 0.008610248565673828, 0.010207176208496094, 0.01180410385131836, 0.013401031494140625, 0.01499795913696289, 0.016594886779785156, 0.018191814422607422, 0.019788742065429688, 0.021385669708251953, 0.02298259735107422, 0.024579524993896484, 0.02617645263671875, 0.027773380279541016, 0.02937030792236328, 0.030967235565185547, 0.03256416320800781, 0.03416109085083008, 0.035758018493652344, 0.03735494613647461, 0.038951873779296875, 0.04054880142211914, 0.042145729064941406, 0.04374265670776367, 0.04533958435058594, 0.0469365119934082, 0.04853343963623047, 0.050130367279052734, 0.051727294921875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 5.0, 14.0, 13.0, 15.0, 18.0, 23.0, 29.0, 28.0, 46.0, 44.0, 41.0, 50.0, 48.0, 54.0, 45.0, 51.0, 63.0, 49.0, 46.0, 46.0, 42.0, 38.0, 32.0, 29.0, 30.0, 26.0, 17.0, 14.0, 11.0, 4.0, 11.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045013427734375, -0.04360628128051758, -0.042199134826660156, -0.040791988372802734, -0.03938484191894531, -0.03797769546508789, -0.03657054901123047, -0.03516340255737305, -0.033756256103515625, -0.0323491096496582, -0.03094196319580078, -0.02953481674194336, -0.028127670288085938, -0.026720523834228516, -0.025313377380371094, -0.023906230926513672, -0.02249908447265625, -0.021091938018798828, -0.019684791564941406, -0.018277645111083984, -0.016870498657226562, -0.01546335220336914, -0.014056205749511719, -0.012649059295654297, -0.011241912841796875, -0.009834766387939453, -0.008427619934082031, -0.007020473480224609, -0.0056133270263671875, -0.004206180572509766, -0.0027990341186523438, -0.0013918876647949219, 1.52587890625e-05, 0.0014224052429199219, 0.0028295516967773438, 0.004236698150634766, 0.0056438446044921875, 0.007050991058349609, 0.008458137512207031, 0.009865283966064453, 0.011272430419921875, 0.012679576873779297, 0.014086723327636719, 0.01549386978149414, 0.016901016235351562, 0.018308162689208984, 0.019715309143066406, 0.021122455596923828, 0.02252960205078125, 0.023936748504638672, 0.025343894958496094, 0.026751041412353516, 0.028158187866210938, 0.02956533432006836, 0.03097248077392578, 0.0323796272277832, 0.033786773681640625, 0.03519392013549805, 0.03660106658935547, 0.03800821304321289, 0.03941535949707031, 0.040822505950927734, 0.042229652404785156, 0.04363679885864258, 0.0450439453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 6.0, 11.0, 8.0, 13.0, 19.0, 36.0, 61.0, 87.0, 166.0, 269.0, 563.0, 1460.0, 6129.0, 96138.0, 866155.0, 69543.0, 5307.0, 1307.0, 551.0, 272.0, 179.0, 101.0, 74.0, 35.0, 33.0, 17.0, 10.0, 3.0, 8.0, 3.0], "bins": [-0.294189453125, -0.2881183624267578, -0.2820472717285156, -0.27597618103027344, -0.26990509033203125, -0.26383399963378906, -0.2577629089355469, -0.2516918182373047, -0.2456207275390625, -0.2395496368408203, -0.23347854614257812, -0.22740745544433594, -0.22133636474609375, -0.21526527404785156, -0.20919418334960938, -0.2031230926513672, -0.197052001953125, -0.1909809112548828, -0.18490982055664062, -0.17883872985839844, -0.17276763916015625, -0.16669654846191406, -0.16062545776367188, -0.1545543670654297, -0.1484832763671875, -0.1424121856689453, -0.13634109497070312, -0.13027000427246094, -0.12419891357421875, -0.11812782287597656, -0.11205673217773438, -0.10598564147949219, -0.09991455078125, -0.09384346008300781, -0.08777236938476562, -0.08170127868652344, -0.07563018798828125, -0.06955909729003906, -0.06348800659179688, -0.05741691589355469, -0.0513458251953125, -0.04527473449707031, -0.039203643798828125, -0.03313255310058594, -0.02706146240234375, -0.020990371704101562, -0.014919281005859375, -0.008848190307617188, -0.002777099609375, 0.0032939910888671875, 0.009365081787109375, 0.015436172485351562, 0.02150726318359375, 0.027578353881835938, 0.033649444580078125, 0.03972053527832031, 0.0457916259765625, 0.05186271667480469, 0.057933807373046875, 0.06400489807128906, 0.07007598876953125, 0.07614707946777344, 0.08221817016601562, 0.08828926086425781, 0.0943603515625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 7.0, 1.0, 7.0, 3.0, 5.0, 14.0, 6.0, 10.0, 8.0, 5.0, 20.0, 17.0, 18.0, 18.0, 22.0, 24.0, 30.0, 33.0, 29.0, 36.0, 38.0, 40.0, 46.0, 35.0, 46.0, 42.0, 51.0, 53.0, 31.0, 33.0, 38.0, 38.0, 27.0, 34.0, 25.0, 19.0, 14.0, 16.0, 13.0, 11.0, 8.0, 9.0, 8.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.171142578125, -0.16641807556152344, -0.16169357299804688, -0.1569690704345703, -0.15224456787109375, -0.1475200653076172, -0.14279556274414062, -0.13807106018066406, -0.1333465576171875, -0.12862205505371094, -0.12389755249023438, -0.11917304992675781, -0.11444854736328125, -0.10972404479980469, -0.10499954223632812, -0.10027503967285156, -0.095550537109375, -0.09082603454589844, -0.08610153198242188, -0.08137702941894531, -0.07665252685546875, -0.07192802429199219, -0.06720352172851562, -0.06247901916503906, -0.0577545166015625, -0.05303001403808594, -0.048305511474609375, -0.04358100891113281, -0.03885650634765625, -0.03413200378417969, -0.029407501220703125, -0.024682998657226562, -0.01995849609375, -0.015233993530273438, -0.010509490966796875, -0.0057849884033203125, -0.00106048583984375, 0.0036640167236328125, 0.008388519287109375, 0.013113021850585938, 0.0178375244140625, 0.022562026977539062, 0.027286529541015625, 0.03201103210449219, 0.03673553466796875, 0.04146003723144531, 0.046184539794921875, 0.05090904235839844, 0.055633544921875, 0.06035804748535156, 0.06508255004882812, 0.06980705261230469, 0.07453155517578125, 0.07925605773925781, 0.08398056030273438, 0.08870506286621094, 0.0934295654296875, 0.09815406799316406, 0.10287857055664062, 0.10760307312011719, 0.11232757568359375, 0.11705207824707031, 0.12177658081054688, 0.12650108337402344, 0.1312255859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 5.0, 6.0, 8.0, 17.0, 22.0, 42.0, 112.0, 349.0, 1806.0, 47899.0, 981832.0, 14918.0, 1137.0, 223.0, 86.0, 37.0, 19.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.262451171875, -0.25640010833740234, -0.2503490447998047, -0.24429798126220703, -0.23824691772460938, -0.23219585418701172, -0.22614479064941406, -0.2200937271118164, -0.21404266357421875, -0.2079916000366211, -0.20194053649902344, -0.19588947296142578, -0.18983840942382812, -0.18378734588623047, -0.1777362823486328, -0.17168521881103516, -0.1656341552734375, -0.15958309173583984, -0.1535320281982422, -0.14748096466064453, -0.14142990112304688, -0.13537883758544922, -0.12932777404785156, -0.1232767105102539, -0.11722564697265625, -0.1111745834350586, -0.10512351989746094, -0.09907245635986328, -0.09302139282226562, -0.08697032928466797, -0.08091926574707031, -0.07486820220947266, -0.068817138671875, -0.06276607513427734, -0.05671501159667969, -0.05066394805908203, -0.044612884521484375, -0.03856182098388672, -0.03251075744628906, -0.026459693908691406, -0.02040863037109375, -0.014357566833496094, -0.008306503295898438, -0.0022554397583007812, 0.003795623779296875, 0.009846687316894531, 0.015897750854492188, 0.021948814392089844, 0.0279998779296875, 0.034050941467285156, 0.04010200500488281, 0.04615306854248047, 0.052204132080078125, 0.05825519561767578, 0.06430625915527344, 0.0703573226928711, 0.07640838623046875, 0.0824594497680664, 0.08851051330566406, 0.09456157684326172, 0.10061264038085938, 0.10666370391845703, 0.11271476745605469, 0.11876583099365234, 0.12481689453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 8.0, 9.0, 11.0, 12.0, 16.0, 19.0, 32.0, 60.0, 57.0, 76.0, 47.0, 91.0, 83.0, 95.0, 84.0, 66.0, 48.0, 43.0, 40.0, 31.0, 22.0, 13.0, 12.0, 7.0, 0.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.553794860839844e-05, -4.435330629348755e-05, -4.316866397857666e-05, -4.198402166366577e-05, -4.079937934875488e-05, -3.9614737033843994e-05, -3.8430094718933105e-05, -3.724545240402222e-05, -3.606081008911133e-05, -3.487616777420044e-05, -3.369152545928955e-05, -3.250688314437866e-05, -3.1322240829467773e-05, -3.0137598514556885e-05, -2.8952956199645996e-05, -2.7768313884735107e-05, -2.658367156982422e-05, -2.539902925491333e-05, -2.421438694000244e-05, -2.3029744625091553e-05, -2.1845102310180664e-05, -2.0660459995269775e-05, -1.9475817680358887e-05, -1.8291175365447998e-05, -1.710653305053711e-05, -1.592189073562622e-05, -1.4737248420715332e-05, -1.3552606105804443e-05, -1.2367963790893555e-05, -1.1183321475982666e-05, -9.998679161071777e-06, -8.814036846160889e-06, -7.62939453125e-06, -6.444752216339111e-06, -5.260109901428223e-06, -4.075467586517334e-06, -2.8908252716064453e-06, -1.7061829566955566e-06, -5.21540641784668e-07, 6.631016731262207e-07, 1.8477439880371094e-06, 3.032386302947998e-06, 4.217028617858887e-06, 5.401670932769775e-06, 6.586313247680664e-06, 7.770955562591553e-06, 8.955597877502441e-06, 1.014024019241333e-05, 1.1324882507324219e-05, 1.2509524822235107e-05, 1.3694167137145996e-05, 1.4878809452056885e-05, 1.6063451766967773e-05, 1.7248094081878662e-05, 1.843273639678955e-05, 1.961737871170044e-05, 2.0802021026611328e-05, 2.1986663341522217e-05, 2.3171305656433105e-05, 2.4355947971343994e-05, 2.5540590286254883e-05, 2.672523260116577e-05, 2.790987491607666e-05, 2.909451723098755e-05, 3.0279159545898438e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 12.0, 19.0, 39.0, 93.0, 197.0, 808.0, 7033.0, 921083.0, 116250.0, 2288.0, 469.0, 144.0, 64.0, 26.0, 21.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1727294921875, -0.16576194763183594, -0.15879440307617188, -0.1518268585205078, -0.14485931396484375, -0.1378917694091797, -0.13092422485351562, -0.12395668029785156, -0.1169891357421875, -0.11002159118652344, -0.10305404663085938, -0.09608650207519531, -0.08911895751953125, -0.08215141296386719, -0.07518386840820312, -0.06821632385253906, -0.061248779296875, -0.05428123474121094, -0.047313690185546875, -0.04034614562988281, -0.03337860107421875, -0.026411056518554688, -0.019443511962890625, -0.012475967407226562, -0.0055084228515625, 0.0014591217041015625, 0.008426666259765625, 0.015394210815429688, 0.02236175537109375, 0.029329299926757812, 0.036296844482421875, 0.04326438903808594, 0.05023193359375, 0.05719947814941406, 0.06416702270507812, 0.07113456726074219, 0.07810211181640625, 0.08506965637207031, 0.09203720092773438, 0.09900474548339844, 0.1059722900390625, 0.11293983459472656, 0.11990737915039062, 0.1268749237060547, 0.13384246826171875, 0.1408100128173828, 0.14777755737304688, 0.15474510192871094, 0.161712646484375, 0.16868019104003906, 0.17564773559570312, 0.1826152801513672, 0.18958282470703125, 0.1965503692626953, 0.20351791381835938, 0.21048545837402344, 0.2174530029296875, 0.22442054748535156, 0.23138809204101562, 0.2383556365966797, 0.24532318115234375, 0.2522907257080078, 0.2592582702636719, 0.26622581481933594, 0.273193359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 19.0, 40.0, 126.0, 313.0, 271.0, 145.0, 62.0, 25.0, 6.0, 4.0, 0.0, 1.0], "bins": [-0.374755859375, -0.3680744171142578, -0.3613929748535156, -0.35471153259277344, -0.34803009033203125, -0.34134864807128906, -0.3346672058105469, -0.3279857635498047, -0.3213043212890625, -0.3146228790283203, -0.3079414367675781, -0.30125999450683594, -0.29457855224609375, -0.28789710998535156, -0.2812156677246094, -0.2745342254638672, -0.267852783203125, -0.2611713409423828, -0.2544898986816406, -0.24780845642089844, -0.24112701416015625, -0.23444557189941406, -0.22776412963867188, -0.2210826873779297, -0.2144012451171875, -0.2077198028564453, -0.20103836059570312, -0.19435691833496094, -0.18767547607421875, -0.18099403381347656, -0.17431259155273438, -0.1676311492919922, -0.16094970703125, -0.1542682647705078, -0.14758682250976562, -0.14090538024902344, -0.13422393798828125, -0.12754249572753906, -0.12086105346679688, -0.11417961120605469, -0.1074981689453125, -0.10081672668457031, -0.09413528442382812, -0.08745384216308594, -0.08077239990234375, -0.07409095764160156, -0.06740951538085938, -0.06072807312011719, -0.054046630859375, -0.04736518859863281, -0.040683746337890625, -0.03400230407714844, -0.02732086181640625, -0.020639419555664062, -0.013957977294921875, -0.0072765350341796875, -0.0005950927734375, 0.0060863494873046875, 0.012767791748046875, 0.019449234008789062, 0.02613067626953125, 0.03281211853027344, 0.039493560791015625, 0.04617500305175781, 0.0528564453125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 11.0, 34.0, 79.0, 172.0, 201.0, 224.0, 148.0, 61.0, 29.0, 17.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3085153102874756, -1.2630460262298584, -1.2175768613815308, -1.1721075773239136, -1.1266382932662964, -1.0811691284179688, -1.0356998443603516, -0.9902305603027344, -0.944761335849762, -0.8992921113967896, -0.8538228273391724, -0.8083536028862, -0.7628843784332275, -0.7174150943756104, -0.6719458699226379, -0.6264766454696655, -0.5810073614120483, -0.5355381369590759, -0.49006885290145874, -0.44459962844848633, -0.39913037419319153, -0.35366111993789673, -0.3081918954849243, -0.2627226412296295, -0.21725338697433472, -0.17178413271903992, -0.1263148933649063, -0.0808456540107727, -0.035376399755477905, 0.010092854499816895, 0.05556207895278931, 0.1010313332080841, 0.1465005874633789, 0.1919698417186737, 0.2374390810728073, 0.2829083204269409, 0.3283775746822357, 0.3738468289375305, 0.41931605339050293, 0.46478530764579773, 0.5102545619010925, 0.5557237863540649, 0.6011930704116821, 0.6466622948646545, 0.692131519317627, 0.7376008033752441, 0.7830700278282166, 0.828539252281189, 0.8740085363388062, 0.9194777607917786, 0.9649470448493958, 1.0104162693023682, 1.0558855533599854, 1.1013548374176025, 1.1468240022659302, 1.1922932863235474, 1.237762451171875, 1.2832317352294922, 1.3287009000778198, 1.374170184135437, 1.4196394681930542, 1.4651086330413818, 1.510577917098999, 1.5560472011566162, 1.6015164852142334]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 2.0, 4.0, 8.0, 7.0, 10.0, 5.0, 11.0, 18.0, 19.0, 10.0, 28.0, 25.0, 26.0, 40.0, 37.0, 37.0, 46.0, 32.0, 35.0, 40.0, 49.0, 50.0, 36.0, 46.0, 45.0, 45.0, 36.0, 22.0, 29.0, 30.0, 23.0, 27.0, 16.0, 29.0, 16.0, 11.0, 12.0, 9.0, 10.0, 3.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6497471332550049, -0.6263760328292847, -0.6030049324035645, -0.5796338319778442, -0.556262731552124, -0.5328916311264038, -0.5095205307006836, -0.48614946007728577, -0.46277835965156555, -0.43940725922584534, -0.4160361588001251, -0.3926650881767273, -0.3692939877510071, -0.34592288732528687, -0.32255178689956665, -0.29918068647384644, -0.2758095860481262, -0.252438485622406, -0.2290673851966858, -0.20569629967212677, -0.18232519924640656, -0.15895409882068634, -0.13558301329612732, -0.1122119128704071, -0.08884081244468689, -0.06546971201896667, -0.04209861904382706, -0.01872752606868744, 0.004643574357032776, 0.02801467478275299, 0.05138576030731201, 0.07475686073303223, 0.09812802076339722, 0.12149912118911743, 0.14487022161483765, 0.16824130713939667, 0.19161240756511688, 0.2149835079908371, 0.23835459351539612, 0.26172569394111633, 0.28509679436683655, 0.30846789479255676, 0.331838995218277, 0.3552100658416748, 0.378581166267395, 0.40195226669311523, 0.42532336711883545, 0.44869446754455566, 0.4720655679702759, 0.4954366683959961, 0.5188077688217163, 0.5421788692474365, 0.5655499696731567, 0.588921070098877, 0.6122921705245972, 0.6356632709503174, 0.6590343713760376, 0.6824054718017578, 0.705776572227478, 0.7291476726531982, 0.7525187730789185, 0.7758898735046387, 0.7992609739303589, 0.8226320743560791, 0.8460031151771545]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 8.0, 7.0, 12.0, 26.0, 23.0, 30.0, 50.0, 60.0, 78.0, 118.0, 177.0, 248.0, 453.0, 784.0, 1535.0, 3341.0, 9422.0, 48346.0, 4004058.0, 103423.0, 13314.0, 4313.0, 1969.0, 997.0, 480.0, 325.0, 216.0, 117.0, 88.0, 70.0, 52.0, 37.0, 23.0, 24.0, 10.0, 12.0, 4.0, 5.0, 4.0, 3.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10223388671875, -0.09853458404541016, -0.09483528137207031, -0.09113597869873047, -0.08743667602539062, -0.08373737335205078, -0.08003807067871094, -0.0763387680053711, -0.07263946533203125, -0.0689401626586914, -0.06524085998535156, -0.06154155731201172, -0.057842254638671875, -0.05414295196533203, -0.05044364929199219, -0.046744346618652344, -0.0430450439453125, -0.039345741271972656, -0.03564643859863281, -0.03194713592529297, -0.028247833251953125, -0.02454853057861328, -0.020849227905273438, -0.017149925231933594, -0.01345062255859375, -0.009751319885253906, -0.0060520172119140625, -0.0023527145385742188, 0.001346588134765625, 0.005045890808105469, 0.008745193481445312, 0.012444496154785156, 0.016143798828125, 0.019843101501464844, 0.023542404174804688, 0.02724170684814453, 0.030941009521484375, 0.03464031219482422, 0.03833961486816406, 0.042038917541503906, 0.04573822021484375, 0.049437522888183594, 0.05313682556152344, 0.05683612823486328, 0.060535430908203125, 0.06423473358154297, 0.06793403625488281, 0.07163333892822266, 0.0753326416015625, 0.07903194427490234, 0.08273124694824219, 0.08643054962158203, 0.09012985229492188, 0.09382915496826172, 0.09752845764160156, 0.1012277603149414, 0.10492706298828125, 0.1086263656616211, 0.11232566833496094, 0.11602497100830078, 0.11972427368164062, 0.12342357635498047, 0.1271228790283203, 0.13082218170166016, 0.134521484375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 8.0, 12.0, 8.0, 13.0, 20.0, 29.0, 12.0, 30.0, 27.0, 34.0, 38.0, 45.0, 47.0, 40.0, 37.0, 42.0, 35.0, 37.0, 38.0, 40.0, 39.0, 37.0, 38.0, 30.0, 25.0, 34.0, 26.0, 20.0, 23.0, 17.0, 18.0, 16.0, 18.0, 8.0, 9.0, 6.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.034332275390625, -0.033249855041503906, -0.03216743469238281, -0.03108501434326172, -0.030002593994140625, -0.02892017364501953, -0.027837753295898438, -0.026755332946777344, -0.02567291259765625, -0.024590492248535156, -0.023508071899414062, -0.02242565155029297, -0.021343231201171875, -0.02026081085205078, -0.019178390502929688, -0.018095970153808594, -0.0170135498046875, -0.015931129455566406, -0.014848709106445312, -0.013766288757324219, -0.012683868408203125, -0.011601448059082031, -0.010519027709960938, -0.009436607360839844, -0.00835418701171875, -0.007271766662597656, -0.0061893463134765625, -0.005106925964355469, -0.004024505615234375, -0.0029420852661132812, -0.0018596649169921875, -0.0007772445678710938, 0.00030517578125, 0.0013875961303710938, 0.0024700164794921875, 0.0035524368286132812, 0.004634857177734375, 0.005717277526855469, 0.0067996978759765625, 0.007882118225097656, 0.00896453857421875, 0.010046958923339844, 0.011129379272460938, 0.012211799621582031, 0.013294219970703125, 0.014376640319824219, 0.015459060668945312, 0.016541481018066406, 0.0176239013671875, 0.018706321716308594, 0.019788742065429688, 0.02087116241455078, 0.021953582763671875, 0.02303600311279297, 0.024118423461914062, 0.025200843811035156, 0.02628326416015625, 0.027365684509277344, 0.028448104858398438, 0.02953052520751953, 0.030612945556640625, 0.03169536590576172, 0.03277778625488281, 0.033860206604003906, 0.034942626953125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 8.0, 24.0, 23.0, 29.0, 55.0, 111.0, 127.0, 187.0, 325.0, 578.0, 1124.0, 2390.0, 6258.0, 22331.0, 205346.0, 3872585.0, 62938.0, 12080.0, 3978.0, 1664.0, 853.0, 521.0, 280.0, 155.0, 97.0, 65.0, 45.0, 32.0, 22.0, 12.0, 16.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10650634765625, -0.10245418548583984, -0.09840202331542969, -0.09434986114501953, -0.09029769897460938, -0.08624553680419922, -0.08219337463378906, -0.0781412124633789, -0.07408905029296875, -0.0700368881225586, -0.06598472595214844, -0.06193256378173828, -0.057880401611328125, -0.05382823944091797, -0.04977607727050781, -0.045723915100097656, -0.0416717529296875, -0.037619590759277344, -0.03356742858886719, -0.02951526641845703, -0.025463104248046875, -0.02141094207763672, -0.017358779907226562, -0.013306617736816406, -0.00925445556640625, -0.005202293395996094, -0.0011501312255859375, 0.0029020309448242188, 0.006954193115234375, 0.011006355285644531, 0.015058517456054688, 0.019110679626464844, 0.023162841796875, 0.027215003967285156, 0.03126716613769531, 0.03531932830810547, 0.039371490478515625, 0.04342365264892578, 0.04747581481933594, 0.051527976989746094, 0.05558013916015625, 0.059632301330566406, 0.06368446350097656, 0.06773662567138672, 0.07178878784179688, 0.07584095001220703, 0.07989311218261719, 0.08394527435302734, 0.0879974365234375, 0.09204959869384766, 0.09610176086425781, 0.10015392303466797, 0.10420608520507812, 0.10825824737548828, 0.11231040954589844, 0.1163625717163086, 0.12041473388671875, 0.1244668960571289, 0.12851905822753906, 0.13257122039794922, 0.13662338256835938, 0.14067554473876953, 0.1447277069091797, 0.14877986907958984, 0.15283203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 4.0, 7.0, 17.0, 20.0, 21.0, 56.0, 174.0, 2417.0, 1041.0, 142.0, 64.0, 46.0, 19.0, 7.0, 7.0, 10.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0226898193359375, -0.021553754806518555, -0.02041769027709961, -0.019281625747680664, -0.01814556121826172, -0.017009496688842773, -0.015873432159423828, -0.014737367630004883, -0.013601303100585938, -0.012465238571166992, -0.011329174041748047, -0.010193109512329102, -0.009057044982910156, -0.007920980453491211, -0.006784915924072266, -0.00564885139465332, -0.004512786865234375, -0.0033767223358154297, -0.0022406578063964844, -0.001104593276977539, 3.147125244140625e-05, 0.0011675357818603516, 0.002303600311279297, 0.003439664840698242, 0.0045757293701171875, 0.005711793899536133, 0.006847858428955078, 0.007983922958374023, 0.009119987487792969, 0.010256052017211914, 0.01139211654663086, 0.012528181076049805, 0.01366424560546875, 0.014800310134887695, 0.01593637466430664, 0.017072439193725586, 0.01820850372314453, 0.019344568252563477, 0.020480632781982422, 0.021616697311401367, 0.022752761840820312, 0.023888826370239258, 0.025024890899658203, 0.02616095542907715, 0.027297019958496094, 0.02843308448791504, 0.029569149017333984, 0.03070521354675293, 0.031841278076171875, 0.03297734260559082, 0.034113407135009766, 0.03524947166442871, 0.036385536193847656, 0.0375216007232666, 0.03865766525268555, 0.03979372978210449, 0.04092979431152344, 0.04206585884094238, 0.04320192337036133, 0.04433798789978027, 0.04547405242919922, 0.046610116958618164, 0.04774618148803711, 0.048882246017456055, 0.050018310546875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 10.0, 17.0, 32.0, 55.0, 86.0, 138.0, 154.0, 172.0, 118.0, 80.0, 58.0, 29.0, 13.0, 10.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.12451092153787613, -0.11970972269773483, -0.11490852385759354, -0.11010732501745224, -0.10530612617731094, -0.10050492733716965, -0.09570373594760895, -0.09090253710746765, -0.08610133826732635, -0.08130013942718506, -0.07649894058704376, -0.07169774174690247, -0.06689654290676117, -0.06209534406661987, -0.057294148951768875, -0.05249295011162758, -0.047691747546195984, -0.04289054870605469, -0.03808934986591339, -0.033288151025772095, -0.028486954048275948, -0.02368575520813465, -0.018884558230638504, -0.014083359390497208, -0.009282160550355911, -0.004480962175875902, 0.0003202361986041069, 0.005121434107422829, 0.009922632947564125, 0.014723831787705421, 0.01952502876520157, 0.024326227605342865, 0.02912743389606476, 0.033928632736206055, 0.03872983157634735, 0.04353103041648865, 0.048332229256629944, 0.05313342809677124, 0.05793462321162224, 0.06273582577705383, 0.06753702461719513, 0.07233822345733643, 0.07713942229747772, 0.08194062113761902, 0.08674181997776031, 0.09154301881790161, 0.09634421765804291, 0.1011454164981842, 0.1059466078877449, 0.1107478067278862, 0.1155490055680275, 0.12035020440816879, 0.1251513957977295, 0.1299525946378708, 0.13475379347801208, 0.13955499231815338, 0.14435619115829468, 0.14915738999843597, 0.15395858883857727, 0.15875978767871857, 0.16356098651885986, 0.16836218535900116, 0.17316338419914246, 0.17796458303928375, 0.18276578187942505]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 7.0, 5.0, 4.0, 9.0, 10.0, 9.0, 13.0, 14.0, 13.0, 21.0, 28.0, 23.0, 29.0, 20.0, 26.0, 29.0, 35.0, 39.0, 49.0, 53.0, 44.0, 45.0, 40.0, 44.0, 55.0, 38.0, 36.0, 26.0, 40.0, 29.0, 30.0, 22.0, 20.0, 12.0, 16.0, 14.0, 10.0, 12.0, 9.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06451869010925293, -0.06243486702442169, -0.060351043939590454, -0.058267224580049515, -0.05618340149521828, -0.05409957841038704, -0.0520157590508461, -0.04993193596601486, -0.047848112881183624, -0.045764289796352386, -0.04368046671152115, -0.04159664735198021, -0.03951282426714897, -0.037429001182317734, -0.035345181822776794, -0.03326135873794556, -0.03117753565311432, -0.02909371256828308, -0.027009891346096992, -0.024926070123910904, -0.022842247039079666, -0.02075842395424843, -0.01867460273206234, -0.01659078150987625, -0.014506958425045013, -0.01242313627153635, -0.010339314118027687, -0.008255491964519024, -0.006171669811010361, -0.0040878476575016975, -0.0020040255039930344, 7.979664951562881e-05, 0.002163618803024292, 0.004247440956532955, 0.006331263110041618, 0.008415085263550282, 0.010498907417058945, 0.012582729570567608, 0.014666551724076271, 0.01675037294626236, 0.018834196031093597, 0.020918019115924835, 0.023001840338110924, 0.025085661560297012, 0.02716948464512825, 0.029253307729959488, 0.03133712708950043, 0.033420950174331665, 0.0355047732591629, 0.03758859634399414, 0.03967241942882538, 0.04175623878836632, 0.043840061873197556, 0.04592388495802879, 0.04800770431756973, 0.05009152740240097, 0.05217535048723221, 0.054259173572063446, 0.056342996656894684, 0.05842681601643562, 0.06051063910126686, 0.0625944584608078, 0.06467828154563904, 0.06676210463047028, 0.06884592771530151]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 5.0, 14.0, 7.0, 19.0, 19.0, 22.0, 29.0, 35.0, 50.0, 78.0, 136.0, 203.0, 431.0, 908.0, 2185.0, 5293.0, 13165.0, 35037.0, 87209.0, 189773.0, 284950.0, 231236.0, 117442.0, 48406.0, 18950.0, 7457.0, 3009.0, 1209.0, 516.0, 291.0, 163.0, 83.0, 60.0, 42.0, 29.0, 24.0, 11.0, 15.0, 10.0, 3.0, 2.0, 4.0, 3.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.046600341796875, -0.04521656036376953, -0.04383277893066406, -0.042448997497558594, -0.041065216064453125, -0.039681434631347656, -0.03829765319824219, -0.03691387176513672, -0.03553009033203125, -0.03414630889892578, -0.03276252746582031, -0.031378746032714844, -0.029994964599609375, -0.028611183166503906, -0.027227401733398438, -0.02584362030029297, -0.0244598388671875, -0.02307605743408203, -0.021692276000976562, -0.020308494567871094, -0.018924713134765625, -0.017540931701660156, -0.016157150268554688, -0.014773368835449219, -0.01338958740234375, -0.012005805969238281, -0.010622024536132812, -0.009238243103027344, -0.007854461669921875, -0.006470680236816406, -0.0050868988037109375, -0.0037031173706054688, -0.0023193359375, -0.0009355545043945312, 0.0004482269287109375, 0.0018320083618164062, 0.003215789794921875, 0.004599571228027344, 0.0059833526611328125, 0.007367134094238281, 0.00875091552734375, 0.010134696960449219, 0.011518478393554688, 0.012902259826660156, 0.014286041259765625, 0.015669822692871094, 0.017053604125976562, 0.01843738555908203, 0.0198211669921875, 0.02120494842529297, 0.022588729858398438, 0.023972511291503906, 0.025356292724609375, 0.026740074157714844, 0.028123855590820312, 0.02950763702392578, 0.03089141845703125, 0.03227519989013672, 0.03365898132324219, 0.035042762756347656, 0.036426544189453125, 0.037810325622558594, 0.03919410705566406, 0.04057788848876953, 0.041961669921875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 8.0, 6.0, 9.0, 4.0, 7.0, 20.0, 18.0, 10.0, 15.0, 25.0, 17.0, 26.0, 27.0, 29.0, 39.0, 38.0, 37.0, 43.0, 36.0, 39.0, 48.0, 33.0, 44.0, 44.0, 33.0, 36.0, 41.0, 24.0, 33.0, 26.0, 24.0, 28.0, 30.0, 13.0, 15.0, 24.0, 9.0, 8.0, 8.0, 6.0, 9.0, 5.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.033203125, -0.03207111358642578, -0.030939102172851562, -0.029807090759277344, -0.028675079345703125, -0.027543067932128906, -0.026411056518554688, -0.02527904510498047, -0.02414703369140625, -0.02301502227783203, -0.021883010864257812, -0.020750999450683594, -0.019618988037109375, -0.018486976623535156, -0.017354965209960938, -0.01622295379638672, -0.0150909423828125, -0.013958930969238281, -0.012826919555664062, -0.011694908142089844, -0.010562896728515625, -0.009430885314941406, -0.008298873901367188, -0.007166862487792969, -0.00603485107421875, -0.004902839660644531, -0.0037708282470703125, -0.0026388168334960938, -0.001506805419921875, -0.00037479400634765625, 0.0007572174072265625, 0.0018892288208007812, 0.003021240234375, 0.004153251647949219, 0.0052852630615234375, 0.006417274475097656, 0.007549285888671875, 0.008681297302246094, 0.009813308715820312, 0.010945320129394531, 0.01207733154296875, 0.013209342956542969, 0.014341354370117188, 0.015473365783691406, 0.016605377197265625, 0.017737388610839844, 0.018869400024414062, 0.02000141143798828, 0.0211334228515625, 0.02226543426513672, 0.023397445678710938, 0.024529457092285156, 0.025661468505859375, 0.026793479919433594, 0.027925491333007812, 0.02905750274658203, 0.03018951416015625, 0.03132152557373047, 0.03245353698730469, 0.033585548400878906, 0.034717559814453125, 0.035849571228027344, 0.03698158264160156, 0.03811359405517578, 0.03924560546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 9.0, 10.0, 18.0, 14.0, 36.0, 35.0, 51.0, 74.0, 113.0, 174.0, 249.0, 486.0, 930.0, 2472.0, 14962.0, 301810.0, 680886.0, 39309.0, 4132.0, 1287.0, 579.0, 382.0, 166.0, 117.0, 79.0, 54.0, 38.0, 23.0, 18.0, 14.0, 4.0, 4.0, 6.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1461181640625, -0.14171409606933594, -0.13731002807617188, -0.1329059600830078, -0.12850189208984375, -0.12409782409667969, -0.11969375610351562, -0.11528968811035156, -0.1108856201171875, -0.10648155212402344, -0.10207748413085938, -0.09767341613769531, -0.09326934814453125, -0.08886528015136719, -0.08446121215820312, -0.08005714416503906, -0.075653076171875, -0.07124900817871094, -0.06684494018554688, -0.06244087219238281, -0.05803680419921875, -0.05363273620605469, -0.049228668212890625, -0.04482460021972656, -0.0404205322265625, -0.03601646423339844, -0.031612396240234375, -0.027208328247070312, -0.02280426025390625, -0.018400192260742188, -0.013996124267578125, -0.009592056274414062, -0.00518798828125, -0.0007839202880859375, 0.003620147705078125, 0.008024215698242188, 0.01242828369140625, 0.016832351684570312, 0.021236419677734375, 0.025640487670898438, 0.0300445556640625, 0.03444862365722656, 0.038852691650390625, 0.04325675964355469, 0.04766082763671875, 0.05206489562988281, 0.056468963623046875, 0.06087303161621094, 0.065277099609375, 0.06968116760253906, 0.07408523559570312, 0.07848930358886719, 0.08289337158203125, 0.08729743957519531, 0.09170150756835938, 0.09610557556152344, 0.1005096435546875, 0.10491371154785156, 0.10931777954101562, 0.11372184753417969, 0.11812591552734375, 0.12252998352050781, 0.12693405151367188, 0.13133811950683594, 0.1357421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 3.0, 5.0, 6.0, 9.0, 9.0, 18.0, 16.0, 22.0, 15.0, 19.0, 35.0, 32.0, 40.0, 49.0, 45.0, 44.0, 44.0, 56.0, 54.0, 60.0, 49.0, 37.0, 56.0, 41.0, 35.0, 23.0, 35.0, 19.0, 27.0, 22.0, 15.0, 8.0, 14.0, 7.0, 8.0, 8.0, 3.0, 3.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1845703125, -0.17830848693847656, -0.17204666137695312, -0.1657848358154297, -0.15952301025390625, -0.1532611846923828, -0.14699935913085938, -0.14073753356933594, -0.1344757080078125, -0.12821388244628906, -0.12195205688476562, -0.11569023132324219, -0.10942840576171875, -0.10316658020019531, -0.09690475463867188, -0.09064292907714844, -0.084381103515625, -0.07811927795410156, -0.07185745239257812, -0.06559562683105469, -0.05933380126953125, -0.05307197570800781, -0.046810150146484375, -0.04054832458496094, -0.0342864990234375, -0.028024673461914062, -0.021762847900390625, -0.015501022338867188, -0.00923919677734375, -0.0029773712158203125, 0.003284454345703125, 0.009546279907226562, 0.01580810546875, 0.022069931030273438, 0.028331756591796875, 0.03459358215332031, 0.04085540771484375, 0.04711723327636719, 0.053379058837890625, 0.05964088439941406, 0.0659027099609375, 0.07216453552246094, 0.07842636108398438, 0.08468818664550781, 0.09095001220703125, 0.09721183776855469, 0.10347366333007812, 0.10973548889160156, 0.115997314453125, 0.12225914001464844, 0.12852096557617188, 0.1347827911376953, 0.14104461669921875, 0.1473064422607422, 0.15356826782226562, 0.15983009338378906, 0.1660919189453125, 0.17235374450683594, 0.17861557006835938, 0.1848773956298828, 0.19113922119140625, 0.1974010467529297, 0.20366287231445312, 0.20992469787597656, 0.2161865234375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 4.0, 3.0, 8.0, 13.0, 17.0, 35.0, 48.0, 66.0, 116.0, 177.0, 417.0, 1023.0, 3806.0, 40568.0, 899519.0, 94644.0, 5695.0, 1329.0, 503.0, 217.0, 124.0, 53.0, 46.0, 30.0, 28.0, 14.0, 10.0, 11.0, 7.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0953369140625, -0.09232139587402344, -0.08930587768554688, -0.08629035949707031, -0.08327484130859375, -0.08025932312011719, -0.07724380493164062, -0.07422828674316406, -0.0712127685546875, -0.06819725036621094, -0.06518173217773438, -0.06216621398925781, -0.05915069580078125, -0.05613517761230469, -0.053119659423828125, -0.05010414123535156, -0.047088623046875, -0.04407310485839844, -0.041057586669921875, -0.03804206848144531, -0.03502655029296875, -0.03201103210449219, -0.028995513916015625, -0.025979995727539062, -0.0229644775390625, -0.019948959350585938, -0.016933441162109375, -0.013917922973632812, -0.01090240478515625, -0.007886886596679688, -0.004871368408203125, -0.0018558502197265625, 0.00115966796875, 0.0041751861572265625, 0.007190704345703125, 0.010206222534179688, 0.01322174072265625, 0.016237258911132812, 0.019252777099609375, 0.022268295288085938, 0.0252838134765625, 0.028299331665039062, 0.031314849853515625, 0.03433036804199219, 0.03734588623046875, 0.04036140441894531, 0.043376922607421875, 0.04639244079589844, 0.049407958984375, 0.05242347717285156, 0.055438995361328125, 0.05845451354980469, 0.06147003173828125, 0.06448554992675781, 0.06750106811523438, 0.07051658630371094, 0.0735321044921875, 0.07654762268066406, 0.07956314086914062, 0.08257865905761719, 0.08559417724609375, 0.08860969543457031, 0.09162521362304688, 0.09464073181152344, 0.09765625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 10.0, 8.0, 9.0, 9.0, 17.0, 31.0, 26.0, 53.0, 74.0, 94.0, 106.0, 117.0, 105.0, 75.0, 68.0, 55.0, 29.0, 27.0, 15.0, 14.0, 10.0, 4.0, 10.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.695487976074219e-05, -3.569945693016052e-05, -3.444403409957886e-05, -3.318861126899719e-05, -3.193318843841553e-05, -3.067776560783386e-05, -2.9422342777252197e-05, -2.8166919946670532e-05, -2.6911497116088867e-05, -2.5656074285507202e-05, -2.4400651454925537e-05, -2.3145228624343872e-05, -2.1889805793762207e-05, -2.0634382963180542e-05, -1.9378960132598877e-05, -1.8123537302017212e-05, -1.6868114471435547e-05, -1.5612691640853882e-05, -1.4357268810272217e-05, -1.3101845979690552e-05, -1.1846423149108887e-05, -1.0591000318527222e-05, -9.335577487945557e-06, -8.080154657363892e-06, -6.8247318267822266e-06, -5.5693089962005615e-06, -4.3138861656188965e-06, -3.0584633350372314e-06, -1.8030405044555664e-06, -5.476176738739014e-07, 7.078051567077637e-07, 1.9632279872894287e-06, 3.2186508178710938e-06, 4.474073648452759e-06, 5.729496479034424e-06, 6.984919309616089e-06, 8.240342140197754e-06, 9.495764970779419e-06, 1.0751187801361084e-05, 1.2006610631942749e-05, 1.3262033462524414e-05, 1.4517456293106079e-05, 1.5772879123687744e-05, 1.702830195426941e-05, 1.8283724784851074e-05, 1.953914761543274e-05, 2.0794570446014404e-05, 2.204999327659607e-05, 2.3305416107177734e-05, 2.45608389377594e-05, 2.5816261768341064e-05, 2.707168459892273e-05, 2.8327107429504395e-05, 2.958253026008606e-05, 3.0837953090667725e-05, 3.209337592124939e-05, 3.3348798751831055e-05, 3.460422158241272e-05, 3.5859644412994385e-05, 3.711506724357605e-05, 3.8370490074157715e-05, 3.962591290473938e-05, 4.0881335735321045e-05, 4.213675856590271e-05, 4.3392181396484375e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 5.0, 6.0, 8.0, 17.0, 15.0, 21.0, 29.0, 62.0, 90.0, 140.0, 259.0, 492.0, 1077.0, 2688.0, 9075.0, 68040.0, 695148.0, 242656.0, 21081.0, 4455.0, 1578.0, 706.0, 376.0, 196.0, 120.0, 71.0, 43.0, 23.0, 15.0, 14.0, 9.0, 11.0, 2.0, 1.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.06329345703125, -0.06129932403564453, -0.05930519104003906, -0.057311058044433594, -0.055316925048828125, -0.053322792053222656, -0.05132865905761719, -0.04933452606201172, -0.04734039306640625, -0.04534626007080078, -0.04335212707519531, -0.041357994079589844, -0.039363861083984375, -0.037369728088378906, -0.03537559509277344, -0.03338146209716797, -0.0313873291015625, -0.02939319610595703, -0.027399063110351562, -0.025404930114746094, -0.023410797119140625, -0.021416664123535156, -0.019422531127929688, -0.01742839813232422, -0.01543426513671875, -0.013440132141113281, -0.011445999145507812, -0.009451866149902344, -0.007457733154296875, -0.005463600158691406, -0.0034694671630859375, -0.0014753341674804688, 0.000518798828125, 0.0025129318237304688, 0.0045070648193359375, 0.006501197814941406, 0.008495330810546875, 0.010489463806152344, 0.012483596801757812, 0.014477729797363281, 0.01647186279296875, 0.01846599578857422, 0.020460128784179688, 0.022454261779785156, 0.024448394775390625, 0.026442527770996094, 0.028436660766601562, 0.03043079376220703, 0.0324249267578125, 0.03441905975341797, 0.03641319274902344, 0.038407325744628906, 0.040401458740234375, 0.042395591735839844, 0.04438972473144531, 0.04638385772705078, 0.04837799072265625, 0.05037212371826172, 0.05236625671386719, 0.054360389709472656, 0.056354522705078125, 0.058348655700683594, 0.06034278869628906, 0.06233692169189453, 0.0643310546875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 7.0, 11.0, 13.0, 31.0, 56.0, 70.0, 96.0, 135.0, 128.0, 128.0, 105.0, 58.0, 44.0, 27.0, 28.0, 17.0, 10.0, 9.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.093505859375, -0.09053707122802734, -0.08756828308105469, -0.08459949493408203, -0.08163070678710938, -0.07866191864013672, -0.07569313049316406, -0.0727243423461914, -0.06975555419921875, -0.0667867660522461, -0.06381797790527344, -0.06084918975830078, -0.057880401611328125, -0.05491161346435547, -0.05194282531738281, -0.048974037170410156, -0.0460052490234375, -0.043036460876464844, -0.04006767272949219, -0.03709888458251953, -0.034130096435546875, -0.03116130828857422, -0.028192520141601562, -0.025223731994628906, -0.02225494384765625, -0.019286155700683594, -0.016317367553710938, -0.013348579406738281, -0.010379791259765625, -0.007411003112792969, -0.0044422149658203125, -0.0014734268188476562, 0.001495361328125, 0.004464149475097656, 0.0074329376220703125, 0.010401725769042969, 0.013370513916015625, 0.01633930206298828, 0.019308090209960938, 0.022276878356933594, 0.02524566650390625, 0.028214454650878906, 0.031183242797851562, 0.03415203094482422, 0.037120819091796875, 0.04008960723876953, 0.04305839538574219, 0.046027183532714844, 0.0489959716796875, 0.051964759826660156, 0.05493354797363281, 0.05790233612060547, 0.060871124267578125, 0.06383991241455078, 0.06680870056152344, 0.0697774887084961, 0.07274627685546875, 0.0757150650024414, 0.07868385314941406, 0.08165264129638672, 0.08462142944335938, 0.08759021759033203, 0.09055900573730469, 0.09352779388427734, 0.09649658203125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 33.0, 253.0, 509.0, 178.0, 18.0, 9.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0131804943084717, -2.9205641746520996, -2.8279478549957275, -2.7353315353393555, -2.6427152156829834, -2.5500988960266113, -2.4574825763702393, -2.364866256713867, -2.272249937057495, -2.179633617401123, -2.087017297744751, -1.994400978088379, -1.9017846584320068, -1.8091683387756348, -1.7165520191192627, -1.6239356994628906, -1.5313193798065186, -1.4387030601501465, -1.3460867404937744, -1.2534704208374023, -1.1608541011810303, -1.0682377815246582, -0.9756214618682861, -0.8830051422119141, -0.790388822555542, -0.6977725028991699, -0.6051561832427979, -0.5125398635864258, -0.4199235439300537, -0.32730722427368164, -0.23469090461730957, -0.1420745849609375, -0.04945802688598633, 0.04315829277038574, 0.1357746124267578, 0.22839093208312988, 0.32100725173950195, 0.413623571395874, 0.5062398910522461, 0.5988562107086182, 0.6914725303649902, 0.7840888500213623, 0.8767051696777344, 0.9693214893341064, 1.0619378089904785, 1.1545541286468506, 1.2471704483032227, 1.3397867679595947, 1.4324030876159668, 1.5250194072723389, 1.617635726928711, 1.710252046585083, 1.802868366241455, 1.8954846858978271, 1.9881010055541992, 2.0807173252105713, 2.1733336448669434, 2.2659499645233154, 2.3585662841796875, 2.4511826038360596, 2.5437989234924316, 2.6364152431488037, 2.729031562805176, 2.821647882461548, 2.91426420211792]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 4.0, 5.0, 8.0, 15.0, 8.0, 15.0, 16.0, 18.0, 18.0, 25.0, 24.0, 26.0, 30.0, 36.0, 31.0, 38.0, 37.0, 51.0, 40.0, 55.0, 53.0, 46.0, 36.0, 45.0, 36.0, 33.0, 34.0, 20.0, 23.0, 23.0, 23.0, 17.0, 22.0, 17.0, 15.0, 17.0, 9.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7086033225059509, -0.6850324869155884, -0.661461591720581, -0.6378907561302185, -0.614319920539856, -0.5907490253448486, -0.5671781897544861, -0.5436073541641235, -0.5200364589691162, -0.4964655935764313, -0.4728947579860687, -0.4493238925933838, -0.42575305700302124, -0.4021821916103363, -0.37861132621765137, -0.3550404906272888, -0.33146965503692627, -0.30789878964424133, -0.2843279540538788, -0.26075708866119385, -0.2371862381696701, -0.21361538767814636, -0.19004452228546143, -0.16647367179393768, -0.14290282130241394, -0.1193319708108902, -0.09576111286878586, -0.07219025492668152, -0.048619404435157776, -0.025048553943634033, -0.0014776885509490967, 0.022093161940574646, 0.04566395282745361, 0.06923480331897736, 0.0928056612610817, 0.11637651920318604, 0.13994736969470978, 0.16351822018623352, 0.18708908557891846, 0.2106599360704422, 0.23423078656196594, 0.2578016519546509, 0.2813724875450134, 0.30494335293769836, 0.3285142183303833, 0.35208505392074585, 0.3756559193134308, 0.3992267847061157, 0.42279762029647827, 0.4463684856891632, 0.46993932127952576, 0.4935101866722107, 0.5170810222625732, 0.5406519174575806, 0.5642227530479431, 0.5877935886383057, 0.611364483833313, 0.6349353194236755, 0.6585062146186829, 0.6820770502090454, 0.705647885799408, 0.7292187213897705, 0.7527896165847778, 0.7763604521751404, 0.7999312877655029]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 12.0, 16.0, 7.0, 20.0, 28.0, 49.0, 56.0, 65.0, 135.0, 151.0, 235.0, 348.0, 602.0, 1107.0, 2223.0, 4775.0, 12133.0, 41571.0, 364127.0, 3648136.0, 84742.0, 19956.0, 7127.0, 2936.0, 1496.0, 831.0, 472.0, 309.0, 188.0, 127.0, 91.0, 53.0, 44.0, 27.0, 19.0, 20.0, 12.0, 5.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.07647705078125, -0.07410335540771484, -0.07172966003417969, -0.06935596466064453, -0.06698226928710938, -0.06460857391357422, -0.06223487854003906, -0.059861183166503906, -0.05748748779296875, -0.055113792419433594, -0.05274009704589844, -0.05036640167236328, -0.047992706298828125, -0.04561901092529297, -0.04324531555175781, -0.040871620178222656, -0.0384979248046875, -0.036124229431152344, -0.03375053405761719, -0.03137683868408203, -0.029003143310546875, -0.02662944793701172, -0.024255752563476562, -0.021882057189941406, -0.01950836181640625, -0.017134666442871094, -0.014760971069335938, -0.012387275695800781, -0.010013580322265625, -0.007639884948730469, -0.0052661895751953125, -0.0028924942016601562, -0.000518798828125, 0.0018548965454101562, 0.0042285919189453125, 0.006602287292480469, 0.008975982666015625, 0.011349678039550781, 0.013723373413085938, 0.016097068786621094, 0.01847076416015625, 0.020844459533691406, 0.023218154907226562, 0.02559185028076172, 0.027965545654296875, 0.03033924102783203, 0.03271293640136719, 0.035086631774902344, 0.0374603271484375, 0.039834022521972656, 0.04220771789550781, 0.04458141326904297, 0.046955108642578125, 0.04932880401611328, 0.05170249938964844, 0.054076194763183594, 0.05644989013671875, 0.058823585510253906, 0.06119728088378906, 0.06357097625732422, 0.06594467163085938, 0.06831836700439453, 0.07069206237792969, 0.07306575775146484, 0.075439453125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 8.0, 6.0, 13.0, 15.0, 13.0, 14.0, 23.0, 24.0, 30.0, 40.0, 42.0, 53.0, 56.0, 41.0, 52.0, 59.0, 73.0, 49.0, 53.0, 51.0, 54.0, 39.0, 31.0, 39.0, 26.0, 16.0, 19.0, 24.0, 7.0, 7.0, 8.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.055084228515625, -0.05355119705200195, -0.052018165588378906, -0.05048513412475586, -0.04895210266113281, -0.047419071197509766, -0.04588603973388672, -0.04435300827026367, -0.042819976806640625, -0.04128694534301758, -0.03975391387939453, -0.038220882415771484, -0.03668785095214844, -0.03515481948852539, -0.033621788024902344, -0.0320887565612793, -0.03055572509765625, -0.029022693634033203, -0.027489662170410156, -0.02595663070678711, -0.024423599243164062, -0.022890567779541016, -0.02135753631591797, -0.019824504852294922, -0.018291473388671875, -0.016758441925048828, -0.015225410461425781, -0.013692378997802734, -0.012159347534179688, -0.01062631607055664, -0.009093284606933594, -0.007560253143310547, -0.0060272216796875, -0.004494190216064453, -0.0029611587524414062, -0.0014281272888183594, 0.0001049041748046875, 0.0016379356384277344, 0.0031709671020507812, 0.004703998565673828, 0.006237030029296875, 0.007770061492919922, 0.009303092956542969, 0.010836124420166016, 0.012369155883789062, 0.01390218734741211, 0.015435218811035156, 0.016968250274658203, 0.01850128173828125, 0.020034313201904297, 0.021567344665527344, 0.02310037612915039, 0.024633407592773438, 0.026166439056396484, 0.02769947052001953, 0.029232501983642578, 0.030765533447265625, 0.03229856491088867, 0.03383159637451172, 0.035364627838134766, 0.03689765930175781, 0.03843069076538086, 0.039963722229003906, 0.04149675369262695, 0.04302978515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 7.0, 9.0, 8.0, 11.0, 35.0, 38.0, 40.0, 59.0, 80.0, 159.0, 213.0, 288.0, 477.0, 1241.0, 5823.0, 59354.0, 4004319.0, 110976.0, 7977.0, 1598.0, 570.0, 291.0, 194.0, 142.0, 107.0, 70.0, 48.0, 31.0, 19.0, 21.0, 17.0, 13.0, 7.0, 7.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2159423828125, -0.20987510681152344, -0.20380783081054688, -0.1977405548095703, -0.19167327880859375, -0.1856060028076172, -0.17953872680664062, -0.17347145080566406, -0.1674041748046875, -0.16133689880371094, -0.15526962280273438, -0.1492023468017578, -0.14313507080078125, -0.1370677947998047, -0.13100051879882812, -0.12493324279785156, -0.118865966796875, -0.11279869079589844, -0.10673141479492188, -0.10066413879394531, -0.09459686279296875, -0.08852958679199219, -0.08246231079101562, -0.07639503479003906, -0.0703277587890625, -0.06426048278808594, -0.058193206787109375, -0.05212593078613281, -0.04605865478515625, -0.03999137878417969, -0.033924102783203125, -0.027856826782226562, -0.02178955078125, -0.015722274780273438, -0.009654998779296875, -0.0035877227783203125, 0.00247955322265625, 0.008546829223632812, 0.014614105224609375, 0.020681381225585938, 0.0267486572265625, 0.03281593322753906, 0.038883209228515625, 0.04495048522949219, 0.05101776123046875, 0.05708503723144531, 0.06315231323242188, 0.06921958923339844, 0.075286865234375, 0.08135414123535156, 0.08742141723632812, 0.09348869323730469, 0.09955596923828125, 0.10562324523925781, 0.11169052124023438, 0.11775779724121094, 0.1238250732421875, 0.12989234924316406, 0.13595962524414062, 0.1420269012451172, 0.14809417724609375, 0.1541614532470703, 0.16022872924804688, 0.16629600524902344, 0.17236328125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 9.0, 20.0, 40.0, 78.0, 272.0, 2764.0, 670.0, 129.0, 52.0, 16.0, 11.0, 4.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10858154296875, -0.10545158386230469, -0.10232162475585938, -0.09919166564941406, -0.09606170654296875, -0.09293174743652344, -0.08980178833007812, -0.08667182922363281, -0.0835418701171875, -0.08041191101074219, -0.07728195190429688, -0.07415199279785156, -0.07102203369140625, -0.06789207458496094, -0.06476211547851562, -0.06163215637207031, -0.058502197265625, -0.05537223815917969, -0.052242279052734375, -0.04911231994628906, -0.04598236083984375, -0.04285240173339844, -0.039722442626953125, -0.03659248352050781, -0.0334625244140625, -0.030332565307617188, -0.027202606201171875, -0.024072647094726562, -0.02094268798828125, -0.017812728881835938, -0.014682769775390625, -0.011552810668945312, -0.0084228515625, -0.0052928924560546875, -0.002162933349609375, 0.0009670257568359375, 0.00409698486328125, 0.0072269439697265625, 0.010356903076171875, 0.013486862182617188, 0.0166168212890625, 0.019746780395507812, 0.022876739501953125, 0.026006698608398438, 0.02913665771484375, 0.03226661682128906, 0.035396575927734375, 0.03852653503417969, 0.041656494140625, 0.04478645324707031, 0.047916412353515625, 0.05104637145996094, 0.05417633056640625, 0.05730628967285156, 0.060436248779296875, 0.06356620788574219, 0.0666961669921875, 0.06982612609863281, 0.07295608520507812, 0.07608604431152344, 0.07921600341796875, 0.08234596252441406, 0.08547592163085938, 0.08860588073730469, 0.09173583984375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 10.0, 63.0, 95.0, 182.0, 249.0, 189.0, 97.0, 60.0, 14.0, 10.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25520849227905273, -0.2414485514163971, -0.22768861055374146, -0.21392866969108582, -0.20016872882843018, -0.18640878796577454, -0.1726488322019577, -0.15888889133930206, -0.14512895047664642, -0.13136900961399078, -0.11760906875133514, -0.10384912043809891, -0.09008917957544327, -0.07632923871278763, -0.06256929039955139, -0.04880934953689575, -0.03504940867424011, -0.021289465948939323, -0.0075295232236385345, 0.0062304213643074036, 0.019990362226963043, 0.03375030308961868, 0.04751025140285492, 0.06127019226551056, 0.0750301331281662, 0.08879007399082184, 0.10255001485347748, 0.11630996316671371, 0.13006991147994995, 0.1438298523426056, 0.15758979320526123, 0.17134973406791687, 0.1851096749305725, 0.19886961579322815, 0.2126295566558838, 0.22638949751853943, 0.24014943838119507, 0.2539093792438507, 0.26766932010650635, 0.2814292907714844, 0.2951892018318176, 0.30894914269447327, 0.3227090835571289, 0.33646902441978455, 0.3502289652824402, 0.3639889061450958, 0.37774884700775146, 0.3915088176727295, 0.40526875853538513, 0.41902869939804077, 0.4327886402606964, 0.44654858112335205, 0.4603085219860077, 0.47406846284866333, 0.48782843351364136, 0.5015883445739746, 0.5153483152389526, 0.5291082859039307, 0.5428681969642639, 0.5566281676292419, 0.5703880786895752, 0.5841480493545532, 0.5979079604148865, 0.6116679310798645, 0.6254278421401978]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 7.0, 5.0, 11.0, 11.0, 10.0, 17.0, 15.0, 16.0, 20.0, 16.0, 31.0, 23.0, 26.0, 28.0, 32.0, 31.0, 40.0, 38.0, 36.0, 38.0, 41.0, 36.0, 41.0, 33.0, 42.0, 42.0, 28.0, 35.0, 29.0, 30.0, 19.0, 18.0, 19.0, 19.0, 25.0, 15.0, 15.0, 14.0, 5.0, 10.0, 5.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.12384110689163208, -0.11998491734266281, -0.11612872779369354, -0.11227253824472427, -0.108416348695755, -0.10456016659736633, -0.10070397704839706, -0.0968477874994278, -0.09299159795045853, -0.08913540840148926, -0.08527921885251999, -0.08142302930355072, -0.07756684720516205, -0.07371065020561218, -0.06985446810722351, -0.06599827855825424, -0.06214208900928497, -0.058285899460315704, -0.054429709911346436, -0.050573524087667465, -0.046717334538698196, -0.04286114498972893, -0.03900495916604996, -0.03514876961708069, -0.03129258006811142, -0.02743639051914215, -0.02358020283281803, -0.019724015146493912, -0.015867825597524643, -0.012011636048555374, -0.008155448362231255, -0.004299260675907135, -0.0004430711269378662, 0.003413117490708828, 0.007269306108355522, 0.011125494726002216, 0.01498168334364891, 0.01883787289261818, 0.0226940605789423, 0.02655024826526642, 0.030406437814235687, 0.034262627363204956, 0.038118816912174225, 0.041975002735853195, 0.045831192284822464, 0.04968738183379173, 0.0535435676574707, 0.05739975720643997, 0.06125594675540924, 0.06511213630437851, 0.06896832585334778, 0.07282451540231705, 0.07668070495128632, 0.08053688704967499, 0.08439307659864426, 0.08824926614761353, 0.0921054556965828, 0.09596164524555206, 0.09981783479452133, 0.1036740243434906, 0.10753020644187927, 0.11138640344142914, 0.11524258553981781, 0.11909877508878708, 0.12295496463775635]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 7.0, 5.0, 19.0, 25.0, 24.0, 40.0, 57.0, 90.0, 128.0, 228.0, 350.0, 659.0, 1277.0, 2653.0, 6154.0, 15772.0, 44119.0, 130141.0, 315543.0, 323006.0, 134331.0, 45884.0, 15934.0, 6301.0, 2740.0, 1347.0, 647.0, 401.0, 246.0, 139.0, 89.0, 57.0, 33.0, 20.0, 25.0, 17.0, 10.0, 5.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.062347412109375, -0.06040000915527344, -0.058452606201171875, -0.05650520324707031, -0.05455780029296875, -0.05261039733886719, -0.050662994384765625, -0.04871559143066406, -0.0467681884765625, -0.04482078552246094, -0.042873382568359375, -0.04092597961425781, -0.03897857666015625, -0.03703117370605469, -0.035083770751953125, -0.03313636779785156, -0.03118896484375, -0.029241561889648438, -0.027294158935546875, -0.025346755981445312, -0.02339935302734375, -0.021451950073242188, -0.019504547119140625, -0.017557144165039062, -0.0156097412109375, -0.013662338256835938, -0.011714935302734375, -0.009767532348632812, -0.00782012939453125, -0.0058727264404296875, -0.003925323486328125, -0.0019779205322265625, -3.0517578125e-05, 0.0019168853759765625, 0.003864288330078125, 0.0058116912841796875, 0.00775909423828125, 0.009706497192382812, 0.011653900146484375, 0.013601303100585938, 0.0155487060546875, 0.017496109008789062, 0.019443511962890625, 0.021390914916992188, 0.02333831787109375, 0.025285720825195312, 0.027233123779296875, 0.029180526733398438, 0.0311279296875, 0.03307533264160156, 0.035022735595703125, 0.03697013854980469, 0.03891754150390625, 0.04086494445800781, 0.042812347412109375, 0.04475975036621094, 0.0467071533203125, 0.04865455627441406, 0.050601959228515625, 0.05254936218261719, 0.05449676513671875, 0.05644416809082031, 0.058391571044921875, 0.06033897399902344, 0.062286376953125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 9.0, 6.0, 8.0, 12.0, 13.0, 27.0, 18.0, 28.0, 29.0, 39.0, 39.0, 55.0, 47.0, 53.0, 56.0, 52.0, 61.0, 52.0, 48.0, 51.0, 38.0, 48.0, 39.0, 35.0, 30.0, 29.0, 12.0, 14.0, 12.0, 10.0, 7.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0582275390625, -0.056571006774902344, -0.05491447448730469, -0.05325794219970703, -0.051601409912109375, -0.04994487762451172, -0.04828834533691406, -0.046631813049316406, -0.04497528076171875, -0.043318748474121094, -0.04166221618652344, -0.04000568389892578, -0.038349151611328125, -0.03669261932373047, -0.03503608703613281, -0.033379554748535156, -0.0317230224609375, -0.030066490173339844, -0.028409957885742188, -0.02675342559814453, -0.025096893310546875, -0.02344036102294922, -0.021783828735351562, -0.020127296447753906, -0.01847076416015625, -0.016814231872558594, -0.015157699584960938, -0.013501167297363281, -0.011844635009765625, -0.010188102722167969, -0.008531570434570312, -0.006875038146972656, -0.005218505859375, -0.0035619735717773438, -0.0019054412841796875, -0.00024890899658203125, 0.001407623291015625, 0.0030641555786132812, 0.0047206878662109375, 0.006377220153808594, 0.00803375244140625, 0.009690284729003906, 0.011346817016601562, 0.013003349304199219, 0.014659881591796875, 0.01631641387939453, 0.017972946166992188, 0.019629478454589844, 0.0212860107421875, 0.022942543029785156, 0.024599075317382812, 0.02625560760498047, 0.027912139892578125, 0.02956867218017578, 0.031225204467773438, 0.032881736755371094, 0.03453826904296875, 0.036194801330566406, 0.03785133361816406, 0.03950786590576172, 0.041164398193359375, 0.04282093048095703, 0.04447746276855469, 0.046133995056152344, 0.04779052734375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 4.0, 8.0, 7.0, 9.0, 11.0, 15.0, 35.0, 40.0, 65.0, 112.0, 211.0, 365.0, 784.0, 1837.0, 7054.0, 127671.0, 862679.0, 40382.0, 4356.0, 1441.0, 633.0, 347.0, 181.0, 101.0, 68.0, 53.0, 19.0, 22.0, 18.0, 9.0, 5.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1785888671875, -0.17205810546875, -0.16552734375, -0.15899658203125, -0.1524658203125, -0.14593505859375, -0.139404296875, -0.13287353515625, -0.1263427734375, -0.11981201171875, -0.11328125, -0.10675048828125, -0.1002197265625, -0.09368896484375, -0.087158203125, -0.08062744140625, -0.0740966796875, -0.06756591796875, -0.06103515625, -0.05450439453125, -0.0479736328125, -0.04144287109375, -0.034912109375, -0.02838134765625, -0.0218505859375, -0.01531982421875, -0.0087890625, -0.00225830078125, 0.0042724609375, 0.01080322265625, 0.017333984375, 0.02386474609375, 0.0303955078125, 0.03692626953125, 0.04345703125, 0.04998779296875, 0.0565185546875, 0.06304931640625, 0.069580078125, 0.07611083984375, 0.0826416015625, 0.08917236328125, 0.095703125, 0.10223388671875, 0.1087646484375, 0.11529541015625, 0.121826171875, 0.12835693359375, 0.1348876953125, 0.14141845703125, 0.14794921875, 0.15447998046875, 0.1610107421875, 0.16754150390625, 0.174072265625, 0.18060302734375, 0.1871337890625, 0.19366455078125, 0.2001953125, 0.20672607421875, 0.2132568359375, 0.21978759765625, 0.226318359375, 0.23284912109375, 0.2393798828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 7.0, 4.0, 6.0, 19.0, 5.0, 15.0, 21.0, 10.0, 22.0, 24.0, 33.0, 26.0, 29.0, 51.0, 32.0, 34.0, 42.0, 47.0, 39.0, 45.0, 46.0, 51.0, 32.0, 37.0, 33.0, 36.0, 30.0, 28.0, 31.0, 17.0, 34.0, 18.0, 15.0, 8.0, 5.0, 13.0, 9.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.170166015625, -0.1646575927734375, -0.159149169921875, -0.1536407470703125, -0.14813232421875, -0.1426239013671875, -0.137115478515625, -0.1316070556640625, -0.1260986328125, -0.1205902099609375, -0.115081787109375, -0.1095733642578125, -0.10406494140625, -0.0985565185546875, -0.093048095703125, -0.0875396728515625, -0.08203125, -0.0765228271484375, -0.071014404296875, -0.0655059814453125, -0.05999755859375, -0.0544891357421875, -0.048980712890625, -0.0434722900390625, -0.0379638671875, -0.0324554443359375, -0.026947021484375, -0.0214385986328125, -0.01593017578125, -0.0104217529296875, -0.004913330078125, 0.0005950927734375, 0.006103515625, 0.0116119384765625, 0.017120361328125, 0.0226287841796875, 0.02813720703125, 0.0336456298828125, 0.039154052734375, 0.0446624755859375, 0.0501708984375, 0.0556793212890625, 0.061187744140625, 0.0666961669921875, 0.07220458984375, 0.0777130126953125, 0.083221435546875, 0.0887298583984375, 0.09423828125, 0.0997467041015625, 0.105255126953125, 0.1107635498046875, 0.11627197265625, 0.1217803955078125, 0.127288818359375, 0.1327972412109375, 0.1383056640625, 0.1438140869140625, 0.149322509765625, 0.1548309326171875, 0.16033935546875, 0.1658477783203125, 0.171356201171875, 0.1768646240234375, 0.182373046875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 5.0, 22.0, 22.0, 37.0, 75.0, 118.0, 250.0, 547.0, 1652.0, 7575.0, 104078.0, 883734.0, 43439.0, 4859.0, 1239.0, 433.0, 193.0, 94.0, 54.0, 37.0, 17.0, 14.0, 5.0, 9.0, 8.0, 5.0, 0.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.09954833984375, -0.09656524658203125, -0.0935821533203125, -0.09059906005859375, -0.087615966796875, -0.08463287353515625, -0.0816497802734375, -0.07866668701171875, -0.07568359375, -0.07270050048828125, -0.0697174072265625, -0.06673431396484375, -0.063751220703125, -0.06076812744140625, -0.0577850341796875, -0.05480194091796875, -0.05181884765625, -0.04883575439453125, -0.0458526611328125, -0.04286956787109375, -0.039886474609375, -0.03690338134765625, -0.0339202880859375, -0.03093719482421875, -0.0279541015625, -0.02497100830078125, -0.0219879150390625, -0.01900482177734375, -0.016021728515625, -0.01303863525390625, -0.0100555419921875, -0.00707244873046875, -0.00408935546875, -0.00110626220703125, 0.0018768310546875, 0.00485992431640625, 0.007843017578125, 0.01082611083984375, 0.0138092041015625, 0.01679229736328125, 0.019775390625, 0.02275848388671875, 0.0257415771484375, 0.02872467041015625, 0.031707763671875, 0.03469085693359375, 0.0376739501953125, 0.04065704345703125, 0.04364013671875, 0.04662322998046875, 0.0496063232421875, 0.05258941650390625, 0.055572509765625, 0.05855560302734375, 0.0615386962890625, 0.06452178955078125, 0.0675048828125, 0.07048797607421875, 0.0734710693359375, 0.07645416259765625, 0.079437255859375, 0.08242034912109375, 0.0854034423828125, 0.08838653564453125, 0.09136962890625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 1.0, 5.0, 3.0, 6.0, 4.0, 9.0, 11.0, 9.0, 11.0, 5.0, 18.0, 19.0, 26.0, 34.0, 55.0, 53.0, 72.0, 67.0, 79.0, 91.0, 74.0, 56.0, 43.0, 47.0, 34.0, 29.0, 17.0, 21.0, 14.0, 11.0, 9.0, 11.0, 4.0, 10.0, 4.0, 4.0, 8.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.314018249511719e-05, -3.2131560146808624e-05, -3.112293779850006e-05, -3.0114315450191498e-05, -2.9105693101882935e-05, -2.809707075357437e-05, -2.7088448405265808e-05, -2.6079826056957245e-05, -2.507120370864868e-05, -2.406258136034012e-05, -2.3053959012031555e-05, -2.2045336663722992e-05, -2.103671431541443e-05, -2.0028091967105865e-05, -1.9019469618797302e-05, -1.801084727048874e-05, -1.7002224922180176e-05, -1.5993602573871613e-05, -1.498498022556305e-05, -1.3976357877254486e-05, -1.2967735528945923e-05, -1.195911318063736e-05, -1.0950490832328796e-05, -9.941868484020233e-06, -8.93324613571167e-06, -7.924623787403107e-06, -6.9160014390945435e-06, -5.90737909078598e-06, -4.898756742477417e-06, -3.890134394168854e-06, -2.8815120458602905e-06, -1.8728896975517273e-06, -8.642673492431641e-07, 1.4435499906539917e-07, 1.1529773473739624e-06, 2.1615996956825256e-06, 3.170222043991089e-06, 4.178844392299652e-06, 5.187466740608215e-06, 6.1960890889167786e-06, 7.204711437225342e-06, 8.213333785533905e-06, 9.221956133842468e-06, 1.0230578482151031e-05, 1.1239200830459595e-05, 1.2247823178768158e-05, 1.3256445527076721e-05, 1.4265067875385284e-05, 1.5273690223693848e-05, 1.628231257200241e-05, 1.7290934920310974e-05, 1.8299557268619537e-05, 1.93081796169281e-05, 2.0316801965236664e-05, 2.1325424313545227e-05, 2.233404666185379e-05, 2.3342669010162354e-05, 2.4351291358470917e-05, 2.535991370677948e-05, 2.6368536055088043e-05, 2.7377158403396606e-05, 2.838578075170517e-05, 2.9394403100013733e-05, 3.0403025448322296e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 2.0, 17.0, 26.0, 51.0, 110.0, 268.0, 850.0, 3512.0, 61548.0, 948172.0, 30303.0, 2617.0, 640.0, 267.0, 100.0, 31.0, 23.0, 11.0, 3.0, 5.0, 3.0, 2.0, 3.0], "bins": [-0.2105712890625, -0.20639419555664062, -0.20221710205078125, -0.19804000854492188, -0.1938629150390625, -0.18968582153320312, -0.18550872802734375, -0.18133163452148438, -0.177154541015625, -0.17297744750976562, -0.16880035400390625, -0.16462326049804688, -0.1604461669921875, -0.15626907348632812, -0.15209197998046875, -0.14791488647460938, -0.14373779296875, -0.13956069946289062, -0.13538360595703125, -0.13120651245117188, -0.1270294189453125, -0.12285232543945312, -0.11867523193359375, -0.11449813842773438, -0.110321044921875, -0.10614395141601562, -0.10196685791015625, -0.09778976440429688, -0.0936126708984375, -0.08943557739257812, -0.08525848388671875, -0.08108139038085938, -0.076904296875, -0.07272720336914062, -0.06855010986328125, -0.06437301635742188, -0.0601959228515625, -0.056018829345703125, -0.05184173583984375, -0.047664642333984375, -0.043487548828125, -0.039310455322265625, -0.03513336181640625, -0.030956268310546875, -0.0267791748046875, -0.022602081298828125, -0.01842498779296875, -0.014247894287109375, -0.01007080078125, -0.005893707275390625, -0.00171661376953125, 0.002460479736328125, 0.0066375732421875, 0.010814666748046875, 0.01499176025390625, 0.019168853759765625, 0.023345947265625, 0.027523040771484375, 0.03170013427734375, 0.035877227783203125, 0.0400543212890625, 0.044231414794921875, 0.04840850830078125, 0.052585601806640625, 0.0567626953125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 12.0, 10.0, 18.0, 20.0, 29.0, 42.0, 48.0, 66.0, 78.0, 125.0, 98.0, 95.0, 83.0, 70.0, 43.0, 44.0, 32.0, 21.0, 18.0, 10.0, 5.0, 9.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058319091796875, -0.05634927749633789, -0.05437946319580078, -0.05240964889526367, -0.05043983459472656, -0.04847002029418945, -0.046500205993652344, -0.044530391693115234, -0.042560577392578125, -0.040590763092041016, -0.038620948791503906, -0.0366511344909668, -0.03468132019042969, -0.03271150588989258, -0.03074169158935547, -0.02877187728881836, -0.02680206298828125, -0.02483224868774414, -0.02286243438720703, -0.020892620086669922, -0.018922805786132812, -0.016952991485595703, -0.014983177185058594, -0.013013362884521484, -0.011043548583984375, -0.009073734283447266, -0.007103919982910156, -0.005134105682373047, -0.0031642913818359375, -0.0011944770812988281, 0.0007753372192382812, 0.0027451515197753906, 0.0047149658203125, 0.006684780120849609, 0.008654594421386719, 0.010624408721923828, 0.012594223022460938, 0.014564037322998047, 0.016533851623535156, 0.018503665924072266, 0.020473480224609375, 0.022443294525146484, 0.024413108825683594, 0.026382923126220703, 0.028352737426757812, 0.030322551727294922, 0.03229236602783203, 0.03426218032836914, 0.03623199462890625, 0.03820180892944336, 0.04017162322998047, 0.04214143753051758, 0.04411125183105469, 0.0460810661315918, 0.048050880432128906, 0.050020694732666016, 0.051990509033203125, 0.053960323333740234, 0.055930137634277344, 0.05789995193481445, 0.05986976623535156, 0.06183958053588867, 0.06380939483642578, 0.06577920913696289, 0.0677490234375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 14.0, 69.0, 258.0, 393.0, 191.0, 42.0, 14.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2288155555725098, -3.1465654373168945, -3.0643153190612793, -2.982065200805664, -2.899815082550049, -2.8175649642944336, -2.7353148460388184, -2.653064727783203, -2.570814609527588, -2.4885644912719727, -2.4063143730163574, -2.324064254760742, -2.241814136505127, -2.1595640182495117, -2.0773138999938965, -1.9950636625289917, -1.912813425064087, -1.8305633068084717, -1.7483131885528564, -1.6660630702972412, -1.583812952041626, -1.5015628337860107, -1.419312596321106, -1.3370624780654907, -1.2548123598098755, -1.1725622415542603, -1.090312123298645, -1.0080620050430298, -0.9258118271827698, -0.8435617089271545, -0.7613115310668945, -0.6790614128112793, -0.5968115329742432, -0.5145614147186279, -0.4323112666606903, -0.3500611186027527, -0.26781100034713745, -0.18556088209152222, -0.1033107340335846, -0.021060585975646973, 0.06118953227996826, 0.1434396654367447, 0.22568979859352112, 0.30793994665145874, 0.390190064907074, 0.4724401831626892, 0.5546903610229492, 0.6369404792785645, 0.7191905975341797, 0.8014407157897949, 0.8836908340454102, 0.9659410119056702, 1.0481910705566406, 1.1304411888122559, 1.2126914262771606, 1.2949415445327759, 1.3771916627883911, 1.4594417810440063, 1.5416918992996216, 1.6239420175552368, 1.7061922550201416, 1.7884423732757568, 1.870692491531372, 1.9529426097869873, 2.0351927280426025]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 9.0, 6.0, 7.0, 3.0, 19.0, 11.0, 13.0, 20.0, 30.0, 24.0, 30.0, 29.0, 41.0, 37.0, 43.0, 50.0, 72.0, 47.0, 54.0, 43.0, 60.0, 45.0, 43.0, 32.0, 46.0, 40.0, 25.0, 25.0, 19.0, 14.0, 16.0, 8.0, 9.0, 6.0, 6.0, 8.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.1144278049468994, -1.085119605064392, -1.0558112859725952, -1.026503086090088, -0.9971948266029358, -0.9678865671157837, -0.9385783672332764, -0.9092701077461243, -0.8799618482589722, -0.8506535887718201, -0.8213453888893127, -0.7920371294021606, -0.7627288699150085, -0.7334206104278564, -0.7041124105453491, -0.674804151058197, -0.6454959511756897, -0.6161876916885376, -0.5868794918060303, -0.5575712323188782, -0.5282629728317261, -0.49895474314689636, -0.46964651346206665, -0.44033825397491455, -0.41103002429008484, -0.3817217946052551, -0.352413535118103, -0.3231053054332733, -0.2937970757484436, -0.2644888162612915, -0.2351805865764618, -0.2058723419904709, -0.17656409740447998, -0.14725585281848907, -0.11794761568307877, -0.08863937854766846, -0.05933113396167755, -0.030022889375686646, -0.0007146596908569336, 0.028593584895133972, 0.05790182948112488, 0.08721007406711578, 0.11651831120252609, 0.1458265483379364, 0.1751347929239273, 0.2044430375099182, 0.23375126719474792, 0.26305949687957764, 0.29236775636672974, 0.32167598605155945, 0.35098424553871155, 0.38029247522354126, 0.40960073471069336, 0.43890896439552307, 0.4682171940803528, 0.4975254535675049, 0.5268336534500122, 0.5561419129371643, 0.5854501128196716, 0.6147583723068237, 0.6440666317939758, 0.6733748912811279, 0.7026830911636353, 0.7319913506507874, 0.7612996101379395]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 11.0, 7.0, 11.0, 19.0, 40.0, 75.0, 141.0, 296.0, 687.0, 1828.0, 5387.0, 19314.0, 109450.0, 2348624.0, 1599411.0, 84583.0, 16901.0, 4821.0, 1596.0, 586.0, 246.0, 131.0, 58.0, 24.0, 14.0, 11.0, 8.0, 6.0], "bins": [-0.154296875, -0.15120697021484375, -0.1481170654296875, -0.14502716064453125, -0.141937255859375, -0.13884735107421875, -0.1357574462890625, -0.13266754150390625, -0.12957763671875, -0.12648773193359375, -0.1233978271484375, -0.12030792236328125, -0.117218017578125, -0.11412811279296875, -0.1110382080078125, -0.10794830322265625, -0.1048583984375, -0.10176849365234375, -0.0986785888671875, -0.09558868408203125, -0.092498779296875, -0.08940887451171875, -0.0863189697265625, -0.08322906494140625, -0.08013916015625, -0.07704925537109375, -0.0739593505859375, -0.07086944580078125, -0.067779541015625, -0.06468963623046875, -0.0615997314453125, -0.05850982666015625, -0.055419921875, -0.05233001708984375, -0.0492401123046875, -0.04615020751953125, -0.043060302734375, -0.03997039794921875, -0.0368804931640625, -0.03379058837890625, -0.03070068359375, -0.02761077880859375, -0.0245208740234375, -0.02143096923828125, -0.018341064453125, -0.01525115966796875, -0.0121612548828125, -0.00907135009765625, -0.0059814453125, -0.00289154052734375, 0.0001983642578125, 0.00328826904296875, 0.006378173828125, 0.00946807861328125, 0.0125579833984375, 0.01564788818359375, 0.01873779296875, 0.02182769775390625, 0.0249176025390625, 0.02800750732421875, 0.031097412109375, 0.03418731689453125, 0.0372772216796875, 0.04036712646484375, 0.04345703125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 7.0, 10.0, 17.0, 13.0, 33.0, 38.0, 55.0, 53.0, 64.0, 78.0, 71.0, 82.0, 75.0, 86.0, 59.0, 62.0, 66.0, 35.0, 26.0, 22.0, 15.0, 14.0, 15.0, 8.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.1085205078125, -0.10619497299194336, -0.10386943817138672, -0.10154390335083008, -0.09921836853027344, -0.0968928337097168, -0.09456729888916016, -0.09224176406860352, -0.08991622924804688, -0.08759069442749023, -0.0852651596069336, -0.08293962478637695, -0.08061408996582031, -0.07828855514526367, -0.07596302032470703, -0.07363748550415039, -0.07131195068359375, -0.06898641586303711, -0.06666088104248047, -0.06433534622192383, -0.06200981140136719, -0.05968427658081055, -0.057358741760253906, -0.055033206939697266, -0.052707672119140625, -0.050382137298583984, -0.048056602478027344, -0.0457310676574707, -0.04340553283691406, -0.04107999801635742, -0.03875446319580078, -0.03642892837524414, -0.0341033935546875, -0.03177785873413086, -0.02945232391357422, -0.027126789093017578, -0.024801254272460938, -0.022475719451904297, -0.020150184631347656, -0.017824649810791016, -0.015499114990234375, -0.013173580169677734, -0.010848045349121094, -0.008522510528564453, -0.0061969757080078125, -0.003871440887451172, -0.0015459060668945312, 0.0007796287536621094, 0.00310516357421875, 0.005430698394775391, 0.007756233215332031, 0.010081768035888672, 0.012407302856445312, 0.014732837677001953, 0.017058372497558594, 0.019383907318115234, 0.021709442138671875, 0.024034976959228516, 0.026360511779785156, 0.028686046600341797, 0.031011581420898438, 0.03333711624145508, 0.03566265106201172, 0.03798818588256836, 0.040313720703125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 3.0, 5.0, 5.0, 5.0, 16.0, 19.0, 28.0, 32.0, 64.0, 126.0, 280.0, 812.0, 3414.0, 20136.0, 274669.0, 3755645.0, 122543.0, 12888.0, 2364.0, 673.0, 240.0, 109.0, 64.0, 32.0, 24.0, 23.0, 12.0, 11.0, 4.0, 8.0, 10.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1358642578125, -0.13071441650390625, -0.1255645751953125, -0.12041473388671875, -0.115264892578125, -0.11011505126953125, -0.1049652099609375, -0.09981536865234375, -0.09466552734375, -0.08951568603515625, -0.0843658447265625, -0.07921600341796875, -0.074066162109375, -0.06891632080078125, -0.0637664794921875, -0.05861663818359375, -0.053466796875, -0.04831695556640625, -0.0431671142578125, -0.03801727294921875, -0.032867431640625, -0.02771759033203125, -0.0225677490234375, -0.01741790771484375, -0.01226806640625, -0.00711822509765625, -0.0019683837890625, 0.00318145751953125, 0.008331298828125, 0.01348114013671875, 0.0186309814453125, 0.02378082275390625, 0.0289306640625, 0.03408050537109375, 0.0392303466796875, 0.04438018798828125, 0.049530029296875, 0.05467987060546875, 0.0598297119140625, 0.06497955322265625, 0.07012939453125, 0.07527923583984375, 0.0804290771484375, 0.08557891845703125, 0.090728759765625, 0.09587860107421875, 0.1010284423828125, 0.10617828369140625, 0.111328125, 0.11647796630859375, 0.1216278076171875, 0.12677764892578125, 0.131927490234375, 0.13707733154296875, 0.1422271728515625, 0.14737701416015625, 0.15252685546875, 0.15767669677734375, 0.1628265380859375, 0.16797637939453125, 0.173126220703125, 0.17827606201171875, 0.1834259033203125, 0.18857574462890625, 0.1937255859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 11.0, 9.0, 9.0, 13.0, 30.0, 28.0, 55.0, 85.0, 144.0, 270.0, 589.0, 958.0, 870.0, 427.0, 219.0, 128.0, 62.0, 37.0, 26.0, 23.0, 12.0, 10.0, 14.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1318359375, -0.12782859802246094, -0.12382125854492188, -0.11981391906738281, -0.11580657958984375, -0.11179924011230469, -0.10779190063476562, -0.10378456115722656, -0.0997772216796875, -0.09576988220214844, -0.09176254272460938, -0.08775520324707031, -0.08374786376953125, -0.07974052429199219, -0.07573318481445312, -0.07172584533691406, -0.067718505859375, -0.06371116638183594, -0.059703826904296875, -0.05569648742675781, -0.05168914794921875, -0.04768180847167969, -0.043674468994140625, -0.03966712951660156, -0.0356597900390625, -0.03165245056152344, -0.027645111083984375, -0.023637771606445312, -0.01963043212890625, -0.015623092651367188, -0.011615753173828125, -0.0076084136962890625, -0.00360107421875, 0.0004062652587890625, 0.004413604736328125, 0.008420944213867188, 0.01242828369140625, 0.016435623168945312, 0.020442962646484375, 0.024450302124023438, 0.0284576416015625, 0.03246498107910156, 0.036472320556640625, 0.04047966003417969, 0.04448699951171875, 0.04849433898925781, 0.052501678466796875, 0.05650901794433594, 0.060516357421875, 0.06452369689941406, 0.06853103637695312, 0.07253837585449219, 0.07654571533203125, 0.08055305480957031, 0.08456039428710938, 0.08856773376464844, 0.0925750732421875, 0.09658241271972656, 0.10058975219726562, 0.10459709167480469, 0.10860443115234375, 0.11261177062988281, 0.11661911010742188, 0.12062644958496094, 0.1246337890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 1.0, 8.0, 12.0, 22.0, 27.0, 86.0, 170.0, 247.0, 188.0, 120.0, 70.0, 21.0, 6.0, 6.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6261084079742432, -1.5855979919433594, -1.545087456703186, -1.5045770406723022, -1.4640666246414185, -1.4235560894012451, -1.3830456733703613, -1.3425352573394775, -1.3020247220993042, -1.2615143060684204, -1.221003770828247, -1.1804933547973633, -1.1399829387664795, -1.0994724035263062, -1.0589619874954224, -1.018451452255249, -0.97794109582901, -0.9374306201934814, -0.8969202041625977, -0.8564097285270691, -0.8158992528915405, -0.7753888368606567, -0.7348783612251282, -0.6943678855895996, -0.6538574695587158, -0.6133469939231873, -0.5728365778923035, -0.5323261022567749, -0.49181562662124634, -0.45130518078804016, -0.410794734954834, -0.3702842593193054, -0.3297737240791321, -0.2892632782459259, -0.24875280261039734, -0.20824235677719116, -0.1677318960428238, -0.12722143530845642, -0.08671098947525024, -0.04620051383972168, -0.005690068006515503, 0.03482038900256157, 0.07533084601163864, 0.11584129929542542, 0.15635176002979279, 0.19686222076416016, 0.23737266659736633, 0.2778831422328949, 0.3183935880661011, 0.35890403389930725, 0.3994145095348358, 0.439924955368042, 0.48043543100357056, 0.5209459066390991, 0.5614563226699829, 0.6019667983055115, 0.64247727394104, 0.6829877495765686, 0.7234981656074524, 0.764008641242981, 0.8045191168785095, 0.8450295925140381, 0.8855400085449219, 0.9260504841804504, 0.9665609002113342]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 5.0, 10.0, 6.0, 20.0, 22.0, 26.0, 22.0, 36.0, 47.0, 42.0, 51.0, 41.0, 62.0, 72.0, 73.0, 65.0, 50.0, 57.0, 50.0, 37.0, 37.0, 39.0, 26.0, 25.0, 15.0, 16.0, 18.0, 14.0, 6.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7481275200843811, -0.7273287773132324, -0.7065300345420837, -0.6857312321662903, -0.6649324893951416, -0.6441337466239929, -0.6233350038528442, -0.6025362610816956, -0.5817375183105469, -0.5609387755393982, -0.5401400327682495, -0.519341230392456, -0.4985424876213074, -0.4777437448501587, -0.45694500207901, -0.43614625930786133, -0.41534745693206787, -0.3945487141609192, -0.3737499415874481, -0.35295119881629944, -0.33215242624282837, -0.3113536834716797, -0.290554940700531, -0.2697561979293823, -0.24895742535591125, -0.22815866768360138, -0.2073599100112915, -0.18656116724014282, -0.16576240956783295, -0.14496365189552307, -0.12416490167379379, -0.10336615145206451, -0.08256733417510986, -0.061768580228090286, -0.04096982628107071, -0.020171072334051132, 0.0006276816129684448, 0.02142643928527832, 0.0422251895070076, 0.06302393972873688, 0.08382269740104675, 0.10462145507335663, 0.1254202127456665, 0.14621895551681519, 0.16701771318912506, 0.18781647086143494, 0.20861521363258362, 0.2294139713048935, 0.25021272897720337, 0.27101147174835205, 0.2918102443218231, 0.3126089870929718, 0.33340775966644287, 0.35420650243759155, 0.37500524520874023, 0.3958039879798889, 0.41660276055336, 0.43740150332450867, 0.45820027589797974, 0.4789990186691284, 0.4997977614402771, 0.5205965042114258, 0.5413953065872192, 0.5621940493583679, 0.5829927921295166]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 16.0, 21.0, 40.0, 70.0, 109.0, 189.0, 350.0, 744.0, 1551.0, 3334.0, 8277.0, 20941.0, 56492.0, 153910.0, 349550.0, 280338.0, 107178.0, 39449.0, 14942.0, 6024.0, 2575.0, 1171.0, 577.0, 304.0, 177.0, 84.0, 57.0, 40.0, 15.0, 10.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053375244140625, -0.05130815505981445, -0.049241065979003906, -0.04717397689819336, -0.04510688781738281, -0.043039798736572266, -0.04097270965576172, -0.03890562057495117, -0.036838531494140625, -0.03477144241333008, -0.03270435333251953, -0.030637264251708984, -0.028570175170898438, -0.02650308609008789, -0.024435997009277344, -0.022368907928466797, -0.02030181884765625, -0.018234729766845703, -0.016167640686035156, -0.01410055160522461, -0.012033462524414062, -0.009966373443603516, -0.007899284362792969, -0.005832195281982422, -0.003765106201171875, -0.0016980171203613281, 0.00036907196044921875, 0.0024361610412597656, 0.0045032501220703125, 0.006570339202880859, 0.008637428283691406, 0.010704517364501953, 0.0127716064453125, 0.014838695526123047, 0.016905784606933594, 0.01897287368774414, 0.021039962768554688, 0.023107051849365234, 0.02517414093017578, 0.027241230010986328, 0.029308319091796875, 0.03137540817260742, 0.03344249725341797, 0.035509586334228516, 0.03757667541503906, 0.03964376449584961, 0.041710853576660156, 0.0437779426574707, 0.04584503173828125, 0.0479121208190918, 0.049979209899902344, 0.05204629898071289, 0.05411338806152344, 0.056180477142333984, 0.05824756622314453, 0.06031465530395508, 0.062381744384765625, 0.06444883346557617, 0.06651592254638672, 0.06858301162719727, 0.07065010070800781, 0.07271718978881836, 0.0747842788696289, 0.07685136795043945, 0.07891845703125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 1.0, 5.0, 3.0, 8.0, 12.0, 11.0, 22.0, 26.0, 27.0, 27.0, 43.0, 48.0, 46.0, 57.0, 48.0, 41.0, 62.0, 68.0, 50.0, 51.0, 45.0, 42.0, 46.0, 32.0, 38.0, 35.0, 22.0, 21.0, 20.0, 15.0, 12.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.0706787109375, -0.06903934478759766, -0.06739997863769531, -0.06576061248779297, -0.06412124633789062, -0.06248188018798828, -0.06084251403808594, -0.059203147888183594, -0.05756378173828125, -0.055924415588378906, -0.05428504943847656, -0.05264568328857422, -0.051006317138671875, -0.04936695098876953, -0.04772758483886719, -0.046088218688964844, -0.0444488525390625, -0.042809486389160156, -0.04117012023925781, -0.03953075408935547, -0.037891387939453125, -0.03625202178955078, -0.03461265563964844, -0.032973289489746094, -0.03133392333984375, -0.029694557189941406, -0.028055191040039062, -0.02641582489013672, -0.024776458740234375, -0.02313709259033203, -0.021497726440429688, -0.019858360290527344, -0.018218994140625, -0.016579627990722656, -0.014940261840820312, -0.013300895690917969, -0.011661529541015625, -0.010022163391113281, -0.008382797241210938, -0.006743431091308594, -0.00510406494140625, -0.0034646987915039062, -0.0018253326416015625, -0.00018596649169921875, 0.001453399658203125, 0.0030927658081054688, 0.0047321319580078125, 0.006371498107910156, 0.0080108642578125, 0.009650230407714844, 0.011289596557617188, 0.012928962707519531, 0.014568328857421875, 0.01620769500732422, 0.017847061157226562, 0.019486427307128906, 0.02112579345703125, 0.022765159606933594, 0.024404525756835938, 0.02604389190673828, 0.027683258056640625, 0.02932262420654297, 0.030961990356445312, 0.032601356506347656, 0.03424072265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 7.0, 8.0, 15.0, 28.0, 38.0, 45.0, 70.0, 114.0, 171.0, 241.0, 469.0, 925.0, 1969.0, 6159.0, 61579.0, 873042.0, 91678.0, 7490.0, 2180.0, 937.0, 551.0, 309.0, 173.0, 127.0, 72.0, 56.0, 27.0, 21.0, 16.0, 8.0, 3.0, 7.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2166748046875, -0.2102184295654297, -0.20376205444335938, -0.19730567932128906, -0.19084930419921875, -0.18439292907714844, -0.17793655395507812, -0.1714801788330078, -0.1650238037109375, -0.1585674285888672, -0.15211105346679688, -0.14565467834472656, -0.13919830322265625, -0.13274192810058594, -0.12628555297851562, -0.11982917785644531, -0.113372802734375, -0.10691642761230469, -0.10046005249023438, -0.09400367736816406, -0.08754730224609375, -0.08109092712402344, -0.07463455200195312, -0.06817817687988281, -0.0617218017578125, -0.05526542663574219, -0.048809051513671875, -0.04235267639160156, -0.03589630126953125, -0.029439926147460938, -0.022983551025390625, -0.016527175903320312, -0.01007080078125, -0.0036144256591796875, 0.002841949462890625, 0.009298324584960938, 0.01575469970703125, 0.022211074829101562, 0.028667449951171875, 0.03512382507324219, 0.0415802001953125, 0.04803657531738281, 0.054492950439453125, 0.06094932556152344, 0.06740570068359375, 0.07386207580566406, 0.08031845092773438, 0.08677482604980469, 0.093231201171875, 0.09968757629394531, 0.10614395141601562, 0.11260032653808594, 0.11905670166015625, 0.12551307678222656, 0.13196945190429688, 0.1384258270263672, 0.1448822021484375, 0.1513385772705078, 0.15779495239257812, 0.16425132751464844, 0.17070770263671875, 0.17716407775878906, 0.18362045288085938, 0.1900768280029297, 0.196533203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 4.0, 8.0, 12.0, 20.0, 15.0, 34.0, 23.0, 26.0, 22.0, 39.0, 37.0, 32.0, 46.0, 55.0, 51.0, 42.0, 57.0, 50.0, 59.0, 40.0, 51.0, 47.0, 30.0, 31.0, 28.0, 25.0, 21.0, 19.0, 11.0, 13.0, 11.0, 7.0, 5.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1732177734375, -0.16698837280273438, -0.16075897216796875, -0.15452957153320312, -0.1483001708984375, -0.14207077026367188, -0.13584136962890625, -0.12961196899414062, -0.123382568359375, -0.11715316772460938, -0.11092376708984375, -0.10469436645507812, -0.0984649658203125, -0.09223556518554688, -0.08600616455078125, -0.07977676391601562, -0.07354736328125, -0.06731796264648438, -0.06108856201171875, -0.054859161376953125, -0.0486297607421875, -0.042400360107421875, -0.03617095947265625, -0.029941558837890625, -0.023712158203125, -0.017482757568359375, -0.01125335693359375, -0.005023956298828125, 0.0012054443359375, 0.007434844970703125, 0.01366424560546875, 0.019893646240234375, 0.026123046875, 0.032352447509765625, 0.03858184814453125, 0.044811248779296875, 0.0510406494140625, 0.057270050048828125, 0.06349945068359375, 0.06972885131835938, 0.075958251953125, 0.08218765258789062, 0.08841705322265625, 0.09464645385742188, 0.1008758544921875, 0.10710525512695312, 0.11333465576171875, 0.11956405639648438, 0.12579345703125, 0.13202285766601562, 0.13825225830078125, 0.14448165893554688, 0.1507110595703125, 0.15694046020507812, 0.16316986083984375, 0.16939926147460938, 0.175628662109375, 0.18185806274414062, 0.18808746337890625, 0.19431686401367188, 0.2005462646484375, 0.20677566528320312, 0.21300506591796875, 0.21923446655273438, 0.2254638671875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 8.0, 3.0, 2.0, 7.0, 9.0, 14.0, 18.0, 28.0, 61.0, 77.0, 155.0, 291.0, 554.0, 1452.0, 4818.0, 30999.0, 740901.0, 246969.0, 16745.0, 3344.0, 1078.0, 474.0, 221.0, 114.0, 75.0, 34.0, 30.0, 24.0, 15.0, 10.0, 8.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10540771484375, -0.10219955444335938, -0.09899139404296875, -0.09578323364257812, -0.0925750732421875, -0.08936691284179688, -0.08615875244140625, -0.08295059204101562, -0.079742431640625, -0.07653427124023438, -0.07332611083984375, -0.07011795043945312, -0.0669097900390625, -0.06370162963867188, -0.06049346923828125, -0.057285308837890625, -0.0540771484375, -0.050868988037109375, -0.04766082763671875, -0.044452667236328125, -0.0412445068359375, -0.038036346435546875, -0.03482818603515625, -0.031620025634765625, -0.028411865234375, -0.025203704833984375, -0.02199554443359375, -0.018787384033203125, -0.0155792236328125, -0.012371063232421875, -0.00916290283203125, -0.005954742431640625, -0.00274658203125, 0.000461578369140625, 0.00366973876953125, 0.006877899169921875, 0.0100860595703125, 0.013294219970703125, 0.01650238037109375, 0.019710540771484375, 0.022918701171875, 0.026126861572265625, 0.02933502197265625, 0.032543182373046875, 0.0357513427734375, 0.038959503173828125, 0.04216766357421875, 0.045375823974609375, 0.048583984375, 0.051792144775390625, 0.05500030517578125, 0.058208465576171875, 0.0614166259765625, 0.06462478637695312, 0.06783294677734375, 0.07104110717773438, 0.074249267578125, 0.07745742797851562, 0.08066558837890625, 0.08387374877929688, 0.0870819091796875, 0.09029006958007812, 0.09349822998046875, 0.09670639038085938, 0.09991455078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 8.0, 7.0, 5.0, 3.0, 6.0, 8.0, 17.0, 15.0, 16.0, 16.0, 24.0, 41.0, 44.0, 62.0, 90.0, 107.0, 111.0, 85.0, 85.0, 59.0, 45.0, 32.0, 25.0, 17.0, 11.0, 8.0, 16.0, 5.0, 7.0, 7.0, 9.0, 7.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.451108932495117e-05, -3.308989107608795e-05, -3.166869282722473e-05, -3.024749457836151e-05, -2.882629632949829e-05, -2.740509808063507e-05, -2.598389983177185e-05, -2.456270158290863e-05, -2.314150333404541e-05, -2.172030508518219e-05, -2.029910683631897e-05, -1.887790858745575e-05, -1.745671033859253e-05, -1.603551208972931e-05, -1.4614313840866089e-05, -1.3193115592002869e-05, -1.1771917343139648e-05, -1.0350719094276428e-05, -8.929520845413208e-06, -7.508322596549988e-06, -6.087124347686768e-06, -4.665926098823547e-06, -3.244727849960327e-06, -1.823529601097107e-06, -4.023313522338867e-07, 1.0188668966293335e-06, 2.4400651454925537e-06, 3.861263394355774e-06, 5.282461643218994e-06, 6.703659892082214e-06, 8.124858140945435e-06, 9.546056389808655e-06, 1.0967254638671875e-05, 1.2388452887535095e-05, 1.3809651136398315e-05, 1.5230849385261536e-05, 1.6652047634124756e-05, 1.8073245882987976e-05, 1.9494444131851196e-05, 2.0915642380714417e-05, 2.2336840629577637e-05, 2.3758038878440857e-05, 2.5179237127304077e-05, 2.6600435376167297e-05, 2.8021633625030518e-05, 2.9442831873893738e-05, 3.086403012275696e-05, 3.228522837162018e-05, 3.37064266204834e-05, 3.512762486934662e-05, 3.654882311820984e-05, 3.797002136707306e-05, 3.939121961593628e-05, 4.08124178647995e-05, 4.223361611366272e-05, 4.365481436252594e-05, 4.507601261138916e-05, 4.649721086025238e-05, 4.79184091091156e-05, 4.933960735797882e-05, 5.076080560684204e-05, 5.218200385570526e-05, 5.360320210456848e-05, 5.50244003534317e-05, 5.644559860229492e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 7.0, 14.0, 19.0, 16.0, 29.0, 39.0, 54.0, 118.0, 174.0, 294.0, 517.0, 1020.0, 2306.0, 8607.0, 65321.0, 815029.0, 135105.0, 13935.0, 3281.0, 1226.0, 635.0, 301.0, 184.0, 116.0, 61.0, 49.0, 35.0, 15.0, 10.0, 10.0, 2.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.099609375, -0.0966482162475586, -0.09368705749511719, -0.09072589874267578, -0.08776473999023438, -0.08480358123779297, -0.08184242248535156, -0.07888126373291016, -0.07592010498046875, -0.07295894622802734, -0.06999778747558594, -0.06703662872314453, -0.06407546997070312, -0.06111431121826172, -0.05815315246582031, -0.055191993713378906, -0.0522308349609375, -0.049269676208496094, -0.04630851745605469, -0.04334735870361328, -0.040386199951171875, -0.03742504119873047, -0.03446388244628906, -0.031502723693847656, -0.02854156494140625, -0.025580406188964844, -0.022619247436523438, -0.01965808868408203, -0.016696929931640625, -0.013735771179199219, -0.010774612426757812, -0.007813453674316406, -0.004852294921875, -0.0018911361694335938, 0.0010700225830078125, 0.004031181335449219, 0.006992340087890625, 0.009953498840332031, 0.012914657592773438, 0.015875816345214844, 0.01883697509765625, 0.021798133850097656, 0.024759292602539062, 0.02772045135498047, 0.030681610107421875, 0.03364276885986328, 0.03660392761230469, 0.039565086364746094, 0.0425262451171875, 0.045487403869628906, 0.04844856262207031, 0.05140972137451172, 0.054370880126953125, 0.05733203887939453, 0.06029319763183594, 0.06325435638427734, 0.06621551513671875, 0.06917667388916016, 0.07213783264160156, 0.07509899139404297, 0.07806015014648438, 0.08102130889892578, 0.08398246765136719, 0.0869436264038086, 0.08990478515625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 8.0, 8.0, 13.0, 15.0, 17.0, 24.0, 26.0, 40.0, 41.0, 61.0, 73.0, 75.0, 88.0, 110.0, 81.0, 59.0, 62.0, 44.0, 32.0, 28.0, 24.0, 24.0, 13.0, 10.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04937744140625, -0.047245025634765625, -0.04511260986328125, -0.042980194091796875, -0.0408477783203125, -0.038715362548828125, -0.03658294677734375, -0.034450531005859375, -0.032318115234375, -0.030185699462890625, -0.02805328369140625, -0.025920867919921875, -0.0237884521484375, -0.021656036376953125, -0.01952362060546875, -0.017391204833984375, -0.0152587890625, -0.013126373291015625, -0.01099395751953125, -0.008861541748046875, -0.0067291259765625, -0.004596710205078125, -0.00246429443359375, -0.000331878662109375, 0.001800537109375, 0.003932952880859375, 0.00606536865234375, 0.008197784423828125, 0.0103302001953125, 0.012462615966796875, 0.01459503173828125, 0.016727447509765625, 0.01885986328125, 0.020992279052734375, 0.02312469482421875, 0.025257110595703125, 0.0273895263671875, 0.029521942138671875, 0.03165435791015625, 0.033786773681640625, 0.035919189453125, 0.038051605224609375, 0.04018402099609375, 0.042316436767578125, 0.0444488525390625, 0.046581268310546875, 0.04871368408203125, 0.050846099853515625, 0.052978515625, 0.055110931396484375, 0.05724334716796875, 0.059375762939453125, 0.0615081787109375, 0.06364059448242188, 0.06577301025390625, 0.06790542602539062, 0.070037841796875, 0.07217025756835938, 0.07430267333984375, 0.07643508911132812, 0.0785675048828125, 0.08069992065429688, 0.08283233642578125, 0.08496475219726562, 0.08709716796875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 9.0, 9.0, 13.0, 40.0, 87.0, 158.0, 250.0, 223.0, 117.0, 54.0, 18.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9582399129867554, -1.9145997762680054, -1.8709596395492554, -1.8273195028305054, -1.7836793661117554, -1.7400391101837158, -1.6963989734649658, -1.6527588367462158, -1.6091187000274658, -1.5654785633087158, -1.5218384265899658, -1.4781982898712158, -1.4345581531524658, -1.3909180164337158, -1.3472778797149658, -1.3036376237869263, -1.2599976062774658, -1.2163574695587158, -1.1727173328399658, -1.1290771961212158, -1.0854370594024658, -1.0417969226837158, -0.998156726360321, -0.9545165300369263, -0.9108763933181763, -0.8672362565994263, -0.8235961198806763, -0.7799559831619263, -0.7363157868385315, -0.6926756501197815, -0.6490355134010315, -0.6053953170776367, -0.5617551803588867, -0.5181150436401367, -0.47447487711906433, -0.43083474040031433, -0.38719457387924194, -0.34355443716049194, -0.29991430044174194, -0.25627413392066956, -0.21263399720191956, -0.16899384558200836, -0.12535369396209717, -0.08171355724334717, -0.038073405623435974, 0.00556674599647522, 0.04920688271522522, 0.09284704923629761, 0.1364871859550476, 0.1801273375749588, 0.22376748919487, 0.26740762591362, 0.3110477924346924, 0.3546879291534424, 0.3983280658721924, 0.44196823239326477, 0.48560836911201477, 0.5292485356330872, 0.5728886723518372, 0.6165288090705872, 0.6601689457893372, 0.7038091421127319, 0.7474492788314819, 0.7910894155502319, 0.8347295522689819]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 7.0, 7.0, 14.0, 18.0, 19.0, 19.0, 16.0, 25.0, 27.0, 42.0, 37.0, 43.0, 47.0, 47.0, 54.0, 68.0, 43.0, 46.0, 55.0, 48.0, 43.0, 38.0, 28.0, 28.0, 24.0, 28.0, 20.0, 20.0, 15.0, 12.0, 6.0, 12.0, 9.0, 8.0, 7.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5854082107543945, -0.5636565089225769, -0.541904866695404, -0.5201531648635864, -0.4984014928340912, -0.47664982080459595, -0.4548981189727783, -0.4331464469432831, -0.41139477491378784, -0.3896431028842926, -0.36789143085479736, -0.34613972902297974, -0.3243880569934845, -0.30263638496398926, -0.28088468313217163, -0.2591330111026764, -0.23738133907318115, -0.2156296670436859, -0.19387798011302948, -0.17212629318237305, -0.1503746211528778, -0.12862294912338257, -0.10687126219272614, -0.0851195752620697, -0.06336790323257446, -0.04161622375249863, -0.01986454427242279, 0.0018871352076530457, 0.023638814687728882, 0.04539049416780472, 0.06714217364788055, 0.08889386057853699, 0.11064547300338745, 0.1323971450328827, 0.15414883196353912, 0.17590051889419556, 0.1976521909236908, 0.21940386295318604, 0.24115554988384247, 0.2629072368144989, 0.28465890884399414, 0.3064105808734894, 0.3281622529029846, 0.34991395473480225, 0.3716656267642975, 0.3934172987937927, 0.41516900062561035, 0.4369206726551056, 0.45867234468460083, 0.48042401671409607, 0.5021756887435913, 0.5239273905754089, 0.5456790924072266, 0.5674307346343994, 0.589182436466217, 0.6109341382980347, 0.6326857805252075, 0.6544374823570251, 0.676189124584198, 0.6979408264160156, 0.7196924686431885, 0.7414441704750061, 0.7631958723068237, 0.7849475145339966, 0.8066992163658142]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 9.0, 8.0, 6.0, 12.0, 20.0, 20.0, 27.0, 31.0, 35.0, 65.0, 74.0, 105.0, 139.0, 264.0, 771.0, 20920.0, 4140782.0, 29391.0, 786.0, 232.0, 148.0, 95.0, 78.0, 62.0, 48.0, 32.0, 27.0, 26.0, 20.0, 6.0, 13.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33251953125, -0.321258544921875, -0.30999755859375, -0.298736572265625, -0.2874755859375, -0.276214599609375, -0.26495361328125, -0.253692626953125, -0.242431640625, -0.231170654296875, -0.21990966796875, -0.208648681640625, -0.1973876953125, -0.186126708984375, -0.17486572265625, -0.163604736328125, -0.15234375, -0.141082763671875, -0.12982177734375, -0.118560791015625, -0.1072998046875, -0.096038818359375, -0.08477783203125, -0.073516845703125, -0.062255859375, -0.050994873046875, -0.03973388671875, -0.028472900390625, -0.0172119140625, -0.005950927734375, 0.00531005859375, 0.016571044921875, 0.02783203125, 0.039093017578125, 0.05035400390625, 0.061614990234375, 0.0728759765625, 0.084136962890625, 0.09539794921875, 0.106658935546875, 0.117919921875, 0.129180908203125, 0.14044189453125, 0.151702880859375, 0.1629638671875, 0.174224853515625, 0.18548583984375, 0.196746826171875, 0.2080078125, 0.219268798828125, 0.23052978515625, 0.241790771484375, 0.2530517578125, 0.264312744140625, 0.27557373046875, 0.286834716796875, 0.298095703125, 0.309356689453125, 0.32061767578125, 0.331878662109375, 0.3431396484375, 0.354400634765625, 0.36566162109375, 0.376922607421875, 0.38818359375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 7.0, 7.0, 7.0, 15.0, 16.0, 25.0, 19.0, 22.0, 27.0, 31.0, 37.0, 33.0, 37.0, 40.0, 55.0, 48.0, 41.0, 54.0, 51.0, 51.0, 44.0, 60.0, 31.0, 40.0, 32.0, 25.0, 27.0, 19.0, 18.0, 17.0, 11.0, 9.0, 7.0, 10.0, 9.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0484619140625, -0.04712867736816406, -0.045795440673828125, -0.04446220397949219, -0.04312896728515625, -0.04179573059082031, -0.040462493896484375, -0.03912925720214844, -0.0377960205078125, -0.03646278381347656, -0.035129547119140625, -0.03379631042480469, -0.03246307373046875, -0.031129837036132812, -0.029796600341796875, -0.028463363647460938, -0.027130126953125, -0.025796890258789062, -0.024463653564453125, -0.023130416870117188, -0.02179718017578125, -0.020463943481445312, -0.019130706787109375, -0.017797470092773438, -0.0164642333984375, -0.015130996704101562, -0.013797760009765625, -0.012464523315429688, -0.01113128662109375, -0.009798049926757812, -0.008464813232421875, -0.0071315765380859375, -0.00579833984375, -0.0044651031494140625, -0.003131866455078125, -0.0017986297607421875, -0.00046539306640625, 0.0008678436279296875, 0.002201080322265625, 0.0035343170166015625, 0.0048675537109375, 0.0062007904052734375, 0.007534027099609375, 0.008867263793945312, 0.01020050048828125, 0.011533737182617188, 0.012866973876953125, 0.014200210571289062, 0.015533447265625, 0.016866683959960938, 0.018199920654296875, 0.019533157348632812, 0.02086639404296875, 0.022199630737304688, 0.023532867431640625, 0.024866104125976562, 0.0261993408203125, 0.027532577514648438, 0.028865814208984375, 0.030199050903320312, 0.03153228759765625, 0.03286552429199219, 0.034198760986328125, 0.03553199768066406, 0.036865234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 12.0, 20.0, 39.0, 56.0, 129.0, 263.0, 602.0, 1590.0, 4647.0, 18404.0, 106749.0, 1977667.0, 1947059.0, 108867.0, 19802.0, 5377.0, 1782.0, 632.0, 280.0, 120.0, 81.0, 28.0, 21.0, 9.0, 8.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09552001953125, -0.09222602844238281, -0.08893203735351562, -0.08563804626464844, -0.08234405517578125, -0.07905006408691406, -0.07575607299804688, -0.07246208190917969, -0.0691680908203125, -0.06587409973144531, -0.06258010864257812, -0.05928611755371094, -0.05599212646484375, -0.05269813537597656, -0.049404144287109375, -0.04611015319824219, -0.042816162109375, -0.03952217102050781, -0.036228179931640625, -0.03293418884277344, -0.02964019775390625, -0.026346206665039062, -0.023052215576171875, -0.019758224487304688, -0.0164642333984375, -0.013170242309570312, -0.009876251220703125, -0.0065822601318359375, -0.00328826904296875, 5.7220458984375e-06, 0.003299713134765625, 0.0065937042236328125, 0.0098876953125, 0.013181686401367188, 0.016475677490234375, 0.019769668579101562, 0.02306365966796875, 0.026357650756835938, 0.029651641845703125, 0.03294563293457031, 0.0362396240234375, 0.03953361511230469, 0.042827606201171875, 0.04612159729003906, 0.04941558837890625, 0.05270957946777344, 0.056003570556640625, 0.05929756164550781, 0.062591552734375, 0.06588554382324219, 0.06917953491210938, 0.07247352600097656, 0.07576751708984375, 0.07906150817871094, 0.08235549926757812, 0.08564949035644531, 0.0889434814453125, 0.09223747253417969, 0.09553146362304688, 0.09882545471191406, 0.10211944580078125, 0.10541343688964844, 0.10870742797851562, 0.11200141906738281, 0.11529541015625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0, 6.0, 8.0, 16.0, 15.0, 29.0, 38.0, 52.0, 84.0, 144.0, 206.0, 330.0, 491.0, 639.0, 616.0, 472.0, 322.0, 194.0, 108.0, 69.0, 44.0, 32.0, 32.0, 27.0, 22.0, 12.0, 14.0, 8.0, 6.0, 6.0, 5.0, 4.0, 7.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.09100341796875, -0.08832454681396484, -0.08564567565917969, -0.08296680450439453, -0.08028793334960938, -0.07760906219482422, -0.07493019104003906, -0.0722513198852539, -0.06957244873046875, -0.0668935775756836, -0.06421470642089844, -0.06153583526611328, -0.058856964111328125, -0.05617809295654297, -0.05349922180175781, -0.050820350646972656, -0.0481414794921875, -0.045462608337402344, -0.04278373718261719, -0.04010486602783203, -0.037425994873046875, -0.03474712371826172, -0.03206825256347656, -0.029389381408691406, -0.02671051025390625, -0.024031639099121094, -0.021352767944335938, -0.01867389678955078, -0.015995025634765625, -0.013316154479980469, -0.010637283325195312, -0.007958412170410156, -0.005279541015625, -0.0026006698608398438, 7.82012939453125e-05, 0.0027570724487304688, 0.005435943603515625, 0.008114814758300781, 0.010793685913085938, 0.013472557067871094, 0.01615142822265625, 0.018830299377441406, 0.021509170532226562, 0.02418804168701172, 0.026866912841796875, 0.02954578399658203, 0.03222465515136719, 0.034903526306152344, 0.0375823974609375, 0.040261268615722656, 0.04294013977050781, 0.04561901092529297, 0.048297882080078125, 0.05097675323486328, 0.05365562438964844, 0.056334495544433594, 0.05901336669921875, 0.061692237854003906, 0.06437110900878906, 0.06704998016357422, 0.06972885131835938, 0.07240772247314453, 0.07508659362792969, 0.07776546478271484, 0.0804443359375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 9.0, 9.0, 5.0, 15.0, 46.0, 163.0, 368.0, 276.0, 91.0, 9.0, 7.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9128963947296143, -1.8579959869384766, -1.8030955791473389, -1.7481952905654907, -1.693294882774353, -1.6383944749832153, -1.5834941864013672, -1.5285937786102295, -1.4736933708190918, -1.418792963027954, -1.3638925552368164, -1.3089922666549683, -1.2540918588638306, -1.1991914510726929, -1.1442911624908447, -1.089390754699707, -1.0344903469085693, -0.9795899391174316, -0.9246895909309387, -0.8697892427444458, -0.8148888349533081, -0.7599884271621704, -0.7050880789756775, -0.6501877307891846, -0.5952873229980469, -0.5403869152069092, -0.48548656702041626, -0.43058618903160095, -0.37568581104278564, -0.32078543305397034, -0.26588505506515503, -0.21098467707633972, -0.15608429908752441, -0.1011839210987091, -0.0462835431098938, 0.008616834878921509, 0.06351721286773682, 0.11841759085655212, 0.17331796884536743, 0.22821834683418274, 0.28311872482299805, 0.33801910281181335, 0.39291948080062866, 0.44781985878944397, 0.5027202367782593, 0.557620644569397, 0.6125209927558899, 0.6674213409423828, 0.7223217487335205, 0.7772221565246582, 0.8321225047111511, 0.887022852897644, 0.9419232606887817, 0.9968236684799194, 1.0517239570617676, 1.1066243648529053, 1.161524772644043, 1.2164251804351807, 1.2713255882263184, 1.3262258768081665, 1.3811262845993042, 1.436026692390442, 1.49092698097229, 1.5458273887634277, 1.6007277965545654]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 12.0, 13.0, 24.0, 23.0, 31.0, 32.0, 53.0, 54.0, 66.0, 85.0, 65.0, 81.0, 81.0, 74.0, 74.0, 52.0, 40.0, 41.0, 29.0, 22.0, 17.0, 16.0, 10.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4439486265182495, -0.4232630431652069, -0.4025774598121643, -0.3818918764591217, -0.3612062931060791, -0.3405207395553589, -0.3198351562023163, -0.2991495728492737, -0.2784639894962311, -0.2577784061431885, -0.23709282279014587, -0.21640725433826447, -0.19572167098522186, -0.17503608763217926, -0.15435051918029785, -0.13366493582725525, -0.11297935247421265, -0.09229376912117004, -0.07160819321870804, -0.050922613590955734, -0.03023703396320343, -0.009551450610160828, 0.011134125292301178, 0.031819701194763184, 0.052505284547805786, 0.07319086790084839, 0.0938764438033104, 0.1145620197057724, 0.135247603058815, 0.1559331864118576, 0.176618754863739, 0.19730433821678162, 0.21798992156982422, 0.23867550492286682, 0.2593610882759094, 0.280046671628952, 0.30073225498199463, 0.32141780853271484, 0.34210339188575745, 0.36278897523880005, 0.38347455859184265, 0.40416014194488525, 0.42484572529792786, 0.44553130865097046, 0.4662168622016907, 0.48690247535705566, 0.5075880289077759, 0.5282735824584961, 0.5489591956138611, 0.5696447491645813, 0.5903303623199463, 0.6110159158706665, 0.6317015290260315, 0.6523870825767517, 0.6730726957321167, 0.6937582492828369, 0.7144438028335571, 0.7351293563842773, 0.7558149695396423, 0.7765005230903625, 0.7971861362457275, 0.8178716897964478, 0.8385573029518127, 0.859242856502533, 0.879928469657898]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 11.0, 10.0, 8.0, 14.0, 15.0, 22.0, 43.0, 60.0, 112.0, 157.0, 258.0, 420.0, 767.0, 1471.0, 2904.0, 5706.0, 12177.0, 27879.0, 69168.0, 185798.0, 362175.0, 231147.0, 85740.0, 33658.0, 14767.0, 6885.0, 3340.0, 1720.0, 876.0, 479.0, 266.0, 183.0, 108.0, 54.0, 43.0, 35.0, 23.0, 16.0, 12.0, 7.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050811767578125, -0.04897165298461914, -0.04713153839111328, -0.04529142379760742, -0.04345130920410156, -0.0416111946105957, -0.039771080017089844, -0.037930965423583984, -0.036090850830078125, -0.034250736236572266, -0.032410621643066406, -0.030570507049560547, -0.028730392456054688, -0.026890277862548828, -0.02505016326904297, -0.02321004867553711, -0.02136993408203125, -0.01952981948852539, -0.01768970489501953, -0.015849590301513672, -0.014009475708007812, -0.012169361114501953, -0.010329246520996094, -0.008489131927490234, -0.006649017333984375, -0.004808902740478516, -0.0029687881469726562, -0.0011286735534667969, 0.0007114410400390625, 0.002551555633544922, 0.004391670227050781, 0.006231784820556641, 0.0080718994140625, 0.00991201400756836, 0.011752128601074219, 0.013592243194580078, 0.015432357788085938, 0.017272472381591797, 0.019112586975097656, 0.020952701568603516, 0.022792816162109375, 0.024632930755615234, 0.026473045349121094, 0.028313159942626953, 0.030153274536132812, 0.03199338912963867, 0.03383350372314453, 0.03567361831665039, 0.03751373291015625, 0.03935384750366211, 0.04119396209716797, 0.04303407669067383, 0.04487419128417969, 0.04671430587768555, 0.048554420471191406, 0.050394535064697266, 0.052234649658203125, 0.054074764251708984, 0.055914878845214844, 0.0577549934387207, 0.05959510803222656, 0.06143522262573242, 0.06327533721923828, 0.06511545181274414, 0.06695556640625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 9.0, 16.0, 7.0, 13.0, 16.0, 15.0, 19.0, 31.0, 27.0, 39.0, 34.0, 31.0, 34.0, 45.0, 54.0, 38.0, 50.0, 57.0, 44.0, 42.0, 41.0, 38.0, 32.0, 39.0, 36.0, 28.0, 28.0, 23.0, 13.0, 21.0, 7.0, 17.0, 10.0, 11.0, 4.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.04931640625, -0.04795074462890625, -0.0465850830078125, -0.04521942138671875, -0.043853759765625, -0.04248809814453125, -0.0411224365234375, -0.03975677490234375, -0.03839111328125, -0.03702545166015625, -0.0356597900390625, -0.03429412841796875, -0.032928466796875, -0.03156280517578125, -0.0301971435546875, -0.02883148193359375, -0.0274658203125, -0.02610015869140625, -0.0247344970703125, -0.02336883544921875, -0.022003173828125, -0.02063751220703125, -0.0192718505859375, -0.01790618896484375, -0.01654052734375, -0.01517486572265625, -0.0138092041015625, -0.01244354248046875, -0.011077880859375, -0.00971221923828125, -0.0083465576171875, -0.00698089599609375, -0.005615234375, -0.00424957275390625, -0.0028839111328125, -0.00151824951171875, -0.000152587890625, 0.00121307373046875, 0.0025787353515625, 0.00394439697265625, 0.00531005859375, 0.00667572021484375, 0.0080413818359375, 0.00940704345703125, 0.010772705078125, 0.01213836669921875, 0.0135040283203125, 0.01486968994140625, 0.0162353515625, 0.01760101318359375, 0.0189666748046875, 0.02033233642578125, 0.021697998046875, 0.02306365966796875, 0.0244293212890625, 0.02579498291015625, 0.02716064453125, 0.02852630615234375, 0.0298919677734375, 0.03125762939453125, 0.032623291015625, 0.03398895263671875, 0.0353546142578125, 0.03672027587890625, 0.0380859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 10.0, 10.0, 13.0, 14.0, 29.0, 43.0, 65.0, 106.0, 183.0, 336.0, 633.0, 1543.0, 5412.0, 38691.0, 774107.0, 208506.0, 13910.0, 2816.0, 1019.0, 474.0, 244.0, 134.0, 86.0, 47.0, 40.0, 25.0, 13.0, 5.0, 9.0, 8.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1986083984375, -0.1925487518310547, -0.18648910522460938, -0.18042945861816406, -0.17436981201171875, -0.16831016540527344, -0.16225051879882812, -0.1561908721923828, -0.1501312255859375, -0.1440715789794922, -0.13801193237304688, -0.13195228576660156, -0.12589263916015625, -0.11983299255371094, -0.11377334594726562, -0.10771369934082031, -0.101654052734375, -0.09559440612792969, -0.08953475952148438, -0.08347511291503906, -0.07741546630859375, -0.07135581970214844, -0.06529617309570312, -0.05923652648925781, -0.0531768798828125, -0.04711723327636719, -0.041057586669921875, -0.03499794006347656, -0.02893829345703125, -0.022878646850585938, -0.016819000244140625, -0.010759353637695312, -0.00469970703125, 0.0013599395751953125, 0.007419586181640625, 0.013479232788085938, 0.01953887939453125, 0.025598526000976562, 0.031658172607421875, 0.03771781921386719, 0.0437774658203125, 0.04983711242675781, 0.055896759033203125, 0.06195640563964844, 0.06801605224609375, 0.07407569885253906, 0.08013534545898438, 0.08619499206542969, 0.092254638671875, 0.09831428527832031, 0.10437393188476562, 0.11043357849121094, 0.11649322509765625, 0.12255287170410156, 0.12861251831054688, 0.1346721649169922, 0.1407318115234375, 0.1467914581298828, 0.15285110473632812, 0.15891075134277344, 0.16497039794921875, 0.17103004455566406, 0.17708969116210938, 0.1831493377685547, 0.189208984375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 9.0, 12.0, 8.0, 8.0, 10.0, 15.0, 19.0, 25.0, 17.0, 38.0, 24.0, 35.0, 21.0, 44.0, 36.0, 50.0, 38.0, 34.0, 37.0, 34.0, 48.0, 47.0, 33.0, 52.0, 41.0, 26.0, 21.0, 23.0, 19.0, 32.0, 18.0, 14.0, 11.0, 14.0, 13.0, 7.0, 7.0, 10.0, 11.0, 5.0, 5.0, 5.0, 3.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1385498046875, -0.13378524780273438, -0.12902069091796875, -0.12425613403320312, -0.1194915771484375, -0.11472702026367188, -0.10996246337890625, -0.10519790649414062, -0.100433349609375, -0.09566879272460938, -0.09090423583984375, -0.08613967895507812, -0.0813751220703125, -0.07661056518554688, -0.07184600830078125, -0.06708145141601562, -0.06231689453125, -0.057552337646484375, -0.05278778076171875, -0.048023223876953125, -0.0432586669921875, -0.038494110107421875, -0.03372955322265625, -0.028964996337890625, -0.024200439453125, -0.019435882568359375, -0.01467132568359375, -0.009906768798828125, -0.0051422119140625, -0.000377655029296875, 0.00438690185546875, 0.009151458740234375, 0.013916015625, 0.018680572509765625, 0.02344512939453125, 0.028209686279296875, 0.0329742431640625, 0.037738800048828125, 0.04250335693359375, 0.047267913818359375, 0.052032470703125, 0.056797027587890625, 0.06156158447265625, 0.06632614135742188, 0.0710906982421875, 0.07585525512695312, 0.08061981201171875, 0.08538436889648438, 0.09014892578125, 0.09491348266601562, 0.09967803955078125, 0.10444259643554688, 0.1092071533203125, 0.11397171020507812, 0.11873626708984375, 0.12350082397460938, 0.128265380859375, 0.13302993774414062, 0.13779449462890625, 0.14255905151367188, 0.1473236083984375, 0.15208816528320312, 0.15685272216796875, 0.16161727905273438, 0.1663818359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 7.0, 14.0, 28.0, 31.0, 37.0, 84.0, 146.0, 395.0, 1209.0, 6574.0, 138431.0, 875810.0, 22184.0, 2506.0, 623.0, 224.0, 95.0, 52.0, 26.0, 18.0, 16.0, 7.0, 9.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.145751953125, -0.14108657836914062, -0.13642120361328125, -0.13175582885742188, -0.1270904541015625, -0.12242507934570312, -0.11775970458984375, -0.11309432983398438, -0.108428955078125, -0.10376358032226562, -0.09909820556640625, -0.09443283081054688, -0.0897674560546875, -0.08510208129882812, -0.08043670654296875, -0.07577133178710938, -0.07110595703125, -0.06644058227539062, -0.06177520751953125, -0.057109832763671875, -0.0524444580078125, -0.047779083251953125, -0.04311370849609375, -0.038448333740234375, -0.033782958984375, -0.029117584228515625, -0.02445220947265625, -0.019786834716796875, -0.0151214599609375, -0.010456085205078125, -0.00579071044921875, -0.001125335693359375, 0.0035400390625, 0.008205413818359375, 0.01287078857421875, 0.017536163330078125, 0.0222015380859375, 0.026866912841796875, 0.03153228759765625, 0.036197662353515625, 0.040863037109375, 0.045528411865234375, 0.05019378662109375, 0.054859161376953125, 0.0595245361328125, 0.06418991088867188, 0.06885528564453125, 0.07352066040039062, 0.07818603515625, 0.08285140991210938, 0.08751678466796875, 0.09218215942382812, 0.0968475341796875, 0.10151290893554688, 0.10617828369140625, 0.11084365844726562, 0.115509033203125, 0.12017440795898438, 0.12483978271484375, 0.12950515747070312, 0.1341705322265625, 0.13883590698242188, 0.14350128173828125, 0.14816665649414062, 0.15283203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 4.0, 2.0, 8.0, 1.0, 8.0, 8.0, 11.0, 8.0, 9.0, 11.0, 26.0, 29.0, 29.0, 49.0, 74.0, 82.0, 76.0, 104.0, 103.0, 83.0, 72.0, 37.0, 45.0, 33.0, 17.0, 19.0, 7.0, 12.0, 5.0, 3.0, 10.0, 3.0, 1.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.218650817871094e-05, -3.106147050857544e-05, -2.993643283843994e-05, -2.8811395168304443e-05, -2.7686357498168945e-05, -2.6561319828033447e-05, -2.543628215789795e-05, -2.431124448776245e-05, -2.3186206817626953e-05, -2.2061169147491455e-05, -2.0936131477355957e-05, -1.981109380722046e-05, -1.868605613708496e-05, -1.7561018466949463e-05, -1.6435980796813965e-05, -1.5310943126678467e-05, -1.4185905456542969e-05, -1.306086778640747e-05, -1.1935830116271973e-05, -1.0810792446136475e-05, -9.685754776000977e-06, -8.560717105865479e-06, -7.4356794357299805e-06, -6.310641765594482e-06, -5.185604095458984e-06, -4.060566425323486e-06, -2.9355287551879883e-06, -1.8104910850524902e-06, -6.854534149169922e-07, 4.3958425521850586e-07, 1.564621925354004e-06, 2.689659595489502e-06, 3.814697265625e-06, 4.939734935760498e-06, 6.064772605895996e-06, 7.189810276031494e-06, 8.314847946166992e-06, 9.43988561630249e-06, 1.0564923286437988e-05, 1.1689960956573486e-05, 1.2814998626708984e-05, 1.3940036296844482e-05, 1.506507396697998e-05, 1.619011163711548e-05, 1.7315149307250977e-05, 1.8440186977386475e-05, 1.9565224647521973e-05, 2.069026231765747e-05, 2.181529998779297e-05, 2.2940337657928467e-05, 2.4065375328063965e-05, 2.5190412998199463e-05, 2.631545066833496e-05, 2.744048833847046e-05, 2.8565526008605957e-05, 2.9690563678741455e-05, 3.081560134887695e-05, 3.194063901901245e-05, 3.306567668914795e-05, 3.419071435928345e-05, 3.5315752029418945e-05, 3.644078969955444e-05, 3.756582736968994e-05, 3.869086503982544e-05, 3.981590270996094e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 10.0, 10.0, 13.0, 16.0, 28.0, 33.0, 41.0, 71.0, 129.0, 202.0, 383.0, 724.0, 1662.0, 4762.0, 18528.0, 141300.0, 769506.0, 90248.0, 14258.0, 3814.0, 1348.0, 680.0, 327.0, 164.0, 94.0, 63.0, 53.0, 32.0, 18.0, 8.0, 16.0, 6.0, 3.0, 3.0, 2.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07073974609375, -0.06824970245361328, -0.06575965881347656, -0.06326961517333984, -0.060779571533203125, -0.058289527893066406, -0.05579948425292969, -0.05330944061279297, -0.05081939697265625, -0.04832935333251953, -0.04583930969238281, -0.043349266052246094, -0.040859222412109375, -0.038369178771972656, -0.03587913513183594, -0.03338909149169922, -0.0308990478515625, -0.02840900421142578, -0.025918960571289062, -0.023428916931152344, -0.020938873291015625, -0.018448829650878906, -0.015958786010742188, -0.013468742370605469, -0.01097869873046875, -0.008488655090332031, -0.0059986114501953125, -0.0035085678100585938, -0.001018524169921875, 0.0014715194702148438, 0.0039615631103515625, 0.006451606750488281, 0.008941650390625, 0.011431694030761719, 0.013921737670898438, 0.016411781311035156, 0.018901824951171875, 0.021391868591308594, 0.023881912231445312, 0.02637195587158203, 0.02886199951171875, 0.03135204315185547, 0.03384208679199219, 0.036332130432128906, 0.038822174072265625, 0.041312217712402344, 0.04380226135253906, 0.04629230499267578, 0.0487823486328125, 0.05127239227294922, 0.05376243591308594, 0.056252479553222656, 0.058742523193359375, 0.061232566833496094, 0.06372261047363281, 0.06621265411376953, 0.06870269775390625, 0.07119274139404297, 0.07368278503417969, 0.0761728286743164, 0.07866287231445312, 0.08115291595458984, 0.08364295959472656, 0.08613300323486328, 0.088623046875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 5.0, 5.0, 4.0, 8.0, 18.0, 14.0, 31.0, 32.0, 50.0, 58.0, 74.0, 93.0, 102.0, 105.0, 100.0, 74.0, 47.0, 47.0, 34.0, 17.0, 22.0, 12.0, 13.0, 10.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061187744140625, -0.059216976165771484, -0.05724620819091797, -0.05527544021606445, -0.05330467224121094, -0.05133390426635742, -0.049363136291503906, -0.04739236831665039, -0.045421600341796875, -0.04345083236694336, -0.041480064392089844, -0.03950929641723633, -0.03753852844238281, -0.0355677604675293, -0.03359699249267578, -0.031626224517822266, -0.02965545654296875, -0.027684688568115234, -0.02571392059326172, -0.023743152618408203, -0.021772384643554688, -0.019801616668701172, -0.017830848693847656, -0.01586008071899414, -0.013889312744140625, -0.01191854476928711, -0.009947776794433594, -0.007977008819580078, -0.0060062408447265625, -0.004035472869873047, -0.0020647048950195312, -9.393692016601562e-05, 0.0018768310546875, 0.0038475990295410156, 0.005818367004394531, 0.007789134979248047, 0.009759902954101562, 0.011730670928955078, 0.013701438903808594, 0.01567220687866211, 0.017642974853515625, 0.01961374282836914, 0.021584510803222656, 0.023555278778076172, 0.025526046752929688, 0.027496814727783203, 0.02946758270263672, 0.031438350677490234, 0.03340911865234375, 0.035379886627197266, 0.03735065460205078, 0.0393214225769043, 0.04129219055175781, 0.04326295852661133, 0.045233726501464844, 0.04720449447631836, 0.049175262451171875, 0.05114603042602539, 0.053116798400878906, 0.05508756637573242, 0.05705833435058594, 0.05902910232543945, 0.06099987030029297, 0.06297063827514648, 0.06494140625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 1.0, 7.0, 4.0, 10.0, 11.0, 23.0, 142.0, 526.0, 237.0, 34.0, 5.0, 3.0, 0.0, 2.0, 2.0], "bins": [-5.658314228057861, -5.558578014373779, -5.458841800689697, -5.359105587005615, -5.259368896484375, -5.159632682800293, -5.059896469116211, -4.960160255432129, -4.860424041748047, -4.760687828063965, -4.660951614379883, -4.561215400695801, -4.461479187011719, -4.3617424964904785, -4.2620062828063965, -4.1622700691223145, -4.062533855438232, -3.9627976417541504, -3.8630614280700684, -3.7633249759674072, -3.663588762283325, -3.563852548599243, -3.464116096496582, -3.3643798828125, -3.264643669128418, -3.164907455444336, -3.065171241760254, -2.9654347896575928, -2.8656985759735107, -2.7659623622894287, -2.6662259101867676, -2.5664896965026855, -2.4667534828186035, -2.3670172691345215, -2.2672810554504395, -2.1675446033477783, -2.0678083896636963, -1.9680721759796143, -1.8683358430862427, -1.768599510192871, -1.668863296508789, -1.569127082824707, -1.4693907499313354, -1.3696544170379639, -1.2699182033538818, -1.1701819896697998, -1.0704456567764282, -0.9707093834877014, -0.8709730505943298, -0.771236777305603, -0.6715005040168762, -0.5717642307281494, -0.4720279574394226, -0.3722916841506958, -0.272555410861969, -0.1728191375732422, -0.07308286428451538, 0.026653409004211426, 0.12638968229293823, 0.22612595558166504, 0.32586222887039185, 0.42559850215911865, 0.5253347754478455, 0.6250710487365723, 0.7248073220252991]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 7.0, 2.0, 3.0, 2.0, 6.0, 7.0, 11.0, 17.0, 15.0, 14.0, 22.0, 21.0, 19.0, 31.0, 27.0, 35.0, 44.0, 31.0, 40.0, 51.0, 62.0, 64.0, 47.0, 51.0, 50.0, 43.0, 34.0, 35.0, 30.0, 18.0, 29.0, 19.0, 26.0, 17.0, 10.0, 12.0, 12.0, 11.0, 6.0, 4.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5549246072769165, -0.5320776700973511, -0.5092307925224304, -0.486383855342865, -0.46353697776794434, -0.4406900405883789, -0.41784313321113586, -0.3949962258338928, -0.3721493184566498, -0.34930241107940674, -0.3264555037021637, -0.30360859632492065, -0.2807616591453552, -0.25791478157043457, -0.23506784439086914, -0.2122209370136261, -0.18937402963638306, -0.16652712225914001, -0.14368021488189697, -0.12083329260349274, -0.0979863852262497, -0.07513947784900665, -0.05229255557060242, -0.029445648193359375, -0.006598740816116333, 0.016248170286417007, 0.03909508138895035, 0.06194199621677399, 0.08478890359401703, 0.10763581097126007, 0.1304827332496643, 0.15332964062690735, 0.1761765480041504, 0.19902345538139343, 0.22187036275863647, 0.2447172850370407, 0.26756417751312256, 0.290411114692688, 0.31325802206993103, 0.3361049294471741, 0.3589518368244171, 0.38179874420166016, 0.4046456515789032, 0.42749255895614624, 0.45033949613571167, 0.4731863737106323, 0.49603331089019775, 0.5188802480697632, 0.5417271256446838, 0.5645740628242493, 0.5874209403991699, 0.6102678775787354, 0.633114755153656, 0.6559616923332214, 0.6788085699081421, 0.7016555070877075, 0.724502444267273, 0.7473493814468384, 0.770196259021759, 0.7930431962013245, 0.8158900737762451, 0.8387370109558105, 0.861583948135376, 0.8844308257102966, 0.9072777032852173]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 6.0, 14.0, 14.0, 20.0, 27.0, 39.0, 63.0, 120.0, 206.0, 318.0, 648.0, 1414.0, 2966.0, 7457.0, 23472.0, 98560.0, 668556.0, 2374472.0, 850846.0, 122048.0, 27667.0, 8745.0, 3409.0, 1561.0, 736.0, 349.0, 206.0, 134.0, 78.0, 47.0, 25.0, 18.0, 9.0, 7.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0667724609375, -0.06465721130371094, -0.06254196166992188, -0.06042671203613281, -0.05831146240234375, -0.05619621276855469, -0.054080963134765625, -0.05196571350097656, -0.0498504638671875, -0.04773521423339844, -0.045619964599609375, -0.04350471496582031, -0.04138946533203125, -0.03927421569824219, -0.037158966064453125, -0.03504371643066406, -0.032928466796875, -0.030813217163085938, -0.028697967529296875, -0.026582717895507812, -0.02446746826171875, -0.022352218627929688, -0.020236968994140625, -0.018121719360351562, -0.0160064697265625, -0.013891220092773438, -0.011775970458984375, -0.009660720825195312, -0.00754547119140625, -0.0054302215576171875, -0.003314971923828125, -0.0011997222900390625, 0.00091552734375, 0.0030307769775390625, 0.005146026611328125, 0.0072612762451171875, 0.00937652587890625, 0.011491775512695312, 0.013607025146484375, 0.015722274780273438, 0.0178375244140625, 0.019952774047851562, 0.022068023681640625, 0.024183273315429688, 0.02629852294921875, 0.028413772583007812, 0.030529022216796875, 0.03264427185058594, 0.034759521484375, 0.03687477111816406, 0.038990020751953125, 0.04110527038574219, 0.04322052001953125, 0.04533576965332031, 0.047451019287109375, 0.04956626892089844, 0.0516815185546875, 0.05379676818847656, 0.055912017822265625, 0.05802726745605469, 0.06014251708984375, 0.06225776672363281, 0.06437301635742188, 0.06648826599121094, 0.068603515625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 12.0, 6.0, 15.0, 17.0, 18.0, 23.0, 19.0, 27.0, 33.0, 36.0, 33.0, 36.0, 50.0, 39.0, 55.0, 52.0, 36.0, 48.0, 37.0, 44.0, 38.0, 46.0, 27.0, 46.0, 36.0, 34.0, 24.0, 22.0, 18.0, 13.0, 9.0, 10.0, 9.0, 9.0, 6.0, 2.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.04693603515625, -0.04553985595703125, -0.0441436767578125, -0.04274749755859375, -0.041351318359375, -0.03995513916015625, -0.0385589599609375, -0.03716278076171875, -0.0357666015625, -0.03437042236328125, -0.0329742431640625, -0.03157806396484375, -0.030181884765625, -0.02878570556640625, -0.0273895263671875, -0.02599334716796875, -0.02459716796875, -0.02320098876953125, -0.0218048095703125, -0.02040863037109375, -0.019012451171875, -0.01761627197265625, -0.0162200927734375, -0.01482391357421875, -0.013427734375, -0.01203155517578125, -0.0106353759765625, -0.00923919677734375, -0.007843017578125, -0.00644683837890625, -0.0050506591796875, -0.00365447998046875, -0.00225830078125, -0.00086212158203125, 0.0005340576171875, 0.00193023681640625, 0.003326416015625, 0.00472259521484375, 0.0061187744140625, 0.00751495361328125, 0.0089111328125, 0.01030731201171875, 0.0117034912109375, 0.01309967041015625, 0.014495849609375, 0.01589202880859375, 0.0172882080078125, 0.01868438720703125, 0.02008056640625, 0.02147674560546875, 0.0228729248046875, 0.02426910400390625, 0.025665283203125, 0.02706146240234375, 0.0284576416015625, 0.02985382080078125, 0.03125, 0.03264617919921875, 0.0340423583984375, 0.03543853759765625, 0.036834716796875, 0.03823089599609375, 0.0396270751953125, 0.04102325439453125, 0.04241943359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 15.0, 14.0, 35.0, 55.0, 67.0, 100.0, 172.0, 334.0, 762.0, 2627.0, 14446.0, 130598.0, 3168702.0, 815495.0, 49940.0, 7772.0, 1933.0, 595.0, 256.0, 152.0, 79.0, 42.0, 22.0, 28.0, 10.0, 9.0, 8.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13427734375, -0.129913330078125, -0.12554931640625, -0.121185302734375, -0.1168212890625, -0.112457275390625, -0.10809326171875, -0.103729248046875, -0.099365234375, -0.095001220703125, -0.09063720703125, -0.086273193359375, -0.0819091796875, -0.077545166015625, -0.07318115234375, -0.068817138671875, -0.064453125, -0.060089111328125, -0.05572509765625, -0.051361083984375, -0.0469970703125, -0.042633056640625, -0.03826904296875, -0.033905029296875, -0.029541015625, -0.025177001953125, -0.02081298828125, -0.016448974609375, -0.0120849609375, -0.007720947265625, -0.00335693359375, 0.001007080078125, 0.00537109375, 0.009735107421875, 0.01409912109375, 0.018463134765625, 0.0228271484375, 0.027191162109375, 0.03155517578125, 0.035919189453125, 0.040283203125, 0.044647216796875, 0.04901123046875, 0.053375244140625, 0.0577392578125, 0.062103271484375, 0.06646728515625, 0.070831298828125, 0.0751953125, 0.079559326171875, 0.08392333984375, 0.088287353515625, 0.0926513671875, 0.097015380859375, 0.10137939453125, 0.105743408203125, 0.110107421875, 0.114471435546875, 0.11883544921875, 0.123199462890625, 0.1275634765625, 0.131927490234375, 0.13629150390625, 0.140655517578125, 0.14501953125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 4.0, 11.0, 19.0, 22.0, 26.0, 43.0, 69.0, 84.0, 154.0, 300.0, 515.0, 640.0, 645.0, 547.0, 313.0, 201.0, 135.0, 90.0, 63.0, 55.0, 32.0, 23.0, 15.0, 13.0, 17.0, 8.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11920166015625, -0.11525440216064453, -0.11130714416503906, -0.1073598861694336, -0.10341262817382812, -0.09946537017822266, -0.09551811218261719, -0.09157085418701172, -0.08762359619140625, -0.08367633819580078, -0.07972908020019531, -0.07578182220458984, -0.07183456420898438, -0.0678873062133789, -0.06394004821777344, -0.05999279022216797, -0.0560455322265625, -0.05209827423095703, -0.04815101623535156, -0.044203758239746094, -0.040256500244140625, -0.036309242248535156, -0.03236198425292969, -0.02841472625732422, -0.02446746826171875, -0.02052021026611328, -0.016572952270507812, -0.012625694274902344, -0.008678436279296875, -0.004731178283691406, -0.0007839202880859375, 0.0031633377075195312, 0.007110595703125, 0.011057853698730469, 0.015005111694335938, 0.018952369689941406, 0.022899627685546875, 0.026846885681152344, 0.030794143676757812, 0.03474140167236328, 0.03868865966796875, 0.04263591766357422, 0.04658317565917969, 0.050530433654785156, 0.054477691650390625, 0.058424949645996094, 0.06237220764160156, 0.06631946563720703, 0.0702667236328125, 0.07421398162841797, 0.07816123962402344, 0.0821084976196289, 0.08605575561523438, 0.09000301361083984, 0.09395027160644531, 0.09789752960205078, 0.10184478759765625, 0.10579204559326172, 0.10973930358886719, 0.11368656158447266, 0.11763381958007812, 0.1215810775756836, 0.12552833557128906, 0.12947559356689453, 0.1334228515625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 9.0, 18.0, 67.0, 219.0, 392.0, 192.0, 56.0, 22.0, 12.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.244476556777954, -2.1682205200195312, -2.0919644832611084, -2.0157084465026855, -1.9394525289535522, -1.8631964921951294, -1.786940574645996, -1.7106845378875732, -1.6344285011291504, -1.5581724643707275, -1.4819164276123047, -1.4056605100631714, -1.3294044733047485, -1.2531484365463257, -1.1768925189971924, -1.1006364822387695, -1.0243804454803467, -0.9481244087219238, -0.8718684315681458, -0.7956124544143677, -0.7193564176559448, -0.643100380897522, -0.5668444037437439, -0.4905884265899658, -0.41433238983154297, -0.3380763828754425, -0.26182037591934204, -0.18556436896324158, -0.10930836200714111, -0.03305235505104065, 0.043203651905059814, 0.11945962905883789, 0.19571590423583984, 0.2719719111919403, 0.34822791814804077, 0.42448392510414124, 0.5007399320602417, 0.5769959688186646, 0.6532519459724426, 0.7295079231262207, 0.8057639598846436, 0.8820199966430664, 0.9582759737968445, 1.0345319509506226, 1.1107879877090454, 1.1870440244674683, 1.2632999420166016, 1.3395559787750244, 1.4158120155334473, 1.4920680522918701, 1.568324089050293, 1.6445800065994263, 1.7208360433578491, 1.797092080116272, 1.8733479976654053, 1.9496040344238281, 2.025860071182251, 2.102116107940674, 2.1783721446990967, 2.2546281814575195, 2.3308839797973633, 2.407140016555786, 2.483396053314209, 2.559652090072632, 2.6359081268310547]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 4.0, 13.0, 16.0, 16.0, 18.0, 24.0, 29.0, 28.0, 36.0, 26.0, 30.0, 45.0, 44.0, 59.0, 44.0, 37.0, 42.0, 49.0, 51.0, 51.0, 49.0, 35.0, 40.0, 34.0, 21.0, 21.0, 23.0, 16.0, 23.0, 12.0, 10.0, 6.0, 11.0, 6.0, 6.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6030527949333191, -0.5853688716888428, -0.5676849484443665, -0.5500010251998901, -0.5323171019554138, -0.5146331787109375, -0.4969492554664612, -0.47926533222198486, -0.46158140897750854, -0.4438974857330322, -0.4262135624885559, -0.4085296392440796, -0.39084571599960327, -0.37316179275512695, -0.35547786951065063, -0.3377939462661743, -0.320110023021698, -0.3024260997772217, -0.28474217653274536, -0.26705825328826904, -0.24937433004379272, -0.2316904067993164, -0.2140064835548401, -0.19632256031036377, -0.17863863706588745, -0.16095471382141113, -0.14327079057693481, -0.1255868673324585, -0.10790294408798218, -0.09021902084350586, -0.07253509759902954, -0.05485117435455322, -0.03716719150543213, -0.01948326826095581, -0.0017993450164794922, 0.015884578227996826, 0.033568501472473145, 0.05125242471694946, 0.06893634796142578, 0.0866202712059021, 0.10430419445037842, 0.12198811769485474, 0.13967204093933105, 0.15735596418380737, 0.1750398874282837, 0.19272381067276, 0.21040773391723633, 0.22809165716171265, 0.24577558040618896, 0.2634595036506653, 0.2811434268951416, 0.2988273501396179, 0.31651127338409424, 0.33419519662857056, 0.3518791198730469, 0.3695630431175232, 0.3872469663619995, 0.40493088960647583, 0.42261481285095215, 0.44029873609542847, 0.4579826593399048, 0.4756665825843811, 0.4933505058288574, 0.5110344290733337, 0.5287183523178101]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 16.0, 21.0, 33.0, 56.0, 102.0, 166.0, 436.0, 1013.0, 2698.0, 8533.0, 30216.0, 114975.0, 405542.0, 354213.0, 94329.0, 24947.0, 7345.0, 2319.0, 820.0, 366.0, 154.0, 89.0, 60.0, 34.0, 25.0, 12.0, 7.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0828857421875, -0.07991790771484375, -0.0769500732421875, -0.07398223876953125, -0.071014404296875, -0.06804656982421875, -0.0650787353515625, -0.06211090087890625, -0.05914306640625, -0.05617523193359375, -0.0532073974609375, -0.05023956298828125, -0.047271728515625, -0.04430389404296875, -0.0413360595703125, -0.03836822509765625, -0.035400390625, -0.03243255615234375, -0.0294647216796875, -0.02649688720703125, -0.023529052734375, -0.02056121826171875, -0.0175933837890625, -0.01462554931640625, -0.01165771484375, -0.00868988037109375, -0.0057220458984375, -0.00275421142578125, 0.000213623046875, 0.00318145751953125, 0.0061492919921875, 0.00911712646484375, 0.0120849609375, 0.01505279541015625, 0.0180206298828125, 0.02098846435546875, 0.023956298828125, 0.02692413330078125, 0.0298919677734375, 0.03285980224609375, 0.03582763671875, 0.03879547119140625, 0.0417633056640625, 0.04473114013671875, 0.047698974609375, 0.05066680908203125, 0.0536346435546875, 0.05660247802734375, 0.0595703125, 0.06253814697265625, 0.0655059814453125, 0.06847381591796875, 0.071441650390625, 0.07440948486328125, 0.0773773193359375, 0.08034515380859375, 0.08331298828125, 0.08628082275390625, 0.0892486572265625, 0.09221649169921875, 0.095184326171875, 0.09815216064453125, 0.1011199951171875, 0.10408782958984375, 0.1070556640625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 6.0, 10.0, 5.0, 7.0, 10.0, 14.0, 12.0, 27.0, 24.0, 26.0, 23.0, 30.0, 50.0, 43.0, 42.0, 35.0, 37.0, 51.0, 32.0, 43.0, 48.0, 51.0, 31.0, 34.0, 37.0, 49.0, 31.0, 37.0, 20.0, 21.0, 20.0, 22.0, 19.0, 13.0, 15.0, 9.0, 5.0, 4.0, 7.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0418701171875, -0.040488243103027344, -0.03910636901855469, -0.03772449493408203, -0.036342620849609375, -0.03496074676513672, -0.03357887268066406, -0.032196998596191406, -0.03081512451171875, -0.029433250427246094, -0.028051376342773438, -0.02666950225830078, -0.025287628173828125, -0.02390575408935547, -0.022523880004882812, -0.021142005920410156, -0.0197601318359375, -0.018378257751464844, -0.016996383666992188, -0.015614509582519531, -0.014232635498046875, -0.012850761413574219, -0.011468887329101562, -0.010087013244628906, -0.00870513916015625, -0.007323265075683594, -0.0059413909912109375, -0.004559516906738281, -0.003177642822265625, -0.0017957687377929688, -0.0004138946533203125, 0.0009679794311523438, 0.002349853515625, 0.0037317276000976562, 0.0051136016845703125, 0.006495475769042969, 0.007877349853515625, 0.009259223937988281, 0.010641098022460938, 0.012022972106933594, 0.01340484619140625, 0.014786720275878906, 0.016168594360351562, 0.01755046844482422, 0.018932342529296875, 0.02031421661376953, 0.021696090698242188, 0.023077964782714844, 0.0244598388671875, 0.025841712951660156, 0.027223587036132812, 0.02860546112060547, 0.029987335205078125, 0.03136920928955078, 0.03275108337402344, 0.034132957458496094, 0.03551483154296875, 0.036896705627441406, 0.03827857971191406, 0.03966045379638672, 0.041042327880859375, 0.04242420196533203, 0.04380607604980469, 0.045187950134277344, 0.04656982421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 10.0, 9.0, 13.0, 14.0, 19.0, 26.0, 44.0, 42.0, 59.0, 99.0, 135.0, 214.0, 371.0, 526.0, 865.0, 1661.0, 3525.0, 13330.0, 136016.0, 808719.0, 67775.0, 8687.0, 2841.0, 1322.0, 804.0, 476.0, 291.0, 201.0, 146.0, 80.0, 69.0, 41.0, 36.0, 25.0, 14.0, 17.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1904296875, -0.1841602325439453, -0.17789077758789062, -0.17162132263183594, -0.16535186767578125, -0.15908241271972656, -0.15281295776367188, -0.1465435028076172, -0.1402740478515625, -0.1340045928955078, -0.12773513793945312, -0.12146568298339844, -0.11519622802734375, -0.10892677307128906, -0.10265731811523438, -0.09638786315917969, -0.090118408203125, -0.08384895324707031, -0.07757949829101562, -0.07131004333496094, -0.06504058837890625, -0.05877113342285156, -0.052501678466796875, -0.04623222351074219, -0.0399627685546875, -0.03369331359863281, -0.027423858642578125, -0.021154403686523438, -0.01488494873046875, -0.008615493774414062, -0.002346038818359375, 0.0039234161376953125, 0.01019287109375, 0.016462326049804688, 0.022731781005859375, 0.029001235961914062, 0.03527069091796875, 0.04154014587402344, 0.047809600830078125, 0.05407905578613281, 0.0603485107421875, 0.06661796569824219, 0.07288742065429688, 0.07915687561035156, 0.08542633056640625, 0.09169578552246094, 0.09796524047851562, 0.10423469543457031, 0.110504150390625, 0.11677360534667969, 0.12304306030273438, 0.12931251525878906, 0.13558197021484375, 0.14185142517089844, 0.14812088012695312, 0.1543903350830078, 0.1606597900390625, 0.1669292449951172, 0.17319869995117188, 0.17946815490722656, 0.18573760986328125, 0.19200706481933594, 0.19827651977539062, 0.2045459747314453, 0.2108154296875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 4.0, 7.0, 10.0, 7.0, 11.0, 13.0, 10.0, 23.0, 26.0, 22.0, 42.0, 32.0, 43.0, 46.0, 42.0, 42.0, 53.0, 62.0, 62.0, 62.0, 51.0, 41.0, 39.0, 40.0, 30.0, 34.0, 37.0, 21.0, 23.0, 16.0, 13.0, 10.0, 10.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.255126953125, -0.24761390686035156, -0.24010086059570312, -0.2325878143310547, -0.22507476806640625, -0.2175617218017578, -0.21004867553710938, -0.20253562927246094, -0.1950225830078125, -0.18750953674316406, -0.17999649047851562, -0.1724834442138672, -0.16497039794921875, -0.1574573516845703, -0.14994430541992188, -0.14243125915527344, -0.134918212890625, -0.12740516662597656, -0.11989212036132812, -0.11237907409667969, -0.10486602783203125, -0.09735298156738281, -0.08983993530273438, -0.08232688903808594, -0.0748138427734375, -0.06730079650878906, -0.059787750244140625, -0.05227470397949219, -0.04476165771484375, -0.03724861145019531, -0.029735565185546875, -0.022222518920898438, -0.01470947265625, -0.0071964263916015625, 0.000316619873046875, 0.007829666137695312, 0.01534271240234375, 0.022855758666992188, 0.030368804931640625, 0.03788185119628906, 0.0453948974609375, 0.05290794372558594, 0.060420989990234375, 0.06793403625488281, 0.07544708251953125, 0.08296012878417969, 0.09047317504882812, 0.09798622131347656, 0.105499267578125, 0.11301231384277344, 0.12052536010742188, 0.1280384063720703, 0.13555145263671875, 0.1430644989013672, 0.15057754516601562, 0.15809059143066406, 0.1656036376953125, 0.17311668395996094, 0.18062973022460938, 0.1881427764892578, 0.19565582275390625, 0.2031688690185547, 0.21068191528320312, 0.21819496154785156, 0.2257080078125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 7.0, 8.0, 7.0, 16.0, 21.0, 26.0, 42.0, 60.0, 98.0, 145.0, 336.0, 634.0, 1345.0, 3411.0, 12180.0, 75445.0, 796866.0, 132442.0, 17775.0, 4467.0, 1581.0, 732.0, 366.0, 210.0, 124.0, 66.0, 46.0, 24.0, 25.0, 24.0, 5.0, 5.0, 4.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08697509765625, -0.08382606506347656, -0.08067703247070312, -0.07752799987792969, -0.07437896728515625, -0.07122993469238281, -0.06808090209960938, -0.06493186950683594, -0.0617828369140625, -0.05863380432128906, -0.055484771728515625, -0.05233573913574219, -0.04918670654296875, -0.04603767395019531, -0.042888641357421875, -0.03973960876464844, -0.036590576171875, -0.03344154357910156, -0.030292510986328125, -0.027143478393554688, -0.02399444580078125, -0.020845413208007812, -0.017696380615234375, -0.014547348022460938, -0.0113983154296875, -0.008249282836914062, -0.005100250244140625, -0.0019512176513671875, 0.00119781494140625, 0.0043468475341796875, 0.007495880126953125, 0.010644912719726562, 0.0137939453125, 0.016942977905273438, 0.020092010498046875, 0.023241043090820312, 0.02639007568359375, 0.029539108276367188, 0.032688140869140625, 0.03583717346191406, 0.0389862060546875, 0.04213523864746094, 0.045284271240234375, 0.04843330383300781, 0.05158233642578125, 0.05473136901855469, 0.057880401611328125, 0.06102943420410156, 0.064178466796875, 0.06732749938964844, 0.07047653198242188, 0.07362556457519531, 0.07677459716796875, 0.07992362976074219, 0.08307266235351562, 0.08622169494628906, 0.0893707275390625, 0.09251976013183594, 0.09566879272460938, 0.09881782531738281, 0.10196685791015625, 0.10511589050292969, 0.10826492309570312, 0.11141395568847656, 0.11456298828125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 5.0, 7.0, 11.0, 7.0, 7.0, 12.0, 13.0, 18.0, 21.0, 23.0, 33.0, 32.0, 62.0, 70.0, 99.0, 84.0, 92.0, 73.0, 63.0, 48.0, 32.0, 28.0, 30.0, 16.0, 16.0, 15.0, 15.0, 9.0, 11.0, 4.0, 9.0, 8.0, 3.0, 5.0, 0.0, 3.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.030632019042969e-05, -4.888884723186493e-05, -4.747137427330017e-05, -4.605390131473541e-05, -4.4636428356170654e-05, -4.3218955397605896e-05, -4.180148243904114e-05, -4.038400948047638e-05, -3.896653652191162e-05, -3.754906356334686e-05, -3.6131590604782104e-05, -3.4714117646217346e-05, -3.329664468765259e-05, -3.187917172908783e-05, -3.046169877052307e-05, -2.9044225811958313e-05, -2.7626752853393555e-05, -2.6209279894828796e-05, -2.4791806936264038e-05, -2.337433397769928e-05, -2.195686101913452e-05, -2.0539388060569763e-05, -1.9121915102005005e-05, -1.7704442143440247e-05, -1.6286969184875488e-05, -1.486949622631073e-05, -1.3452023267745972e-05, -1.2034550309181213e-05, -1.0617077350616455e-05, -9.199604392051697e-06, -7.782131433486938e-06, -6.36465847492218e-06, -4.947185516357422e-06, -3.5297125577926636e-06, -2.1122395992279053e-06, -6.94766640663147e-07, 7.227063179016113e-07, 2.1401792764663696e-06, 3.557652235031128e-06, 4.975125193595886e-06, 6.3925981521606445e-06, 7.810071110725403e-06, 9.227544069290161e-06, 1.064501702785492e-05, 1.2062489986419678e-05, 1.3479962944984436e-05, 1.4897435903549194e-05, 1.6314908862113953e-05, 1.773238182067871e-05, 1.914985477924347e-05, 2.0567327737808228e-05, 2.1984800696372986e-05, 2.3402273654937744e-05, 2.4819746613502502e-05, 2.623721957206726e-05, 2.765469253063202e-05, 2.9072165489196777e-05, 3.0489638447761536e-05, 3.1907111406326294e-05, 3.332458436489105e-05, 3.474205732345581e-05, 3.615953028202057e-05, 3.757700324058533e-05, 3.8994476199150085e-05, 4.0411949157714844e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 7.0, 2.0, 12.0, 6.0, 13.0, 11.0, 27.0, 34.0, 52.0, 70.0, 109.0, 186.0, 295.0, 568.0, 1277.0, 3257.0, 12319.0, 91100.0, 839366.0, 82592.0, 11603.0, 3036.0, 1185.0, 562.0, 318.0, 183.0, 118.0, 78.0, 48.0, 39.0, 21.0, 18.0, 10.0, 11.0, 4.0, 7.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1143798828125, -0.11074638366699219, -0.10711288452148438, -0.10347938537597656, -0.09984588623046875, -0.09621238708496094, -0.09257888793945312, -0.08894538879394531, -0.0853118896484375, -0.08167839050292969, -0.07804489135742188, -0.07441139221191406, -0.07077789306640625, -0.06714439392089844, -0.06351089477539062, -0.05987739562988281, -0.056243896484375, -0.05261039733886719, -0.048976898193359375, -0.04534339904785156, -0.04170989990234375, -0.03807640075683594, -0.034442901611328125, -0.030809402465820312, -0.0271759033203125, -0.023542404174804688, -0.019908905029296875, -0.016275405883789062, -0.01264190673828125, -0.009008407592773438, -0.005374908447265625, -0.0017414093017578125, 0.00189208984375, 0.0055255889892578125, 0.009159088134765625, 0.012792587280273438, 0.01642608642578125, 0.020059585571289062, 0.023693084716796875, 0.027326583862304688, 0.0309600830078125, 0.03459358215332031, 0.038227081298828125, 0.04186058044433594, 0.04549407958984375, 0.04912757873535156, 0.052761077880859375, 0.05639457702636719, 0.060028076171875, 0.06366157531738281, 0.06729507446289062, 0.07092857360839844, 0.07456207275390625, 0.07819557189941406, 0.08182907104492188, 0.08546257019042969, 0.0890960693359375, 0.09272956848144531, 0.09636306762695312, 0.09999656677246094, 0.10363006591796875, 0.10726356506347656, 0.11089706420898438, 0.11453056335449219, 0.1181640625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 7.0, 9.0, 12.0, 11.0, 19.0, 24.0, 28.0, 36.0, 43.0, 60.0, 69.0, 124.0, 129.0, 105.0, 63.0, 58.0, 61.0, 30.0, 25.0, 20.0, 16.0, 11.0, 7.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0958251953125, -0.092864990234375, -0.08990478515625, -0.086944580078125, -0.083984375, -0.081024169921875, -0.07806396484375, -0.075103759765625, -0.0721435546875, -0.069183349609375, -0.06622314453125, -0.063262939453125, -0.060302734375, -0.057342529296875, -0.05438232421875, -0.051422119140625, -0.0484619140625, -0.045501708984375, -0.04254150390625, -0.039581298828125, -0.03662109375, -0.033660888671875, -0.03070068359375, -0.027740478515625, -0.0247802734375, -0.021820068359375, -0.01885986328125, -0.015899658203125, -0.012939453125, -0.009979248046875, -0.00701904296875, -0.004058837890625, -0.0010986328125, 0.001861572265625, 0.00482177734375, 0.007781982421875, 0.0107421875, 0.013702392578125, 0.01666259765625, 0.019622802734375, 0.0225830078125, 0.025543212890625, 0.02850341796875, 0.031463623046875, 0.034423828125, 0.037384033203125, 0.04034423828125, 0.043304443359375, 0.0462646484375, 0.049224853515625, 0.05218505859375, 0.055145263671875, 0.05810546875, 0.061065673828125, 0.06402587890625, 0.066986083984375, 0.0699462890625, 0.072906494140625, 0.07586669921875, 0.078826904296875, 0.081787109375, 0.084747314453125, 0.08770751953125, 0.090667724609375, 0.0936279296875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 3.0, 9.0, 25.0, 71.0, 325.0, 379.0, 129.0, 34.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.515934944152832, -2.4263272285461426, -2.336719512939453, -2.2471117973327637, -2.157503843307495, -2.0678961277008057, -1.9782884120941162, -1.8886806964874268, -1.7990728616714478, -1.7094651460647583, -1.6198573112487793, -1.5302495956420898, -1.4406418800354004, -1.3510340452194214, -1.261426329612732, -1.171818494796753, -1.0822107791900635, -0.9926030039787292, -0.902995228767395, -0.8133875131607056, -0.7237797379493713, -0.6341719627380371, -0.5445642471313477, -0.4549564719200134, -0.3653486967086792, -0.27574092149734497, -0.18613317608833313, -0.09652543067932129, -0.0069176554679870605, 0.08269011974334717, 0.17229783535003662, 0.26190561056137085, 0.3515133857727051, 0.4411211609840393, 0.5307289361953735, 0.620336651802063, 0.7099444270133972, 0.7995522022247314, 0.8891599178314209, 0.9787676930427551, 1.0683754682540894, 1.1579831838607788, 1.2475910186767578, 1.3371987342834473, 1.4268064498901367, 1.5164142847061157, 1.6060220003128052, 1.6956298351287842, 1.7852375507354736, 1.874845266342163, 1.964453101158142, 2.054060935974121, 2.1436686515808105, 2.2332763671875, 2.3228840827941895, 2.412491798400879, 2.5020995140075684, 2.591707229614258, 2.6813149452209473, 2.7709226608276367, 2.8605306148529053, 2.9501383304595947, 3.039746046066284, 3.1293537616729736, 3.218961715698242]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 9.0, 8.0, 8.0, 17.0, 20.0, 25.0, 25.0, 23.0, 29.0, 35.0, 24.0, 33.0, 37.0, 39.0, 55.0, 71.0, 62.0, 64.0, 63.0, 31.0, 46.0, 37.0, 28.0, 25.0, 30.0, 21.0, 24.0, 24.0, 9.0, 13.0, 12.0, 12.0, 10.0, 7.0, 7.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7732662558555603, -0.7464436888694763, -0.7196211218833923, -0.6927986145019531, -0.6659760475158691, -0.6391534805297852, -0.6123309135437012, -0.5855083465576172, -0.5586857795715332, -0.5318632125854492, -0.5050406455993652, -0.47821810841560364, -0.45139557123184204, -0.42457300424575806, -0.3977504372596741, -0.3709278702735901, -0.3441053628921509, -0.3172827959060669, -0.2904602587223053, -0.2636376917362213, -0.23681513965129852, -0.20999258756637573, -0.18317002058029175, -0.15634746849536896, -0.12952491641044617, -0.10270236432552338, -0.07587980479001999, -0.0490572452545166, -0.02223469316959381, 0.0045878589153289795, 0.031410425901412964, 0.058232977986335754, 0.08505558967590332, 0.11187814176082611, 0.1387006938457489, 0.16552326083183289, 0.19234581291675568, 0.21916836500167847, 0.24599093198776245, 0.27281349897384644, 0.29963603615760803, 0.326458603143692, 0.3532811403274536, 0.3801037073135376, 0.4069262742996216, 0.4337488114833832, 0.46057137846946716, 0.48739391565322876, 0.5142164826393127, 0.5410390496253967, 0.5678616166114807, 0.5946841239929199, 0.6215066909790039, 0.6483292579650879, 0.6751518249511719, 0.7019743919372559, 0.7287969589233398, 0.7556195259094238, 0.7824420928955078, 0.8092646598815918, 0.836087167263031, 0.862909734249115, 0.889732301235199, 0.916554868221283, 0.9433773756027222]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 16.0, 19.0, 35.0, 65.0, 125.0, 276.0, 681.0, 1916.0, 7597.0, 50952.0, 987539.0, 2924841.0, 198368.0, 16905.0, 3121.0, 983.0, 399.0, 183.0, 95.0, 58.0, 47.0, 25.0, 11.0, 16.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0872802734375, -0.08368110656738281, -0.08008193969726562, -0.07648277282714844, -0.07288360595703125, -0.06928443908691406, -0.06568527221679688, -0.06208610534667969, -0.0584869384765625, -0.05488777160644531, -0.051288604736328125, -0.04768943786621094, -0.04409027099609375, -0.04049110412597656, -0.036891937255859375, -0.03329277038574219, -0.029693603515625, -0.026094436645507812, -0.022495269775390625, -0.018896102905273438, -0.01529693603515625, -0.011697769165039062, -0.008098602294921875, -0.0044994354248046875, -0.0009002685546875, 0.0026988983154296875, 0.006298065185546875, 0.009897232055664062, 0.01349639892578125, 0.017095565795898438, 0.020694732666015625, 0.024293899536132812, 0.02789306640625, 0.03149223327636719, 0.035091400146484375, 0.03869056701660156, 0.04228973388671875, 0.04588890075683594, 0.049488067626953125, 0.05308723449707031, 0.0566864013671875, 0.06028556823730469, 0.06388473510742188, 0.06748390197753906, 0.07108306884765625, 0.07468223571777344, 0.07828140258789062, 0.08188056945800781, 0.085479736328125, 0.08907890319824219, 0.09267807006835938, 0.09627723693847656, 0.09987640380859375, 0.10347557067871094, 0.10707473754882812, 0.11067390441894531, 0.1142730712890625, 0.11787223815917969, 0.12147140502929688, 0.12507057189941406, 0.12866973876953125, 0.13226890563964844, 0.13586807250976562, 0.1394672393798828, 0.14306640625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 14.0, 18.0, 16.0, 19.0, 29.0, 42.0, 40.0, 57.0, 65.0, 79.0, 74.0, 67.0, 74.0, 67.0, 71.0, 46.0, 53.0, 43.0, 35.0, 26.0, 22.0, 19.0, 10.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044891357421875, -0.04262971878051758, -0.040368080139160156, -0.038106441497802734, -0.03584480285644531, -0.03358316421508789, -0.03132152557373047, -0.029059886932373047, -0.026798248291015625, -0.024536609649658203, -0.02227497100830078, -0.02001333236694336, -0.017751693725585938, -0.015490055084228516, -0.013228416442871094, -0.010966777801513672, -0.00870513916015625, -0.006443500518798828, -0.004181861877441406, -0.0019202232360839844, 0.0003414154052734375, 0.0026030540466308594, 0.004864692687988281, 0.007126331329345703, 0.009387969970703125, 0.011649608612060547, 0.013911247253417969, 0.01617288589477539, 0.018434524536132812, 0.020696163177490234, 0.022957801818847656, 0.025219440460205078, 0.0274810791015625, 0.029742717742919922, 0.032004356384277344, 0.034265995025634766, 0.03652763366699219, 0.03878927230834961, 0.04105091094970703, 0.04331254959106445, 0.045574188232421875, 0.0478358268737793, 0.05009746551513672, 0.05235910415649414, 0.05462074279785156, 0.056882381439208984, 0.059144020080566406, 0.06140565872192383, 0.06366729736328125, 0.06592893600463867, 0.0681905746459961, 0.07045221328735352, 0.07271385192871094, 0.07497549057006836, 0.07723712921142578, 0.0794987678527832, 0.08176040649414062, 0.08402204513549805, 0.08628368377685547, 0.08854532241821289, 0.09080696105957031, 0.09306859970092773, 0.09533023834228516, 0.09759187698364258, 0.099853515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 10.0, 8.0, 10.0, 20.0, 21.0, 43.0, 59.0, 73.0, 148.0, 231.0, 407.0, 840.0, 2924.0, 42171.0, 3618722.0, 512206.0, 12454.0, 2114.0, 836.0, 424.0, 248.0, 122.0, 73.0, 46.0, 18.0, 20.0, 9.0, 8.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.235107421875, -0.22814369201660156, -0.22117996215820312, -0.2142162322998047, -0.20725250244140625, -0.2002887725830078, -0.19332504272460938, -0.18636131286621094, -0.1793975830078125, -0.17243385314941406, -0.16547012329101562, -0.1585063934326172, -0.15154266357421875, -0.1445789337158203, -0.13761520385742188, -0.13065147399902344, -0.123687744140625, -0.11672401428222656, -0.10976028442382812, -0.10279655456542969, -0.09583282470703125, -0.08886909484863281, -0.08190536499023438, -0.07494163513183594, -0.0679779052734375, -0.06101417541503906, -0.054050445556640625, -0.04708671569824219, -0.04012298583984375, -0.03315925598144531, -0.026195526123046875, -0.019231796264648438, -0.01226806640625, -0.0053043365478515625, 0.001659393310546875, 0.008623123168945312, 0.01558685302734375, 0.022550582885742188, 0.029514312744140625, 0.03647804260253906, 0.0434417724609375, 0.05040550231933594, 0.057369232177734375, 0.06433296203613281, 0.07129669189453125, 0.07826042175292969, 0.08522415161132812, 0.09218788146972656, 0.099151611328125, 0.10611534118652344, 0.11307907104492188, 0.12004280090332031, 0.12700653076171875, 0.1339702606201172, 0.14093399047851562, 0.14789772033691406, 0.1548614501953125, 0.16182518005371094, 0.16878890991210938, 0.1757526397705078, 0.18271636962890625, 0.1896800994873047, 0.19664382934570312, 0.20360755920410156, 0.2105712890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 17.0, 31.0, 76.0, 234.0, 709.0, 1406.0, 964.0, 373.0, 143.0, 56.0, 30.0, 19.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2276611328125, -0.21877098083496094, -0.20988082885742188, -0.2009906768798828, -0.19210052490234375, -0.1832103729248047, -0.17432022094726562, -0.16543006896972656, -0.1565399169921875, -0.14764976501464844, -0.13875961303710938, -0.1298694610595703, -0.12097930908203125, -0.11208915710449219, -0.10319900512695312, -0.09430885314941406, -0.085418701171875, -0.07652854919433594, -0.06763839721679688, -0.05874824523925781, -0.04985809326171875, -0.04096794128417969, -0.032077789306640625, -0.023187637329101562, -0.0142974853515625, -0.0054073333740234375, 0.003482818603515625, 0.012372970581054688, 0.02126312255859375, 0.030153274536132812, 0.039043426513671875, 0.04793357849121094, 0.05682373046875, 0.06571388244628906, 0.07460403442382812, 0.08349418640136719, 0.09238433837890625, 0.10127449035644531, 0.11016464233398438, 0.11905479431152344, 0.1279449462890625, 0.13683509826660156, 0.14572525024414062, 0.1546154022216797, 0.16350555419921875, 0.1723957061767578, 0.18128585815429688, 0.19017601013183594, 0.199066162109375, 0.20795631408691406, 0.21684646606445312, 0.2257366180419922, 0.23462677001953125, 0.2435169219970703, 0.2524070739746094, 0.26129722595214844, 0.2701873779296875, 0.27907752990722656, 0.2879676818847656, 0.2968578338623047, 0.30574798583984375, 0.3146381378173828, 0.3235282897949219, 0.33241844177246094, 0.34130859375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 10.0, 28.0, 97.0, 371.0, 347.0, 114.0, 21.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7645204067230225, -1.6708967685699463, -1.5772731304168701, -1.483649492263794, -1.3900258541107178, -1.2964022159576416, -1.2027784585952759, -1.1091548204421997, -1.0155311822891235, -0.9219075441360474, -0.8282839059829712, -0.7346602082252502, -0.6410365700721741, -0.5474129319190979, -0.45378923416137695, -0.3601655960083008, -0.2665419578552246, -0.17291830480098724, -0.07929465174674988, 0.014329016208648682, 0.10795265436172485, 0.20157629251480103, 0.295199990272522, 0.38882362842559814, 0.4824472665786743, 0.5760709047317505, 0.6696945428848267, 0.7633182406425476, 0.8569418787956238, 0.9505655169487, 1.044189214706421, 1.137812852859497, 1.2314367294311523, 1.3250603675842285, 1.4186840057373047, 1.5123076438903809, 1.605931282043457, 1.6995549201965332, 1.793178677558899, 1.886802315711975, 1.9804259538650513, 2.074049711227417, 2.167673349380493, 2.2612969875335693, 2.3549206256866455, 2.4485442638397217, 2.542167901992798, 2.635791540145874, 2.72941517829895, 2.8230388164520264, 2.9166624546051025, 3.0102860927581787, 3.103909730911255, 3.197533369064331, 3.2911572456359863, 3.3847808837890625, 3.4784045219421387, 3.572028160095215, 3.665651798248291, 3.759275436401367, 3.8528990745544434, 3.9465227127075195, 4.040146350860596, 4.133769989013672, 4.227393627166748]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 15.0, 18.0, 29.0, 38.0, 49.0, 69.0, 83.0, 92.0, 100.0, 97.0, 86.0, 84.0, 44.0, 64.0, 45.0, 27.0, 26.0, 12.0, 10.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3682739734649658, -1.3293551206588745, -1.2904363870620728, -1.2515175342559814, -1.2125988006591797, -1.1736799478530884, -1.1347612142562866, -1.0958423614501953, -1.0569236278533936, -1.0180047750473022, -0.9790860414505005, -0.940167248249054, -0.9012484550476074, -0.8623296022415161, -0.8234108090400696, -0.784492015838623, -0.7455731630325317, -0.7066543698310852, -0.6677355766296387, -0.6288167834281921, -0.5898979902267456, -0.5509791374206543, -0.5120603442192078, -0.47314155101776123, -0.4342227578163147, -0.39530396461486816, -0.35638517141342163, -0.3174663484096527, -0.2785475552082062, -0.23962876200675964, -0.20070995390415192, -0.1617911458015442, -0.12287235260009766, -0.08395355194807053, -0.045034751296043396, -0.006115950644016266, 0.032802850008010864, 0.0717216432094574, 0.11064045131206512, 0.14955925941467285, 0.18847805261611938, 0.22739684581756592, 0.26631563901901245, 0.30523446202278137, 0.3441532552242279, 0.38307204842567444, 0.42199087142944336, 0.4609096646308899, 0.4998284578323364, 0.538747251033783, 0.5776660442352295, 0.616584837436676, 0.6555036306381226, 0.6944224834442139, 0.7333412766456604, 0.7722600698471069, 0.8111788630485535, 0.85009765625, 0.8890164494514465, 0.9279352426528931, 0.9668540954589844, 1.0057728290557861, 1.0446916818618774, 1.0836105346679688, 1.1225292682647705]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 19.0, 14.0, 34.0, 49.0, 65.0, 94.0, 165.0, 333.0, 755.0, 1912.0, 5211.0, 17304.0, 71587.0, 397155.0, 442785.0, 82461.0, 19348.0, 5626.0, 1939.0, 791.0, 344.0, 181.0, 102.0, 83.0, 51.0, 30.0, 28.0, 12.0, 12.0, 13.0, 7.0, 11.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.133544921875, -0.1295032501220703, -0.12546157836914062, -0.12141990661621094, -0.11737823486328125, -0.11333656311035156, -0.10929489135742188, -0.10525321960449219, -0.1012115478515625, -0.09716987609863281, -0.09312820434570312, -0.08908653259277344, -0.08504486083984375, -0.08100318908691406, -0.07696151733398438, -0.07291984558105469, -0.068878173828125, -0.06483650207519531, -0.060794830322265625, -0.05675315856933594, -0.05271148681640625, -0.04866981506347656, -0.044628143310546875, -0.04058647155761719, -0.0365447998046875, -0.03250312805175781, -0.028461456298828125, -0.024419784545898438, -0.02037811279296875, -0.016336441040039062, -0.012294769287109375, -0.008253097534179688, -0.00421142578125, -0.0001697540283203125, 0.003871917724609375, 0.007913589477539062, 0.01195526123046875, 0.015996932983398438, 0.020038604736328125, 0.024080276489257812, 0.0281219482421875, 0.03216361999511719, 0.036205291748046875, 0.04024696350097656, 0.04428863525390625, 0.04833030700683594, 0.052371978759765625, 0.05641365051269531, 0.060455322265625, 0.06449699401855469, 0.06853866577148438, 0.07258033752441406, 0.07662200927734375, 0.08066368103027344, 0.08470535278320312, 0.08874702453613281, 0.0927886962890625, 0.09683036804199219, 0.10087203979492188, 0.10491371154785156, 0.10895538330078125, 0.11299705505371094, 0.11703872680664062, 0.12108039855957031, 0.1251220703125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 10.0, 8.0, 6.0, 12.0, 9.0, 17.0, 18.0, 21.0, 23.0, 21.0, 23.0, 33.0, 53.0, 41.0, 45.0, 53.0, 40.0, 43.0, 54.0, 53.0, 34.0, 45.0, 52.0, 46.0, 42.0, 28.0, 28.0, 23.0, 25.0, 22.0, 16.0, 9.0, 14.0, 8.0, 6.0, 4.0, 6.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.044677734375, -0.04303312301635742, -0.041388511657714844, -0.039743900299072266, -0.03809928894042969, -0.03645467758178711, -0.03481006622314453, -0.03316545486450195, -0.031520843505859375, -0.029876232147216797, -0.02823162078857422, -0.02658700942993164, -0.024942398071289062, -0.023297786712646484, -0.021653175354003906, -0.020008563995361328, -0.01836395263671875, -0.016719341278076172, -0.015074729919433594, -0.013430118560791016, -0.011785507202148438, -0.01014089584350586, -0.008496284484863281, -0.006851673126220703, -0.005207061767578125, -0.003562450408935547, -0.0019178390502929688, -0.0002732276916503906, 0.0013713836669921875, 0.0030159950256347656, 0.004660606384277344, 0.006305217742919922, 0.0079498291015625, 0.009594440460205078, 0.011239051818847656, 0.012883663177490234, 0.014528274536132812, 0.01617288589477539, 0.01781749725341797, 0.019462108612060547, 0.021106719970703125, 0.022751331329345703, 0.02439594268798828, 0.02604055404663086, 0.027685165405273438, 0.029329776763916016, 0.030974388122558594, 0.03261899948120117, 0.03426361083984375, 0.03590822219848633, 0.037552833557128906, 0.039197444915771484, 0.04084205627441406, 0.04248666763305664, 0.04413127899169922, 0.0457758903503418, 0.047420501708984375, 0.04906511306762695, 0.05070972442626953, 0.05235433578491211, 0.05399894714355469, 0.055643558502197266, 0.057288169860839844, 0.05893278121948242, 0.060577392578125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 10.0, 15.0, 17.0, 22.0, 29.0, 44.0, 68.0, 103.0, 146.0, 199.0, 325.0, 622.0, 1056.0, 2327.0, 7467.0, 50186.0, 855039.0, 112956.0, 11594.0, 3105.0, 1294.0, 700.0, 431.0, 244.0, 163.0, 112.0, 67.0, 60.0, 36.0, 30.0, 11.0, 13.0, 10.0, 8.0, 10.0, 10.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2340087890625, -0.22522544860839844, -0.21644210815429688, -0.2076587677001953, -0.19887542724609375, -0.1900920867919922, -0.18130874633789062, -0.17252540588378906, -0.1637420654296875, -0.15495872497558594, -0.14617538452148438, -0.1373920440673828, -0.12860870361328125, -0.11982536315917969, -0.11104202270507812, -0.10225868225097656, -0.093475341796875, -0.08469200134277344, -0.07590866088867188, -0.06712532043457031, -0.05834197998046875, -0.04955863952636719, -0.040775299072265625, -0.03199195861816406, -0.0232086181640625, -0.014425277709960938, -0.005641937255859375, 0.0031414031982421875, 0.01192474365234375, 0.020708084106445312, 0.029491424560546875, 0.03827476501464844, 0.04705810546875, 0.05584144592285156, 0.06462478637695312, 0.07340812683105469, 0.08219146728515625, 0.09097480773925781, 0.09975814819335938, 0.10854148864746094, 0.1173248291015625, 0.12610816955566406, 0.13489151000976562, 0.1436748504638672, 0.15245819091796875, 0.1612415313720703, 0.17002487182617188, 0.17880821228027344, 0.187591552734375, 0.19637489318847656, 0.20515823364257812, 0.2139415740966797, 0.22272491455078125, 0.2315082550048828, 0.24029159545898438, 0.24907493591308594, 0.2578582763671875, 0.26664161682128906, 0.2754249572753906, 0.2842082977294922, 0.29299163818359375, 0.3017749786376953, 0.3105583190917969, 0.31934165954589844, 0.328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 0.0, 4.0, 11.0, 6.0, 3.0, 13.0, 21.0, 17.0, 20.0, 37.0, 27.0, 52.0, 56.0, 49.0, 53.0, 54.0, 58.0, 66.0, 70.0, 51.0, 58.0, 38.0, 62.0, 29.0, 27.0, 30.0, 14.0, 13.0, 17.0, 9.0, 6.0, 7.0, 7.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23583984375, -0.22736358642578125, -0.2188873291015625, -0.21041107177734375, -0.201934814453125, -0.19345855712890625, -0.1849822998046875, -0.17650604248046875, -0.16802978515625, -0.15955352783203125, -0.1510772705078125, -0.14260101318359375, -0.134124755859375, -0.12564849853515625, -0.1171722412109375, -0.10869598388671875, -0.1002197265625, -0.09174346923828125, -0.0832672119140625, -0.07479095458984375, -0.066314697265625, -0.05783843994140625, -0.0493621826171875, -0.04088592529296875, -0.03240966796875, -0.02393341064453125, -0.0154571533203125, -0.00698089599609375, 0.001495361328125, 0.00997161865234375, 0.0184478759765625, 0.02692413330078125, 0.035400390625, 0.04387664794921875, 0.0523529052734375, 0.06082916259765625, 0.069305419921875, 0.07778167724609375, 0.0862579345703125, 0.09473419189453125, 0.10321044921875, 0.11168670654296875, 0.1201629638671875, 0.12863922119140625, 0.137115478515625, 0.14559173583984375, 0.1540679931640625, 0.16254425048828125, 0.1710205078125, 0.17949676513671875, 0.1879730224609375, 0.19644927978515625, 0.204925537109375, 0.21340179443359375, 0.2218780517578125, 0.23035430908203125, 0.23883056640625, 0.24730682373046875, 0.2557830810546875, 0.26425933837890625, 0.272735595703125, 0.28121185302734375, 0.2896881103515625, 0.29816436767578125, 0.306640625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 5.0, 6.0, 15.0, 12.0, 20.0, 26.0, 31.0, 59.0, 101.0, 194.0, 373.0, 997.0, 3551.0, 25026.0, 826887.0, 176226.0, 11378.0, 2165.0, 727.0, 291.0, 167.0, 95.0, 55.0, 41.0, 29.0, 21.0, 17.0, 9.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.214599609375, -0.2078571319580078, -0.20111465454101562, -0.19437217712402344, -0.18762969970703125, -0.18088722229003906, -0.17414474487304688, -0.1674022674560547, -0.1606597900390625, -0.1539173126220703, -0.14717483520507812, -0.14043235778808594, -0.13368988037109375, -0.12694740295410156, -0.12020492553710938, -0.11346244812011719, -0.106719970703125, -0.09997749328613281, -0.09323501586914062, -0.08649253845214844, -0.07975006103515625, -0.07300758361816406, -0.06626510620117188, -0.05952262878417969, -0.0527801513671875, -0.04603767395019531, -0.039295196533203125, -0.03255271911621094, -0.02581024169921875, -0.019067764282226562, -0.012325286865234375, -0.0055828094482421875, 0.00115966796875, 0.007902145385742188, 0.014644622802734375, 0.021387100219726562, 0.02812957763671875, 0.03487205505371094, 0.041614532470703125, 0.04835700988769531, 0.0550994873046875, 0.06184196472167969, 0.06858444213867188, 0.07532691955566406, 0.08206939697265625, 0.08881187438964844, 0.09555435180664062, 0.10229682922363281, 0.109039306640625, 0.11578178405761719, 0.12252426147460938, 0.12926673889160156, 0.13600921630859375, 0.14275169372558594, 0.14949417114257812, 0.1562366485595703, 0.1629791259765625, 0.1697216033935547, 0.17646408081054688, 0.18320655822753906, 0.18994903564453125, 0.19669151306152344, 0.20343399047851562, 0.2101764678955078, 0.2169189453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 10.0, 7.0, 6.0, 5.0, 15.0, 8.0, 18.0, 16.0, 15.0, 28.0, 35.0, 52.0, 69.0, 100.0, 86.0, 104.0, 115.0, 85.0, 60.0, 44.0, 22.0, 24.0, 13.0, 17.0, 15.0, 5.0, 9.0, 11.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.941225051879883e-05, -4.766322672367096e-05, -4.591420292854309e-05, -4.416517913341522e-05, -4.2416155338287354e-05, -4.0667131543159485e-05, -3.8918107748031616e-05, -3.716908395290375e-05, -3.542006015777588e-05, -3.367103636264801e-05, -3.192201256752014e-05, -3.0172988772392273e-05, -2.8423964977264404e-05, -2.6674941182136536e-05, -2.4925917387008667e-05, -2.31768935918808e-05, -2.142786979675293e-05, -1.967884600162506e-05, -1.7929822206497192e-05, -1.6180798411369324e-05, -1.4431774616241455e-05, -1.2682750821113586e-05, -1.0933727025985718e-05, -9.184703230857849e-06, -7.4356794357299805e-06, -5.686655640602112e-06, -3.937631845474243e-06, -2.1886080503463745e-06, -4.3958425521850586e-07, 1.3094395399093628e-06, 3.0584633350372314e-06, 4.8074871301651e-06, 6.556510925292969e-06, 8.305534720420837e-06, 1.0054558515548706e-05, 1.1803582310676575e-05, 1.3552606105804443e-05, 1.5301629900932312e-05, 1.705065369606018e-05, 1.879967749118805e-05, 2.0548701286315918e-05, 2.2297725081443787e-05, 2.4046748876571655e-05, 2.5795772671699524e-05, 2.7544796466827393e-05, 2.929382026195526e-05, 3.104284405708313e-05, 3.2791867852211e-05, 3.454089164733887e-05, 3.6289915442466736e-05, 3.8038939237594604e-05, 3.978796303272247e-05, 4.153698682785034e-05, 4.328601062297821e-05, 4.503503441810608e-05, 4.678405821323395e-05, 4.8533082008361816e-05, 5.0282105803489685e-05, 5.2031129598617554e-05, 5.378015339374542e-05, 5.552917718887329e-05, 5.727820098400116e-05, 5.902722477912903e-05, 6.07762485742569e-05, 6.252527236938477e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 1.0, 5.0, 13.0, 21.0, 11.0, 12.0, 33.0, 36.0, 73.0, 109.0, 178.0, 316.0, 537.0, 1174.0, 3487.0, 16858.0, 190371.0, 786561.0, 39249.0, 6042.0, 1749.0, 747.0, 372.0, 185.0, 128.0, 98.0, 57.0, 35.0, 22.0, 25.0, 18.0, 12.0, 2.0, 7.0, 5.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1781005859375, -0.17331314086914062, -0.16852569580078125, -0.16373825073242188, -0.1589508056640625, -0.15416336059570312, -0.14937591552734375, -0.14458847045898438, -0.139801025390625, -0.13501358032226562, -0.13022613525390625, -0.12543869018554688, -0.1206512451171875, -0.11586380004882812, -0.11107635498046875, -0.10628890991210938, -0.10150146484375, -0.09671401977539062, -0.09192657470703125, -0.08713912963867188, -0.0823516845703125, -0.07756423950195312, -0.07277679443359375, -0.06798934936523438, -0.063201904296875, -0.058414459228515625, -0.05362701416015625, -0.048839569091796875, -0.0440521240234375, -0.039264678955078125, -0.03447723388671875, -0.029689788818359375, -0.02490234375, -0.020114898681640625, -0.01532745361328125, -0.010540008544921875, -0.0057525634765625, -0.000965118408203125, 0.00382232666015625, 0.008609771728515625, 0.013397216796875, 0.018184661865234375, 0.02297210693359375, 0.027759552001953125, 0.0325469970703125, 0.037334442138671875, 0.04212188720703125, 0.046909332275390625, 0.05169677734375, 0.056484222412109375, 0.06127166748046875, 0.06605911254882812, 0.0708465576171875, 0.07563400268554688, 0.08042144775390625, 0.08520889282226562, 0.089996337890625, 0.09478378295898438, 0.09957122802734375, 0.10435867309570312, 0.1091461181640625, 0.11393356323242188, 0.11872100830078125, 0.12350845336914062, 0.1282958984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 14.0, 6.0, 6.0, 15.0, 13.0, 9.0, 16.0, 33.0, 47.0, 60.0, 84.0, 119.0, 129.0, 125.0, 81.0, 71.0, 33.0, 21.0, 17.0, 19.0, 18.0, 13.0, 14.0, 7.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1097412109375, -0.10673236846923828, -0.10372352600097656, -0.10071468353271484, -0.09770584106445312, -0.0946969985961914, -0.09168815612792969, -0.08867931365966797, -0.08567047119140625, -0.08266162872314453, -0.07965278625488281, -0.0766439437866211, -0.07363510131835938, -0.07062625885009766, -0.06761741638183594, -0.06460857391357422, -0.0615997314453125, -0.05859088897705078, -0.05558204650878906, -0.052573204040527344, -0.049564361572265625, -0.046555519104003906, -0.04354667663574219, -0.04053783416748047, -0.03752899169921875, -0.03452014923095703, -0.03151130676269531, -0.028502464294433594, -0.025493621826171875, -0.022484779357910156, -0.019475936889648438, -0.01646709442138672, -0.013458251953125, -0.010449409484863281, -0.0074405670166015625, -0.004431724548339844, -0.001422882080078125, 0.0015859603881835938, 0.0045948028564453125, 0.007603645324707031, 0.01061248779296875, 0.013621330261230469, 0.016630172729492188, 0.019639015197753906, 0.022647857666015625, 0.025656700134277344, 0.028665542602539062, 0.03167438507080078, 0.0346832275390625, 0.03769207000732422, 0.04070091247558594, 0.043709754943847656, 0.046718597412109375, 0.049727439880371094, 0.05273628234863281, 0.05574512481689453, 0.05875396728515625, 0.06176280975341797, 0.06477165222167969, 0.0677804946899414, 0.07078933715820312, 0.07379817962646484, 0.07680702209472656, 0.07981586456298828, 0.08282470703125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 22.0, 68.0, 291.0, 398.0, 135.0, 31.0, 12.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8678526878356934, -1.7646770477294922, -1.6615012884140015, -1.5583256483078003, -1.4551498889923096, -1.3519742488861084, -1.2487986087799072, -1.1456228494644165, -1.0424470901489258, -0.9392713904380798, -0.8360956907272339, -0.7329200506210327, -0.629744291305542, -0.5265686511993408, -0.4233929514884949, -0.3202172517776489, -0.21704161167144775, -0.1138659194111824, -0.010690227150917053, 0.0924854576587677, 0.19566115736961365, 0.2988368272781372, 0.40201252698898315, 0.5051882266998291, 0.608363926410675, 0.711539626121521, 0.8147153258323669, 0.9178910255432129, 1.021066665649414, 1.1242423057556152, 1.227418065071106, 1.3305938243865967, 1.4337694644927979, 1.536945104598999, 1.6401208639144897, 1.743296504020691, 1.8464722633361816, 1.9496479034423828, 2.052823543548584, 2.155999183654785, 2.2591750621795654, 2.3623507022857666, 2.4655263423919678, 2.568702220916748, 2.671877861022949, 2.7750535011291504, 2.8782291412353516, 2.9814047813415527, 3.084580421447754, 3.187756061553955, 3.2909317016601562, 3.3941075801849365, 3.4972832202911377, 3.600458860397339, 3.70363450050354, 3.8068103790283203, 3.9099860191345215, 4.013161659240723, 4.116337299346924, 4.219512939453125, 4.322688579559326, 4.425864219665527, 4.529040336608887, 4.632215976715088, 4.735391616821289]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 7.0, 3.0, 2.0, 7.0, 8.0, 11.0, 12.0, 20.0, 20.0, 20.0, 23.0, 21.0, 32.0, 37.0, 39.0, 45.0, 45.0, 68.0, 82.0, 72.0, 58.0, 34.0, 45.0, 33.0, 28.0, 37.0, 28.0, 20.0, 17.0, 22.0, 24.0, 17.0, 9.0, 10.0, 9.0, 7.0, 7.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8480085730552673, -0.8180218935012817, -0.7880352139472961, -0.7580485343933105, -0.7280619144439697, -0.6980751752853394, -0.6680885553359985, -0.6381018757820129, -0.6081151962280273, -0.5781285166740417, -0.5481418371200562, -0.5181551575660706, -0.48816850781440735, -0.45818182826042175, -0.42819517850875854, -0.39820849895477295, -0.36822181940078735, -0.33823513984680176, -0.30824846029281616, -0.27826181054115295, -0.24827513098716736, -0.21828845143318176, -0.18830178678035736, -0.15831512212753296, -0.12832844257354736, -0.09834177047014236, -0.06835509836673737, -0.03836842626333237, -0.008381754159927368, 0.021604925394058228, 0.05159159004688263, 0.08157825469970703, 0.1115649938583374, 0.141551673412323, 0.1715383380651474, 0.2015250027179718, 0.2315116822719574, 0.261498361825943, 0.2914850115776062, 0.3214716911315918, 0.3514583706855774, 0.381445050239563, 0.4114317297935486, 0.4414183795452118, 0.4714050590991974, 0.5013917684555054, 0.5313783884048462, 0.5613650679588318, 0.5913517475128174, 0.621338427066803, 0.6513251066207886, 0.6813117861747742, 0.7112984657287598, 0.7412850856781006, 0.7712717652320862, 0.8012584447860718, 0.8312451243400574, 0.861231803894043, 0.8912184834480286, 0.9212051630020142, 0.951191782951355, 0.9811785221099854, 1.0111651420593262, 1.041151762008667, 1.0711385011672974]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 5.0, 11.0, 13.0, 23.0, 30.0, 49.0, 85.0, 102.0, 201.0, 378.0, 768.0, 1714.0, 4226.0, 14790.0, 91707.0, 1459955.0, 2429215.0, 164035.0, 19089.0, 4530.0, 1608.0, 724.0, 408.0, 220.0, 147.0, 89.0, 47.0, 27.0, 25.0, 16.0, 13.0, 11.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1112060546875, -0.10763263702392578, -0.10405921936035156, -0.10048580169677734, -0.09691238403320312, -0.0933389663696289, -0.08976554870605469, -0.08619213104248047, -0.08261871337890625, -0.07904529571533203, -0.07547187805175781, -0.0718984603881836, -0.06832504272460938, -0.06475162506103516, -0.06117820739746094, -0.05760478973388672, -0.0540313720703125, -0.05045795440673828, -0.04688453674316406, -0.043311119079589844, -0.039737701416015625, -0.036164283752441406, -0.03259086608886719, -0.02901744842529297, -0.02544403076171875, -0.02187061309814453, -0.018297195434570312, -0.014723777770996094, -0.011150360107421875, -0.007576942443847656, -0.0040035247802734375, -0.00043010711669921875, 0.003143310546875, 0.006716728210449219, 0.010290145874023438, 0.013863563537597656, 0.017436981201171875, 0.021010398864746094, 0.024583816528320312, 0.02815723419189453, 0.03173065185546875, 0.03530406951904297, 0.03887748718261719, 0.042450904846191406, 0.046024322509765625, 0.049597740173339844, 0.05317115783691406, 0.05674457550048828, 0.0603179931640625, 0.06389141082763672, 0.06746482849121094, 0.07103824615478516, 0.07461166381835938, 0.0781850814819336, 0.08175849914550781, 0.08533191680908203, 0.08890533447265625, 0.09247875213623047, 0.09605216979980469, 0.0996255874633789, 0.10319900512695312, 0.10677242279052734, 0.11034584045410156, 0.11391925811767578, 0.11749267578125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 7.0, 9.0, 12.0, 9.0, 16.0, 21.0, 31.0, 51.0, 45.0, 55.0, 76.0, 69.0, 76.0, 78.0, 73.0, 66.0, 48.0, 59.0, 42.0, 51.0, 29.0, 18.0, 15.0, 14.0, 8.0, 10.0, 5.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05584716796875, -0.05336570739746094, -0.050884246826171875, -0.04840278625488281, -0.04592132568359375, -0.04343986511230469, -0.040958404541015625, -0.03847694396972656, -0.0359954833984375, -0.03351402282714844, -0.031032562255859375, -0.028551101684570312, -0.02606964111328125, -0.023588180541992188, -0.021106719970703125, -0.018625259399414062, -0.016143798828125, -0.013662338256835938, -0.011180877685546875, -0.008699417114257812, -0.00621795654296875, -0.0037364959716796875, -0.001255035400390625, 0.0012264251708984375, 0.0037078857421875, 0.0061893463134765625, 0.008670806884765625, 0.011152267456054688, 0.01363372802734375, 0.016115188598632812, 0.018596649169921875, 0.021078109741210938, 0.0235595703125, 0.026041030883789062, 0.028522491455078125, 0.031003952026367188, 0.03348541259765625, 0.03596687316894531, 0.038448333740234375, 0.04092979431152344, 0.0434112548828125, 0.04589271545410156, 0.048374176025390625, 0.05085563659667969, 0.05333709716796875, 0.05581855773925781, 0.058300018310546875, 0.06078147888183594, 0.063262939453125, 0.06574440002441406, 0.06822586059570312, 0.07070732116699219, 0.07318878173828125, 0.07567024230957031, 0.07815170288085938, 0.08063316345214844, 0.0831146240234375, 0.08559608459472656, 0.08807754516601562, 0.09055900573730469, 0.09304046630859375, 0.09552192687988281, 0.09800338745117188, 0.10048484802246094, 0.10296630859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 10.0, 8.0, 18.0, 23.0, 39.0, 53.0, 80.0, 118.0, 191.0, 384.0, 1032.0, 4371.0, 93621.0, 4058113.0, 31368.0, 3268.0, 849.0, 335.0, 142.0, 99.0, 57.0, 32.0, 16.0, 22.0, 10.0, 8.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52197265625, -0.5096549987792969, -0.49733734130859375, -0.4850196838378906, -0.4727020263671875, -0.4603843688964844, -0.44806671142578125, -0.4357490539550781, -0.423431396484375, -0.4111137390136719, -0.39879608154296875, -0.3864784240722656, -0.3741607666015625, -0.3618431091308594, -0.34952545166015625, -0.3372077941894531, -0.32489013671875, -0.3125724792480469, -0.30025482177734375, -0.2879371643066406, -0.2756195068359375, -0.2633018493652344, -0.25098419189453125, -0.23866653442382812, -0.226348876953125, -0.21403121948242188, -0.20171356201171875, -0.18939590454101562, -0.1770782470703125, -0.16476058959960938, -0.15244293212890625, -0.14012527465820312, -0.1278076171875, -0.11548995971679688, -0.10317230224609375, -0.09085464477539062, -0.0785369873046875, -0.06621932983398438, -0.05390167236328125, -0.041584014892578125, -0.029266357421875, -0.016948699951171875, -0.00463104248046875, 0.007686614990234375, 0.0200042724609375, 0.032321929931640625, 0.04463958740234375, 0.056957244873046875, 0.06927490234375, 0.08159255981445312, 0.09391021728515625, 0.10622787475585938, 0.1185455322265625, 0.13086318969726562, 0.14318084716796875, 0.15549850463867188, 0.167816162109375, 0.18013381958007812, 0.19245147705078125, 0.20476913452148438, 0.2170867919921875, 0.22940444946289062, 0.24172210693359375, 0.2540397644042969, 0.266357421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 9.0, 11.0, 16.0, 29.0, 51.0, 82.0, 199.0, 486.0, 899.0, 1034.0, 682.0, 292.0, 132.0, 65.0, 28.0, 14.0, 13.0, 8.0, 8.0, 2.0, 3.0, 9.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23779296875, -0.23082733154296875, -0.2238616943359375, -0.21689605712890625, -0.209930419921875, -0.20296478271484375, -0.1959991455078125, -0.18903350830078125, -0.18206787109375, -0.17510223388671875, -0.1681365966796875, -0.16117095947265625, -0.154205322265625, -0.14723968505859375, -0.1402740478515625, -0.13330841064453125, -0.1263427734375, -0.11937713623046875, -0.1124114990234375, -0.10544586181640625, -0.098480224609375, -0.09151458740234375, -0.0845489501953125, -0.07758331298828125, -0.07061767578125, -0.06365203857421875, -0.0566864013671875, -0.04972076416015625, -0.042755126953125, -0.03578948974609375, -0.0288238525390625, -0.02185821533203125, -0.014892578125, -0.00792694091796875, -0.0009613037109375, 0.00600433349609375, 0.012969970703125, 0.01993560791015625, 0.0269012451171875, 0.03386688232421875, 0.04083251953125, 0.04779815673828125, 0.0547637939453125, 0.06172943115234375, 0.068695068359375, 0.07566070556640625, 0.0826263427734375, 0.08959197998046875, 0.0965576171875, 0.10352325439453125, 0.1104888916015625, 0.11745452880859375, 0.124420166015625, 0.13138580322265625, 0.1383514404296875, 0.14531707763671875, 0.15228271484375, 0.15924835205078125, 0.1662139892578125, 0.17317962646484375, 0.180145263671875, 0.18711090087890625, 0.1940765380859375, 0.20104217529296875, 0.2080078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 10.0, 33.0, 138.0, 350.0, 319.0, 84.0, 25.0, 13.0, 10.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6513679027557373, -3.549821615219116, -3.448275327682495, -3.346729040145874, -3.245182752609253, -3.143636465072632, -3.0420901775360107, -2.9405438899993896, -2.8389976024627686, -2.7374513149261475, -2.6359050273895264, -2.5343587398529053, -2.432812452316284, -2.331266164779663, -2.229719877243042, -2.128173589706421, -2.0266273021698, -1.9250810146331787, -1.8235347270965576, -1.7219884395599365, -1.6204421520233154, -1.5188958644866943, -1.4173495769500732, -1.3158032894134521, -1.214257001876831, -1.11271071434021, -1.0111644268035889, -0.9096181392669678, -0.8080718517303467, -0.7065255641937256, -0.6049792766571045, -0.5034329891204834, -0.4018867015838623, -0.3003404140472412, -0.19879412651062012, -0.09724783897399902, 0.00429844856262207, 0.10584473609924316, 0.20739102363586426, 0.30893731117248535, 0.41048359870910645, 0.5120298862457275, 0.6135761737823486, 0.7151224613189697, 0.8166687488555908, 0.9182150363922119, 1.019761323928833, 1.121307611465454, 1.2228538990020752, 1.3244001865386963, 1.4259464740753174, 1.5274927616119385, 1.6290390491485596, 1.7305853366851807, 1.8321316242218018, 1.9336779117584229, 2.035224199295044, 2.136770486831665, 2.238316774368286, 2.3398630619049072, 2.4414093494415283, 2.5429556369781494, 2.6445019245147705, 2.7460482120513916, 2.8475944995880127]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 5.0, 2.0, 7.0, 15.0, 15.0, 15.0, 18.0, 28.0, 31.0, 33.0, 55.0, 57.0, 59.0, 65.0, 65.0, 68.0, 65.0, 53.0, 59.0, 55.0, 39.0, 33.0, 30.0, 28.0, 27.0, 12.0, 13.0, 11.0, 9.0, 9.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9541041851043701, -0.9271227717399597, -0.9001412987709045, -0.8731598854064941, -0.8461784720420837, -0.8191969990730286, -0.7922155857086182, -0.765234112739563, -0.7382526993751526, -0.7112712860107422, -0.684289813041687, -0.6573083996772766, -0.6303269863128662, -0.603345513343811, -0.5763640999794006, -0.5493826866149902, -0.5224012136459351, -0.49541977047920227, -0.46843835711479187, -0.4414569139480591, -0.4144754707813263, -0.3874940276145935, -0.3605126142501831, -0.3335311710834503, -0.3065497875213623, -0.2795683443546295, -0.2525869309902191, -0.22560548782348633, -0.19862404465675354, -0.17164261639118195, -0.14466118812561035, -0.11767974495887756, -0.09069830179214478, -0.06371686607599258, -0.03673543408513069, -0.009754002094268799, 0.017227433621883392, 0.044208869338035583, 0.07119029760360718, 0.09817174077033997, 0.12515316903591156, 0.15213459730148315, 0.17911604046821594, 0.20609746873378754, 0.23307889699935913, 0.2600603401660919, 0.2870417833328247, 0.3140231966972351, 0.3410046398639679, 0.3679860830307007, 0.3949674963951111, 0.42194893956184387, 0.44893038272857666, 0.47591179609298706, 0.5028932094573975, 0.5298746824264526, 0.556856095790863, 0.5838375091552734, 0.6108189821243286, 0.637800395488739, 0.6647818088531494, 0.6917632818222046, 0.718744695186615, 0.7457261085510254, 0.7727075815200806]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 6.0, 5.0, 11.0, 16.0, 21.0, 32.0, 54.0, 60.0, 118.0, 220.0, 334.0, 787.0, 1890.0, 5194.0, 18033.0, 85540.0, 434305.0, 401460.0, 75910.0, 16181.0, 4929.0, 1831.0, 758.0, 333.0, 174.0, 130.0, 57.0, 52.0, 29.0, 19.0, 17.0, 8.0, 8.0, 3.0, 7.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.099853515625, -0.096282958984375, -0.09271240234375, -0.089141845703125, -0.0855712890625, -0.082000732421875, -0.07843017578125, -0.074859619140625, -0.0712890625, -0.067718505859375, -0.06414794921875, -0.060577392578125, -0.0570068359375, -0.053436279296875, -0.04986572265625, -0.046295166015625, -0.042724609375, -0.039154052734375, -0.03558349609375, -0.032012939453125, -0.0284423828125, -0.024871826171875, -0.02130126953125, -0.017730712890625, -0.01416015625, -0.010589599609375, -0.00701904296875, -0.003448486328125, 0.0001220703125, 0.003692626953125, 0.00726318359375, 0.010833740234375, 0.014404296875, 0.017974853515625, 0.02154541015625, 0.025115966796875, 0.0286865234375, 0.032257080078125, 0.03582763671875, 0.039398193359375, 0.04296875, 0.046539306640625, 0.05010986328125, 0.053680419921875, 0.0572509765625, 0.060821533203125, 0.06439208984375, 0.067962646484375, 0.071533203125, 0.075103759765625, 0.07867431640625, 0.082244873046875, 0.0858154296875, 0.089385986328125, 0.09295654296875, 0.096527099609375, 0.10009765625, 0.103668212890625, 0.10723876953125, 0.110809326171875, 0.1143798828125, 0.117950439453125, 0.12152099609375, 0.125091552734375, 0.128662109375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 8.0, 7.0, 23.0, 35.0, 35.0, 37.0, 46.0, 68.0, 54.0, 83.0, 71.0, 72.0, 80.0, 67.0, 63.0, 50.0, 57.0, 37.0, 36.0, 24.0, 14.0, 7.0, 13.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09454345703125, -0.09170722961425781, -0.08887100219726562, -0.08603477478027344, -0.08319854736328125, -0.08036231994628906, -0.07752609252929688, -0.07468986511230469, -0.0718536376953125, -0.06901741027832031, -0.06618118286132812, -0.06334495544433594, -0.06050872802734375, -0.05767250061035156, -0.054836273193359375, -0.05200004577636719, -0.049163818359375, -0.04632759094238281, -0.043491363525390625, -0.04065513610839844, -0.03781890869140625, -0.03498268127441406, -0.032146453857421875, -0.029310226440429688, -0.0264739990234375, -0.023637771606445312, -0.020801544189453125, -0.017965316772460938, -0.01512908935546875, -0.012292861938476562, -0.009456634521484375, -0.0066204071044921875, -0.0037841796875, -0.0009479522705078125, 0.001888275146484375, 0.0047245025634765625, 0.00756072998046875, 0.010396957397460938, 0.013233184814453125, 0.016069412231445312, 0.0189056396484375, 0.021741867065429688, 0.024578094482421875, 0.027414321899414062, 0.03025054931640625, 0.03308677673339844, 0.035923004150390625, 0.03875923156738281, 0.041595458984375, 0.04443168640136719, 0.047267913818359375, 0.05010414123535156, 0.05294036865234375, 0.05577659606933594, 0.058612823486328125, 0.06144905090332031, 0.0642852783203125, 0.06712150573730469, 0.06995773315429688, 0.07279396057128906, 0.07563018798828125, 0.07846641540527344, 0.08130264282226562, 0.08413887023925781, 0.08697509765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 14.0, 19.0, 32.0, 51.0, 70.0, 128.0, 261.0, 622.0, 2097.0, 11284.0, 182640.0, 804528.0, 40105.0, 4708.0, 1111.0, 416.0, 169.0, 106.0, 65.0, 42.0, 17.0, 13.0, 13.0, 15.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.179443359375, -0.17204666137695312, -0.16464996337890625, -0.15725326538085938, -0.1498565673828125, -0.14245986938476562, -0.13506317138671875, -0.12766647338867188, -0.120269775390625, -0.11287307739257812, -0.10547637939453125, -0.09807968139648438, -0.0906829833984375, -0.08328628540039062, -0.07588958740234375, -0.06849288940429688, -0.06109619140625, -0.053699493408203125, -0.04630279541015625, -0.038906097412109375, -0.0315093994140625, -0.024112701416015625, -0.01671600341796875, -0.009319305419921875, -0.001922607421875, 0.005474090576171875, 0.01287078857421875, 0.020267486572265625, 0.0276641845703125, 0.035060882568359375, 0.04245758056640625, 0.049854278564453125, 0.0572509765625, 0.06464767456054688, 0.07204437255859375, 0.07944107055664062, 0.0868377685546875, 0.09423446655273438, 0.10163116455078125, 0.10902786254882812, 0.116424560546875, 0.12382125854492188, 0.13121795654296875, 0.13861465454101562, 0.1460113525390625, 0.15340805053710938, 0.16080474853515625, 0.16820144653320312, 0.17559814453125, 0.18299484252929688, 0.19039154052734375, 0.19778823852539062, 0.2051849365234375, 0.21258163452148438, 0.21997833251953125, 0.22737503051757812, 0.234771728515625, 0.24216842651367188, 0.24956512451171875, 0.2569618225097656, 0.2643585205078125, 0.2717552185058594, 0.27915191650390625, 0.2865486145019531, 0.2939453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 1.0, 6.0, 6.0, 8.0, 9.0, 7.0, 16.0, 20.0, 19.0, 26.0, 17.0, 28.0, 33.0, 37.0, 45.0, 49.0, 42.0, 36.0, 61.0, 50.0, 57.0, 57.0, 42.0, 59.0, 37.0, 45.0, 27.0, 28.0, 23.0, 17.0, 20.0, 22.0, 7.0, 12.0, 7.0, 5.0, 8.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.233154296875, -0.22554779052734375, -0.2179412841796875, -0.21033477783203125, -0.202728271484375, -0.19512176513671875, -0.1875152587890625, -0.17990875244140625, -0.17230224609375, -0.16469573974609375, -0.1570892333984375, -0.14948272705078125, -0.141876220703125, -0.13426971435546875, -0.1266632080078125, -0.11905670166015625, -0.1114501953125, -0.10384368896484375, -0.0962371826171875, -0.08863067626953125, -0.081024169921875, -0.07341766357421875, -0.0658111572265625, -0.05820465087890625, -0.05059814453125, -0.04299163818359375, -0.0353851318359375, -0.02777862548828125, -0.020172119140625, -0.01256561279296875, -0.0049591064453125, 0.00264739990234375, 0.01025390625, 0.01786041259765625, 0.0254669189453125, 0.03307342529296875, 0.040679931640625, 0.04828643798828125, 0.0558929443359375, 0.06349945068359375, 0.07110595703125, 0.07871246337890625, 0.0863189697265625, 0.09392547607421875, 0.101531982421875, 0.10913848876953125, 0.1167449951171875, 0.12435150146484375, 0.1319580078125, 0.13956451416015625, 0.1471710205078125, 0.15477752685546875, 0.162384033203125, 0.16999053955078125, 0.1775970458984375, 0.18520355224609375, 0.19281005859375, 0.20041656494140625, 0.2080230712890625, 0.21562957763671875, 0.223236083984375, 0.23084259033203125, 0.2384490966796875, 0.24605560302734375, 0.253662109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 9.0, 9.0, 11.0, 25.0, 26.0, 43.0, 64.0, 113.0, 202.0, 353.0, 669.0, 1326.0, 2878.0, 6432.0, 18569.0, 71373.0, 537056.0, 320540.0, 60790.0, 16487.0, 6201.0, 2603.0, 1251.0, 671.0, 368.0, 192.0, 113.0, 61.0, 46.0, 18.0, 19.0, 14.0, 10.0, 5.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047454833984375, -0.045626163482666016, -0.04379749298095703, -0.04196882247924805, -0.04014015197753906, -0.03831148147583008, -0.036482810974121094, -0.03465414047241211, -0.032825469970703125, -0.03099679946899414, -0.029168128967285156, -0.027339458465576172, -0.025510787963867188, -0.023682117462158203, -0.02185344696044922, -0.020024776458740234, -0.01819610595703125, -0.016367435455322266, -0.014538764953613281, -0.012710094451904297, -0.010881423950195312, -0.009052753448486328, -0.007224082946777344, -0.005395412445068359, -0.003566741943359375, -0.0017380714416503906, 9.059906005859375e-05, 0.0019192695617675781, 0.0037479400634765625, 0.005576610565185547, 0.007405281066894531, 0.009233951568603516, 0.0110626220703125, 0.012891292572021484, 0.014719963073730469, 0.016548633575439453, 0.018377304077148438, 0.020205974578857422, 0.022034645080566406, 0.02386331558227539, 0.025691986083984375, 0.02752065658569336, 0.029349327087402344, 0.031177997589111328, 0.03300666809082031, 0.0348353385925293, 0.03666400909423828, 0.038492679595947266, 0.04032135009765625, 0.042150020599365234, 0.04397869110107422, 0.0458073616027832, 0.04763603210449219, 0.04946470260620117, 0.051293373107910156, 0.05312204360961914, 0.054950714111328125, 0.05677938461303711, 0.058608055114746094, 0.06043672561645508, 0.06226539611816406, 0.06409406661987305, 0.06592273712158203, 0.06775140762329102, 0.069580078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 6.0, 13.0, 19.0, 27.0, 33.0, 33.0, 58.0, 71.0, 62.0, 62.0, 92.0, 82.0, 81.0, 77.0, 52.0, 49.0, 44.0, 29.0, 19.0, 20.0, 12.0, 11.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.540515899658203e-05, -3.441609442234039e-05, -3.3427029848098755e-05, -3.243796527385712e-05, -3.144890069961548e-05, -3.045983612537384e-05, -2.9470771551132202e-05, -2.8481706976890564e-05, -2.7492642402648926e-05, -2.6503577828407288e-05, -2.551451325416565e-05, -2.452544867992401e-05, -2.3536384105682373e-05, -2.2547319531440735e-05, -2.1558254957199097e-05, -2.056919038295746e-05, -1.958012580871582e-05, -1.8591061234474182e-05, -1.7601996660232544e-05, -1.6612932085990906e-05, -1.5623867511749268e-05, -1.463480293750763e-05, -1.3645738363265991e-05, -1.2656673789024353e-05, -1.1667609214782715e-05, -1.0678544640541077e-05, -9.689480066299438e-06, -8.7004154920578e-06, -7.711350917816162e-06, -6.722286343574524e-06, -5.733221769332886e-06, -4.7441571950912476e-06, -3.7550926208496094e-06, -2.766028046607971e-06, -1.776963472366333e-06, -7.878988981246948e-07, 2.0116567611694336e-07, 1.1902302503585815e-06, 2.1792948246002197e-06, 3.168359398841858e-06, 4.157423973083496e-06, 5.146488547325134e-06, 6.1355531215667725e-06, 7.124617695808411e-06, 8.113682270050049e-06, 9.102746844291687e-06, 1.0091811418533325e-05, 1.1080875992774963e-05, 1.2069940567016602e-05, 1.305900514125824e-05, 1.4048069715499878e-05, 1.5037134289741516e-05, 1.6026198863983154e-05, 1.7015263438224792e-05, 1.800432801246643e-05, 1.899339258670807e-05, 1.9982457160949707e-05, 2.0971521735191345e-05, 2.1960586309432983e-05, 2.294965088367462e-05, 2.393871545791626e-05, 2.4927780032157898e-05, 2.5916844606399536e-05, 2.6905909180641174e-05, 2.7894973754882812e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 11.0, 2.0, 16.0, 21.0, 31.0, 35.0, 86.0, 159.0, 250.0, 569.0, 1247.0, 2825.0, 7651.0, 24656.0, 111185.0, 651373.0, 193221.0, 37927.0, 10512.0, 3760.0, 1579.0, 669.0, 340.0, 176.0, 91.0, 58.0, 28.0, 28.0, 17.0, 12.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06671142578125, -0.06466865539550781, -0.06262588500976562, -0.06058311462402344, -0.05854034423828125, -0.05649757385253906, -0.054454803466796875, -0.05241203308105469, -0.0503692626953125, -0.04832649230957031, -0.046283721923828125, -0.04424095153808594, -0.04219818115234375, -0.04015541076660156, -0.038112640380859375, -0.03606986999511719, -0.034027099609375, -0.03198432922363281, -0.029941558837890625, -0.027898788452148438, -0.02585601806640625, -0.023813247680664062, -0.021770477294921875, -0.019727706909179688, -0.0176849365234375, -0.015642166137695312, -0.013599395751953125, -0.011556625366210938, -0.00951385498046875, -0.0074710845947265625, -0.005428314208984375, -0.0033855438232421875, -0.0013427734375, 0.0006999969482421875, 0.002742767333984375, 0.0047855377197265625, 0.00682830810546875, 0.008871078491210938, 0.010913848876953125, 0.012956619262695312, 0.0149993896484375, 0.017042160034179688, 0.019084930419921875, 0.021127700805664062, 0.02317047119140625, 0.025213241577148438, 0.027256011962890625, 0.029298782348632812, 0.031341552734375, 0.03338432312011719, 0.035427093505859375, 0.03746986389160156, 0.03951263427734375, 0.04155540466308594, 0.043598175048828125, 0.04564094543457031, 0.0476837158203125, 0.04972648620605469, 0.051769256591796875, 0.05381202697753906, 0.05585479736328125, 0.05789756774902344, 0.059940338134765625, 0.06198310852050781, 0.06402587890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 5.0, 8.0, 15.0, 11.0, 12.0, 18.0, 25.0, 36.0, 50.0, 54.0, 60.0, 103.0, 91.0, 99.0, 85.0, 69.0, 47.0, 37.0, 34.0, 18.0, 21.0, 19.0, 16.0, 7.0, 7.0, 11.0, 3.0, 3.0, 2.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.060394287109375, -0.058629512786865234, -0.05686473846435547, -0.0550999641418457, -0.05333518981933594, -0.05157041549682617, -0.049805641174316406, -0.04804086685180664, -0.046276092529296875, -0.04451131820678711, -0.042746543884277344, -0.04098176956176758, -0.03921699523925781, -0.03745222091674805, -0.03568744659423828, -0.033922672271728516, -0.03215789794921875, -0.030393123626708984, -0.02862834930419922, -0.026863574981689453, -0.025098800659179688, -0.023334026336669922, -0.021569252014160156, -0.01980447769165039, -0.018039703369140625, -0.01627492904663086, -0.014510154724121094, -0.012745380401611328, -0.010980606079101562, -0.009215831756591797, -0.007451057434082031, -0.005686283111572266, -0.0039215087890625, -0.0021567344665527344, -0.00039196014404296875, 0.0013728141784667969, 0.0031375885009765625, 0.004902362823486328, 0.006667137145996094, 0.00843191146850586, 0.010196685791015625, 0.01196146011352539, 0.013726234436035156, 0.015491008758544922, 0.017255783081054688, 0.019020557403564453, 0.02078533172607422, 0.022550106048583984, 0.02431488037109375, 0.026079654693603516, 0.02784442901611328, 0.029609203338623047, 0.03137397766113281, 0.03313875198364258, 0.034903526306152344, 0.03666830062866211, 0.038433074951171875, 0.04019784927368164, 0.041962623596191406, 0.04372739791870117, 0.04549217224121094, 0.0472569465637207, 0.04902172088623047, 0.050786495208740234, 0.05255126953125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 11.0, 46.0, 148.0, 396.0, 247.0, 97.0, 27.0, 7.0, 8.0, 5.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.970097064971924, -2.8990728855133057, -2.8280487060546875, -2.7570247650146484, -2.6860005855560303, -2.614976406097412, -2.543952465057373, -2.472928285598755, -2.4019041061401367, -2.3308799266815186, -2.2598557472229004, -2.1888318061828613, -2.117807626724243, -2.046783447265625, -1.9757593870162964, -1.9047353267669678, -1.8337111473083496, -1.7626869678497314, -1.6916629076004028, -1.6206388473510742, -1.549614667892456, -1.478590488433838, -1.4075664281845093, -1.3365423679351807, -1.2655181884765625, -1.1944940090179443, -1.1234699487686157, -1.052445888519287, -0.981421709060669, -0.9103975892066956, -0.8393734693527222, -0.7683493494987488, -0.6973253488540649, -0.6263012290000916, -0.5552771091461182, -0.4842529892921448, -0.4132288694381714, -0.342204749584198, -0.2711806297302246, -0.20015650987625122, -0.12913239002227783, -0.05810827016830444, 0.012915849685668945, 0.08393996953964233, 0.15496408939361572, 0.2259882092475891, 0.2970123291015625, 0.3680364489555359, 0.4390605688095093, 0.5100846886634827, 0.581108808517456, 0.6521329283714294, 0.7231570482254028, 0.7941811680793762, 0.8652052879333496, 0.936229407787323, 1.0072535276412964, 1.078277587890625, 1.1493017673492432, 1.2203259468078613, 1.29135000705719, 1.3623740673065186, 1.4333982467651367, 1.5044224262237549, 1.5754464864730835]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 3.0, 6.0, 4.0, 11.0, 9.0, 3.0, 16.0, 15.0, 16.0, 23.0, 24.0, 29.0, 40.0, 39.0, 43.0, 57.0, 65.0, 97.0, 93.0, 78.0, 47.0, 36.0, 30.0, 41.0, 31.0, 22.0, 26.0, 15.0, 19.0, 15.0, 20.0, 6.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9863627552986145, -0.952122688293457, -0.9178825616836548, -0.8836424350738525, -0.8494023680686951, -0.8151623010635376, -0.7809221744537354, -0.7466820478439331, -0.7124419808387756, -0.6782019138336182, -0.6439617872238159, -0.6097216606140137, -0.5754815936088562, -0.5412415266036987, -0.5070013999938965, -0.4727613031864166, -0.43852120637893677, -0.4042811095714569, -0.37004101276397705, -0.3358009159564972, -0.30156081914901733, -0.2673207223415375, -0.23308062553405762, -0.19884052872657776, -0.1646004319190979, -0.13036033511161804, -0.09612023830413818, -0.061880141496658325, -0.027640044689178467, 0.006600052118301392, 0.04084014892578125, 0.07508024573326111, 0.10932040214538574, 0.1435604989528656, 0.17780059576034546, 0.21204069256782532, 0.24628078937530518, 0.28052088618278503, 0.3147609829902649, 0.34900107979774475, 0.3832411766052246, 0.41748127341270447, 0.4517213702201843, 0.4859614670276642, 0.520201563835144, 0.5544416904449463, 0.5886817574501038, 0.6229218244552612, 0.6571619510650635, 0.6914020776748657, 0.7256421446800232, 0.7598822116851807, 0.7941223382949829, 0.8283624649047852, 0.8626025319099426, 0.8968425989151001, 0.9310827255249023, 0.9653228521347046, 0.9995629191398621, 1.0338029861450195, 1.0680431127548218, 1.102283239364624, 1.1365232467651367, 1.170763373374939, 1.2050034999847412]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 13.0, 12.0, 26.0, 44.0, 72.0, 125.0, 245.0, 476.0, 1103.0, 2684.0, 7327.0, 31737.0, 276997.0, 2526750.0, 1227678.0, 96956.0, 15236.0, 4107.0, 1474.0, 573.0, 281.0, 153.0, 82.0, 48.0, 32.0, 20.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.098388671875, -0.094970703125, -0.091552734375, -0.088134765625, -0.084716796875, -0.081298828125, -0.077880859375, -0.074462890625, -0.071044921875, -0.067626953125, -0.064208984375, -0.060791015625, -0.057373046875, -0.053955078125, -0.050537109375, -0.047119140625, -0.043701171875, -0.040283203125, -0.036865234375, -0.033447265625, -0.030029296875, -0.026611328125, -0.023193359375, -0.019775390625, -0.016357421875, -0.012939453125, -0.009521484375, -0.006103515625, -0.002685546875, 0.000732421875, 0.004150390625, 0.007568359375, 0.010986328125, 0.014404296875, 0.017822265625, 0.021240234375, 0.024658203125, 0.028076171875, 0.031494140625, 0.034912109375, 0.038330078125, 0.041748046875, 0.045166015625, 0.048583984375, 0.052001953125, 0.055419921875, 0.058837890625, 0.062255859375, 0.065673828125, 0.069091796875, 0.072509765625, 0.075927734375, 0.079345703125, 0.082763671875, 0.086181640625, 0.089599609375, 0.093017578125, 0.096435546875, 0.099853515625, 0.103271484375, 0.106689453125, 0.110107421875, 0.113525390625, 0.116943359375, 0.120361328125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 14.0, 8.0, 17.0, 18.0, 40.0, 35.0, 27.0, 49.0, 46.0, 64.0, 72.0, 69.0, 67.0, 73.0, 70.0, 54.0, 69.0, 54.0, 35.0, 29.0, 27.0, 16.0, 11.0, 14.0, 7.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063232421875, -0.06053733825683594, -0.057842254638671875, -0.05514717102050781, -0.05245208740234375, -0.04975700378417969, -0.047061920166015625, -0.04436683654785156, -0.0416717529296875, -0.03897666931152344, -0.036281585693359375, -0.03358650207519531, -0.03089141845703125, -0.028196334838867188, -0.025501251220703125, -0.022806167602539062, -0.020111083984375, -0.017416000366210938, -0.014720916748046875, -0.012025833129882812, -0.00933074951171875, -0.0066356658935546875, -0.003940582275390625, -0.0012454986572265625, 0.0014495849609375, 0.0041446685791015625, 0.006839752197265625, 0.009534835815429688, 0.01222991943359375, 0.014925003051757812, 0.017620086669921875, 0.020315170288085938, 0.02301025390625, 0.025705337524414062, 0.028400421142578125, 0.031095504760742188, 0.03379058837890625, 0.03648567199707031, 0.039180755615234375, 0.04187583923339844, 0.0445709228515625, 0.04726600646972656, 0.049961090087890625, 0.05265617370605469, 0.05535125732421875, 0.05804634094238281, 0.060741424560546875, 0.06343650817871094, 0.066131591796875, 0.06882667541503906, 0.07152175903320312, 0.07421684265136719, 0.07691192626953125, 0.07960700988769531, 0.08230209350585938, 0.08499717712402344, 0.0876922607421875, 0.09038734436035156, 0.09308242797851562, 0.09577751159667969, 0.09847259521484375, 0.10116767883300781, 0.10386276245117188, 0.10655784606933594, 0.1092529296875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 2.0, 8.0, 10.0, 16.0, 19.0, 24.0, 33.0, 38.0, 51.0, 110.0, 145.0, 261.0, 473.0, 1060.0, 3314.0, 20402.0, 1041847.0, 3078606.0, 40206.0, 4774.0, 1434.0, 627.0, 330.0, 171.0, 97.0, 57.0, 30.0, 26.0, 25.0, 20.0, 15.0, 11.0, 10.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.2861328125, -0.2784252166748047, -0.2707176208496094, -0.26301002502441406, -0.25530242919921875, -0.24759483337402344, -0.23988723754882812, -0.2321796417236328, -0.2244720458984375, -0.2167644500732422, -0.20905685424804688, -0.20134925842285156, -0.19364166259765625, -0.18593406677246094, -0.17822647094726562, -0.1705188751220703, -0.162811279296875, -0.1551036834716797, -0.14739608764648438, -0.13968849182128906, -0.13198089599609375, -0.12427330017089844, -0.11656570434570312, -0.10885810852050781, -0.1011505126953125, -0.09344291687011719, -0.08573532104492188, -0.07802772521972656, -0.07032012939453125, -0.06261253356933594, -0.054904937744140625, -0.04719734191894531, -0.03948974609375, -0.03178215026855469, -0.024074554443359375, -0.016366958618164062, -0.00865936279296875, -0.0009517669677734375, 0.006755828857421875, 0.014463424682617188, 0.0221710205078125, 0.029878616333007812, 0.037586212158203125, 0.04529380798339844, 0.05300140380859375, 0.06070899963378906, 0.06841659545898438, 0.07612419128417969, 0.083831787109375, 0.09153938293457031, 0.09924697875976562, 0.10695457458496094, 0.11466217041015625, 0.12236976623535156, 0.13007736206054688, 0.1377849578857422, 0.1454925537109375, 0.1532001495361328, 0.16090774536132812, 0.16861534118652344, 0.17632293701171875, 0.18403053283691406, 0.19173812866210938, 0.1994457244873047, 0.2071533203125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 9.0, 17.0, 29.0, 43.0, 76.0, 166.0, 338.0, 608.0, 927.0, 779.0, 493.0, 248.0, 142.0, 75.0, 41.0, 22.0, 18.0, 15.0, 5.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.23828125, -0.2319660186767578, -0.22565078735351562, -0.21933555603027344, -0.21302032470703125, -0.20670509338378906, -0.20038986206054688, -0.1940746307373047, -0.1877593994140625, -0.1814441680908203, -0.17512893676757812, -0.16881370544433594, -0.16249847412109375, -0.15618324279785156, -0.14986801147460938, -0.1435527801513672, -0.137237548828125, -0.1309223175048828, -0.12460708618164062, -0.11829185485839844, -0.11197662353515625, -0.10566139221191406, -0.09934616088867188, -0.09303092956542969, -0.0867156982421875, -0.08040046691894531, -0.07408523559570312, -0.06777000427246094, -0.06145477294921875, -0.05513954162597656, -0.048824310302734375, -0.04250907897949219, -0.03619384765625, -0.029878616333007812, -0.023563385009765625, -0.017248153686523438, -0.01093292236328125, -0.0046176910400390625, 0.001697540283203125, 0.008012771606445312, 0.0143280029296875, 0.020643234252929688, 0.026958465576171875, 0.03327369689941406, 0.03958892822265625, 0.04590415954589844, 0.052219390869140625, 0.05853462219238281, 0.064849853515625, 0.07116508483886719, 0.07748031616210938, 0.08379554748535156, 0.09011077880859375, 0.09642601013183594, 0.10274124145507812, 0.10905647277832031, 0.1153717041015625, 0.12168693542480469, 0.12800216674804688, 0.13431739807128906, 0.14063262939453125, 0.14694786071777344, 0.15326309204101562, 0.1595783233642578, 0.1658935546875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 11.0, 12.0, 36.0, 78.0, 127.0, 153.0, 152.0, 146.0, 97.0, 70.0, 56.0, 18.0, 11.0, 12.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.031156063079834, -0.9883733987808228, -0.9455907344818115, -0.9028080701828003, -0.8600254058837891, -0.8172427415847778, -0.7744601368904114, -0.7316774725914001, -0.6888948082923889, -0.6461121439933777, -0.6033294796943665, -0.560546875, -0.5177642107009888, -0.47498151659965515, -0.4321988821029663, -0.3894162178039551, -0.34663355350494385, -0.3038508892059326, -0.2610682249069214, -0.21828559041023254, -0.1755029261112213, -0.13272026181221008, -0.08993762731552124, -0.04715496301651001, -0.004372298717498779, 0.038410358130931854, 0.08119301497936249, 0.12397566437721252, 0.16675832867622375, 0.20954099297523499, 0.25232362747192383, 0.29510629177093506, 0.33788883686065674, 0.38067150115966797, 0.4234541654586792, 0.46623679995536804, 0.5090194940567017, 0.5518021583557129, 0.5945847630500793, 0.6373674273490906, 0.6801500916481018, 0.722932755947113, 0.7657154202461243, 0.8084980249404907, 0.851280689239502, 0.8940633535385132, 0.9368460178375244, 0.9796286821365356, 1.0224113464355469, 1.065194010734558, 1.1079766750335693, 1.1507593393325806, 1.1935420036315918, 1.236324667930603, 1.2791073322296143, 1.321889877319336, 1.3646726608276367, 1.407455325126648, 1.4502379894256592, 1.4930206537246704, 1.5358033180236816, 1.5785859823226929, 1.621368646621704, 1.6641511917114258, 1.706933856010437]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 4.0, 9.0, 5.0, 9.0, 10.0, 11.0, 18.0, 27.0, 29.0, 33.0, 47.0, 43.0, 31.0, 50.0, 36.0, 42.0, 57.0, 43.0, 50.0, 43.0, 49.0, 38.0, 34.0, 38.0, 26.0, 43.0, 39.0, 23.0, 18.0, 19.0, 15.0, 13.0, 16.0, 11.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7162737846374512, -0.6934219598770142, -0.6705701351165771, -0.6477183103561401, -0.6248664855957031, -0.6020146608352661, -0.5791628360748291, -0.5563110113143921, -0.5334591865539551, -0.5106073617935181, -0.48775553703308105, -0.46490371227264404, -0.44205188751220703, -0.41920006275177, -0.396348237991333, -0.373496413230896, -0.35064461827278137, -0.32779279351234436, -0.30494096875190735, -0.28208914399147034, -0.2592373192310333, -0.2363854944705963, -0.2135336846113205, -0.19068185985088348, -0.16783003509044647, -0.14497821033000946, -0.12212638556957245, -0.09927456825971603, -0.07642274349927902, -0.05357091873884201, -0.030719101428985596, -0.007867276668548584, 0.014984548091888428, 0.03783637285232544, 0.06068819388747215, 0.08354001492261887, 0.10639183968305588, 0.1292436718940735, 0.1520954817533493, 0.17494730651378632, 0.19779913127422333, 0.22065095603466034, 0.24350278079509735, 0.26635459065437317, 0.2892064154148102, 0.3120582401752472, 0.3349100649356842, 0.3577618896961212, 0.3806137144565582, 0.40346553921699524, 0.42631736397743225, 0.44916918873786926, 0.4720210134983063, 0.4948728382587433, 0.5177246332168579, 0.5405764579772949, 0.5634282827377319, 0.586280107498169, 0.609131932258606, 0.631983757019043, 0.65483558177948, 0.677687406539917, 0.700539231300354, 0.723391056060791, 0.746242880821228]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 10.0, 9.0, 13.0, 12.0, 40.0, 48.0, 130.0, 178.0, 415.0, 965.0, 2394.0, 7858.0, 33882.0, 250450.0, 630194.0, 97321.0, 17081.0, 4713.0, 1581.0, 609.0, 294.0, 135.0, 74.0, 55.0, 23.0, 20.0, 14.0, 11.0, 9.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1531982421875, -0.1484527587890625, -0.143707275390625, -0.1389617919921875, -0.13421630859375, -0.1294708251953125, -0.124725341796875, -0.1199798583984375, -0.115234375, -0.1104888916015625, -0.105743408203125, -0.1009979248046875, -0.09625244140625, -0.0915069580078125, -0.086761474609375, -0.0820159912109375, -0.0772705078125, -0.0725250244140625, -0.067779541015625, -0.0630340576171875, -0.05828857421875, -0.0535430908203125, -0.048797607421875, -0.0440521240234375, -0.039306640625, -0.0345611572265625, -0.029815673828125, -0.0250701904296875, -0.02032470703125, -0.0155792236328125, -0.010833740234375, -0.0060882568359375, -0.0013427734375, 0.0034027099609375, 0.008148193359375, 0.0128936767578125, 0.01763916015625, 0.0223846435546875, 0.027130126953125, 0.0318756103515625, 0.03662109375, 0.0413665771484375, 0.046112060546875, 0.0508575439453125, 0.05560302734375, 0.0603485107421875, 0.065093994140625, 0.0698394775390625, 0.0745849609375, 0.0793304443359375, 0.084075927734375, 0.0888214111328125, 0.09356689453125, 0.0983123779296875, 0.103057861328125, 0.1078033447265625, 0.112548828125, 0.1172943115234375, 0.122039794921875, 0.1267852783203125, 0.13153076171875, 0.1362762451171875, 0.141021728515625, 0.1457672119140625, 0.1505126953125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 1.0, 5.0, 7.0, 11.0, 11.0, 16.0, 16.0, 25.0, 28.0, 18.0, 38.0, 37.0, 42.0, 49.0, 52.0, 42.0, 48.0, 39.0, 49.0, 67.0, 48.0, 45.0, 48.0, 39.0, 27.0, 34.0, 38.0, 27.0, 16.0, 18.0, 16.0, 9.0, 11.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.056304931640625, -0.054135799407958984, -0.05196666717529297, -0.04979753494262695, -0.04762840270996094, -0.04545927047729492, -0.043290138244628906, -0.04112100601196289, -0.038951873779296875, -0.03678274154663086, -0.034613609313964844, -0.03244447708129883, -0.030275344848632812, -0.028106212615966797, -0.02593708038330078, -0.023767948150634766, -0.02159881591796875, -0.019429683685302734, -0.01726055145263672, -0.015091419219970703, -0.012922286987304688, -0.010753154754638672, -0.008584022521972656, -0.006414890289306641, -0.004245758056640625, -0.0020766258239746094, 9.250640869140625e-05, 0.002261638641357422, 0.0044307708740234375, 0.006599903106689453, 0.008769035339355469, 0.010938167572021484, 0.0131072998046875, 0.015276432037353516, 0.01744556427001953, 0.019614696502685547, 0.021783828735351562, 0.023952960968017578, 0.026122093200683594, 0.02829122543334961, 0.030460357666015625, 0.03262948989868164, 0.034798622131347656, 0.03696775436401367, 0.03913688659667969, 0.0413060188293457, 0.04347515106201172, 0.045644283294677734, 0.04781341552734375, 0.049982547760009766, 0.05215167999267578, 0.0543208122253418, 0.05648994445800781, 0.05865907669067383, 0.060828208923339844, 0.06299734115600586, 0.06516647338867188, 0.06733560562133789, 0.0695047378540039, 0.07167387008666992, 0.07384300231933594, 0.07601213455200195, 0.07818126678466797, 0.08035039901733398, 0.08251953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 8.0, 7.0, 13.0, 14.0, 24.0, 35.0, 40.0, 61.0, 83.0, 143.0, 195.0, 349.0, 547.0, 1070.0, 3002.0, 10158.0, 71729.0, 829160.0, 112227.0, 13210.0, 3523.0, 1248.0, 679.0, 337.0, 212.0, 142.0, 108.0, 69.0, 37.0, 34.0, 21.0, 14.0, 13.0, 8.0, 10.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.191162109375, -0.18470001220703125, -0.1782379150390625, -0.17177581787109375, -0.165313720703125, -0.15885162353515625, -0.1523895263671875, -0.14592742919921875, -0.13946533203125, -0.13300323486328125, -0.1265411376953125, -0.12007904052734375, -0.113616943359375, -0.10715484619140625, -0.1006927490234375, -0.09423065185546875, -0.0877685546875, -0.08130645751953125, -0.0748443603515625, -0.06838226318359375, -0.061920166015625, -0.05545806884765625, -0.0489959716796875, -0.04253387451171875, -0.03607177734375, -0.02960968017578125, -0.0231475830078125, -0.01668548583984375, -0.010223388671875, -0.00376129150390625, 0.0027008056640625, 0.00916290283203125, 0.015625, 0.02208709716796875, 0.0285491943359375, 0.03501129150390625, 0.041473388671875, 0.04793548583984375, 0.0543975830078125, 0.06085968017578125, 0.06732177734375, 0.07378387451171875, 0.0802459716796875, 0.08670806884765625, 0.093170166015625, 0.09963226318359375, 0.1060943603515625, 0.11255645751953125, 0.1190185546875, 0.12548065185546875, 0.1319427490234375, 0.13840484619140625, 0.144866943359375, 0.15132904052734375, 0.1577911376953125, 0.16425323486328125, 0.17071533203125, 0.17717742919921875, 0.1836395263671875, 0.19010162353515625, 0.196563720703125, 0.20302581787109375, 0.2094879150390625, 0.21595001220703125, 0.222412109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 9.0, 5.0, 5.0, 6.0, 6.0, 19.0, 15.0, 19.0, 16.0, 22.0, 33.0, 35.0, 48.0, 44.0, 54.0, 55.0, 57.0, 72.0, 73.0, 55.0, 56.0, 58.0, 54.0, 29.0, 33.0, 25.0, 28.0, 14.0, 13.0, 6.0, 10.0, 7.0, 6.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2371826171875, -0.2278270721435547, -0.21847152709960938, -0.20911598205566406, -0.19976043701171875, -0.19040489196777344, -0.18104934692382812, -0.1716938018798828, -0.1623382568359375, -0.1529827117919922, -0.14362716674804688, -0.13427162170410156, -0.12491607666015625, -0.11556053161621094, -0.10620498657226562, -0.09684944152832031, -0.087493896484375, -0.07813835144042969, -0.06878280639648438, -0.05942726135253906, -0.05007171630859375, -0.04071617126464844, -0.031360626220703125, -0.022005081176757812, -0.0126495361328125, -0.0032939910888671875, 0.006061553955078125, 0.015417098999023438, 0.02477264404296875, 0.03412818908691406, 0.043483734130859375, 0.05283927917480469, 0.06219482421875, 0.07155036926269531, 0.08090591430664062, 0.09026145935058594, 0.09961700439453125, 0.10897254943847656, 0.11832809448242188, 0.1276836395263672, 0.1370391845703125, 0.1463947296142578, 0.15575027465820312, 0.16510581970214844, 0.17446136474609375, 0.18381690979003906, 0.19317245483398438, 0.2025279998779297, 0.211883544921875, 0.2212390899658203, 0.23059463500976562, 0.23995018005371094, 0.24930572509765625, 0.25866127014160156, 0.2680168151855469, 0.2773723602294922, 0.2867279052734375, 0.2960834503173828, 0.3054389953613281, 0.31479454040527344, 0.32415008544921875, 0.33350563049316406, 0.3428611755371094, 0.3522167205810547, 0.361572265625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 3.0, 5.0, 13.0, 17.0, 19.0, 36.0, 41.0, 59.0, 99.0, 155.0, 310.0, 559.0, 1171.0, 2871.0, 7771.0, 25337.0, 119808.0, 757269.0, 98881.0, 22087.0, 7065.0, 2594.0, 1147.0, 515.0, 305.0, 138.0, 74.0, 59.0, 37.0, 29.0, 18.0, 10.0, 7.0, 8.0, 4.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06622314453125, -0.06397438049316406, -0.061725616455078125, -0.05947685241699219, -0.05722808837890625, -0.05497932434082031, -0.052730560302734375, -0.05048179626464844, -0.0482330322265625, -0.04598426818847656, -0.043735504150390625, -0.04148674011230469, -0.03923797607421875, -0.03698921203613281, -0.034740447998046875, -0.03249168395996094, -0.030242919921875, -0.027994155883789062, -0.025745391845703125, -0.023496627807617188, -0.02124786376953125, -0.018999099731445312, -0.016750335693359375, -0.014501571655273438, -0.0122528076171875, -0.010004043579101562, -0.007755279541015625, -0.0055065155029296875, -0.00325775146484375, -0.0010089874267578125, 0.001239776611328125, 0.0034885406494140625, 0.0057373046875, 0.007986068725585938, 0.010234832763671875, 0.012483596801757812, 0.01473236083984375, 0.016981124877929688, 0.019229888916015625, 0.021478652954101562, 0.0237274169921875, 0.025976181030273438, 0.028224945068359375, 0.030473709106445312, 0.03272247314453125, 0.03497123718261719, 0.037220001220703125, 0.03946876525878906, 0.041717529296875, 0.04396629333496094, 0.046215057373046875, 0.04846382141113281, 0.05071258544921875, 0.05296134948730469, 0.055210113525390625, 0.05745887756347656, 0.0597076416015625, 0.06195640563964844, 0.06420516967773438, 0.06645393371582031, 0.06870269775390625, 0.07095146179199219, 0.07320022583007812, 0.07544898986816406, 0.07769775390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 5.0, 5.0, 6.0, 12.0, 12.0, 13.0, 15.0, 21.0, 32.0, 33.0, 65.0, 76.0, 99.0, 114.0, 103.0, 82.0, 99.0, 47.0, 39.0, 31.0, 18.0, 17.0, 7.0, 7.0, 8.0, 6.0, 3.0, 1.0, 6.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.343820571899414e-05, -3.2315030694007874e-05, -3.1191855669021606e-05, -3.006868064403534e-05, -2.8945505619049072e-05, -2.7822330594062805e-05, -2.6699155569076538e-05, -2.557598054409027e-05, -2.4452805519104004e-05, -2.3329630494117737e-05, -2.220645546913147e-05, -2.1083280444145203e-05, -1.9960105419158936e-05, -1.883693039417267e-05, -1.77137553691864e-05, -1.6590580344200134e-05, -1.5467405319213867e-05, -1.43442302942276e-05, -1.3221055269241333e-05, -1.2097880244255066e-05, -1.0974705219268799e-05, -9.851530194282532e-06, -8.728355169296265e-06, -7.6051801443099976e-06, -6.4820051193237305e-06, -5.358830094337463e-06, -4.235655069351196e-06, -3.112480044364929e-06, -1.989305019378662e-06, -8.66129994392395e-07, 2.5704503059387207e-07, 1.3802200555801392e-06, 2.5033950805664062e-06, 3.6265701055526733e-06, 4.7497451305389404e-06, 5.8729201555252075e-06, 6.996095180511475e-06, 8.119270205497742e-06, 9.242445230484009e-06, 1.0365620255470276e-05, 1.1488795280456543e-05, 1.261197030544281e-05, 1.3735145330429077e-05, 1.4858320355415344e-05, 1.598149538040161e-05, 1.710467040538788e-05, 1.8227845430374146e-05, 1.9351020455360413e-05, 2.047419548034668e-05, 2.1597370505332947e-05, 2.2720545530319214e-05, 2.384372055530548e-05, 2.4966895580291748e-05, 2.6090070605278015e-05, 2.7213245630264282e-05, 2.833642065525055e-05, 2.9459595680236816e-05, 3.0582770705223083e-05, 3.170594573020935e-05, 3.282912075519562e-05, 3.3952295780181885e-05, 3.507547080516815e-05, 3.619864583015442e-05, 3.7321820855140686e-05, 3.844499588012695e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 10.0, 20.0, 14.0, 36.0, 52.0, 88.0, 125.0, 160.0, 293.0, 504.0, 1075.0, 2445.0, 6532.0, 20530.0, 86604.0, 719486.0, 162882.0, 31819.0, 9420.0, 3355.0, 1451.0, 680.0, 384.0, 188.0, 133.0, 88.0, 53.0, 31.0, 31.0, 17.0, 13.0, 11.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.08050537109375, -0.07831001281738281, -0.07611465454101562, -0.07391929626464844, -0.07172393798828125, -0.06952857971191406, -0.06733322143554688, -0.06513786315917969, -0.0629425048828125, -0.06074714660644531, -0.058551788330078125, -0.05635643005371094, -0.05416107177734375, -0.05196571350097656, -0.049770355224609375, -0.04757499694824219, -0.045379638671875, -0.04318428039550781, -0.040988922119140625, -0.03879356384277344, -0.03659820556640625, -0.03440284729003906, -0.032207489013671875, -0.030012130737304688, -0.0278167724609375, -0.025621414184570312, -0.023426055908203125, -0.021230697631835938, -0.01903533935546875, -0.016839981079101562, -0.014644622802734375, -0.012449264526367188, -0.01025390625, -0.008058547973632812, -0.005863189697265625, -0.0036678314208984375, -0.00147247314453125, 0.0007228851318359375, 0.002918243408203125, 0.0051136016845703125, 0.0073089599609375, 0.009504318237304688, 0.011699676513671875, 0.013895034790039062, 0.01609039306640625, 0.018285751342773438, 0.020481109619140625, 0.022676467895507812, 0.024871826171875, 0.027067184448242188, 0.029262542724609375, 0.03145790100097656, 0.03365325927734375, 0.03584861755371094, 0.038043975830078125, 0.04023933410644531, 0.0424346923828125, 0.04463005065917969, 0.046825408935546875, 0.04902076721191406, 0.05121612548828125, 0.05341148376464844, 0.055606842041015625, 0.05780220031738281, 0.05999755859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 10.0, 8.0, 5.0, 4.0, 6.0, 16.0, 17.0, 23.0, 14.0, 22.0, 31.0, 40.0, 62.0, 69.0, 112.0, 115.0, 109.0, 80.0, 67.0, 39.0, 35.0, 26.0, 13.0, 11.0, 13.0, 5.0, 7.0, 12.0, 2.0, 5.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053070068359375, -0.05121183395385742, -0.049353599548339844, -0.047495365142822266, -0.04563713073730469, -0.04377889633178711, -0.04192066192626953, -0.04006242752075195, -0.038204193115234375, -0.0363459587097168, -0.03448772430419922, -0.03262948989868164, -0.030771255493164062, -0.028913021087646484, -0.027054786682128906, -0.025196552276611328, -0.02333831787109375, -0.021480083465576172, -0.019621849060058594, -0.017763614654541016, -0.015905380249023438, -0.01404714584350586, -0.012188911437988281, -0.010330677032470703, -0.008472442626953125, -0.006614208221435547, -0.004755973815917969, -0.0028977394104003906, -0.0010395050048828125, 0.0008187294006347656, 0.0026769638061523438, 0.004535198211669922, 0.0063934326171875, 0.008251667022705078, 0.010109901428222656, 0.011968135833740234, 0.013826370239257812, 0.01568460464477539, 0.01754283905029297, 0.019401073455810547, 0.021259307861328125, 0.023117542266845703, 0.02497577667236328, 0.02683401107788086, 0.028692245483398438, 0.030550479888916016, 0.032408714294433594, 0.03426694869995117, 0.03612518310546875, 0.03798341751098633, 0.039841651916503906, 0.041699886322021484, 0.04355812072753906, 0.04541635513305664, 0.04727458953857422, 0.0491328239440918, 0.050991058349609375, 0.05284929275512695, 0.05470752716064453, 0.05656576156616211, 0.05842399597167969, 0.060282230377197266, 0.062140464782714844, 0.06399869918823242, 0.06585693359375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 11.0, 26.0, 79.0, 178.0, 428.0, 159.0, 57.0, 23.0, 10.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1976826190948486, -1.1246161460876465, -1.0515496730804443, -0.978483259677887, -0.9054167866706848, -0.8323503136634827, -0.7592839002609253, -0.6862174272537231, -0.613150954246521, -0.5400844812393188, -0.4670180380344391, -0.3939515948295593, -0.3208851218223572, -0.24781864881515503, -0.17475220561027527, -0.10168576240539551, -0.02861928939819336, 0.044447168707847595, 0.11751362681388855, 0.1905800849199295, 0.26364654302597046, 0.3367130160331726, 0.40977945923805237, 0.48284590244293213, 0.5559123754501343, 0.6289788484573364, 0.7020453214645386, 0.775111734867096, 0.8481782078742981, 0.9212446808815002, 0.9943110942840576, 1.0673775672912598, 1.140444278717041, 1.2135107517242432, 1.2865772247314453, 1.3596436977386475, 1.4327101707458496, 1.5057766437530518, 1.5788429975509644, 1.6519094705581665, 1.7249759435653687, 1.7980424165725708, 1.871108889579773, 1.944175362586975, 2.0172417163848877, 2.09030818939209, 2.163374662399292, 2.236441135406494, 2.3095076084136963, 2.3825740814208984, 2.4556405544281006, 2.5287070274353027, 2.601773500442505, 2.674839973449707, 2.747906446456909, 2.8209729194641113, 2.8940391540527344, 2.9671056270599365, 3.0401721000671387, 3.113238573074341, 3.186305046081543, 3.259371519088745, 3.3324379920959473, 3.4055042266845703, 3.4785709381103516]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 4.0, 9.0, 12.0, 10.0, 17.0, 15.0, 18.0, 28.0, 21.0, 30.0, 25.0, 34.0, 36.0, 41.0, 48.0, 68.0, 102.0, 97.0, 56.0, 36.0, 42.0, 27.0, 27.0, 30.0, 19.0, 27.0, 17.0, 11.0, 14.0, 5.0, 10.0, 12.0, 6.0, 7.0, 4.0, 3.0, 9.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9578191041946411, -0.9285763502120972, -0.8993335962295532, -0.8700907826423645, -0.8408480286598206, -0.8116052746772766, -0.7823624610900879, -0.753119707107544, -0.723876953125, -0.694634199142456, -0.6653914451599121, -0.6361486315727234, -0.6069058775901794, -0.5776631236076355, -0.5484203100204468, -0.5191775560379028, -0.4899348020553589, -0.46069204807281494, -0.4314492642879486, -0.4022064805030823, -0.37296372652053833, -0.3437209725379944, -0.31447818875312805, -0.2852354049682617, -0.2559926509857178, -0.22674988210201263, -0.1975071132183075, -0.16826434433460236, -0.13902157545089722, -0.10977880656719208, -0.08053603768348694, -0.0512932687997818, -0.022050559520721436, 0.007192209362983704, 0.03643497824668884, 0.06567774713039398, 0.09492051601409912, 0.12416328489780426, 0.1534060537815094, 0.18264882266521454, 0.21189159154891968, 0.24113436043262482, 0.27037712931632996, 0.2996199131011963, 0.32886266708374023, 0.3581054210662842, 0.3873482048511505, 0.41659098863601685, 0.4458337426185608, 0.47507649660110474, 0.5043193101882935, 0.5335620641708374, 0.5628048181533813, 0.5920475721359253, 0.6212903261184692, 0.650533139705658, 0.6797758936882019, 0.7090186476707458, 0.7382614612579346, 0.7675042152404785, 0.7967469692230225, 0.8259897232055664, 0.8552324771881104, 0.8844752907752991, 0.913718044757843]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 3.0, 8.0, 13.0, 21.0, 28.0, 40.0, 46.0, 118.0, 176.0, 312.0, 534.0, 947.0, 2025.0, 4342.0, 10732.0, 35334.0, 174955.0, 1082611.0, 2188372.0, 568699.0, 90244.0, 21382.0, 7190.0, 3010.0, 1392.0, 777.0, 414.0, 240.0, 117.0, 76.0, 40.0, 42.0, 8.0, 11.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08355712890625, -0.08088970184326172, -0.07822227478027344, -0.07555484771728516, -0.07288742065429688, -0.0702199935913086, -0.06755256652832031, -0.06488513946533203, -0.06221771240234375, -0.05955028533935547, -0.05688285827636719, -0.054215431213378906, -0.051548004150390625, -0.048880577087402344, -0.04621315002441406, -0.04354572296142578, -0.0408782958984375, -0.03821086883544922, -0.03554344177246094, -0.032876014709472656, -0.030208587646484375, -0.027541160583496094, -0.024873733520507812, -0.02220630645751953, -0.01953887939453125, -0.01687145233154297, -0.014204025268554688, -0.011536598205566406, -0.008869171142578125, -0.006201744079589844, -0.0035343170166015625, -0.0008668899536132812, 0.001800537109375, 0.004467964172363281, 0.0071353912353515625, 0.009802818298339844, 0.012470245361328125, 0.015137672424316406, 0.017805099487304688, 0.02047252655029297, 0.02313995361328125, 0.02580738067626953, 0.028474807739257812, 0.031142234802246094, 0.033809661865234375, 0.036477088928222656, 0.03914451599121094, 0.04181194305419922, 0.0444793701171875, 0.04714679718017578, 0.04981422424316406, 0.052481651306152344, 0.055149078369140625, 0.057816505432128906, 0.06048393249511719, 0.06315135955810547, 0.06581878662109375, 0.06848621368408203, 0.07115364074707031, 0.0738210678100586, 0.07648849487304688, 0.07915592193603516, 0.08182334899902344, 0.08449077606201172, 0.087158203125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 12.0, 9.0, 12.0, 24.0, 30.0, 35.0, 33.0, 38.0, 54.0, 57.0, 59.0, 89.0, 88.0, 83.0, 63.0, 58.0, 38.0, 51.0, 52.0, 34.0, 22.0, 23.0, 15.0, 4.0, 5.0, 5.0, 2.0, 5.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0631103515625, -0.060146331787109375, -0.05718231201171875, -0.054218292236328125, -0.0512542724609375, -0.048290252685546875, -0.04532623291015625, -0.042362213134765625, -0.039398193359375, -0.036434173583984375, -0.03347015380859375, -0.030506134033203125, -0.0275421142578125, -0.024578094482421875, -0.02161407470703125, -0.018650054931640625, -0.01568603515625, -0.012722015380859375, -0.00975799560546875, -0.006793975830078125, -0.0038299560546875, -0.000865936279296875, 0.00209808349609375, 0.005062103271484375, 0.008026123046875, 0.010990142822265625, 0.01395416259765625, 0.016918182373046875, 0.0198822021484375, 0.022846221923828125, 0.02581024169921875, 0.028774261474609375, 0.03173828125, 0.034702301025390625, 0.03766632080078125, 0.040630340576171875, 0.0435943603515625, 0.046558380126953125, 0.04952239990234375, 0.052486419677734375, 0.055450439453125, 0.058414459228515625, 0.06137847900390625, 0.06434249877929688, 0.0673065185546875, 0.07027053833007812, 0.07323455810546875, 0.07619857788085938, 0.07916259765625, 0.08212661743164062, 0.08509063720703125, 0.08805465698242188, 0.0910186767578125, 0.09398269653320312, 0.09694671630859375, 0.09991073608398438, 0.102874755859375, 0.10583877563476562, 0.10880279541015625, 0.11176681518554688, 0.1147308349609375, 0.11769485473632812, 0.12065887451171875, 0.12362289428710938, 0.1265869140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 9.0, 7.0, 20.0, 31.0, 32.0, 77.0, 149.0, 298.0, 736.0, 2227.0, 15852.0, 1506701.0, 2644804.0, 19582.0, 2408.0, 719.0, 274.0, 142.0, 79.0, 42.0, 28.0, 28.0, 11.0, 8.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32666015625, -0.31578826904296875, -0.3049163818359375, -0.29404449462890625, -0.283172607421875, -0.27230072021484375, -0.2614288330078125, -0.25055694580078125, -0.23968505859375, -0.22881317138671875, -0.2179412841796875, -0.20706939697265625, -0.196197509765625, -0.18532562255859375, -0.1744537353515625, -0.16358184814453125, -0.1527099609375, -0.14183807373046875, -0.1309661865234375, -0.12009429931640625, -0.109222412109375, -0.09835052490234375, -0.0874786376953125, -0.07660675048828125, -0.06573486328125, -0.05486297607421875, -0.0439910888671875, -0.03311920166015625, -0.022247314453125, -0.01137542724609375, -0.0005035400390625, 0.01036834716796875, 0.021240234375, 0.03211212158203125, 0.0429840087890625, 0.05385589599609375, 0.064727783203125, 0.07559967041015625, 0.0864715576171875, 0.09734344482421875, 0.10821533203125, 0.11908721923828125, 0.1299591064453125, 0.14083099365234375, 0.151702880859375, 0.16257476806640625, 0.1734466552734375, 0.18431854248046875, 0.1951904296875, 0.20606231689453125, 0.2169342041015625, 0.22780609130859375, 0.238677978515625, 0.24954986572265625, 0.2604217529296875, 0.27129364013671875, 0.28216552734375, 0.29303741455078125, 0.3039093017578125, 0.31478118896484375, 0.325653076171875, 0.33652496337890625, 0.3473968505859375, 0.35826873779296875, 0.369140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 8.0, 14.0, 13.0, 22.0, 38.0, 45.0, 67.0, 137.0, 191.0, 359.0, 568.0, 805.0, 634.0, 489.0, 254.0, 153.0, 75.0, 62.0, 39.0, 30.0, 19.0, 11.0, 9.0, 8.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.26220703125, -0.25620174407958984, -0.2501964569091797, -0.24419116973876953, -0.23818588256835938, -0.23218059539794922, -0.22617530822753906, -0.2201700210571289, -0.21416473388671875, -0.2081594467163086, -0.20215415954589844, -0.19614887237548828, -0.19014358520507812, -0.18413829803466797, -0.1781330108642578, -0.17212772369384766, -0.1661224365234375, -0.16011714935302734, -0.1541118621826172, -0.14810657501220703, -0.14210128784179688, -0.13609600067138672, -0.13009071350097656, -0.1240854263305664, -0.11808013916015625, -0.1120748519897461, -0.10606956481933594, -0.10006427764892578, -0.09405899047851562, -0.08805370330810547, -0.08204841613769531, -0.07604312896728516, -0.070037841796875, -0.06403255462646484, -0.05802726745605469, -0.05202198028564453, -0.046016693115234375, -0.04001140594482422, -0.03400611877441406, -0.028000831604003906, -0.02199554443359375, -0.015990257263183594, -0.009984970092773438, -0.003979682922363281, 0.002025604248046875, 0.008030891418457031, 0.014036178588867188, 0.020041465759277344, 0.0260467529296875, 0.032052040100097656, 0.03805732727050781, 0.04406261444091797, 0.050067901611328125, 0.05607318878173828, 0.06207847595214844, 0.0680837631225586, 0.07408905029296875, 0.0800943374633789, 0.08609962463378906, 0.09210491180419922, 0.09811019897460938, 0.10411548614501953, 0.11012077331542969, 0.11612606048583984, 0.12213134765625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 12.0, 11.0, 29.0, 59.0, 217.0, 349.0, 218.0, 68.0, 23.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.563542366027832, -4.4676690101623535, -4.371795654296875, -4.2759222984313965, -4.180048942565918, -4.084176063537598, -3.98830246925354, -3.8924291133880615, -3.796555995941162, -3.7006826400756836, -3.604809284210205, -3.5089359283447266, -3.413062810897827, -3.3171894550323486, -3.22131609916687, -3.1254427433013916, -3.029569387435913, -2.9336960315704346, -2.837822675704956, -2.7419495582580566, -2.646076202392578, -2.5502028465270996, -2.454329490661621, -2.3584561347961426, -2.262582778930664, -2.1667094230651855, -2.070836067199707, -1.974962830543518, -1.879089593887329, -1.7832162380218506, -1.687342882156372, -1.5914695262908936, -1.4955964088439941, -1.3997230529785156, -1.3038498163223267, -1.2079764604568481, -1.1121032238006592, -1.0162298679351807, -0.9203565120697021, -0.8244832158088684, -0.7286099195480347, -0.6327366232872009, -0.5368633270263672, -0.44098997116088867, -0.34511667490005493, -0.2492433786392212, -0.15337002277374268, -0.057496726512908936, 0.038376569747924805, 0.13424988090991974, 0.23012319207191467, 0.3259965181350708, 0.42186981439590454, 0.5177431106567383, 0.6136164665222168, 0.7094897627830505, 0.8053630590438843, 0.901236355304718, 0.9971096515655518, 1.0929830074310303, 1.1888563632965088, 1.2847295999526978, 1.3806029558181763, 1.4764761924743652, 1.5723495483398438]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 11.0, 9.0, 11.0, 9.0, 18.0, 19.0, 25.0, 27.0, 28.0, 46.0, 43.0, 73.0, 56.0, 60.0, 63.0, 62.0, 58.0, 57.0, 62.0, 50.0, 33.0, 35.0, 31.0, 22.0, 16.0, 19.0, 14.0, 7.0, 13.0, 9.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0179316997528076, -0.9879207611083984, -0.9579098224639893, -0.9278988838195801, -0.8978880047798157, -0.8678770661354065, -0.8378661274909973, -0.8078551888465881, -0.7778443098068237, -0.7478333711624146, -0.7178224325180054, -0.6878114938735962, -0.6578006148338318, -0.6277896761894226, -0.5977787375450134, -0.5677677989006042, -0.5377568602561951, -0.5077459216117859, -0.4777350127696991, -0.4477240741252899, -0.4177131652832031, -0.38770222663879395, -0.35769128799438477, -0.3276803493499756, -0.2976694405078888, -0.2676585018634796, -0.23764759302139282, -0.20763665437698364, -0.17762573063373566, -0.14761480689048767, -0.11760386824607849, -0.0875929445028305, -0.057582080364227295, -0.02757115289568901, 0.0024397745728492737, 0.032450705766677856, 0.06246162950992584, 0.09247255325317383, 0.12248349189758301, 0.152494415640831, 0.18250533938407898, 0.21251626312732697, 0.24252718687057495, 0.27253812551498413, 0.3025490641593933, 0.3325599730014801, 0.3625709116458893, 0.3925818204879761, 0.42259275913238525, 0.45260369777679443, 0.4826146066188812, 0.5126255750656128, 0.5426364541053772, 0.5726473927497864, 0.6026583313941956, 0.6326692700386047, 0.6626801490783691, 0.6926910877227783, 0.7227020263671875, 0.7527129650115967, 0.7827238440513611, 0.8127347826957703, 0.8427457213401794, 0.8727566599845886, 0.9027675986289978]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 10.0, 19.0, 29.0, 34.0, 67.0, 144.0, 276.0, 499.0, 1063.0, 2170.0, 5002.0, 12422.0, 35572.0, 137296.0, 526812.0, 242752.0, 54593.0, 17353.0, 6874.0, 2907.0, 1328.0, 649.0, 286.0, 161.0, 99.0, 38.0, 37.0, 18.0, 9.0, 16.0, 2.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10223388671875, -0.09840106964111328, -0.09456825256347656, -0.09073543548583984, -0.08690261840820312, -0.0830698013305664, -0.07923698425292969, -0.07540416717529297, -0.07157135009765625, -0.06773853302001953, -0.06390571594238281, -0.060072898864746094, -0.056240081787109375, -0.052407264709472656, -0.04857444763183594, -0.04474163055419922, -0.0409088134765625, -0.03707599639892578, -0.03324317932128906, -0.029410362243652344, -0.025577545166015625, -0.021744728088378906, -0.017911911010742188, -0.014079093933105469, -0.01024627685546875, -0.006413459777832031, -0.0025806427001953125, 0.0012521743774414062, 0.005084991455078125, 0.008917808532714844, 0.012750625610351562, 0.01658344268798828, 0.020416259765625, 0.02424907684326172, 0.028081893920898438, 0.031914710998535156, 0.035747528076171875, 0.039580345153808594, 0.04341316223144531, 0.04724597930908203, 0.05107879638671875, 0.05491161346435547, 0.05874443054199219, 0.0625772476196289, 0.06641006469726562, 0.07024288177490234, 0.07407569885253906, 0.07790851593017578, 0.0817413330078125, 0.08557415008544922, 0.08940696716308594, 0.09323978424072266, 0.09707260131835938, 0.1009054183959961, 0.10473823547363281, 0.10857105255126953, 0.11240386962890625, 0.11623668670654297, 0.12006950378417969, 0.1239023208618164, 0.12773513793945312, 0.13156795501708984, 0.13540077209472656, 0.13923358917236328, 0.14306640625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 4.0, 6.0, 6.0, 9.0, 15.0, 15.0, 19.0, 14.0, 14.0, 30.0, 28.0, 34.0, 39.0, 46.0, 40.0, 52.0, 51.0, 43.0, 66.0, 64.0, 53.0, 38.0, 48.0, 29.0, 33.0, 39.0, 24.0, 14.0, 16.0, 23.0, 13.0, 20.0, 13.0, 11.0, 6.0, 6.0, 11.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06524658203125, -0.06293392181396484, -0.06062126159667969, -0.05830860137939453, -0.055995941162109375, -0.05368328094482422, -0.05137062072753906, -0.049057960510253906, -0.04674530029296875, -0.044432640075683594, -0.04211997985839844, -0.03980731964111328, -0.037494659423828125, -0.03518199920654297, -0.03286933898925781, -0.030556678771972656, -0.0282440185546875, -0.025931358337402344, -0.023618698120117188, -0.02130603790283203, -0.018993377685546875, -0.01668071746826172, -0.014368057250976562, -0.012055397033691406, -0.00974273681640625, -0.007430076599121094, -0.0051174163818359375, -0.0028047561645507812, -0.000492095947265625, 0.0018205642700195312, 0.0041332244873046875, 0.006445884704589844, 0.008758544921875, 0.011071205139160156, 0.013383865356445312, 0.01569652557373047, 0.018009185791015625, 0.02032184600830078, 0.022634506225585938, 0.024947166442871094, 0.02725982666015625, 0.029572486877441406, 0.03188514709472656, 0.03419780731201172, 0.036510467529296875, 0.03882312774658203, 0.04113578796386719, 0.043448448181152344, 0.0457611083984375, 0.048073768615722656, 0.05038642883300781, 0.05269908905029297, 0.055011749267578125, 0.05732440948486328, 0.05963706970214844, 0.061949729919433594, 0.06426239013671875, 0.0665750503540039, 0.06888771057128906, 0.07120037078857422, 0.07351303100585938, 0.07582569122314453, 0.07813835144042969, 0.08045101165771484, 0.082763671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 4.0, 5.0, 8.0, 13.0, 14.0, 21.0, 17.0, 31.0, 43.0, 51.0, 76.0, 133.0, 192.0, 266.0, 428.0, 760.0, 1706.0, 5134.0, 32094.0, 852371.0, 138751.0, 10913.0, 2776.0, 1121.0, 546.0, 328.0, 217.0, 151.0, 98.0, 81.0, 56.0, 41.0, 34.0, 18.0, 17.0, 8.0, 10.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.30615234375, -0.29734039306640625, -0.2885284423828125, -0.27971649169921875, -0.270904541015625, -0.26209259033203125, -0.2532806396484375, -0.24446868896484375, -0.23565673828125, -0.22684478759765625, -0.2180328369140625, -0.20922088623046875, -0.200408935546875, -0.19159698486328125, -0.1827850341796875, -0.17397308349609375, -0.1651611328125, -0.15634918212890625, -0.1475372314453125, -0.13872528076171875, -0.129913330078125, -0.12110137939453125, -0.1122894287109375, -0.10347747802734375, -0.09466552734375, -0.08585357666015625, -0.0770416259765625, -0.06822967529296875, -0.059417724609375, -0.05060577392578125, -0.0417938232421875, -0.03298187255859375, -0.024169921875, -0.01535797119140625, -0.0065460205078125, 0.00226593017578125, 0.011077880859375, 0.01988983154296875, 0.0287017822265625, 0.03751373291015625, 0.04632568359375, 0.05513763427734375, 0.0639495849609375, 0.07276153564453125, 0.081573486328125, 0.09038543701171875, 0.0991973876953125, 0.10800933837890625, 0.1168212890625, 0.12563323974609375, 0.1344451904296875, 0.14325714111328125, 0.152069091796875, 0.16088104248046875, 0.1696929931640625, 0.17850494384765625, 0.18731689453125, 0.19612884521484375, 0.2049407958984375, 0.21375274658203125, 0.222564697265625, 0.23137664794921875, 0.2401885986328125, 0.24900054931640625, 0.2578125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 9.0, 7.0, 8.0, 10.0, 10.0, 12.0, 17.0, 21.0, 18.0, 21.0, 28.0, 45.0, 41.0, 55.0, 55.0, 44.0, 67.0, 50.0, 55.0, 58.0, 51.0, 48.0, 45.0, 33.0, 30.0, 33.0, 21.0, 23.0, 10.0, 18.0, 12.0, 11.0, 12.0, 8.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.323486328125, -0.3136711120605469, -0.30385589599609375, -0.2940406799316406, -0.2842254638671875, -0.2744102478027344, -0.26459503173828125, -0.2547798156738281, -0.244964599609375, -0.23514938354492188, -0.22533416748046875, -0.21551895141601562, -0.2057037353515625, -0.19588851928710938, -0.18607330322265625, -0.17625808715820312, -0.16644287109375, -0.15662765502929688, -0.14681243896484375, -0.13699722290039062, -0.1271820068359375, -0.11736679077148438, -0.10755157470703125, -0.09773635864257812, -0.087921142578125, -0.07810592651367188, -0.06829071044921875, -0.058475494384765625, -0.0486602783203125, -0.038845062255859375, -0.02902984619140625, -0.019214630126953125, -0.0093994140625, 0.000415802001953125, 0.01023101806640625, 0.020046234130859375, 0.0298614501953125, 0.039676666259765625, 0.04949188232421875, 0.059307098388671875, 0.069122314453125, 0.07893753051757812, 0.08875274658203125, 0.09856796264648438, 0.1083831787109375, 0.11819839477539062, 0.12801361083984375, 0.13782882690429688, 0.14764404296875, 0.15745925903320312, 0.16727447509765625, 0.17708969116210938, 0.1869049072265625, 0.19672012329101562, 0.20653533935546875, 0.21635055541992188, 0.226165771484375, 0.23598098754882812, 0.24579620361328125, 0.2556114196777344, 0.2654266357421875, 0.2752418518066406, 0.28505706787109375, 0.2948722839355469, 0.3046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 7.0, 7.0, 12.0, 15.0, 17.0, 22.0, 23.0, 33.0, 68.0, 70.0, 121.0, 214.0, 366.0, 777.0, 1813.0, 5246.0, 18469.0, 135999.0, 823251.0, 46395.0, 10015.0, 3132.0, 1171.0, 559.0, 289.0, 160.0, 92.0, 46.0, 39.0, 39.0, 23.0, 13.0, 20.0, 4.0, 8.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0875244140625, -0.08442878723144531, -0.08133316040039062, -0.07823753356933594, -0.07514190673828125, -0.07204627990722656, -0.06895065307617188, -0.06585502624511719, -0.0627593994140625, -0.05966377258300781, -0.056568145751953125, -0.05347251892089844, -0.05037689208984375, -0.04728126525878906, -0.044185638427734375, -0.04109001159667969, -0.037994384765625, -0.03489875793457031, -0.031803131103515625, -0.028707504272460938, -0.02561187744140625, -0.022516250610351562, -0.019420623779296875, -0.016324996948242188, -0.0132293701171875, -0.010133743286132812, -0.007038116455078125, -0.0039424896240234375, -0.00084686279296875, 0.0022487640380859375, 0.005344390869140625, 0.008440017700195312, 0.01153564453125, 0.014631271362304688, 0.017726898193359375, 0.020822525024414062, 0.02391815185546875, 0.027013778686523438, 0.030109405517578125, 0.03320503234863281, 0.0363006591796875, 0.03939628601074219, 0.042491912841796875, 0.04558753967285156, 0.04868316650390625, 0.05177879333496094, 0.054874420166015625, 0.05797004699707031, 0.061065673828125, 0.06416130065917969, 0.06725692749023438, 0.07035255432128906, 0.07344818115234375, 0.07654380798339844, 0.07963943481445312, 0.08273506164550781, 0.0858306884765625, 0.08892631530761719, 0.09202194213867188, 0.09511756896972656, 0.09821319580078125, 0.10130882263183594, 0.10440444946289062, 0.10750007629394531, 0.110595703125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 2.0, 8.0, 2.0, 10.0, 10.0, 10.0, 14.0, 25.0, 23.0, 45.0, 55.0, 67.0, 107.0, 97.0, 109.0, 99.0, 77.0, 60.0, 35.0, 27.0, 21.0, 17.0, 13.0, 19.0, 10.0, 4.0, 5.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.844499588012695e-05, -3.712717443704605e-05, -3.580935299396515e-05, -3.449153155088425e-05, -3.3173710107803345e-05, -3.185588866472244e-05, -3.053806722164154e-05, -2.922024577856064e-05, -2.7902424335479736e-05, -2.6584602892398834e-05, -2.5266781449317932e-05, -2.394896000623703e-05, -2.2631138563156128e-05, -2.1313317120075226e-05, -1.9995495676994324e-05, -1.867767423391342e-05, -1.735985279083252e-05, -1.6042031347751617e-05, -1.4724209904670715e-05, -1.3406388461589813e-05, -1.2088567018508911e-05, -1.0770745575428009e-05, -9.452924132347107e-06, -8.135102689266205e-06, -6.817281246185303e-06, -5.499459803104401e-06, -4.1816383600234985e-06, -2.8638169169425964e-06, -1.5459954738616943e-06, -2.2817403078079224e-07, 1.0896474123001099e-06, 2.407468855381012e-06, 3.725290298461914e-06, 5.043111741542816e-06, 6.360933184623718e-06, 7.67875462770462e-06, 8.996576070785522e-06, 1.0314397513866425e-05, 1.1632218956947327e-05, 1.2950040400028229e-05, 1.4267861843109131e-05, 1.5585683286190033e-05, 1.6903504729270935e-05, 1.8221326172351837e-05, 1.953914761543274e-05, 2.085696905851364e-05, 2.2174790501594543e-05, 2.3492611944675446e-05, 2.4810433387756348e-05, 2.612825483083725e-05, 2.7446076273918152e-05, 2.8763897716999054e-05, 3.0081719160079956e-05, 3.139954060316086e-05, 3.271736204624176e-05, 3.403518348932266e-05, 3.5353004932403564e-05, 3.6670826375484467e-05, 3.798864781856537e-05, 3.930646926164627e-05, 4.062429070472717e-05, 4.1942112147808075e-05, 4.325993359088898e-05, 4.457775503396988e-05, 4.589557647705078e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 5.0, 11.0, 19.0, 26.0, 47.0, 82.0, 130.0, 234.0, 442.0, 887.0, 2376.0, 9017.0, 57550.0, 830214.0, 126325.0, 15210.0, 3508.0, 1270.0, 511.0, 273.0, 171.0, 96.0, 46.0, 34.0, 14.0, 6.0, 11.0, 8.0, 3.0, 7.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1002197265625, -0.09732818603515625, -0.0944366455078125, -0.09154510498046875, -0.088653564453125, -0.08576202392578125, -0.0828704833984375, -0.07997894287109375, -0.07708740234375, -0.07419586181640625, -0.0713043212890625, -0.06841278076171875, -0.065521240234375, -0.06262969970703125, -0.0597381591796875, -0.05684661865234375, -0.053955078125, -0.05106353759765625, -0.0481719970703125, -0.04528045654296875, -0.042388916015625, -0.03949737548828125, -0.0366058349609375, -0.03371429443359375, -0.03082275390625, -0.02793121337890625, -0.0250396728515625, -0.02214813232421875, -0.019256591796875, -0.01636505126953125, -0.0134735107421875, -0.01058197021484375, -0.0076904296875, -0.00479888916015625, -0.0019073486328125, 0.00098419189453125, 0.003875732421875, 0.00676727294921875, 0.0096588134765625, 0.01255035400390625, 0.01544189453125, 0.01833343505859375, 0.0212249755859375, 0.02411651611328125, 0.027008056640625, 0.02989959716796875, 0.0327911376953125, 0.03568267822265625, 0.03857421875, 0.04146575927734375, 0.0443572998046875, 0.04724884033203125, 0.050140380859375, 0.05303192138671875, 0.0559234619140625, 0.05881500244140625, 0.06170654296875, 0.06459808349609375, 0.0674896240234375, 0.07038116455078125, 0.073272705078125, 0.07616424560546875, 0.0790557861328125, 0.08194732666015625, 0.0848388671875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 6.0, 5.0, 9.0, 6.0, 8.0, 12.0, 15.0, 21.0, 26.0, 28.0, 39.0, 75.0, 82.0, 95.0, 109.0, 119.0, 80.0, 68.0, 58.0, 42.0, 18.0, 20.0, 10.0, 14.0, 12.0, 5.0, 5.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.072265625, -0.07023000717163086, -0.06819438934326172, -0.06615877151489258, -0.06412315368652344, -0.0620875358581543, -0.060051918029785156, -0.058016300201416016, -0.055980682373046875, -0.053945064544677734, -0.051909446716308594, -0.04987382888793945, -0.04783821105957031, -0.04580259323120117, -0.04376697540283203, -0.04173135757446289, -0.03969573974609375, -0.03766012191772461, -0.03562450408935547, -0.03358888626098633, -0.03155326843261719, -0.029517650604248047, -0.027482032775878906, -0.025446414947509766, -0.023410797119140625, -0.021375179290771484, -0.019339561462402344, -0.017303943634033203, -0.015268325805664062, -0.013232707977294922, -0.011197090148925781, -0.00916147232055664, -0.0071258544921875, -0.005090236663818359, -0.0030546188354492188, -0.0010190010070800781, 0.0010166168212890625, 0.003052234649658203, 0.005087852478027344, 0.007123470306396484, 0.009159088134765625, 0.011194705963134766, 0.013230323791503906, 0.015265941619873047, 0.017301559448242188, 0.019337177276611328, 0.02137279510498047, 0.02340841293334961, 0.02544403076171875, 0.02747964859008789, 0.02951526641845703, 0.03155088424682617, 0.03358650207519531, 0.03562211990356445, 0.037657737731933594, 0.039693355560302734, 0.041728973388671875, 0.043764591217041016, 0.045800209045410156, 0.0478358268737793, 0.04987144470214844, 0.05190706253051758, 0.05394268035888672, 0.05597829818725586, 0.058013916015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 12.0, 51.0, 297.0, 507.0, 87.0, 18.0, 7.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44856595993042, -4.309902191162109, -4.171238422393799, -4.032574653625488, -3.8939108848571777, -3.755247116088867, -3.6165833473205566, -3.477919578552246, -3.3392558097839355, -3.200592041015625, -3.0619282722473145, -2.923264503479004, -2.7846007347106934, -2.645936965942383, -2.5072731971740723, -2.3686094284057617, -2.229945659637451, -2.0912818908691406, -1.95261812210083, -1.8139543533325195, -1.675290584564209, -1.5366268157958984, -1.397963047027588, -1.2592992782592773, -1.1206355094909668, -0.9819717407226562, -0.8433079719543457, -0.7046442031860352, -0.5659804344177246, -0.42731666564941406, -0.2886528968811035, -0.14998912811279297, -0.011325836181640625, 0.12733793258666992, 0.26600170135498047, 0.404665470123291, 0.5433292388916016, 0.6819930076599121, 0.8206567764282227, 0.9593205451965332, 1.0979843139648438, 1.2366480827331543, 1.3753118515014648, 1.5139756202697754, 1.652639389038086, 1.7913031578063965, 1.929966926574707, 2.0686306953430176, 2.207294464111328, 2.3459582328796387, 2.484622001647949, 2.6232857704162598, 2.7619495391845703, 2.900613307952881, 3.0392770767211914, 3.177940845489502, 3.3166046142578125, 3.455268383026123, 3.5939321517944336, 3.732595920562744, 3.8712596893310547, 4.009923458099365, 4.148587226867676, 4.287250995635986, 4.425914764404297]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 8.0, 9.0, 6.0, 12.0, 13.0, 13.0, 11.0, 7.0, 8.0, 17.0, 21.0, 19.0, 17.0, 31.0, 26.0, 24.0, 26.0, 34.0, 47.0, 109.0, 141.0, 67.0, 39.0, 30.0, 29.0, 28.0, 19.0, 24.0, 27.0, 16.0, 17.0, 10.0, 17.0, 11.0, 8.0, 10.0, 11.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-1.1509994268417358, -1.1173025369644165, -1.0836055278778076, -1.0499086380004883, -1.016211748123169, -0.9825147390365601, -0.9488178491592407, -0.9151208996772766, -0.8814239501953125, -0.8477270007133484, -0.8140300512313843, -0.7803331613540649, -0.7466362118721008, -0.7129392623901367, -0.6792423725128174, -0.6455454230308533, -0.6118484735488892, -0.578151524066925, -0.5444545745849609, -0.5107576847076416, -0.4770607352256775, -0.4433637857437134, -0.40966686606407166, -0.37596994638442993, -0.3422729969024658, -0.3085760474205017, -0.27487912774086, -0.24118219316005707, -0.20748525857925415, -0.17378832399845123, -0.14009138941764832, -0.1063944548368454, -0.07269763946533203, -0.039000704884529114, -0.005303770303726196, 0.02839316427707672, 0.06209009885787964, 0.09578703343868256, 0.12948396801948547, 0.1631809026002884, 0.1968778371810913, 0.23057477176189423, 0.26427170634269714, 0.29796862602233887, 0.331665575504303, 0.3653625249862671, 0.3990594446659088, 0.43275636434555054, 0.46645331382751465, 0.5001502633094788, 0.5338472127914429, 0.5675441026687622, 0.6012410521507263, 0.6349380016326904, 0.6686348915100098, 0.7023318409919739, 0.736028790473938, 0.7697257399559021, 0.8034226894378662, 0.8371195793151855, 0.8708165287971497, 0.9045134782791138, 0.9382103681564331, 0.9719073176383972, 1.0056042671203613]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 12.0, 15.0, 25.0, 37.0, 40.0, 62.0, 142.0, 235.0, 407.0, 855.0, 1597.0, 3412.0, 8807.0, 29689.0, 164248.0, 1170160.0, 2223179.0, 492834.0, 70971.0, 16703.0, 5873.0, 2399.0, 1181.0, 635.0, 308.0, 187.0, 85.0, 51.0, 45.0, 28.0, 24.0, 9.0, 10.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.162109375, -0.157379150390625, -0.15264892578125, -0.147918701171875, -0.1431884765625, -0.138458251953125, -0.13372802734375, -0.128997802734375, -0.124267578125, -0.119537353515625, -0.11480712890625, -0.110076904296875, -0.1053466796875, -0.100616455078125, -0.09588623046875, -0.091156005859375, -0.08642578125, -0.081695556640625, -0.07696533203125, -0.072235107421875, -0.0675048828125, -0.062774658203125, -0.05804443359375, -0.053314208984375, -0.048583984375, -0.043853759765625, -0.03912353515625, -0.034393310546875, -0.0296630859375, -0.024932861328125, -0.02020263671875, -0.015472412109375, -0.0107421875, -0.006011962890625, -0.00128173828125, 0.003448486328125, 0.0081787109375, 0.012908935546875, 0.01763916015625, 0.022369384765625, 0.027099609375, 0.031829833984375, 0.03656005859375, 0.041290283203125, 0.0460205078125, 0.050750732421875, 0.05548095703125, 0.060211181640625, 0.06494140625, 0.069671630859375, 0.07440185546875, 0.079132080078125, 0.0838623046875, 0.088592529296875, 0.09332275390625, 0.098052978515625, 0.102783203125, 0.107513427734375, 0.11224365234375, 0.116973876953125, 0.1217041015625, 0.126434326171875, 0.13116455078125, 0.135894775390625, 0.140625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 12.0, 12.0, 9.0, 16.0, 14.0, 19.0, 41.0, 25.0, 18.0, 43.0, 46.0, 42.0, 34.0, 40.0, 51.0, 39.0, 52.0, 41.0, 59.0, 44.0, 41.0, 29.0, 31.0, 33.0, 31.0, 27.0, 28.0, 23.0, 16.0, 15.0, 16.0, 7.0, 16.0, 4.0, 3.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.07440185546875, -0.07224845886230469, -0.07009506225585938, -0.06794166564941406, -0.06578826904296875, -0.06363487243652344, -0.061481475830078125, -0.05932807922363281, -0.0571746826171875, -0.05502128601074219, -0.052867889404296875, -0.05071449279785156, -0.04856109619140625, -0.04640769958496094, -0.044254302978515625, -0.04210090637207031, -0.039947509765625, -0.03779411315917969, -0.035640716552734375, -0.03348731994628906, -0.03133392333984375, -0.029180526733398438, -0.027027130126953125, -0.024873733520507812, -0.0227203369140625, -0.020566940307617188, -0.018413543701171875, -0.016260147094726562, -0.01410675048828125, -0.011953353881835938, -0.009799957275390625, -0.0076465606689453125, -0.0054931640625, -0.0033397674560546875, -0.001186370849609375, 0.0009670257568359375, 0.00312042236328125, 0.0052738189697265625, 0.007427215576171875, 0.009580612182617188, 0.0117340087890625, 0.013887405395507812, 0.016040802001953125, 0.018194198608398438, 0.02034759521484375, 0.022500991821289062, 0.024654388427734375, 0.026807785034179688, 0.028961181640625, 0.031114578247070312, 0.033267974853515625, 0.03542137145996094, 0.03757476806640625, 0.03972816467285156, 0.041881561279296875, 0.04403495788574219, 0.0461883544921875, 0.04834175109863281, 0.050495147705078125, 0.05264854431152344, 0.05480194091796875, 0.05695533752441406, 0.059108734130859375, 0.06126213073730469, 0.06341552734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 8.0, 8.0, 13.0, 35.0, 54.0, 126.0, 310.0, 808.0, 2482.0, 64368.0, 4115554.0, 8126.0, 1473.0, 517.0, 209.0, 77.0, 42.0, 23.0, 7.0, 12.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.23828125, -1.2021484375, -1.166015625, -1.1298828125, -1.09375, -1.0576171875, -1.021484375, -0.9853515625, -0.94921875, -0.9130859375, -0.876953125, -0.8408203125, -0.8046875, -0.7685546875, -0.732421875, -0.6962890625, -0.66015625, -0.6240234375, -0.587890625, -0.5517578125, -0.515625, -0.4794921875, -0.443359375, -0.4072265625, -0.37109375, -0.3349609375, -0.298828125, -0.2626953125, -0.2265625, -0.1904296875, -0.154296875, -0.1181640625, -0.08203125, -0.0458984375, -0.009765625, 0.0263671875, 0.0625, 0.0986328125, 0.134765625, 0.1708984375, 0.20703125, 0.2431640625, 0.279296875, 0.3154296875, 0.3515625, 0.3876953125, 0.423828125, 0.4599609375, 0.49609375, 0.5322265625, 0.568359375, 0.6044921875, 0.640625, 0.6767578125, 0.712890625, 0.7490234375, 0.78515625, 0.8212890625, 0.857421875, 0.8935546875, 0.9296875, 0.9658203125, 1.001953125, 1.0380859375, 1.07421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 27.0, 46.0, 145.0, 378.0, 957.0, 1412.0, 662.0, 261.0, 105.0, 46.0, 16.0, 11.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79052734375, -0.7681121826171875, -0.745697021484375, -0.7232818603515625, -0.70086669921875, -0.6784515380859375, -0.656036376953125, -0.6336212158203125, -0.6112060546875, -0.5887908935546875, -0.566375732421875, -0.5439605712890625, -0.52154541015625, -0.4991302490234375, -0.476715087890625, -0.4542999267578125, -0.431884765625, -0.4094696044921875, -0.387054443359375, -0.3646392822265625, -0.34222412109375, -0.3198089599609375, -0.297393798828125, -0.2749786376953125, -0.2525634765625, -0.2301483154296875, -0.207733154296875, -0.1853179931640625, -0.16290283203125, -0.1404876708984375, -0.118072509765625, -0.0956573486328125, -0.0732421875, -0.0508270263671875, -0.028411865234375, -0.0059967041015625, 0.01641845703125, 0.0388336181640625, 0.061248779296875, 0.0836639404296875, 0.1060791015625, 0.1284942626953125, 0.150909423828125, 0.1733245849609375, 0.19573974609375, 0.2181549072265625, 0.240570068359375, 0.2629852294921875, 0.285400390625, 0.3078155517578125, 0.330230712890625, 0.3526458740234375, 0.37506103515625, 0.3974761962890625, 0.419891357421875, 0.4423065185546875, 0.4647216796875, 0.4871368408203125, 0.509552001953125, 0.5319671630859375, 0.55438232421875, 0.5767974853515625, 0.599212646484375, 0.6216278076171875, 0.64404296875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 8.0, 7.0, 11.0, 8.0, 20.0, 43.0, 97.0, 156.0, 221.0, 179.0, 113.0, 53.0, 29.0, 11.0, 8.0, 6.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2617931365966797, -3.134150505065918, -3.0065078735351562, -2.8788652420043945, -2.751222610473633, -2.623579978942871, -2.4959373474121094, -2.3682947158813477, -2.240652084350586, -2.113009452819824, -1.9853668212890625, -1.8577241897583008, -1.730081558227539, -1.6024389266967773, -1.4747962951660156, -1.347153663635254, -1.2195110321044922, -1.0918684005737305, -0.9642257690429688, -0.836583137512207, -0.7089405059814453, -0.5812978744506836, -0.4536552429199219, -0.32601261138916016, -0.19836997985839844, -0.07072734832763672, 0.056915283203125, 0.18455791473388672, 0.31220054626464844, 0.43984317779541016, 0.5674858093261719, 0.6951284408569336, 0.8227715492248535, 0.9504141807556152, 1.078056812286377, 1.2056994438171387, 1.3333420753479004, 1.460984706878662, 1.5886273384094238, 1.7162699699401855, 1.8439126014709473, 1.971555233001709, 2.0991978645324707, 2.2268404960632324, 2.354483127593994, 2.482125759124756, 2.6097683906555176, 2.7374110221862793, 2.865053653717041, 2.9926962852478027, 3.1203389167785645, 3.247981548309326, 3.375624179840088, 3.5032668113708496, 3.6309094429016113, 3.758552074432373, 3.8861947059631348, 4.0138373374938965, 4.141479969024658, 4.26912260055542, 4.396765232086182, 4.524407863616943, 4.652050495147705, 4.779693126678467, 4.9073357582092285]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 5.0, 14.0, 8.0, 18.0, 26.0, 52.0, 41.0, 80.0, 64.0, 101.0, 114.0, 96.0, 82.0, 60.0, 58.0, 49.0, 36.0, 27.0, 20.0, 12.0, 3.0, 11.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.90010666847229, -1.7998974323272705, -1.699688196182251, -1.5994789600372314, -1.499269723892212, -1.3990604877471924, -1.2988513708114624, -1.1986421346664429, -1.0984328985214233, -0.9982236623764038, -0.8980144262313843, -0.7978052496910095, -0.69759601354599, -0.5973867774009705, -0.4971776008605957, -0.39696836471557617, -0.29675912857055664, -0.1965499073266983, -0.09634068608283997, 0.0038685202598571777, 0.10407775640487671, 0.20428699254989624, 0.304496169090271, 0.4047054052352905, 0.5049146413803101, 0.6051238775253296, 0.7053331136703491, 0.8055422902107239, 0.9057515263557434, 1.0059607028961182, 1.1061699390411377, 1.2063791751861572, 1.3065886497497559, 1.4067978858947754, 1.507007122039795, 1.6072163581848145, 1.707425594329834, 1.8076348304748535, 1.9078439474105835, 2.0080533027648926, 2.108262538909912, 2.2084717750549316, 2.308681011199951, 2.4088902473449707, 2.5090994834899902, 2.6093087196350098, 2.7095179557800293, 2.809727191925049, 2.9099361896514893, 3.010145425796509, 3.1103546619415283, 3.210563898086548, 3.3107731342315674, 3.410982370376587, 3.5111913681030273, 3.611400604248047, 3.7116098403930664, 3.811819076538086, 3.9120283126831055, 4.012237548828125, 4.1124467849731445, 4.212656021118164, 4.312865257263184, 4.413074493408203, 4.513283729553223]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 3.0, 7.0, 15.0, 19.0, 18.0, 39.0, 43.0, 90.0, 149.0, 301.0, 605.0, 1170.0, 2796.0, 7762.0, 29899.0, 197669.0, 703247.0, 79990.0, 16069.0, 4928.0, 1908.0, 836.0, 451.0, 207.0, 123.0, 67.0, 48.0, 34.0, 15.0, 12.0, 13.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1817626953125, -0.17595291137695312, -0.17014312744140625, -0.16433334350585938, -0.1585235595703125, -0.15271377563476562, -0.14690399169921875, -0.14109420776367188, -0.135284423828125, -0.12947463989257812, -0.12366485595703125, -0.11785507202148438, -0.1120452880859375, -0.10623550415039062, -0.10042572021484375, -0.09461593627929688, -0.08880615234375, -0.08299636840820312, -0.07718658447265625, -0.07137680053710938, -0.0655670166015625, -0.059757232666015625, -0.05394744873046875, -0.048137664794921875, -0.042327880859375, -0.036518096923828125, -0.03070831298828125, -0.024898529052734375, -0.0190887451171875, -0.013278961181640625, -0.00746917724609375, -0.001659393310546875, 0.004150390625, 0.009960174560546875, 0.01576995849609375, 0.021579742431640625, 0.0273895263671875, 0.033199310302734375, 0.03900909423828125, 0.044818878173828125, 0.050628662109375, 0.056438446044921875, 0.06224822998046875, 0.06805801391601562, 0.0738677978515625, 0.07967758178710938, 0.08548736572265625, 0.09129714965820312, 0.09710693359375, 0.10291671752929688, 0.10872650146484375, 0.11453628540039062, 0.1203460693359375, 0.12615585327148438, 0.13196563720703125, 0.13777542114257812, 0.143585205078125, 0.14939498901367188, 0.15520477294921875, 0.16101455688476562, 0.1668243408203125, 0.17263412475585938, 0.17844390869140625, 0.18425369262695312, 0.1900634765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 8.0, 6.0, 11.0, 17.0, 17.0, 28.0, 31.0, 39.0, 44.0, 43.0, 57.0, 73.0, 91.0, 89.0, 81.0, 71.0, 65.0, 52.0, 33.0, 33.0, 23.0, 37.0, 10.0, 9.0, 12.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.158203125, -0.15298080444335938, -0.14775848388671875, -0.14253616333007812, -0.1373138427734375, -0.13209152221679688, -0.12686920166015625, -0.12164688110351562, -0.116424560546875, -0.11120223999023438, -0.10597991943359375, -0.10075759887695312, -0.0955352783203125, -0.09031295776367188, -0.08509063720703125, -0.07986831665039062, -0.07464599609375, -0.06942367553710938, -0.06420135498046875, -0.058979034423828125, -0.0537567138671875, -0.048534393310546875, -0.04331207275390625, -0.038089752197265625, -0.032867431640625, -0.027645111083984375, -0.02242279052734375, -0.017200469970703125, -0.0119781494140625, -0.006755828857421875, -0.00153350830078125, 0.003688812255859375, 0.0089111328125, 0.014133453369140625, 0.01935577392578125, 0.024578094482421875, 0.0298004150390625, 0.035022735595703125, 0.04024505615234375, 0.045467376708984375, 0.050689697265625, 0.055912017822265625, 0.06113433837890625, 0.06635665893554688, 0.0715789794921875, 0.07680130004882812, 0.08202362060546875, 0.08724594116210938, 0.09246826171875, 0.09769058227539062, 0.10291290283203125, 0.10813522338867188, 0.1133575439453125, 0.11857986450195312, 0.12380218505859375, 0.12902450561523438, 0.134246826171875, 0.13946914672851562, 0.14469146728515625, 0.14991378784179688, 0.1551361083984375, 0.16035842895507812, 0.16558074951171875, 0.17080307006835938, 0.176025390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 8.0, 8.0, 7.0, 18.0, 23.0, 25.0, 42.0, 66.0, 74.0, 121.0, 213.0, 397.0, 773.0, 2306.0, 12642.0, 323128.0, 691439.0, 13169.0, 2334.0, 778.0, 340.0, 207.0, 142.0, 88.0, 56.0, 36.0, 27.0, 25.0, 16.0, 8.0, 7.0, 6.0, 3.0, 3.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.27783203125, -0.26966285705566406, -0.2614936828613281, -0.2533245086669922, -0.24515533447265625, -0.2369861602783203, -0.22881698608398438, -0.22064781188964844, -0.2124786376953125, -0.20430946350097656, -0.19614028930664062, -0.1879711151123047, -0.17980194091796875, -0.1716327667236328, -0.16346359252929688, -0.15529441833496094, -0.147125244140625, -0.13895606994628906, -0.13078689575195312, -0.12261772155761719, -0.11444854736328125, -0.10627937316894531, -0.09811019897460938, -0.08994102478027344, -0.0817718505859375, -0.07360267639160156, -0.06543350219726562, -0.05726432800292969, -0.04909515380859375, -0.04092597961425781, -0.032756805419921875, -0.024587631225585938, -0.01641845703125, -0.008249282836914062, -8.0108642578125e-05, 0.008089065551757812, 0.01625823974609375, 0.024427413940429688, 0.032596588134765625, 0.04076576232910156, 0.0489349365234375, 0.05710411071777344, 0.06527328491210938, 0.07344245910644531, 0.08161163330078125, 0.08978080749511719, 0.09794998168945312, 0.10611915588378906, 0.114288330078125, 0.12245750427246094, 0.13062667846679688, 0.1387958526611328, 0.14696502685546875, 0.1551342010498047, 0.16330337524414062, 0.17147254943847656, 0.1796417236328125, 0.18781089782714844, 0.19598007202148438, 0.2041492462158203, 0.21231842041015625, 0.2204875946044922, 0.22865676879882812, 0.23682594299316406, 0.2449951171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 11.0, 9.0, 12.0, 6.0, 13.0, 17.0, 22.0, 21.0, 29.0, 25.0, 35.0, 34.0, 40.0, 63.0, 75.0, 77.0, 66.0, 85.0, 48.0, 51.0, 45.0, 44.0, 18.0, 22.0, 20.0, 18.0, 11.0, 13.0, 9.0, 8.0, 10.0, 11.0, 2.0, 2.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.436767578125, -0.42220306396484375, -0.4076385498046875, -0.39307403564453125, -0.378509521484375, -0.36394500732421875, -0.3493804931640625, -0.33481597900390625, -0.32025146484375, -0.30568695068359375, -0.2911224365234375, -0.27655792236328125, -0.261993408203125, -0.24742889404296875, -0.2328643798828125, -0.21829986572265625, -0.2037353515625, -0.18917083740234375, -0.1746063232421875, -0.16004180908203125, -0.145477294921875, -0.13091278076171875, -0.1163482666015625, -0.10178375244140625, -0.08721923828125, -0.07265472412109375, -0.0580902099609375, -0.04352569580078125, -0.028961181640625, -0.01439666748046875, 0.0001678466796875, 0.01473236083984375, 0.029296875, 0.04386138916015625, 0.0584259033203125, 0.07299041748046875, 0.087554931640625, 0.10211944580078125, 0.1166839599609375, 0.13124847412109375, 0.14581298828125, 0.16037750244140625, 0.1749420166015625, 0.18950653076171875, 0.204071044921875, 0.21863555908203125, 0.2332000732421875, 0.24776458740234375, 0.2623291015625, 0.27689361572265625, 0.2914581298828125, 0.30602264404296875, 0.320587158203125, 0.33515167236328125, 0.3497161865234375, 0.36428070068359375, 0.37884521484375, 0.39340972900390625, 0.4079742431640625, 0.42253875732421875, 0.437103271484375, 0.45166778564453125, 0.4662322998046875, 0.48079681396484375, 0.495361328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 6.0, 4.0, 2.0, 9.0, 12.0, 9.0, 24.0, 28.0, 38.0, 47.0, 70.0, 99.0, 164.0, 246.0, 449.0, 837.0, 1822.0, 4302.0, 14074.0, 66201.0, 857625.0, 77845.0, 15938.0, 4791.0, 1831.0, 861.0, 427.0, 268.0, 166.0, 124.0, 64.0, 43.0, 29.0, 24.0, 10.0, 14.0, 16.0, 8.0, 3.0, 7.0, 2.0, 6.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0], "bins": [-0.033477783203125, -0.03253579139709473, -0.03159379959106445, -0.03065180778503418, -0.029709815979003906, -0.028767824172973633, -0.02782583236694336, -0.026883840560913086, -0.025941848754882812, -0.02499985694885254, -0.024057865142822266, -0.023115873336791992, -0.02217388153076172, -0.021231889724731445, -0.020289897918701172, -0.0193479061126709, -0.018405914306640625, -0.01746392250061035, -0.016521930694580078, -0.015579938888549805, -0.014637947082519531, -0.013695955276489258, -0.012753963470458984, -0.011811971664428711, -0.010869979858398438, -0.009927988052368164, -0.00898599624633789, -0.008044004440307617, -0.007102012634277344, -0.00616002082824707, -0.005218029022216797, -0.0042760372161865234, -0.00333404541015625, -0.0023920536041259766, -0.0014500617980957031, -0.0005080699920654297, 0.00043392181396484375, 0.0013759136199951172, 0.0023179054260253906, 0.003259897232055664, 0.0042018890380859375, 0.005143880844116211, 0.006085872650146484, 0.007027864456176758, 0.007969856262207031, 0.008911848068237305, 0.009853839874267578, 0.010795831680297852, 0.011737823486328125, 0.012679815292358398, 0.013621807098388672, 0.014563798904418945, 0.015505790710449219, 0.016447782516479492, 0.017389774322509766, 0.01833176612854004, 0.019273757934570312, 0.020215749740600586, 0.02115774154663086, 0.022099733352661133, 0.023041725158691406, 0.02398371696472168, 0.024925708770751953, 0.025867700576782227, 0.0268096923828125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 10.0, 6.0, 8.0, 12.0, 11.0, 17.0, 16.0, 28.0, 19.0, 26.0, 26.0, 35.0, 43.0, 47.0, 59.0, 72.0, 68.0, 72.0, 66.0, 57.0, 41.0, 31.0, 47.0, 21.0, 20.0, 17.0, 19.0, 12.0, 20.0, 13.0, 12.0, 7.0, 8.0, 4.0, 4.0, 4.0, 2.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3603439331054688e-05, -2.292729914188385e-05, -2.2251158952713013e-05, -2.1575018763542175e-05, -2.0898878574371338e-05, -2.02227383852005e-05, -1.9546598196029663e-05, -1.8870458006858826e-05, -1.8194317817687988e-05, -1.751817762851715e-05, -1.6842037439346313e-05, -1.6165897250175476e-05, -1.548975706100464e-05, -1.4813616871833801e-05, -1.4137476682662964e-05, -1.3461336493492126e-05, -1.2785196304321289e-05, -1.2109056115150452e-05, -1.1432915925979614e-05, -1.0756775736808777e-05, -1.008063554763794e-05, -9.404495358467102e-06, -8.728355169296265e-06, -8.052214980125427e-06, -7.37607479095459e-06, -6.6999346017837524e-06, -6.023794412612915e-06, -5.347654223442078e-06, -4.67151403427124e-06, -3.995373845100403e-06, -3.3192336559295654e-06, -2.643093466758728e-06, -1.9669532775878906e-06, -1.2908130884170532e-06, -6.146728992462158e-07, 6.146728992462158e-08, 7.37607479095459e-07, 1.4137476682662964e-06, 2.089887857437134e-06, 2.766028046607971e-06, 3.4421682357788086e-06, 4.118308424949646e-06, 4.794448614120483e-06, 5.470588803291321e-06, 6.146728992462158e-06, 6.822869181632996e-06, 7.499009370803833e-06, 8.17514955997467e-06, 8.851289749145508e-06, 9.527429938316345e-06, 1.0203570127487183e-05, 1.087971031665802e-05, 1.1555850505828857e-05, 1.2231990694999695e-05, 1.2908130884170532e-05, 1.358427107334137e-05, 1.4260411262512207e-05, 1.4936551451683044e-05, 1.5612691640853882e-05, 1.628883183002472e-05, 1.6964972019195557e-05, 1.7641112208366394e-05, 1.831725239753723e-05, 1.899339258670807e-05, 1.9669532775878906e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 12.0, 22.0, 21.0, 32.0, 46.0, 57.0, 102.0, 156.0, 278.0, 496.0, 873.0, 1589.0, 3334.0, 7394.0, 19243.0, 67570.0, 801957.0, 103562.0, 24596.0, 9043.0, 3944.0, 1891.0, 987.0, 506.0, 318.0, 198.0, 105.0, 73.0, 43.0, 31.0, 20.0, 14.0, 11.0, 6.0, 8.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0258331298828125, -0.02498936653137207, -0.02414560317993164, -0.02330183982849121, -0.02245807647705078, -0.02161431312561035, -0.020770549774169922, -0.019926786422729492, -0.019083023071289062, -0.018239259719848633, -0.017395496368408203, -0.016551733016967773, -0.015707969665527344, -0.014864206314086914, -0.014020442962646484, -0.013176679611206055, -0.012332916259765625, -0.011489152908325195, -0.010645389556884766, -0.009801626205444336, -0.008957862854003906, -0.008114099502563477, -0.007270336151123047, -0.006426572799682617, -0.0055828094482421875, -0.004739046096801758, -0.003895282745361328, -0.0030515193939208984, -0.0022077560424804688, -0.001363992691040039, -0.0005202293395996094, 0.0003235340118408203, 0.00116729736328125, 0.0020110607147216797, 0.0028548240661621094, 0.003698587417602539, 0.004542350769042969, 0.0053861141204833984, 0.006229877471923828, 0.007073640823364258, 0.007917404174804688, 0.008761167526245117, 0.009604930877685547, 0.010448694229125977, 0.011292457580566406, 0.012136220932006836, 0.012979984283447266, 0.013823747634887695, 0.014667510986328125, 0.015511274337768555, 0.016355037689208984, 0.017198801040649414, 0.018042564392089844, 0.018886327743530273, 0.019730091094970703, 0.020573854446411133, 0.021417617797851562, 0.022261381149291992, 0.023105144500732422, 0.02394890785217285, 0.02479267120361328, 0.02563643455505371, 0.02648019790649414, 0.02732396125793457, 0.028167724609375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 6.0, 13.0, 7.0, 12.0, 14.0, 22.0, 33.0, 67.0, 61.0, 89.0, 120.0, 122.0, 113.0, 94.0, 63.0, 42.0, 29.0, 29.0, 16.0, 17.0, 11.0, 6.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.044403076171875, -0.042996883392333984, -0.04159069061279297, -0.04018449783325195, -0.03877830505371094, -0.03737211227416992, -0.035965919494628906, -0.03455972671508789, -0.033153533935546875, -0.03174734115600586, -0.030341148376464844, -0.028934955596923828, -0.027528762817382812, -0.026122570037841797, -0.02471637725830078, -0.023310184478759766, -0.02190399169921875, -0.020497798919677734, -0.01909160614013672, -0.017685413360595703, -0.016279220581054688, -0.014873027801513672, -0.013466835021972656, -0.01206064224243164, -0.010654449462890625, -0.00924825668334961, -0.007842063903808594, -0.006435871124267578, -0.0050296783447265625, -0.003623485565185547, -0.0022172927856445312, -0.0008111000061035156, 0.0005950927734375, 0.0020012855529785156, 0.0034074783325195312, 0.004813671112060547, 0.0062198638916015625, 0.007626056671142578, 0.009032249450683594, 0.01043844223022461, 0.011844635009765625, 0.01325082778930664, 0.014657020568847656, 0.016063213348388672, 0.017469406127929688, 0.018875598907470703, 0.02028179168701172, 0.021687984466552734, 0.02309417724609375, 0.024500370025634766, 0.02590656280517578, 0.027312755584716797, 0.028718948364257812, 0.030125141143798828, 0.031531333923339844, 0.03293752670288086, 0.034343719482421875, 0.03574991226196289, 0.037156105041503906, 0.03856229782104492, 0.03996849060058594, 0.04137468338012695, 0.04278087615966797, 0.044187068939208984, 0.04559326171875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 10.0, 11.0, 19.0, 37.0, 78.0, 359.0, 314.0, 69.0, 43.0, 21.0, 22.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1238476037979126, -1.064666986465454, -1.0054864883422852, -0.9463058710098267, -0.8871253728866577, -0.8279447555541992, -0.7687641978263855, -0.7095836400985718, -0.6504030823707581, -0.5912225246429443, -0.5320419669151306, -0.4728613793849945, -0.4136808216571808, -0.35450026392936707, -0.29531967639923096, -0.23613911867141724, -0.17695856094360352, -0.1177779957652092, -0.05859743058681488, 0.0005831420421600342, 0.059763699769973755, 0.11894425749778748, 0.17812484502792358, 0.2373054027557373, 0.296485960483551, 0.35566651821136475, 0.41484707593917847, 0.4740276634693146, 0.5332082509994507, 0.5923887491226196, 0.6515693664550781, 0.7107499241828918, 0.769930362701416, 0.8291109204292297, 0.8882914781570435, 0.947472095489502, 1.006652593612671, 1.0658332109451294, 1.125013828277588, 1.1841943264007568, 1.2433748245239258, 1.3025554418563843, 1.3617359399795532, 1.4209165573120117, 1.4800970554351807, 1.5392776727676392, 1.5984582901000977, 1.6576387882232666, 1.716819405555725, 1.7760000228881836, 1.8351805210113525, 1.894361138343811, 1.95354163646698, 2.0127222537994385, 2.0719027519226074, 2.1310834884643555, 2.1902639865875244, 2.2494444847106934, 2.3086252212524414, 2.3678057193756104, 2.4269862174987793, 2.4861667156219482, 2.5453474521636963, 2.6045279502868652, 2.663708448410034]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 10.0, 11.0, 13.0, 19.0, 18.0, 34.0, 38.0, 52.0, 67.0, 456.0, 65.0, 45.0, 49.0, 26.0, 31.0, 18.0, 16.0, 13.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.0652060508728027, -2.983243227005005, -2.901280641555786, -2.8193178176879883, -2.7373549938201904, -2.6553921699523926, -2.573429584503174, -2.491466760635376, -2.409503936767578, -2.3275411128997803, -2.2455785274505615, -2.1636157035827637, -2.081652879714966, -1.9996901750564575, -1.9177274703979492, -1.8357646465301514, -1.7538020610809326, -1.6718393564224243, -1.5898765325546265, -1.5079138278961182, -1.4259510040283203, -1.343988299369812, -1.2620255947113037, -1.1800627708435059, -1.0981000661849976, -1.0161373615264893, -0.9341745376586914, -0.8522118330001831, -0.77024906873703, -0.688286304473877, -0.6063235998153687, -0.5243608355522156, -0.4423980712890625, -0.3604353070259094, -0.27847257256507874, -0.19650982320308685, -0.11454707384109497, -0.032584309577941895, 0.049378424882888794, 0.13134115934371948, 0.21330392360687256, 0.29526668787002563, 0.3772294223308563, 0.459192156791687, 0.5411549210548401, 0.6231176853179932, 0.7050803899765015, 0.7870431542396545, 0.8690059185028076, 0.9509686827659607, 1.0329314470291138, 1.114894151687622, 1.19685697555542, 1.2788196802139282, 1.3607823848724365, 1.4427452087402344, 1.5247079133987427, 1.606670618057251, 1.6886334419250488, 1.7705961465835571, 1.8525588512420654, 1.9345216751098633, 2.016484498977661, 2.09844708442688, 2.1804099082946777]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 2.0, 4.0, 4.0, 6.0, 8.0, 6.0, 12.0, 6.0, 20.0, 22.0, 16.0, 29.0, 25.0, 35.0, 46.0, 62.0, 160.0, 190.0, 59.0, 37.0, 30.0, 41.0, 30.0, 31.0, 21.0, 24.0, 29.0, 6.0, 2.0, 13.0, 4.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.123779296875, -0.11978340148925781, -0.11578750610351562, -0.11179161071777344, -0.10779571533203125, -0.10379981994628906, -0.09980392456054688, -0.09580802917480469, -0.0918121337890625, -0.08781623840332031, -0.08382034301757812, -0.07982444763183594, -0.07582855224609375, -0.07183265686035156, -0.06783676147460938, -0.06384086608886719, -0.059844970703125, -0.05584907531738281, -0.051853179931640625, -0.04785728454589844, -0.04386138916015625, -0.03986549377441406, -0.035869598388671875, -0.03187370300292969, -0.0278778076171875, -0.023881912231445312, -0.019886016845703125, -0.015890121459960938, -0.01189422607421875, -0.007898330688476562, -0.003902435302734375, 9.34600830078125e-05, 0.00408935546875, 0.008085250854492188, 0.012081146240234375, 0.016077041625976562, 0.02007293701171875, 0.024068832397460938, 0.028064727783203125, 0.03206062316894531, 0.0360565185546875, 0.04005241394042969, 0.044048309326171875, 0.04804420471191406, 0.05204010009765625, 0.05603599548339844, 0.060031890869140625, 0.06402778625488281, 0.068023681640625, 0.07201957702636719, 0.07601547241210938, 0.08001136779785156, 0.08400726318359375, 0.08800315856933594, 0.09199905395507812, 0.09599494934082031, 0.0999908447265625, 0.10398674011230469, 0.10798263549804688, 0.11197853088378906, 0.11597442626953125, 0.11997032165527344, 0.12396621704101562, 0.1279621124267578, 0.1319580078125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 7.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 6.0, 13.0, 11.0, 12.0, 13.0, 25.0, 25.0, 51.0, 52.0, 109.0, 162.0, 336.0, 1140.0, 5338.0, 596042.0, 7777448.0, 5688.0, 1207.0, 383.0, 157.0, 130.0, 55.0, 45.0, 20.0, 17.0, 13.0, 14.0, 9.0, 3.0, 6.0, 8.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0761479139328003, -1.0425422191619873, -1.0089366436004639, -0.9753309488296509, -0.9417252540588379, -0.9081196188926697, -0.8745139837265015, -0.8409082889556885, -0.8073025941848755, -0.7736969590187073, -0.7400912642478943, -0.7064856290817261, -0.6728799343109131, -0.6392742991447449, -0.6056686639785767, -0.5720629692077637, -0.5384573340415955, -0.5048516988754272, -0.47124600410461426, -0.43764036893844604, -0.40403467416763306, -0.37042903900146484, -0.33682337403297424, -0.30321770906448364, -0.26961204409599304, -0.23600637912750244, -0.20240071415901184, -0.16879506409168243, -0.13518939912319183, -0.10158373415470123, -0.06797808408737183, -0.034372419118881226, -0.000766754150390625, 0.03283890709280968, 0.06644456833600998, 0.10005022585391998, 0.13365589082241058, 0.16726155579090118, 0.2008672058582306, 0.2344728708267212, 0.2680785357952118, 0.3016842007637024, 0.335289865732193, 0.3688955307006836, 0.4025011658668518, 0.4361068606376648, 0.469712495803833, 0.503318190574646, 0.5369238257408142, 0.5705294609069824, 0.6041351556777954, 0.6377407908439636, 0.6713464856147766, 0.7049521207809448, 0.7385578155517578, 0.772163450717926, 0.8057690858840942, 0.8393747210502625, 0.8729804158210754, 0.9065860509872437, 0.9401917457580566, 0.9737973809242249, 1.007403016090393, 1.041008710861206, 1.074614405632019]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 4.0, 4.0, 4.0, 5.0, 4.0, 5.0, 3.0, 4.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.217621088027954, -2.162781000137329, -2.107941150665283, -2.053101062774658, -1.9982612133026123, -1.9434212446212769, -1.8885812759399414, -1.8337411880493164, -1.7789013385772705, -1.724061369895935, -1.6692214012145996, -1.6143814325332642, -1.5595414638519287, -1.5047014951705933, -1.4498615264892578, -1.3950214385986328, -1.3401814699172974, -1.285341501235962, -1.2305015325546265, -1.175661563873291, -1.1208215951919556, -1.0659816265106201, -1.0111415386199951, -0.9563016295433044, -0.901461660861969, -0.8466216921806335, -0.7917817234992981, -0.7369416952133179, -0.6821017265319824, -0.627261757850647, -0.5724217891693115, -0.5175818204879761, -0.4627417325973511, -0.4079017639160156, -0.3530617952346802, -0.29822179675102234, -0.2433818280696869, -0.18854185938835144, -0.1337018609046936, -0.07886189222335815, -0.024021923542022705, 0.03081805258989334, 0.08565802872180939, 0.14049801230430603, 0.19533798098564148, 0.25017794966697693, 0.30501794815063477, 0.3598579168319702, 0.41469788551330566, 0.4695378541946411, 0.5243778228759766, 0.579217791557312, 0.6340577602386475, 0.6888977289199829, 0.7437377572059631, 0.7985777258872986, 0.853417694568634, 0.9082576632499695, 0.9630976319313049, 1.0179376602172852, 1.0727776288986206, 1.127617597579956, 1.1824575662612915, 1.237297534942627, 1.2921375036239624]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 2.0, 9.0, 7.0, 5.0, 16.0, 10.0, 15.0, 14.0, 21.0, 26.0, 37.0, 32.0, 51.0, 53.0, 53.0, 63.0, 62.0, 59.0, 71.0, 51.0, 61.0, 31.0, 44.0, 42.0, 32.0, 24.0, 21.0, 17.0, 12.0, 9.0, 13.0, 11.0, 4.0, 4.0, 2.0, 7.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07977294921875, -0.07704925537109375, -0.0743255615234375, -0.07160186767578125, -0.068878173828125, -0.06615447998046875, -0.0634307861328125, -0.06070709228515625, -0.0579833984375, -0.05525970458984375, -0.0525360107421875, -0.04981231689453125, -0.047088623046875, -0.04436492919921875, -0.0416412353515625, -0.03891754150390625, -0.03619384765625, -0.03347015380859375, -0.0307464599609375, -0.02802276611328125, -0.025299072265625, -0.02257537841796875, -0.0198516845703125, -0.01712799072265625, -0.014404296875, -0.01168060302734375, -0.0089569091796875, -0.00623321533203125, -0.003509521484375, -0.00078582763671875, 0.0019378662109375, 0.00466156005859375, 0.00738525390625, 0.01010894775390625, 0.0128326416015625, 0.01555633544921875, 0.018280029296875, 0.02100372314453125, 0.0237274169921875, 0.02645111083984375, 0.0291748046875, 0.03189849853515625, 0.0346221923828125, 0.03734588623046875, 0.040069580078125, 0.04279327392578125, 0.0455169677734375, 0.04824066162109375, 0.05096435546875, 0.05368804931640625, 0.0564117431640625, 0.05913543701171875, 0.061859130859375, 0.06458282470703125, 0.0673065185546875, 0.07003021240234375, 0.07275390625, 0.07547760009765625, 0.0782012939453125, 0.08092498779296875, 0.083648681640625, 0.08637237548828125, 0.0890960693359375, 0.09181976318359375, 0.09454345703125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 9.0, 3.0, 10.0, 18.0, 12.0, 25.0, 22.0, 44.0, 67.0, 96.0, 147.0, 221.0, 379.0, 595.0, 1126.0, 2235.0, 5134.0, 12525.0, 32900.0, 93674.0, 193510.0, 114282.0, 40177.0, 14841.0, 5933.0, 2664.0, 1436.0, 757.0, 437.0, 305.0, 181.0, 136.0, 100.0, 57.0, 61.0, 43.0, 30.0, 18.0, 17.0, 11.0, 6.0, 3.0, 5.0, 7.0, 3.0, 5.0, 3.0, 2.0], "bins": [-0.74609375, -0.7257080078125, -0.705322265625, -0.6849365234375, -0.66455078125, -0.6441650390625, -0.623779296875, -0.6033935546875, -0.5830078125, -0.5626220703125, -0.542236328125, -0.5218505859375, -0.50146484375, -0.4810791015625, -0.460693359375, -0.4403076171875, -0.419921875, -0.3995361328125, -0.379150390625, -0.3587646484375, -0.33837890625, -0.3179931640625, -0.297607421875, -0.2772216796875, -0.2568359375, -0.2364501953125, -0.216064453125, -0.1956787109375, -0.17529296875, -0.1549072265625, -0.134521484375, -0.1141357421875, -0.09375, -0.0733642578125, -0.052978515625, -0.0325927734375, -0.01220703125, 0.0081787109375, 0.028564453125, 0.0489501953125, 0.0693359375, 0.0897216796875, 0.110107421875, 0.1304931640625, 0.15087890625, 0.1712646484375, 0.191650390625, 0.2120361328125, 0.232421875, 0.2528076171875, 0.273193359375, 0.2935791015625, 0.31396484375, 0.3343505859375, 0.354736328125, 0.3751220703125, 0.3955078125, 0.4158935546875, 0.436279296875, 0.4566650390625, 0.47705078125, 0.4974365234375, 0.517822265625, 0.5382080078125, 0.55859375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 8.0, 17.0, 10.0, 12.0, 23.0, 20.0, 28.0, 36.0, 24.0, 51.0, 42.0, 62.0, 60.0, 49.0, 50.0, 43.0, 66.0, 54.0, 46.0, 45.0, 41.0, 31.0, 29.0, 21.0, 23.0, 15.0, 15.0, 13.0, 8.0, 8.0, 7.0, 4.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0931396484375, -0.0901346206665039, -0.08712959289550781, -0.08412456512451172, -0.08111953735351562, -0.07811450958251953, -0.07510948181152344, -0.07210445404052734, -0.06909942626953125, -0.06609439849853516, -0.06308937072753906, -0.06008434295654297, -0.057079315185546875, -0.05407428741455078, -0.05106925964355469, -0.048064231872558594, -0.0450592041015625, -0.042054176330566406, -0.03904914855957031, -0.03604412078857422, -0.033039093017578125, -0.03003406524658203, -0.027029037475585938, -0.024024009704589844, -0.02101898193359375, -0.018013954162597656, -0.015008926391601562, -0.012003898620605469, -0.008998870849609375, -0.005993843078613281, -0.0029888153076171875, 1.621246337890625e-05, 0.003021240234375, 0.006026268005371094, 0.009031295776367188, 0.012036323547363281, 0.015041351318359375, 0.01804637908935547, 0.021051406860351562, 0.024056434631347656, 0.02706146240234375, 0.030066490173339844, 0.03307151794433594, 0.03607654571533203, 0.039081573486328125, 0.04208660125732422, 0.04509162902832031, 0.048096656799316406, 0.0511016845703125, 0.054106712341308594, 0.05711174011230469, 0.06011676788330078, 0.06312179565429688, 0.06612682342529297, 0.06913185119628906, 0.07213687896728516, 0.07514190673828125, 0.07814693450927734, 0.08115196228027344, 0.08415699005126953, 0.08716201782226562, 0.09016704559326172, 0.09317207336425781, 0.0961771011352539, 0.09918212890625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 6.0, 1.0, 12.0, 27.0, 44.0, 69.0, 76.0, 85.0, 57.0, 39.0, 26.0, 11.0, 7.0, 12.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.044643759727478, -1.0165958404541016, -0.9885479807853699, -0.9605000615119934, -0.9324522018432617, -0.9044042825698853, -0.8763564229011536, -0.8483085036277771, -0.8202606439590454, -0.792212724685669, -0.7641648650169373, -0.7361169457435608, -0.7080690860748291, -0.6800211668014526, -0.651973307132721, -0.6239253878593445, -0.5958775281906128, -0.5678296089172363, -0.5397817492485046, -0.5117338299751282, -0.4836859703063965, -0.45563805103302, -0.42759019136428833, -0.39954227209091187, -0.3714943528175354, -0.3434464633464813, -0.31539857387542725, -0.28735068440437317, -0.2593027949333191, -0.23125489056110382, -0.20320700109004974, -0.17515911161899567, -0.14711123704910278, -0.1190633475780487, -0.09101545810699463, -0.06296756118535995, -0.03491967171430588, -0.006871774792671204, 0.021176114678382874, 0.04922400414943695, 0.07727189362049103, 0.1053197830915451, 0.13336767256259918, 0.16141557693481445, 0.18946346640586853, 0.2175113558769226, 0.24555924534797668, 0.27360713481903076, 0.30165502429008484, 0.3297029137611389, 0.357750803232193, 0.38579869270324707, 0.41384658217430115, 0.4418944716453552, 0.4699423909187317, 0.4979902505874634, 0.5260381698608398, 0.5540860891342163, 0.582133948802948, 0.6101818680763245, 0.6382297277450562, 0.6662776470184326, 0.6943255066871643, 0.7223734259605408, 0.7504212856292725]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 7.0, 6.0, 7.0, 13.0, 19.0, 50.0, 44.0, 71.0, 55.0, 50.0, 29.0, 31.0, 15.0, 12.0, 7.0, 6.0, 5.0, 5.0, 4.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42098671197891235, -0.4044722318649292, -0.38795772194862366, -0.3714432418346405, -0.35492876172065735, -0.3384142518043518, -0.32189977169036865, -0.3053852915763855, -0.28887081146240234, -0.2723563313484192, -0.25584182143211365, -0.2393273413181305, -0.22281286120414734, -0.206298366189003, -0.18978387117385864, -0.1732693910598755, -0.15675488114356995, -0.1402403861284256, -0.12372590601444244, -0.1072114109992981, -0.09069692343473434, -0.0741824358701706, -0.057667940855026245, -0.041153453290462494, -0.024638965725898743, -0.008124476298689842, 0.008390013128519058, 0.024904504418373108, 0.04141899198293686, 0.05793347954750061, 0.07444797456264496, 0.09096246212720871, 0.10747694969177246, 0.12399143725633621, 0.14050592482089996, 0.1570204198360443, 0.17353489995002747, 0.19004939496517181, 0.20656388998031616, 0.22307837009429932, 0.23959286510944366, 0.256107360124588, 0.27262184023857117, 0.2891363501548767, 0.30565083026885986, 0.322165310382843, 0.33867979049682617, 0.3551943004131317, 0.37170878052711487, 0.388223260641098, 0.40473777055740356, 0.4212522506713867, 0.4377667307853699, 0.454281210899353, 0.47079572081565857, 0.4873102009296417, 0.5038247108459473, 0.5203391909599304, 0.5368536710739136, 0.5533682107925415, 0.5698826909065247, 0.5863971710205078, 0.602911651134491, 0.6194261312484741, 0.6359406113624573]}, "_wandb": {"runtime": 2391}} \ No newline at end of file